| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 6664, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.005252100840336135, |
| "grad_norm": 14.420694283658325, |
| "learning_rate": 2.39880059970015e-07, |
| "loss": 0.8126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.790475606918335, |
| "step": 5, |
| "valid_targets_mean": 1423.4, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 0.01050420168067227, |
| "grad_norm": 15.311496330131531, |
| "learning_rate": 5.397301349325338e-07, |
| "loss": 0.8157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.8297374248504639, |
| "step": 10, |
| "valid_targets_mean": 1407.8, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 0.015756302521008403, |
| "grad_norm": 13.45958528833613, |
| "learning_rate": 8.395802098950526e-07, |
| "loss": 0.7879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7610906362533569, |
| "step": 15, |
| "valid_targets_mean": 1413.5, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 0.02100840336134454, |
| "grad_norm": 11.905230272753508, |
| "learning_rate": 1.1394302848575713e-06, |
| "loss": 0.7735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.753049373626709, |
| "step": 20, |
| "valid_targets_mean": 1450.1, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.026260504201680673, |
| "grad_norm": 9.744011308309286, |
| "learning_rate": 1.43928035982009e-06, |
| "loss": 0.744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7382731437683105, |
| "step": 25, |
| "valid_targets_mean": 1481.1, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 0.031512605042016806, |
| "grad_norm": 7.094821641510122, |
| "learning_rate": 1.7391304347826088e-06, |
| "loss": 0.7128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6914137601852417, |
| "step": 30, |
| "valid_targets_mean": 1530.8, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 0.03676470588235294, |
| "grad_norm": 6.368906220458843, |
| "learning_rate": 2.0389805097451275e-06, |
| "loss": 0.6643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6466853022575378, |
| "step": 35, |
| "valid_targets_mean": 1416.6, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 0.04201680672268908, |
| "grad_norm": 5.399102696758742, |
| "learning_rate": 2.3388305847076464e-06, |
| "loss": 0.6382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6274276971817017, |
| "step": 40, |
| "valid_targets_mean": 1371.5, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 0.04726890756302521, |
| "grad_norm": 4.306253658085107, |
| "learning_rate": 2.6386806596701653e-06, |
| "loss": 0.5772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5616586208343506, |
| "step": 45, |
| "valid_targets_mean": 1484.7, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 0.052521008403361345, |
| "grad_norm": 3.7077951595748515, |
| "learning_rate": 2.9385307346326843e-06, |
| "loss": 0.527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4847095012664795, |
| "step": 50, |
| "valid_targets_mean": 1365.5, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 0.05777310924369748, |
| "grad_norm": 2.363263225041768, |
| "learning_rate": 3.2383808095952024e-06, |
| "loss": 0.4935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5059503316879272, |
| "step": 55, |
| "valid_targets_mean": 1234.7, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 0.06302521008403361, |
| "grad_norm": 1.6467637243933408, |
| "learning_rate": 3.5382308845577213e-06, |
| "loss": 0.4679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44630974531173706, |
| "step": 60, |
| "valid_targets_mean": 1540.4, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 0.06827731092436974, |
| "grad_norm": 1.5411024922038776, |
| "learning_rate": 3.83808095952024e-06, |
| "loss": 0.4446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41912999749183655, |
| "step": 65, |
| "valid_targets_mean": 1329.9, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 0.07352941176470588, |
| "grad_norm": 1.244534525186305, |
| "learning_rate": 4.137931034482759e-06, |
| "loss": 0.4205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39288026094436646, |
| "step": 70, |
| "valid_targets_mean": 1549.6, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 0.07878151260504201, |
| "grad_norm": 1.1996703760120404, |
| "learning_rate": 4.437781109445278e-06, |
| "loss": 0.4055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40949755907058716, |
| "step": 75, |
| "valid_targets_mean": 1507.4, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 0.08403361344537816, |
| "grad_norm": 1.2896717545023444, |
| "learning_rate": 4.737631184407796e-06, |
| "loss": 0.4011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43845802545547485, |
| "step": 80, |
| "valid_targets_mean": 1542.4, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 0.08928571428571429, |
| "grad_norm": 1.0177436395323942, |
| "learning_rate": 5.037481259370315e-06, |
| "loss": 0.3951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38916561007499695, |
| "step": 85, |
| "valid_targets_mean": 1595.2, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 0.09453781512605042, |
| "grad_norm": 1.9249372968791647, |
| "learning_rate": 5.337331334332834e-06, |
| "loss": 0.3869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39647072553634644, |
| "step": 90, |
| "valid_targets_mean": 1401.6, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 0.09978991596638656, |
| "grad_norm": 1.284016705259006, |
| "learning_rate": 5.6371814092953526e-06, |
| "loss": 0.3607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3547477126121521, |
| "step": 95, |
| "valid_targets_mean": 1298.4, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 0.10504201680672269, |
| "grad_norm": 1.0443779966069502, |
| "learning_rate": 5.937031484257871e-06, |
| "loss": 0.3572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35236796736717224, |
| "step": 100, |
| "valid_targets_mean": 1659.7, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 0.11029411764705882, |
| "grad_norm": 1.0855951515574154, |
| "learning_rate": 6.2368815592203904e-06, |
| "loss": 0.3587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3708180785179138, |
| "step": 105, |
| "valid_targets_mean": 1600.4, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 0.11554621848739496, |
| "grad_norm": 1.1032891548957378, |
| "learning_rate": 6.536731634182909e-06, |
| "loss": 0.3475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.322293221950531, |
| "step": 110, |
| "valid_targets_mean": 1338.3, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 0.1207983193277311, |
| "grad_norm": 0.9768878378529005, |
| "learning_rate": 6.8365817091454274e-06, |
| "loss": 0.3369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3234562277793884, |
| "step": 115, |
| "valid_targets_mean": 1456.2, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 0.12605042016806722, |
| "grad_norm": 1.0487060724275885, |
| "learning_rate": 7.136431784107947e-06, |
| "loss": 0.329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32765859365463257, |
| "step": 120, |
| "valid_targets_mean": 1340.2, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 0.13130252100840337, |
| "grad_norm": 1.1049013021741143, |
| "learning_rate": 7.436281859070465e-06, |
| "loss": 0.3235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31769877672195435, |
| "step": 125, |
| "valid_targets_mean": 1394.4, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 0.13655462184873948, |
| "grad_norm": 1.0426803049134692, |
| "learning_rate": 7.736131934032984e-06, |
| "loss": 0.319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3211321234703064, |
| "step": 130, |
| "valid_targets_mean": 1501.8, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 0.14180672268907563, |
| "grad_norm": 1.0513598327816873, |
| "learning_rate": 8.035982008995503e-06, |
| "loss": 0.3162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31629741191864014, |
| "step": 135, |
| "valid_targets_mean": 1651.7, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 0.14705882352941177, |
| "grad_norm": 1.0551559578309457, |
| "learning_rate": 8.335832083958023e-06, |
| "loss": 0.3204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3266269564628601, |
| "step": 140, |
| "valid_targets_mean": 1632.1, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 0.15231092436974789, |
| "grad_norm": 0.9612333107113046, |
| "learning_rate": 8.63568215892054e-06, |
| "loss": 0.306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33223849534988403, |
| "step": 145, |
| "valid_targets_mean": 1615.3, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 0.15756302521008403, |
| "grad_norm": 1.0081404887340868, |
| "learning_rate": 8.93553223388306e-06, |
| "loss": 0.315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32516705989837646, |
| "step": 150, |
| "valid_targets_mean": 1482.9, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 0.16281512605042017, |
| "grad_norm": 1.0468696423891182, |
| "learning_rate": 9.235382308845579e-06, |
| "loss": 0.3071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3112391531467438, |
| "step": 155, |
| "valid_targets_mean": 1552.8, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 0.16806722689075632, |
| "grad_norm": 0.9973569578712165, |
| "learning_rate": 9.535232383808097e-06, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2998279333114624, |
| "step": 160, |
| "valid_targets_mean": 1590.4, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 0.17331932773109243, |
| "grad_norm": 1.2443677749688786, |
| "learning_rate": 9.835082458770614e-06, |
| "loss": 0.2954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30380943417549133, |
| "step": 165, |
| "valid_targets_mean": 1417.6, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 0.17857142857142858, |
| "grad_norm": 1.1254552821617871, |
| "learning_rate": 1.0134932533733135e-05, |
| "loss": 0.284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2681633234024048, |
| "step": 170, |
| "valid_targets_mean": 1255.4, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 0.18382352941176472, |
| "grad_norm": 0.9851494239413889, |
| "learning_rate": 1.0434782608695653e-05, |
| "loss": 0.2881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2868928611278534, |
| "step": 175, |
| "valid_targets_mean": 1566.6, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 0.18907563025210083, |
| "grad_norm": 1.098473835442716, |
| "learning_rate": 1.0734632683658172e-05, |
| "loss": 0.286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27357298135757446, |
| "step": 180, |
| "valid_targets_mean": 1440.9, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 0.19432773109243698, |
| "grad_norm": 1.1557321572729486, |
| "learning_rate": 1.103448275862069e-05, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29238957166671753, |
| "step": 185, |
| "valid_targets_mean": 1399.1, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 0.19957983193277312, |
| "grad_norm": 1.1396871077620272, |
| "learning_rate": 1.1334332833583211e-05, |
| "loss": 0.2932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2987218499183655, |
| "step": 190, |
| "valid_targets_mean": 1334.3, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 0.20483193277310924, |
| "grad_norm": 1.1178689873643397, |
| "learning_rate": 1.1634182908545729e-05, |
| "loss": 0.2941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33798643946647644, |
| "step": 195, |
| "valid_targets_mean": 1452.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.21008403361344538, |
| "grad_norm": 1.0854720395667985, |
| "learning_rate": 1.1934032983508246e-05, |
| "loss": 0.2816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25798511505126953, |
| "step": 200, |
| "valid_targets_mean": 1338.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 0.21533613445378152, |
| "grad_norm": 1.1508679180169188, |
| "learning_rate": 1.2233883058470766e-05, |
| "loss": 0.2723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.276319682598114, |
| "step": 205, |
| "valid_targets_mean": 1360.2, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 0.22058823529411764, |
| "grad_norm": 0.990266456581399, |
| "learning_rate": 1.2533733133433283e-05, |
| "loss": 0.2973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2741560935974121, |
| "step": 210, |
| "valid_targets_mean": 1520.9, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 0.22584033613445378, |
| "grad_norm": 0.9411807898115928, |
| "learning_rate": 1.2833583208395803e-05, |
| "loss": 0.2983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3527371883392334, |
| "step": 215, |
| "valid_targets_mean": 1814.6, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 0.23109243697478993, |
| "grad_norm": 0.9509244068358998, |
| "learning_rate": 1.313343328335832e-05, |
| "loss": 0.2758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27980518341064453, |
| "step": 220, |
| "valid_targets_mean": 1478.3, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 0.23634453781512604, |
| "grad_norm": 0.9802646448806872, |
| "learning_rate": 1.3433283358320841e-05, |
| "loss": 0.2797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2757881283760071, |
| "step": 225, |
| "valid_targets_mean": 1497.9, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 0.2415966386554622, |
| "grad_norm": 1.1416789358107773, |
| "learning_rate": 1.3733133433283359e-05, |
| "loss": 0.2842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2863280773162842, |
| "step": 230, |
| "valid_targets_mean": 1550.5, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 0.24684873949579833, |
| "grad_norm": 1.2243896073517977, |
| "learning_rate": 1.4032983508245878e-05, |
| "loss": 0.28, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2647148370742798, |
| "step": 235, |
| "valid_targets_mean": 1372.5, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 0.25210084033613445, |
| "grad_norm": 1.0671177129673626, |
| "learning_rate": 1.4332833583208396e-05, |
| "loss": 0.2667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2796405553817749, |
| "step": 240, |
| "valid_targets_mean": 1479.0, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 0.25735294117647056, |
| "grad_norm": 1.1155587555825344, |
| "learning_rate": 1.4632683658170917e-05, |
| "loss": 0.267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2673705816268921, |
| "step": 245, |
| "valid_targets_mean": 1234.8, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 0.26260504201680673, |
| "grad_norm": 1.0111523665697042, |
| "learning_rate": 1.4932533733133435e-05, |
| "loss": 0.2816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3024107813835144, |
| "step": 250, |
| "valid_targets_mean": 1363.2, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 0.26785714285714285, |
| "grad_norm": 0.9398095246969382, |
| "learning_rate": 1.5232383808095954e-05, |
| "loss": 0.2773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28389376401901245, |
| "step": 255, |
| "valid_targets_mean": 1532.1, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 0.27310924369747897, |
| "grad_norm": 0.9520954006331536, |
| "learning_rate": 1.5532233883058472e-05, |
| "loss": 0.2619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.262344628572464, |
| "step": 260, |
| "valid_targets_mean": 1471.0, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 0.27836134453781514, |
| "grad_norm": 0.9231810982153198, |
| "learning_rate": 1.5832083958020993e-05, |
| "loss": 0.268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25394904613494873, |
| "step": 265, |
| "valid_targets_mean": 1494.1, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 0.28361344537815125, |
| "grad_norm": 1.036465235131244, |
| "learning_rate": 1.613193403298351e-05, |
| "loss": 0.2693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2542717456817627, |
| "step": 270, |
| "valid_targets_mean": 1340.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 0.28886554621848737, |
| "grad_norm": 0.969535346268365, |
| "learning_rate": 1.6431784107946028e-05, |
| "loss": 0.2674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2644956707954407, |
| "step": 275, |
| "valid_targets_mean": 1530.9, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 0.29411764705882354, |
| "grad_norm": 1.095458178867704, |
| "learning_rate": 1.6731634182908546e-05, |
| "loss": 0.257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2714339792728424, |
| "step": 280, |
| "valid_targets_mean": 1233.0, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 0.29936974789915966, |
| "grad_norm": 0.989855094627666, |
| "learning_rate": 1.7031484257871064e-05, |
| "loss": 0.2571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2507407069206238, |
| "step": 285, |
| "valid_targets_mean": 1246.8, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 0.30462184873949577, |
| "grad_norm": 1.0834380820761222, |
| "learning_rate": 1.7331334332833585e-05, |
| "loss": 0.2479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26474529504776, |
| "step": 290, |
| "valid_targets_mean": 1392.5, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 0.30987394957983194, |
| "grad_norm": 1.035539563074315, |
| "learning_rate": 1.7631184407796102e-05, |
| "loss": 0.2635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24842077493667603, |
| "step": 295, |
| "valid_targets_mean": 1319.9, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 0.31512605042016806, |
| "grad_norm": 1.0392297368060632, |
| "learning_rate": 1.7931034482758623e-05, |
| "loss": 0.2567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2532370090484619, |
| "step": 300, |
| "valid_targets_mean": 1554.4, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 0.32037815126050423, |
| "grad_norm": 1.1437803903133303, |
| "learning_rate": 1.823088455772114e-05, |
| "loss": 0.2547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26745492219924927, |
| "step": 305, |
| "valid_targets_mean": 1417.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.32563025210084034, |
| "grad_norm": 1.0470695391841682, |
| "learning_rate": 1.853073463268366e-05, |
| "loss": 0.2622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27369868755340576, |
| "step": 310, |
| "valid_targets_mean": 1223.8, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 0.33088235294117646, |
| "grad_norm": 0.99682750228871, |
| "learning_rate": 1.8830584707646176e-05, |
| "loss": 0.2577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2700139284133911, |
| "step": 315, |
| "valid_targets_mean": 1550.6, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 0.33613445378151263, |
| "grad_norm": 0.9922010090048154, |
| "learning_rate": 1.9130434782608697e-05, |
| "loss": 0.2509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23878350853919983, |
| "step": 320, |
| "valid_targets_mean": 1542.2, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 0.34138655462184875, |
| "grad_norm": 0.9969922099846812, |
| "learning_rate": 1.9430284857571215e-05, |
| "loss": 0.2564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24636775255203247, |
| "step": 325, |
| "valid_targets_mean": 1390.6, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 0.34663865546218486, |
| "grad_norm": 0.9249347847273258, |
| "learning_rate": 1.9730134932533736e-05, |
| "loss": 0.2576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25145918130874634, |
| "step": 330, |
| "valid_targets_mean": 1515.5, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 0.35189075630252103, |
| "grad_norm": 0.9954869233754978, |
| "learning_rate": 2.0029985007496254e-05, |
| "loss": 0.2675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23031079769134521, |
| "step": 335, |
| "valid_targets_mean": 1333.3, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 0.35714285714285715, |
| "grad_norm": 1.0229626657604847, |
| "learning_rate": 2.0329835082458775e-05, |
| "loss": 0.2635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2601286470890045, |
| "step": 340, |
| "valid_targets_mean": 1395.2, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 0.36239495798319327, |
| "grad_norm": 0.9742753314709449, |
| "learning_rate": 2.0629685157421292e-05, |
| "loss": 0.2644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2516604959964752, |
| "step": 345, |
| "valid_targets_mean": 1515.6, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 0.36764705882352944, |
| "grad_norm": 1.0984493157523587, |
| "learning_rate": 2.092953523238381e-05, |
| "loss": 0.263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26009607315063477, |
| "step": 350, |
| "valid_targets_mean": 1312.8, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 0.37289915966386555, |
| "grad_norm": 1.0124670927846027, |
| "learning_rate": 2.1229385307346328e-05, |
| "loss": 0.2634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2756904661655426, |
| "step": 355, |
| "valid_targets_mean": 1492.9, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 0.37815126050420167, |
| "grad_norm": 0.9303311281634132, |
| "learning_rate": 2.152923538230885e-05, |
| "loss": 0.2475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23849308490753174, |
| "step": 360, |
| "valid_targets_mean": 1369.1, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 0.38340336134453784, |
| "grad_norm": 0.938627487391855, |
| "learning_rate": 2.1829085457271363e-05, |
| "loss": 0.2506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24323752522468567, |
| "step": 365, |
| "valid_targets_mean": 1521.9, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 0.38865546218487396, |
| "grad_norm": 1.0170934463633303, |
| "learning_rate": 2.2128935532233884e-05, |
| "loss": 0.2615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23910865187644958, |
| "step": 370, |
| "valid_targets_mean": 1277.9, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 0.3939075630252101, |
| "grad_norm": 0.9747309964507797, |
| "learning_rate": 2.2428785607196405e-05, |
| "loss": 0.2519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2347027212381363, |
| "step": 375, |
| "valid_targets_mean": 1336.5, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 0.39915966386554624, |
| "grad_norm": 1.0544024939800751, |
| "learning_rate": 2.2728635682158923e-05, |
| "loss": 0.2461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22451592981815338, |
| "step": 380, |
| "valid_targets_mean": 1288.1, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 0.40441176470588236, |
| "grad_norm": 1.0293634003316077, |
| "learning_rate": 2.302848575712144e-05, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2373955398797989, |
| "step": 385, |
| "valid_targets_mean": 1526.9, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 0.4096638655462185, |
| "grad_norm": 1.0510698011217983, |
| "learning_rate": 2.3328335832083958e-05, |
| "loss": 0.2701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.272568941116333, |
| "step": 390, |
| "valid_targets_mean": 1372.4, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 0.41491596638655465, |
| "grad_norm": 1.0256066743434804, |
| "learning_rate": 2.362818590704648e-05, |
| "loss": 0.237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2508437931537628, |
| "step": 395, |
| "valid_targets_mean": 1356.8, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 0.42016806722689076, |
| "grad_norm": 0.918276243513663, |
| "learning_rate": 2.3928035982009e-05, |
| "loss": 0.249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26278817653656006, |
| "step": 400, |
| "valid_targets_mean": 1540.9, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 0.4254201680672269, |
| "grad_norm": 0.829017462865176, |
| "learning_rate": 2.4227886056971515e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1897987425327301, |
| "step": 405, |
| "valid_targets_mean": 1442.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 0.43067226890756305, |
| "grad_norm": 1.009337402964787, |
| "learning_rate": 2.4527736131934036e-05, |
| "loss": 0.2422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25567498803138733, |
| "step": 410, |
| "valid_targets_mean": 1407.6, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 0.43592436974789917, |
| "grad_norm": 1.102110069443316, |
| "learning_rate": 2.4827586206896553e-05, |
| "loss": 0.2392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22340771555900574, |
| "step": 415, |
| "valid_targets_mean": 1197.8, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 0.4411764705882353, |
| "grad_norm": 0.9439286600674722, |
| "learning_rate": 2.5127436281859074e-05, |
| "loss": 0.2466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22316749393939972, |
| "step": 420, |
| "valid_targets_mean": 1423.3, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 0.44642857142857145, |
| "grad_norm": 0.9288887022810997, |
| "learning_rate": 2.542728635682159e-05, |
| "loss": 0.2356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22205528616905212, |
| "step": 425, |
| "valid_targets_mean": 1331.5, |
| "valid_targets_min": 827 |
| }, |
| { |
| "epoch": 0.45168067226890757, |
| "grad_norm": 0.918938060661647, |
| "learning_rate": 2.572713643178411e-05, |
| "loss": 0.2436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24578994512557983, |
| "step": 430, |
| "valid_targets_mean": 1381.7, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 0.4569327731092437, |
| "grad_norm": 0.8450512785959888, |
| "learning_rate": 2.602698650674663e-05, |
| "loss": 0.2512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25319570302963257, |
| "step": 435, |
| "valid_targets_mean": 1472.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 0.46218487394957986, |
| "grad_norm": 1.3247180796200522, |
| "learning_rate": 2.632683658170915e-05, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4720996022224426, |
| "step": 440, |
| "valid_targets_mean": 2248.9, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 0.46743697478991597, |
| "grad_norm": 0.7756817606153216, |
| "learning_rate": 2.6626686656671666e-05, |
| "loss": 0.4381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4191029667854309, |
| "step": 445, |
| "valid_targets_mean": 3664.4, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 0.4726890756302521, |
| "grad_norm": 0.8141822973818857, |
| "learning_rate": 2.6926536731634184e-05, |
| "loss": 0.4066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42180395126342773, |
| "step": 450, |
| "valid_targets_mean": 3591.1, |
| "valid_targets_min": 1635 |
| }, |
| { |
| "epoch": 0.47794117647058826, |
| "grad_norm": 0.6183205557943057, |
| "learning_rate": 2.7226386806596705e-05, |
| "loss": 0.399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37809157371520996, |
| "step": 455, |
| "valid_targets_mean": 4172.7, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 0.4831932773109244, |
| "grad_norm": 0.6341645150900163, |
| "learning_rate": 2.752623688155922e-05, |
| "loss": 0.3807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3980065882205963, |
| "step": 460, |
| "valid_targets_mean": 4040.2, |
| "valid_targets_min": 2187 |
| }, |
| { |
| "epoch": 0.4884453781512605, |
| "grad_norm": 0.7232188026091549, |
| "learning_rate": 2.782608695652174e-05, |
| "loss": 0.3993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39658811688423157, |
| "step": 465, |
| "valid_targets_mean": 3156.3, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 0.49369747899159666, |
| "grad_norm": 0.5975850484936072, |
| "learning_rate": 2.812593703148426e-05, |
| "loss": 0.377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35548049211502075, |
| "step": 470, |
| "valid_targets_mean": 3529.7, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 0.4989495798319328, |
| "grad_norm": 0.6544292649550012, |
| "learning_rate": 2.8425787106446782e-05, |
| "loss": 0.3589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36396756768226624, |
| "step": 475, |
| "valid_targets_mean": 3485.6, |
| "valid_targets_min": 1488 |
| }, |
| { |
| "epoch": 0.5042016806722689, |
| "grad_norm": 0.5784234889060588, |
| "learning_rate": 2.8725637181409296e-05, |
| "loss": 0.3769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3580145239830017, |
| "step": 480, |
| "valid_targets_mean": 3707.0, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 0.509453781512605, |
| "grad_norm": 0.5809204879202081, |
| "learning_rate": 2.9025487256371818e-05, |
| "loss": 0.3991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37097570300102234, |
| "step": 485, |
| "valid_targets_mean": 4252.4, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 0.5147058823529411, |
| "grad_norm": 0.6518660166623274, |
| "learning_rate": 2.9325337331334335e-05, |
| "loss": 0.3791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39846816658973694, |
| "step": 490, |
| "valid_targets_mean": 4029.2, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 0.5199579831932774, |
| "grad_norm": 0.5952710397208067, |
| "learning_rate": 2.9625187406296856e-05, |
| "loss": 0.3793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34132808446884155, |
| "step": 495, |
| "valid_targets_mean": 4507.0, |
| "valid_targets_min": 2011 |
| }, |
| { |
| "epoch": 0.5252100840336135, |
| "grad_norm": 0.5921750584078646, |
| "learning_rate": 2.992503748125937e-05, |
| "loss": 0.3773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3380280137062073, |
| "step": 500, |
| "valid_targets_mean": 4268.2, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 0.5304621848739496, |
| "grad_norm": 0.7847684848643338, |
| "learning_rate": 3.022488755622189e-05, |
| "loss": 0.3692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3614731431007385, |
| "step": 505, |
| "valid_targets_mean": 3858.9, |
| "valid_targets_min": 1366 |
| }, |
| { |
| "epoch": 0.5357142857142857, |
| "grad_norm": 0.6674187275757447, |
| "learning_rate": 3.052473763118441e-05, |
| "loss": 0.3796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36018460988998413, |
| "step": 510, |
| "valid_targets_mean": 3169.1, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 0.5409663865546218, |
| "grad_norm": 0.5809835935023818, |
| "learning_rate": 3.0824587706146934e-05, |
| "loss": 0.3895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34386080503463745, |
| "step": 515, |
| "valid_targets_mean": 4130.4, |
| "valid_targets_min": 1762 |
| }, |
| { |
| "epoch": 0.5462184873949579, |
| "grad_norm": 0.6856115085091843, |
| "learning_rate": 3.112443778110945e-05, |
| "loss": 0.3807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3728490471839905, |
| "step": 520, |
| "valid_targets_mean": 3285.0, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 0.5514705882352942, |
| "grad_norm": 0.7152310015109019, |
| "learning_rate": 3.142428785607197e-05, |
| "loss": 0.3934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3993592858314514, |
| "step": 525, |
| "valid_targets_mean": 3298.2, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 0.5567226890756303, |
| "grad_norm": 0.7853116245952066, |
| "learning_rate": 3.172413793103448e-05, |
| "loss": 0.3929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3852170705795288, |
| "step": 530, |
| "valid_targets_mean": 2740.4, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 0.5619747899159664, |
| "grad_norm": 0.7253886613797418, |
| "learning_rate": 3.2023988005997004e-05, |
| "loss": 0.3777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3952094614505768, |
| "step": 535, |
| "valid_targets_mean": 2995.1, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 0.5672268907563025, |
| "grad_norm": 0.7947910205242297, |
| "learning_rate": 3.2323838080959525e-05, |
| "loss": 0.3671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3840707540512085, |
| "step": 540, |
| "valid_targets_mean": 2811.6, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 0.5724789915966386, |
| "grad_norm": 0.7101634109805368, |
| "learning_rate": 3.262368815592204e-05, |
| "loss": 0.3656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3580155372619629, |
| "step": 545, |
| "valid_targets_mean": 3709.5, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 0.5777310924369747, |
| "grad_norm": 0.7401801947692503, |
| "learning_rate": 3.292353823088456e-05, |
| "loss": 0.3732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37310606241226196, |
| "step": 550, |
| "valid_targets_mean": 2960.6, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 0.582983193277311, |
| "grad_norm": 0.6819266322867479, |
| "learning_rate": 3.3223388305847075e-05, |
| "loss": 0.3727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.376257061958313, |
| "step": 555, |
| "valid_targets_mean": 3189.2, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 0.5882352941176471, |
| "grad_norm": 0.5792785228231021, |
| "learning_rate": 3.3523238380809596e-05, |
| "loss": 0.3706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3450887203216553, |
| "step": 560, |
| "valid_targets_mean": 3823.1, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 0.5934873949579832, |
| "grad_norm": 0.706870647311464, |
| "learning_rate": 3.382308845577212e-05, |
| "loss": 0.3699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33471646904945374, |
| "step": 565, |
| "valid_targets_mean": 2639.4, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 0.5987394957983193, |
| "grad_norm": 0.8079454260503596, |
| "learning_rate": 3.412293853073464e-05, |
| "loss": 0.3653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39000123739242554, |
| "step": 570, |
| "valid_targets_mean": 2988.3, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 0.6039915966386554, |
| "grad_norm": 0.6685925501276144, |
| "learning_rate": 3.442278860569715e-05, |
| "loss": 0.3659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3652319312095642, |
| "step": 575, |
| "valid_targets_mean": 3563.1, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 0.6092436974789915, |
| "grad_norm": 0.6271409370176393, |
| "learning_rate": 3.4722638680659673e-05, |
| "loss": 0.3594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3371011018753052, |
| "step": 580, |
| "valid_targets_mean": 3737.9, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 0.6144957983193278, |
| "grad_norm": 0.7635609780961795, |
| "learning_rate": 3.5022488755622194e-05, |
| "loss": 0.3644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3491378426551819, |
| "step": 585, |
| "valid_targets_mean": 2745.8, |
| "valid_targets_min": 1036 |
| }, |
| { |
| "epoch": 0.6197478991596639, |
| "grad_norm": 0.9486847263065615, |
| "learning_rate": 3.5322338830584716e-05, |
| "loss": 0.3682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3554984927177429, |
| "step": 590, |
| "valid_targets_mean": 3516.4, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 0.625, |
| "grad_norm": 0.6979971886991938, |
| "learning_rate": 3.562218890554723e-05, |
| "loss": 0.3604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3572150468826294, |
| "step": 595, |
| "valid_targets_mean": 3279.4, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 0.6302521008403361, |
| "grad_norm": 0.628571339160864, |
| "learning_rate": 3.592203898050975e-05, |
| "loss": 0.3601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32577332854270935, |
| "step": 600, |
| "valid_targets_mean": 3180.4, |
| "valid_targets_min": 1816 |
| }, |
| { |
| "epoch": 0.6355042016806722, |
| "grad_norm": 0.7162106687544288, |
| "learning_rate": 3.6221889055472265e-05, |
| "loss": 0.3733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36203664541244507, |
| "step": 605, |
| "valid_targets_mean": 2939.2, |
| "valid_targets_min": 1629 |
| }, |
| { |
| "epoch": 0.6407563025210085, |
| "grad_norm": 0.7531458122055458, |
| "learning_rate": 3.6521739130434786e-05, |
| "loss": 0.3618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3718830943107605, |
| "step": 610, |
| "valid_targets_mean": 2755.7, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 0.6460084033613446, |
| "grad_norm": 0.7043721880651528, |
| "learning_rate": 3.68215892053973e-05, |
| "loss": 0.3629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3637351989746094, |
| "step": 615, |
| "valid_targets_mean": 3390.2, |
| "valid_targets_min": 1973 |
| }, |
| { |
| "epoch": 0.6512605042016807, |
| "grad_norm": 0.7411003182380056, |
| "learning_rate": 3.712143928035982e-05, |
| "loss": 0.3638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35509952902793884, |
| "step": 620, |
| "valid_targets_mean": 2960.4, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 0.6565126050420168, |
| "grad_norm": 0.6916717573319705, |
| "learning_rate": 3.742128935532234e-05, |
| "loss": 0.3592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37266242504119873, |
| "step": 625, |
| "valid_targets_mean": 3181.4, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 0.6617647058823529, |
| "grad_norm": 0.6405799101681395, |
| "learning_rate": 3.772113943028486e-05, |
| "loss": 0.3642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.351756751537323, |
| "step": 630, |
| "valid_targets_mean": 3464.2, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 0.667016806722689, |
| "grad_norm": 0.6665303943258725, |
| "learning_rate": 3.802098950524738e-05, |
| "loss": 0.3496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34305959939956665, |
| "step": 635, |
| "valid_targets_mean": 3443.1, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 0.6722689075630253, |
| "grad_norm": 0.6963251575164391, |
| "learning_rate": 3.83208395802099e-05, |
| "loss": 0.349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36686572432518005, |
| "step": 640, |
| "valid_targets_mean": 3891.4, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 0.6775210084033614, |
| "grad_norm": 0.6447119132301098, |
| "learning_rate": 3.862068965517242e-05, |
| "loss": 0.3547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35105079412460327, |
| "step": 645, |
| "valid_targets_mean": 3368.9, |
| "valid_targets_min": 1700 |
| }, |
| { |
| "epoch": 0.6827731092436975, |
| "grad_norm": 0.775468044490351, |
| "learning_rate": 3.8920539730134934e-05, |
| "loss": 0.3561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35495996475219727, |
| "step": 650, |
| "valid_targets_mean": 2497.1, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 0.6880252100840336, |
| "grad_norm": 0.6998673088388078, |
| "learning_rate": 3.9220389805097455e-05, |
| "loss": 0.37, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.373879611492157, |
| "step": 655, |
| "valid_targets_mean": 3391.2, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 0.6932773109243697, |
| "grad_norm": 0.6911940333174383, |
| "learning_rate": 3.9520239880059976e-05, |
| "loss": 0.3604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3743062913417816, |
| "step": 660, |
| "valid_targets_mean": 3003.8, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 0.6985294117647058, |
| "grad_norm": 0.6312467853415549, |
| "learning_rate": 3.982008995502249e-05, |
| "loss": 0.3406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3238492012023926, |
| "step": 665, |
| "valid_targets_mean": 3239.7, |
| "valid_targets_min": 1679 |
| }, |
| { |
| "epoch": 0.7037815126050421, |
| "grad_norm": 0.6929968801305512, |
| "learning_rate": 3.9999989022799437e-05, |
| "loss": 0.3559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.374039888381958, |
| "step": 670, |
| "valid_targets_mean": 3101.2, |
| "valid_targets_min": 1739 |
| }, |
| { |
| "epoch": 0.7090336134453782, |
| "grad_norm": 0.7069459947278421, |
| "learning_rate": 3.9999865529431466e-05, |
| "loss": 0.3481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3492530584335327, |
| "step": 675, |
| "valid_targets_mean": 2844.4, |
| "valid_targets_min": 1278 |
| }, |
| { |
| "epoch": 0.7142857142857143, |
| "grad_norm": 0.6222986155844251, |
| "learning_rate": 3.9999604822044886e-05, |
| "loss": 0.3406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.327778160572052, |
| "step": 680, |
| "valid_targets_mean": 3563.4, |
| "valid_targets_min": 1522 |
| }, |
| { |
| "epoch": 0.7195378151260504, |
| "grad_norm": 0.6470886363287454, |
| "learning_rate": 3.999920690242835e-05, |
| "loss": 0.3288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33931905031204224, |
| "step": 685, |
| "valid_targets_mean": 3589.0, |
| "valid_targets_min": 464 |
| }, |
| { |
| "epoch": 0.7247899159663865, |
| "grad_norm": 0.5841030308921137, |
| "learning_rate": 3.999867177331189e-05, |
| "loss": 0.362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3474075198173523, |
| "step": 690, |
| "valid_targets_mean": 3827.1, |
| "valid_targets_min": 1003 |
| }, |
| { |
| "epoch": 0.7300420168067226, |
| "grad_norm": 0.6944347153816217, |
| "learning_rate": 3.9997999438366895e-05, |
| "loss": 0.3424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36091533303260803, |
| "step": 695, |
| "valid_targets_mean": 3042.1, |
| "valid_targets_min": 1446 |
| }, |
| { |
| "epoch": 0.7352941176470589, |
| "grad_norm": 0.6583742822611474, |
| "learning_rate": 3.9997189902206065e-05, |
| "loss": 0.3494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3591790199279785, |
| "step": 700, |
| "valid_targets_mean": 3257.8, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 0.740546218487395, |
| "grad_norm": 0.6796220489697876, |
| "learning_rate": 3.999624317038344e-05, |
| "loss": 0.3623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3584475815296173, |
| "step": 705, |
| "valid_targets_mean": 3858.5, |
| "valid_targets_min": 1336 |
| }, |
| { |
| "epoch": 0.7457983193277311, |
| "grad_norm": 0.5779511153503359, |
| "learning_rate": 3.9995159249394303e-05, |
| "loss": 0.3632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3402530550956726, |
| "step": 710, |
| "valid_targets_mean": 3821.1, |
| "valid_targets_min": 1275 |
| }, |
| { |
| "epoch": 0.7510504201680672, |
| "grad_norm": 0.6920943343973615, |
| "learning_rate": 3.999393814667517e-05, |
| "loss": 0.3394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35493505001068115, |
| "step": 715, |
| "valid_targets_mean": 2914.6, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 0.7563025210084033, |
| "grad_norm": 0.6484863168026516, |
| "learning_rate": 3.9992579870603695e-05, |
| "loss": 0.336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3329768478870392, |
| "step": 720, |
| "valid_targets_mean": 3083.4, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 0.7615546218487395, |
| "grad_norm": 0.7459309224625077, |
| "learning_rate": 3.999108443049869e-05, |
| "loss": 0.3408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35886648297309875, |
| "step": 725, |
| "valid_targets_mean": 2747.4, |
| "valid_targets_min": 1557 |
| }, |
| { |
| "epoch": 0.7668067226890757, |
| "grad_norm": 0.6643965239188359, |
| "learning_rate": 3.998945183661997e-05, |
| "loss": 0.3442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3370826840400696, |
| "step": 730, |
| "valid_targets_mean": 3405.2, |
| "valid_targets_min": 1405 |
| }, |
| { |
| "epoch": 0.7720588235294118, |
| "grad_norm": 0.6311941065520537, |
| "learning_rate": 3.9987682100168376e-05, |
| "loss": 0.3432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32585620880126953, |
| "step": 735, |
| "valid_targets_mean": 3507.1, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 0.7773109243697479, |
| "grad_norm": 0.6934056789740213, |
| "learning_rate": 3.99857752332856e-05, |
| "loss": 0.3318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3426210284233093, |
| "step": 740, |
| "valid_targets_mean": 3079.7, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 0.782563025210084, |
| "grad_norm": 0.6683294329205226, |
| "learning_rate": 3.998373124905418e-05, |
| "loss": 0.3404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3405384421348572, |
| "step": 745, |
| "valid_targets_mean": 2934.3, |
| "valid_targets_min": 1288 |
| }, |
| { |
| "epoch": 0.7878151260504201, |
| "grad_norm": 0.6089870902503931, |
| "learning_rate": 3.9981550161497375e-05, |
| "loss": 0.36, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3385617136955261, |
| "step": 750, |
| "valid_targets_mean": 3428.2, |
| "valid_targets_min": 1915 |
| }, |
| { |
| "epoch": 0.7930672268907563, |
| "grad_norm": 0.6028162675947055, |
| "learning_rate": 3.9979231985579074e-05, |
| "loss": 0.3484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3657104969024658, |
| "step": 755, |
| "valid_targets_mean": 3764.9, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 0.7983193277310925, |
| "grad_norm": 0.7017817313652911, |
| "learning_rate": 3.99767767372037e-05, |
| "loss": 0.3304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33708494901657104, |
| "step": 760, |
| "valid_targets_mean": 3006.5, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 0.8035714285714286, |
| "grad_norm": 0.6788931537841902, |
| "learning_rate": 3.997418443321609e-05, |
| "loss": 0.3478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3829076290130615, |
| "step": 765, |
| "valid_targets_mean": 3326.2, |
| "valid_targets_min": 1586 |
| }, |
| { |
| "epoch": 0.8088235294117647, |
| "grad_norm": 0.6396470227937194, |
| "learning_rate": 3.997145509140138e-05, |
| "loss": 0.3451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3249973654747009, |
| "step": 770, |
| "valid_targets_mean": 3205.2, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 0.8140756302521008, |
| "grad_norm": 0.6959358945807129, |
| "learning_rate": 3.9968588730484896e-05, |
| "loss": 0.3302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35094955563545227, |
| "step": 775, |
| "valid_targets_mean": 2735.1, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 0.819327731092437, |
| "grad_norm": 0.7121078872001974, |
| "learning_rate": 3.9965585370132013e-05, |
| "loss": 0.3355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3337578773498535, |
| "step": 780, |
| "valid_targets_mean": 3735.8, |
| "valid_targets_min": 1681 |
| }, |
| { |
| "epoch": 0.8245798319327731, |
| "grad_norm": 0.731579949310607, |
| "learning_rate": 3.996244503094804e-05, |
| "loss": 0.3497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37752842903137207, |
| "step": 785, |
| "valid_targets_mean": 2883.7, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 0.8298319327731093, |
| "grad_norm": 0.6650190290860145, |
| "learning_rate": 3.995916773447804e-05, |
| "loss": 0.3574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3751668930053711, |
| "step": 790, |
| "valid_targets_mean": 3324.1, |
| "valid_targets_min": 1455 |
| }, |
| { |
| "epoch": 0.8350840336134454, |
| "grad_norm": 0.6084187992006697, |
| "learning_rate": 3.995575350320671e-05, |
| "loss": 0.3363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3428555428981781, |
| "step": 795, |
| "valid_targets_mean": 3948.6, |
| "valid_targets_min": 1529 |
| }, |
| { |
| "epoch": 0.8403361344537815, |
| "grad_norm": 0.6734592462466594, |
| "learning_rate": 3.995220236055824e-05, |
| "loss": 0.3662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36074283719062805, |
| "step": 800, |
| "valid_targets_mean": 3419.9, |
| "valid_targets_min": 1450 |
| }, |
| { |
| "epoch": 0.8455882352941176, |
| "grad_norm": 0.5774931076226504, |
| "learning_rate": 3.99485143308961e-05, |
| "loss": 0.3351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3051412105560303, |
| "step": 805, |
| "valid_targets_mean": 3465.6, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 0.8508403361344538, |
| "grad_norm": 0.8400200119736569, |
| "learning_rate": 3.994468943952296e-05, |
| "loss": 0.3546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35333842039108276, |
| "step": 810, |
| "valid_targets_mean": 3085.4, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 0.8560924369747899, |
| "grad_norm": 0.6336110237839332, |
| "learning_rate": 3.994072771268041e-05, |
| "loss": 0.362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.347425639629364, |
| "step": 815, |
| "valid_targets_mean": 3230.6, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 0.8613445378151261, |
| "grad_norm": 0.6958422384825939, |
| "learning_rate": 3.993662917754885e-05, |
| "loss": 0.3478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35881751775741577, |
| "step": 820, |
| "valid_targets_mean": 2908.7, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 0.8665966386554622, |
| "grad_norm": 0.7411583695170622, |
| "learning_rate": 3.993239386224732e-05, |
| "loss": 0.3536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3721003532409668, |
| "step": 825, |
| "valid_targets_mean": 2748.8, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 0.8718487394957983, |
| "grad_norm": 0.63511436606181, |
| "learning_rate": 3.992802179583322e-05, |
| "loss": 0.3513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3608887195587158, |
| "step": 830, |
| "valid_targets_mean": 3297.7, |
| "valid_targets_min": 1683 |
| }, |
| { |
| "epoch": 0.8771008403361344, |
| "grad_norm": 0.6522816701659483, |
| "learning_rate": 3.9923513008302204e-05, |
| "loss": 0.3484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32889869809150696, |
| "step": 835, |
| "valid_targets_mean": 3406.1, |
| "valid_targets_min": 1913 |
| }, |
| { |
| "epoch": 0.8823529411764706, |
| "grad_norm": 0.5886512960386365, |
| "learning_rate": 3.991886753058792e-05, |
| "loss": 0.3322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32120782136917114, |
| "step": 840, |
| "valid_targets_mean": 3848.1, |
| "valid_targets_min": 1659 |
| }, |
| { |
| "epoch": 0.8876050420168067, |
| "grad_norm": 0.6037677731592493, |
| "learning_rate": 3.991408539456182e-05, |
| "loss": 0.3476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31538859009742737, |
| "step": 845, |
| "valid_targets_mean": 3390.7, |
| "valid_targets_min": 1390 |
| }, |
| { |
| "epoch": 0.8928571428571429, |
| "grad_norm": 0.7282746261851238, |
| "learning_rate": 3.990916663303293e-05, |
| "loss": 0.351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4035952389240265, |
| "step": 850, |
| "valid_targets_mean": 3338.5, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 0.898109243697479, |
| "grad_norm": 0.8755920451444243, |
| "learning_rate": 3.990411127974762e-05, |
| "loss": 0.3411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3417074978351593, |
| "step": 855, |
| "valid_targets_mean": 3389.6, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 0.9033613445378151, |
| "grad_norm": 0.6595337996347566, |
| "learning_rate": 3.989891936938939e-05, |
| "loss": 0.349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31698334217071533, |
| "step": 860, |
| "valid_targets_mean": 3097.9, |
| "valid_targets_min": 1459 |
| }, |
| { |
| "epoch": 0.9086134453781513, |
| "grad_norm": 0.7205543746187569, |
| "learning_rate": 3.9893590937578634e-05, |
| "loss": 0.3356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37621456384658813, |
| "step": 865, |
| "valid_targets_mean": 2619.4, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 0.9138655462184874, |
| "grad_norm": 0.5683063041911645, |
| "learning_rate": 3.9888126020872375e-05, |
| "loss": 0.3317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31596362590789795, |
| "step": 870, |
| "valid_targets_mean": 3791.2, |
| "valid_targets_min": 1564 |
| }, |
| { |
| "epoch": 0.9191176470588235, |
| "grad_norm": 1.070844790253151, |
| "learning_rate": 3.988252465676401e-05, |
| "loss": 0.3364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33733999729156494, |
| "step": 875, |
| "valid_targets_mean": 3223.3, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 0.9243697478991597, |
| "grad_norm": 0.637333593228743, |
| "learning_rate": 3.98767868836831e-05, |
| "loss": 0.3193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3216400146484375, |
| "step": 880, |
| "valid_targets_mean": 3439.2, |
| "valid_targets_min": 1524 |
| }, |
| { |
| "epoch": 0.9296218487394958, |
| "grad_norm": 0.5754820914455384, |
| "learning_rate": 3.987091274099504e-05, |
| "loss": 0.3239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3149118423461914, |
| "step": 885, |
| "valid_targets_mean": 3744.9, |
| "valid_targets_min": 1375 |
| }, |
| { |
| "epoch": 0.9348739495798319, |
| "grad_norm": 0.6651917315458717, |
| "learning_rate": 3.986490226900084e-05, |
| "loss": 0.3368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3212442398071289, |
| "step": 890, |
| "valid_targets_mean": 3036.2, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 0.9401260504201681, |
| "grad_norm": 0.6067258438956236, |
| "learning_rate": 3.985875550893684e-05, |
| "loss": 0.3232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30532318353652954, |
| "step": 895, |
| "valid_targets_mean": 3766.5, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 0.9453781512605042, |
| "grad_norm": 0.6702408814712129, |
| "learning_rate": 3.9852472502974386e-05, |
| "loss": 0.3288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3562542498111725, |
| "step": 900, |
| "valid_targets_mean": 3225.9, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 0.9506302521008403, |
| "grad_norm": 0.5790810375186305, |
| "learning_rate": 3.984605329421961e-05, |
| "loss": 0.3279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32805150747299194, |
| "step": 905, |
| "valid_targets_mean": 3751.3, |
| "valid_targets_min": 2264 |
| }, |
| { |
| "epoch": 0.9558823529411765, |
| "grad_norm": 0.5978703507597435, |
| "learning_rate": 3.983949792671307e-05, |
| "loss": 0.3481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.347832053899765, |
| "step": 910, |
| "valid_targets_mean": 3505.2, |
| "valid_targets_min": 1454 |
| }, |
| { |
| "epoch": 0.9611344537815126, |
| "grad_norm": 0.624321623961909, |
| "learning_rate": 3.9832806445429486e-05, |
| "loss": 0.3425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3324778378009796, |
| "step": 915, |
| "valid_targets_mean": 3385.7, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 0.9663865546218487, |
| "grad_norm": 0.6245540796780895, |
| "learning_rate": 3.982597889627742e-05, |
| "loss": 0.3348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.317277729511261, |
| "step": 920, |
| "valid_targets_mean": 3201.6, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 0.9716386554621849, |
| "grad_norm": 0.6175278753890704, |
| "learning_rate": 3.981901532609896e-05, |
| "loss": 0.3239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32414883375167847, |
| "step": 925, |
| "valid_targets_mean": 3362.1, |
| "valid_targets_min": 1512 |
| }, |
| { |
| "epoch": 0.976890756302521, |
| "grad_norm": 0.6165488317026186, |
| "learning_rate": 3.9811915782669406e-05, |
| "loss": 0.3298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31244921684265137, |
| "step": 930, |
| "valid_targets_mean": 3643.9, |
| "valid_targets_min": 2048 |
| }, |
| { |
| "epoch": 0.9821428571428571, |
| "grad_norm": 0.6227928286121143, |
| "learning_rate": 3.980468031469691e-05, |
| "loss": 0.3463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3477458953857422, |
| "step": 935, |
| "valid_targets_mean": 3107.1, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 0.9873949579831933, |
| "grad_norm": 0.6175153136159267, |
| "learning_rate": 3.9797308971822206e-05, |
| "loss": 0.3446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3596673607826233, |
| "step": 940, |
| "valid_targets_mean": 3339.4, |
| "valid_targets_min": 1878 |
| }, |
| { |
| "epoch": 0.9926470588235294, |
| "grad_norm": 0.6173093585223963, |
| "learning_rate": 3.978980180461821e-05, |
| "loss": 0.3367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33542400598526, |
| "step": 945, |
| "valid_targets_mean": 3394.6, |
| "valid_targets_min": 1727 |
| }, |
| { |
| "epoch": 0.9978991596638656, |
| "grad_norm": 0.6354828168457491, |
| "learning_rate": 3.9782158864589696e-05, |
| "loss": 0.3261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3046625554561615, |
| "step": 950, |
| "valid_targets_mean": 2924.3, |
| "valid_targets_min": 1622 |
| }, |
| { |
| "epoch": 1.0031512605042017, |
| "grad_norm": 1.3016888810382736, |
| "learning_rate": 3.977438020417293e-05, |
| "loss": 0.3059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2962370216846466, |
| "step": 955, |
| "valid_targets_mean": 1587.9, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 1.0084033613445378, |
| "grad_norm": 1.178432388446946, |
| "learning_rate": 3.9766465876735354e-05, |
| "loss": 0.2533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23576419055461884, |
| "step": 960, |
| "valid_targets_mean": 1591.2, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 1.013655462184874, |
| "grad_norm": 0.9417299138332059, |
| "learning_rate": 3.9758415936575155e-05, |
| "loss": 0.2443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23771171271800995, |
| "step": 965, |
| "valid_targets_mean": 1418.7, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 1.01890756302521, |
| "grad_norm": 0.9391474883661355, |
| "learning_rate": 3.975023043892094e-05, |
| "loss": 0.2429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23540674149990082, |
| "step": 970, |
| "valid_targets_mean": 1389.0, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 1.0241596638655461, |
| "grad_norm": 0.8489834118982603, |
| "learning_rate": 3.974190943993133e-05, |
| "loss": 0.2363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.221901997923851, |
| "step": 975, |
| "valid_targets_mean": 1513.9, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 1.0294117647058822, |
| "grad_norm": 0.830262362849459, |
| "learning_rate": 3.973345299669461e-05, |
| "loss": 0.2401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23195049166679382, |
| "step": 980, |
| "valid_targets_mean": 1482.3, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 1.0346638655462186, |
| "grad_norm": 0.8915461834880904, |
| "learning_rate": 3.972486116722828e-05, |
| "loss": 0.2468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.208994060754776, |
| "step": 985, |
| "valid_targets_mean": 1189.1, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 1.0399159663865547, |
| "grad_norm": 0.9988345647892146, |
| "learning_rate": 3.971613401047872e-05, |
| "loss": 0.2285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2332269549369812, |
| "step": 990, |
| "valid_targets_mean": 1299.6, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 1.0451680672268908, |
| "grad_norm": 0.8523206270419763, |
| "learning_rate": 3.970727158632075e-05, |
| "loss": 0.2491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23563072085380554, |
| "step": 995, |
| "valid_targets_mean": 1407.6, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 1.050420168067227, |
| "grad_norm": 1.0576241067376564, |
| "learning_rate": 3.969827395555721e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2590252757072449, |
| "step": 1000, |
| "valid_targets_mean": 1544.1, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 1.055672268907563, |
| "grad_norm": 1.1458471492556306, |
| "learning_rate": 3.968914117991857e-05, |
| "loss": 0.2286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.230397567152977, |
| "step": 1005, |
| "valid_targets_mean": 1511.1, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 1.0609243697478992, |
| "grad_norm": 0.9006777040659446, |
| "learning_rate": 3.967987332206249e-05, |
| "loss": 0.2396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2451692819595337, |
| "step": 1010, |
| "valid_targets_mean": 1638.0, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 1.0661764705882353, |
| "grad_norm": 0.7626623690643839, |
| "learning_rate": 3.967047044557341e-05, |
| "loss": 0.2329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22060266137123108, |
| "step": 1015, |
| "valid_targets_mean": 1526.9, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 1.0714285714285714, |
| "grad_norm": 0.8215685697177867, |
| "learning_rate": 3.966093261496208e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2275817096233368, |
| "step": 1020, |
| "valid_targets_mean": 1387.4, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 1.0766806722689075, |
| "grad_norm": 0.8698242331020952, |
| "learning_rate": 3.9651259895665146e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2096673548221588, |
| "step": 1025, |
| "valid_targets_mean": 1382.9, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 1.0819327731092436, |
| "grad_norm": 0.768616027752401, |
| "learning_rate": 3.9641452354044687e-05, |
| "loss": 0.2263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20485013723373413, |
| "step": 1030, |
| "valid_targets_mean": 1312.1, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 1.0871848739495797, |
| "grad_norm": 0.8590772693317404, |
| "learning_rate": 3.9631510057387765e-05, |
| "loss": 0.2403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24823632836341858, |
| "step": 1035, |
| "valid_targets_mean": 1397.6, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 1.092436974789916, |
| "grad_norm": 0.9234663166300711, |
| "learning_rate": 3.962143307390596e-05, |
| "loss": 0.236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2525438666343689, |
| "step": 1040, |
| "valid_targets_mean": 1419.4, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 1.0976890756302522, |
| "grad_norm": 0.7428187089700554, |
| "learning_rate": 3.961122147273491e-05, |
| "loss": 0.2362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24657368659973145, |
| "step": 1045, |
| "valid_targets_mean": 1647.7, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 1.1029411764705883, |
| "grad_norm": 0.7835107757413885, |
| "learning_rate": 3.9600875323933826e-05, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21424023807048798, |
| "step": 1050, |
| "valid_targets_mean": 1545.5, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 1.1081932773109244, |
| "grad_norm": 0.8623930769993505, |
| "learning_rate": 3.959039469848502e-05, |
| "loss": 0.2274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2390882670879364, |
| "step": 1055, |
| "valid_targets_mean": 1411.8, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 1.1134453781512605, |
| "grad_norm": 0.8342187952076956, |
| "learning_rate": 3.9579779668293416e-05, |
| "loss": 0.2341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24478605389595032, |
| "step": 1060, |
| "valid_targets_mean": 1437.3, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 1.1186974789915967, |
| "grad_norm": 0.8716802159762432, |
| "learning_rate": 3.956903030618605e-05, |
| "loss": 0.229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21243079006671906, |
| "step": 1065, |
| "valid_targets_mean": 1193.6, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 1.1239495798319328, |
| "grad_norm": 0.8276094439043256, |
| "learning_rate": 3.955814668591156e-05, |
| "loss": 0.221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2292919009923935, |
| "step": 1070, |
| "valid_targets_mean": 1514.0, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 1.129201680672269, |
| "grad_norm": 0.8269530258415205, |
| "learning_rate": 3.9547128882139735e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2063109278678894, |
| "step": 1075, |
| "valid_targets_mean": 1379.1, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 1.134453781512605, |
| "grad_norm": 0.7349504784818733, |
| "learning_rate": 3.9535976970460925e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2086534947156906, |
| "step": 1080, |
| "valid_targets_mean": 1455.5, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 1.1397058823529411, |
| "grad_norm": 0.7910940364262357, |
| "learning_rate": 3.9524691027385585e-05, |
| "loss": 0.2244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22840695083141327, |
| "step": 1085, |
| "valid_targets_mean": 1525.2, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 1.1449579831932772, |
| "grad_norm": 0.9125068091813882, |
| "learning_rate": 3.95132711303437e-05, |
| "loss": 0.234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23359861969947815, |
| "step": 1090, |
| "valid_targets_mean": 1476.6, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 1.1502100840336134, |
| "grad_norm": 0.7517080972876787, |
| "learning_rate": 3.9501717357684315e-05, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22301185131072998, |
| "step": 1095, |
| "valid_targets_mean": 1467.1, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 1.1554621848739495, |
| "grad_norm": 0.8187151581180054, |
| "learning_rate": 3.9490029788674934e-05, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22149021923542023, |
| "step": 1100, |
| "valid_targets_mean": 1341.3, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 1.1607142857142858, |
| "grad_norm": 0.7811554150228613, |
| "learning_rate": 3.9478208503501e-05, |
| "loss": 0.2245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23048382997512817, |
| "step": 1105, |
| "valid_targets_mean": 1556.4, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 1.165966386554622, |
| "grad_norm": 0.8232786153715305, |
| "learning_rate": 3.946625358326538e-05, |
| "loss": 0.2278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24594677984714508, |
| "step": 1110, |
| "valid_targets_mean": 1509.7, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 1.171218487394958, |
| "grad_norm": 0.7583404192175697, |
| "learning_rate": 3.945416510998775e-05, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.229123055934906, |
| "step": 1115, |
| "valid_targets_mean": 1408.4, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 1.1764705882352942, |
| "grad_norm": 0.7798738937206717, |
| "learning_rate": 3.944194316660406e-05, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20927229523658752, |
| "step": 1120, |
| "valid_targets_mean": 1449.8, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 1.1817226890756303, |
| "grad_norm": 0.7782369720225292, |
| "learning_rate": 3.942958783696598e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21136952936649323, |
| "step": 1125, |
| "valid_targets_mean": 1489.8, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 1.1869747899159664, |
| "grad_norm": 0.8389164365291358, |
| "learning_rate": 3.94170992058403e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2247747778892517, |
| "step": 1130, |
| "valid_targets_mean": 1379.1, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 1.1922268907563025, |
| "grad_norm": 0.85218432627087, |
| "learning_rate": 3.9404477358908354e-05, |
| "loss": 0.2185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20599870383739471, |
| "step": 1135, |
| "valid_targets_mean": 1347.1, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 1.1974789915966386, |
| "grad_norm": 0.7736857874589698, |
| "learning_rate": 3.9391722382765445e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2081984579563141, |
| "step": 1140, |
| "valid_targets_mean": 1372.6, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 1.2027310924369747, |
| "grad_norm": 0.8143324846381077, |
| "learning_rate": 3.937883436492025e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.210773304104805, |
| "step": 1145, |
| "valid_targets_mean": 1323.6, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 1.2079831932773109, |
| "grad_norm": 0.8168389117740881, |
| "learning_rate": 3.9365813393794186e-05, |
| "loss": 0.2306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2400819957256317, |
| "step": 1150, |
| "valid_targets_mean": 1597.7, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 1.213235294117647, |
| "grad_norm": 0.798484953443434, |
| "learning_rate": 3.9352659558720836e-05, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19974064826965332, |
| "step": 1155, |
| "valid_targets_mean": 1270.8, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 1.2184873949579833, |
| "grad_norm": 0.7597271913919195, |
| "learning_rate": 3.933937294994535e-05, |
| "loss": 0.2306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22933819890022278, |
| "step": 1160, |
| "valid_targets_mean": 1388.2, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 1.2237394957983194, |
| "grad_norm": 0.7412896199433119, |
| "learning_rate": 3.932595365862379e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2073134481906891, |
| "step": 1165, |
| "valid_targets_mean": 1447.2, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 1.2289915966386555, |
| "grad_norm": 0.8029587259024663, |
| "learning_rate": 3.9312401776822504e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22155123949050903, |
| "step": 1170, |
| "valid_targets_mean": 1399.7, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 1.2342436974789917, |
| "grad_norm": 0.753092266372571, |
| "learning_rate": 3.9298717397517546e-05, |
| "loss": 0.2104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20688486099243164, |
| "step": 1175, |
| "valid_targets_mean": 1454.3, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 1.2394957983193278, |
| "grad_norm": 0.7552069088401491, |
| "learning_rate": 3.928490061459396e-05, |
| "loss": 0.2193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2513880133628845, |
| "step": 1180, |
| "valid_targets_mean": 1746.1, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 1.2447478991596639, |
| "grad_norm": 0.7724105286503384, |
| "learning_rate": 3.927095152284521e-05, |
| "loss": 0.2215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2342674434185028, |
| "step": 1185, |
| "valid_targets_mean": 1282.2, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 1.25, |
| "grad_norm": 0.8255573649270425, |
| "learning_rate": 3.925687021797249e-05, |
| "loss": 0.2124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19916367530822754, |
| "step": 1190, |
| "valid_targets_mean": 1227.6, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 1.2552521008403361, |
| "grad_norm": 0.7348173616246707, |
| "learning_rate": 3.924265679658407e-05, |
| "loss": 0.2127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20118603110313416, |
| "step": 1195, |
| "valid_targets_mean": 1319.1, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 1.2605042016806722, |
| "grad_norm": 0.7536987070404887, |
| "learning_rate": 3.922831135619462e-05, |
| "loss": 0.2161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20859253406524658, |
| "step": 1200, |
| "valid_targets_mean": 1616.5, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 1.2657563025210083, |
| "grad_norm": 0.7577745081343713, |
| "learning_rate": 3.9213833995224605e-05, |
| "loss": 0.2203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2004815638065338, |
| "step": 1205, |
| "valid_targets_mean": 1453.0, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 1.2710084033613445, |
| "grad_norm": 0.7784879343054987, |
| "learning_rate": 3.919922481299952e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21279674768447876, |
| "step": 1210, |
| "valid_targets_mean": 1442.0, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 1.2762605042016806, |
| "grad_norm": 0.7318237431101263, |
| "learning_rate": 3.918448390974928e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20114900171756744, |
| "step": 1215, |
| "valid_targets_mean": 1548.4, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 1.2815126050420167, |
| "grad_norm": 0.8439347277266402, |
| "learning_rate": 3.9169611386607476e-05, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20195883512496948, |
| "step": 1220, |
| "valid_targets_mean": 1359.8, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 1.2867647058823528, |
| "grad_norm": 0.7840655198861911, |
| "learning_rate": 3.9154607345610746e-05, |
| "loss": 0.2145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22591176629066467, |
| "step": 1225, |
| "valid_targets_mean": 1478.6, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 1.2920168067226891, |
| "grad_norm": 0.7776629349610283, |
| "learning_rate": 3.913947188969801e-05, |
| "loss": 0.2065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19768911600112915, |
| "step": 1230, |
| "valid_targets_mean": 1332.7, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 1.2972689075630253, |
| "grad_norm": 0.7729134790563235, |
| "learning_rate": 3.912420512270981e-05, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2305484265089035, |
| "step": 1235, |
| "valid_targets_mean": 1622.7, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 1.3025210084033614, |
| "grad_norm": 0.8616431181942282, |
| "learning_rate": 3.910880714938757e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1932060420513153, |
| "step": 1240, |
| "valid_targets_mean": 1195.4, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 1.3077731092436975, |
| "grad_norm": 0.7695069319629071, |
| "learning_rate": 3.909327807537288e-05, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.232661634683609, |
| "step": 1245, |
| "valid_targets_mean": 1504.5, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 1.3130252100840336, |
| "grad_norm": 0.7113969327868939, |
| "learning_rate": 3.90776180072068e-05, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20750564336776733, |
| "step": 1250, |
| "valid_targets_mean": 1580.1, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 1.3182773109243697, |
| "grad_norm": 0.7945153800878063, |
| "learning_rate": 3.906182705232909e-05, |
| "loss": 0.1997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20195449888706207, |
| "step": 1255, |
| "valid_targets_mean": 1158.2, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 1.3235294117647058, |
| "grad_norm": 0.7587646804913716, |
| "learning_rate": 3.904590531907751e-05, |
| "loss": 0.2159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21249453723430634, |
| "step": 1260, |
| "valid_targets_mean": 1430.4, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 1.328781512605042, |
| "grad_norm": 0.7185755186164045, |
| "learning_rate": 3.9029852916687034e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2006302922964096, |
| "step": 1265, |
| "valid_targets_mean": 1590.4, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 1.334033613445378, |
| "grad_norm": 0.7257232800212272, |
| "learning_rate": 3.9013669955289136e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20573708415031433, |
| "step": 1270, |
| "valid_targets_mean": 1521.5, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 1.3392857142857144, |
| "grad_norm": 0.7974748283202712, |
| "learning_rate": 3.899735654591101e-05, |
| "loss": 0.21, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22591374814510345, |
| "step": 1275, |
| "valid_targets_mean": 1455.2, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 1.3445378151260505, |
| "grad_norm": 0.8433766016494005, |
| "learning_rate": 3.898091280047486e-05, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20434291660785675, |
| "step": 1280, |
| "valid_targets_mean": 1279.4, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 1.3497899159663866, |
| "grad_norm": 0.7810238280537369, |
| "learning_rate": 3.896433883179703e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22051532566547394, |
| "step": 1285, |
| "valid_targets_mean": 1366.9, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 1.3550420168067228, |
| "grad_norm": 0.9021667080271751, |
| "learning_rate": 3.894763475358736e-05, |
| "loss": 0.2124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19154158234596252, |
| "step": 1290, |
| "valid_targets_mean": 1220.5, |
| "valid_targets_min": 585 |
| }, |
| { |
| "epoch": 1.3602941176470589, |
| "grad_norm": 0.8197315751887221, |
| "learning_rate": 3.8930800680448275e-05, |
| "loss": 0.2202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.230904221534729, |
| "step": 1295, |
| "valid_targets_mean": 1596.4, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 1.365546218487395, |
| "grad_norm": 0.7275089472098615, |
| "learning_rate": 3.891383672787411e-05, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20911553502082825, |
| "step": 1300, |
| "valid_targets_mean": 1401.3, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 1.370798319327731, |
| "grad_norm": 0.7376318715306975, |
| "learning_rate": 3.889674301225025e-05, |
| "loss": 0.2162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19725364446640015, |
| "step": 1305, |
| "valid_targets_mean": 1546.8, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 1.3760504201680672, |
| "grad_norm": 0.7408476899885955, |
| "learning_rate": 3.8879519650852356e-05, |
| "loss": 0.2053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18753978610038757, |
| "step": 1310, |
| "valid_targets_mean": 1284.4, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 1.3813025210084033, |
| "grad_norm": 0.7266684151521309, |
| "learning_rate": 3.886216676184555e-05, |
| "loss": 0.214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20051538944244385, |
| "step": 1315, |
| "valid_targets_mean": 1356.6, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 1.3865546218487395, |
| "grad_norm": 0.7791953600527686, |
| "learning_rate": 3.8844684464283614e-05, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23191730678081512, |
| "step": 1320, |
| "valid_targets_mean": 1564.5, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 1.3918067226890756, |
| "grad_norm": 0.6803022151794903, |
| "learning_rate": 3.882707287810817e-05, |
| "loss": 0.2039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20292726159095764, |
| "step": 1325, |
| "valid_targets_mean": 1604.7, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 1.3970588235294117, |
| "grad_norm": 0.7109648477839206, |
| "learning_rate": 3.880933212414786e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19687709212303162, |
| "step": 1330, |
| "valid_targets_mean": 1383.4, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 1.4023109243697478, |
| "grad_norm": 0.7636435446308724, |
| "learning_rate": 3.87914623241175e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19838300347328186, |
| "step": 1335, |
| "valid_targets_mean": 1482.5, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 1.407563025210084, |
| "grad_norm": 0.7790600366170161, |
| "learning_rate": 3.877346360061728e-05, |
| "loss": 0.2213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20176908373832703, |
| "step": 1340, |
| "valid_targets_mean": 1603.6, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 1.41281512605042, |
| "grad_norm": 0.7307120382472138, |
| "learning_rate": 3.8755336077131894e-05, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19978278875350952, |
| "step": 1345, |
| "valid_targets_mean": 1517.9, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 1.4180672268907564, |
| "grad_norm": 0.7009558460825884, |
| "learning_rate": 3.873707987802967e-05, |
| "loss": 0.2027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20674484968185425, |
| "step": 1350, |
| "valid_targets_mean": 1516.2, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 1.4233193277310925, |
| "grad_norm": 0.6935543353633367, |
| "learning_rate": 3.871869512856179e-05, |
| "loss": 0.1965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19707924127578735, |
| "step": 1355, |
| "valid_targets_mean": 1606.8, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 1.4285714285714286, |
| "grad_norm": 0.7721082945840706, |
| "learning_rate": 3.870018195486138e-05, |
| "loss": 0.1903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20531484484672546, |
| "step": 1360, |
| "valid_targets_mean": 1328.7, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 1.4338235294117647, |
| "grad_norm": 0.7736104466743927, |
| "learning_rate": 3.868154048394262e-05, |
| "loss": 0.2059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.201510488986969, |
| "step": 1365, |
| "valid_targets_mean": 1396.2, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 1.4390756302521008, |
| "grad_norm": 0.7550538776229306, |
| "learning_rate": 3.8662770843699944e-05, |
| "loss": 0.204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2158433496952057, |
| "step": 1370, |
| "valid_targets_mean": 1352.9, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.444327731092437, |
| "grad_norm": 0.6820026840811728, |
| "learning_rate": 3.8643873162907086e-05, |
| "loss": 0.2009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19932374358177185, |
| "step": 1375, |
| "valid_targets_mean": 1479.4, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 1.449579831932773, |
| "grad_norm": 0.6850687148845401, |
| "learning_rate": 3.862484757121627e-05, |
| "loss": 0.2008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19579848647117615, |
| "step": 1380, |
| "valid_targets_mean": 1501.2, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 1.4548319327731092, |
| "grad_norm": 0.6990618001541059, |
| "learning_rate": 3.860569419915727e-05, |
| "loss": 0.2082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20401817560195923, |
| "step": 1385, |
| "valid_targets_mean": 1419.9, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 1.4600840336134453, |
| "grad_norm": 0.699051470230191, |
| "learning_rate": 3.858641317813653e-05, |
| "loss": 0.2151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23287919163703918, |
| "step": 1390, |
| "valid_targets_mean": 1587.2, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 1.4653361344537816, |
| "grad_norm": 0.5943455101511255, |
| "learning_rate": 3.8567004640436234e-05, |
| "loss": 0.3011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3295353651046753, |
| "step": 1395, |
| "valid_targets_mean": 3546.9, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 1.4705882352941178, |
| "grad_norm": 0.570252231140088, |
| "learning_rate": 3.8547468719213476e-05, |
| "loss": 0.3267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33764392137527466, |
| "step": 1400, |
| "valid_targets_mean": 4000.6, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 1.4758403361344539, |
| "grad_norm": 0.5515303020894601, |
| "learning_rate": 3.852780554849925e-05, |
| "loss": 0.3055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3034968376159668, |
| "step": 1405, |
| "valid_targets_mean": 4063.9, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 1.48109243697479, |
| "grad_norm": 0.5595030961730294, |
| "learning_rate": 3.850801526319761e-05, |
| "loss": 0.3004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.288005530834198, |
| "step": 1410, |
| "valid_targets_mean": 3747.0, |
| "valid_targets_min": 1561 |
| }, |
| { |
| "epoch": 1.486344537815126, |
| "grad_norm": 0.5948008178131649, |
| "learning_rate": 3.84880979990847e-05, |
| "loss": 0.304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32669079303741455, |
| "step": 1415, |
| "valid_targets_mean": 3562.5, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 1.4915966386554622, |
| "grad_norm": 0.5216067222057376, |
| "learning_rate": 3.846805389280782e-05, |
| "loss": 0.3154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2934839725494385, |
| "step": 1420, |
| "valid_targets_mean": 3911.4, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 1.4968487394957983, |
| "grad_norm": 0.4836038411370819, |
| "learning_rate": 3.844788308188452e-05, |
| "loss": 0.2861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3024061918258667, |
| "step": 1425, |
| "valid_targets_mean": 5753.8, |
| "valid_targets_min": 2060 |
| }, |
| { |
| "epoch": 1.5021008403361344, |
| "grad_norm": 0.5556606445880677, |
| "learning_rate": 3.8427585704701634e-05, |
| "loss": 0.3043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31254953145980835, |
| "step": 1430, |
| "valid_targets_mean": 3728.6, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 1.5073529411764706, |
| "grad_norm": 0.5895498142754928, |
| "learning_rate": 3.840716190051433e-05, |
| "loss": 0.3141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32763177156448364, |
| "step": 1435, |
| "valid_targets_mean": 3554.0, |
| "valid_targets_min": 1689 |
| }, |
| { |
| "epoch": 1.5126050420168067, |
| "grad_norm": 0.54899724482139, |
| "learning_rate": 3.8386611809445155e-05, |
| "loss": 0.3091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30432096123695374, |
| "step": 1440, |
| "valid_targets_mean": 3708.1, |
| "valid_targets_min": 1697 |
| }, |
| { |
| "epoch": 1.5178571428571428, |
| "grad_norm": 0.6115854171093719, |
| "learning_rate": 3.8365935572483095e-05, |
| "loss": 0.3162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3384946882724762, |
| "step": 1445, |
| "valid_targets_mean": 3652.6, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 1.523109243697479, |
| "grad_norm": 0.5435695015200867, |
| "learning_rate": 3.834513333148258e-05, |
| "loss": 0.3085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3052658438682556, |
| "step": 1450, |
| "valid_targets_mean": 4036.1, |
| "valid_targets_min": 1552 |
| }, |
| { |
| "epoch": 1.528361344537815, |
| "grad_norm": 0.614280577128499, |
| "learning_rate": 3.832420522916252e-05, |
| "loss": 0.3084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.316119909286499, |
| "step": 1455, |
| "valid_targets_mean": 3543.5, |
| "valid_targets_min": 1439 |
| }, |
| { |
| "epoch": 1.5336134453781511, |
| "grad_norm": 0.5885577114747288, |
| "learning_rate": 3.830315140910534e-05, |
| "loss": 0.3058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30280590057373047, |
| "step": 1460, |
| "valid_targets_mean": 3287.0, |
| "valid_targets_min": 1402 |
| }, |
| { |
| "epoch": 1.5388655462184873, |
| "grad_norm": 0.6135025188561368, |
| "learning_rate": 3.8281972015755965e-05, |
| "loss": 0.3204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3206782341003418, |
| "step": 1465, |
| "valid_targets_mean": 3423.9, |
| "valid_targets_min": 1586 |
| }, |
| { |
| "epoch": 1.5441176470588234, |
| "grad_norm": 0.584621502686007, |
| "learning_rate": 3.826066719442086e-05, |
| "loss": 0.3117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3108097314834595, |
| "step": 1470, |
| "valid_targets_mean": 3406.0, |
| "valid_targets_min": 1538 |
| }, |
| { |
| "epoch": 1.5493697478991597, |
| "grad_norm": 0.6706962593993887, |
| "learning_rate": 3.823923709126701e-05, |
| "loss": 0.3158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31825387477874756, |
| "step": 1475, |
| "valid_targets_mean": 2954.0, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 1.5546218487394958, |
| "grad_norm": 0.651116388475916, |
| "learning_rate": 3.821768185332095e-05, |
| "loss": 0.3305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32802870869636536, |
| "step": 1480, |
| "valid_targets_mean": 3051.8, |
| "valid_targets_min": 1362 |
| }, |
| { |
| "epoch": 1.559873949579832, |
| "grad_norm": 0.5745329146566351, |
| "learning_rate": 3.81960016284677e-05, |
| "loss": 0.3145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3129153251647949, |
| "step": 1485, |
| "valid_targets_mean": 3620.5, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 1.565126050420168, |
| "grad_norm": 0.6580272364249068, |
| "learning_rate": 3.817419656544979e-05, |
| "loss": 0.3154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3198480010032654, |
| "step": 1490, |
| "valid_targets_mean": 3103.6, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 1.5703781512605042, |
| "grad_norm": 0.6033632847231352, |
| "learning_rate": 3.815226681386626e-05, |
| "loss": 0.3079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3069283664226532, |
| "step": 1495, |
| "valid_targets_mean": 3592.7, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 1.5756302521008403, |
| "grad_norm": 0.5732499269923438, |
| "learning_rate": 3.8130212524171576e-05, |
| "loss": 0.2966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30469539761543274, |
| "step": 1500, |
| "valid_targets_mean": 3632.1, |
| "valid_targets_min": 1785 |
| }, |
| { |
| "epoch": 1.5808823529411766, |
| "grad_norm": 0.5775861462441018, |
| "learning_rate": 3.810803384767465e-05, |
| "loss": 0.319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2886812388896942, |
| "step": 1505, |
| "valid_targets_mean": 3557.1, |
| "valid_targets_min": 1957 |
| }, |
| { |
| "epoch": 1.5861344537815127, |
| "grad_norm": 0.5694130410160565, |
| "learning_rate": 3.808573093653777e-05, |
| "loss": 0.315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2857256233692169, |
| "step": 1510, |
| "valid_targets_mean": 3230.6, |
| "valid_targets_min": 1570 |
| }, |
| { |
| "epoch": 1.5913865546218489, |
| "grad_norm": 0.6246265430681128, |
| "learning_rate": 3.806330394377556e-05, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30203184485435486, |
| "step": 1515, |
| "valid_targets_mean": 3023.7, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 1.596638655462185, |
| "grad_norm": 0.658813587454356, |
| "learning_rate": 3.8040753023253956e-05, |
| "loss": 0.3007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33436664938926697, |
| "step": 1520, |
| "valid_targets_mean": 3056.6, |
| "valid_targets_min": 1293 |
| }, |
| { |
| "epoch": 1.601890756302521, |
| "grad_norm": 0.6211106779673433, |
| "learning_rate": 3.801807832968912e-05, |
| "loss": 0.3093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29863476753234863, |
| "step": 1525, |
| "valid_targets_mean": 2915.6, |
| "valid_targets_min": 1687 |
| }, |
| { |
| "epoch": 1.6071428571428572, |
| "grad_norm": 0.6368491555844873, |
| "learning_rate": 3.799528001864637e-05, |
| "loss": 0.3068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33547699451446533, |
| "step": 1530, |
| "valid_targets_mean": 2985.1, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 1.6123949579831933, |
| "grad_norm": 0.5840908746370534, |
| "learning_rate": 3.797235824653918e-05, |
| "loss": 0.3048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3032509684562683, |
| "step": 1535, |
| "valid_targets_mean": 3195.0, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 1.6176470588235294, |
| "grad_norm": 0.6352859314737174, |
| "learning_rate": 3.7949313170628006e-05, |
| "loss": 0.3143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3243550956249237, |
| "step": 1540, |
| "valid_targets_mean": 3106.2, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 1.6228991596638656, |
| "grad_norm": 0.6224156356901303, |
| "learning_rate": 3.79261449490193e-05, |
| "loss": 0.2955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30039089918136597, |
| "step": 1545, |
| "valid_targets_mean": 3189.5, |
| "valid_targets_min": 1896 |
| }, |
| { |
| "epoch": 1.6281512605042017, |
| "grad_norm": 0.6278005675540494, |
| "learning_rate": 3.7902853740664356e-05, |
| "loss": 0.3128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3083696663379669, |
| "step": 1550, |
| "valid_targets_mean": 3278.9, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 1.6334033613445378, |
| "grad_norm": 0.5850412843704133, |
| "learning_rate": 3.7879439705358286e-05, |
| "loss": 0.3043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3127497732639313, |
| "step": 1555, |
| "valid_targets_mean": 3398.8, |
| "valid_targets_min": 1270 |
| }, |
| { |
| "epoch": 1.638655462184874, |
| "grad_norm": 0.5805366053879955, |
| "learning_rate": 3.785590300373884e-05, |
| "loss": 0.3063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29494237899780273, |
| "step": 1560, |
| "valid_targets_mean": 3829.2, |
| "valid_targets_min": 1668 |
| }, |
| { |
| "epoch": 1.64390756302521, |
| "grad_norm": 0.569934576020579, |
| "learning_rate": 3.7832243797285385e-05, |
| "loss": 0.3052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3094933032989502, |
| "step": 1565, |
| "valid_targets_mean": 3426.9, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 1.6491596638655461, |
| "grad_norm": 0.6159772681925453, |
| "learning_rate": 3.780846224831775e-05, |
| "loss": 0.3049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3124518394470215, |
| "step": 1570, |
| "valid_targets_mean": 3523.6, |
| "valid_targets_min": 1858 |
| }, |
| { |
| "epoch": 1.6544117647058822, |
| "grad_norm": 0.5971056987489094, |
| "learning_rate": 3.7784558519995135e-05, |
| "loss": 0.3075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28216129541397095, |
| "step": 1575, |
| "valid_targets_mean": 3161.2, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 1.6596638655462184, |
| "grad_norm": 0.699651916524887, |
| "learning_rate": 3.776053277631496e-05, |
| "loss": 0.3079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34362688660621643, |
| "step": 1580, |
| "valid_targets_mean": 2948.9, |
| "valid_targets_min": 1812 |
| }, |
| { |
| "epoch": 1.6649159663865545, |
| "grad_norm": 0.7182980448996313, |
| "learning_rate": 3.7736385182111785e-05, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2877700626850128, |
| "step": 1585, |
| "valid_targets_mean": 3107.7, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 1.6701680672268906, |
| "grad_norm": 0.5675825049010571, |
| "learning_rate": 3.771211590305614e-05, |
| "loss": 0.2923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2754617929458618, |
| "step": 1590, |
| "valid_targets_mean": 3372.6, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 1.675420168067227, |
| "grad_norm": 0.5802055167295502, |
| "learning_rate": 3.768772510565342e-05, |
| "loss": 0.2973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29426002502441406, |
| "step": 1595, |
| "valid_targets_mean": 3305.2, |
| "valid_targets_min": 1673 |
| }, |
| { |
| "epoch": 1.680672268907563, |
| "grad_norm": 0.5249464047322138, |
| "learning_rate": 3.76632129572427e-05, |
| "loss": 0.2977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2580610513687134, |
| "step": 1600, |
| "valid_targets_mean": 3933.0, |
| "valid_targets_min": 1869 |
| }, |
| { |
| "epoch": 1.6859243697478992, |
| "grad_norm": 1.426921636472864, |
| "learning_rate": 3.763857962599565e-05, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3049716353416443, |
| "step": 1605, |
| "valid_targets_mean": 3010.2, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 1.6911764705882353, |
| "grad_norm": 0.6454799620397031, |
| "learning_rate": 3.761382528091531e-05, |
| "loss": 0.3122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30134791135787964, |
| "step": 1610, |
| "valid_targets_mean": 3055.6, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 1.6964285714285714, |
| "grad_norm": 0.5717900298014066, |
| "learning_rate": 3.7588950091834986e-05, |
| "loss": 0.3049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2911268174648285, |
| "step": 1615, |
| "valid_targets_mean": 3442.4, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 1.7016806722689075, |
| "grad_norm": 0.645609709718482, |
| "learning_rate": 3.756395422941706e-05, |
| "loss": 0.2833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30699074268341064, |
| "step": 1620, |
| "valid_targets_mean": 3041.9, |
| "valid_targets_min": 1955 |
| }, |
| { |
| "epoch": 1.7069327731092439, |
| "grad_norm": 0.5866883370447175, |
| "learning_rate": 3.753883786515181e-05, |
| "loss": 0.2999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2968907654285431, |
| "step": 1625, |
| "valid_targets_mean": 3640.2, |
| "valid_targets_min": 1628 |
| }, |
| { |
| "epoch": 1.71218487394958, |
| "grad_norm": 0.5743154885711474, |
| "learning_rate": 3.751360117135628e-05, |
| "loss": 0.2881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2586438059806824, |
| "step": 1630, |
| "valid_targets_mean": 3358.4, |
| "valid_targets_min": 1482 |
| }, |
| { |
| "epoch": 1.717436974789916, |
| "grad_norm": 0.5881142433423517, |
| "learning_rate": 3.7488244321173025e-05, |
| "loss": 0.2883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26784512400627136, |
| "step": 1635, |
| "valid_targets_mean": 3460.4, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 1.7226890756302522, |
| "grad_norm": 0.6168171706911441, |
| "learning_rate": 3.746276748856898e-05, |
| "loss": 0.2982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3478624224662781, |
| "step": 1640, |
| "valid_targets_mean": 3728.4, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 1.7279411764705883, |
| "grad_norm": 0.5755170388250846, |
| "learning_rate": 3.743717084833425e-05, |
| "loss": 0.3, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30867037177085876, |
| "step": 1645, |
| "valid_targets_mean": 3940.4, |
| "valid_targets_min": 1658 |
| }, |
| { |
| "epoch": 1.7331932773109244, |
| "grad_norm": 0.6224361276979423, |
| "learning_rate": 3.741145457608093e-05, |
| "loss": 0.2957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31917211413383484, |
| "step": 1650, |
| "valid_targets_mean": 3536.9, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 1.7384453781512605, |
| "grad_norm": 0.6144445149004428, |
| "learning_rate": 3.738561884824183e-05, |
| "loss": 0.2996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3049688935279846, |
| "step": 1655, |
| "valid_targets_mean": 3351.2, |
| "valid_targets_min": 2010 |
| }, |
| { |
| "epoch": 1.7436974789915967, |
| "grad_norm": 0.5954264479652966, |
| "learning_rate": 3.735966384206936e-05, |
| "loss": 0.3155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30082428455352783, |
| "step": 1660, |
| "valid_targets_mean": 3498.6, |
| "valid_targets_min": 1172 |
| }, |
| { |
| "epoch": 1.7489495798319328, |
| "grad_norm": 0.5715440496549611, |
| "learning_rate": 3.733358973563425e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2998632788658142, |
| "step": 1665, |
| "valid_targets_mean": 3863.8, |
| "valid_targets_min": 1229 |
| }, |
| { |
| "epoch": 1.754201680672269, |
| "grad_norm": 0.6026903585406433, |
| "learning_rate": 3.730739670782435e-05, |
| "loss": 0.2896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2936575412750244, |
| "step": 1670, |
| "valid_targets_mean": 3600.5, |
| "valid_targets_min": 1523 |
| }, |
| { |
| "epoch": 1.759453781512605, |
| "grad_norm": 0.5960750461839239, |
| "learning_rate": 3.72810849383434e-05, |
| "loss": 0.2869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.286255419254303, |
| "step": 1675, |
| "valid_targets_mean": 3623.9, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 1.7647058823529411, |
| "grad_norm": 0.5856872929601087, |
| "learning_rate": 3.725465460770978e-05, |
| "loss": 0.2922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29570281505584717, |
| "step": 1680, |
| "valid_targets_mean": 3535.2, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 1.7699579831932772, |
| "grad_norm": 0.6652466131769478, |
| "learning_rate": 3.7228105897255324e-05, |
| "loss": 0.293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29390841722488403, |
| "step": 1685, |
| "valid_targets_mean": 3071.5, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 1.7752100840336134, |
| "grad_norm": 0.5607387594187455, |
| "learning_rate": 3.7201438989124e-05, |
| "loss": 0.2794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25984397530555725, |
| "step": 1690, |
| "valid_targets_mean": 3779.1, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 1.7804621848739495, |
| "grad_norm": 0.5923487985204593, |
| "learning_rate": 3.717465406627074e-05, |
| "loss": 0.288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27242133021354675, |
| "step": 1695, |
| "valid_targets_mean": 3330.2, |
| "valid_targets_min": 1853 |
| }, |
| { |
| "epoch": 1.7857142857142856, |
| "grad_norm": 0.5899947816496157, |
| "learning_rate": 3.714775131246011e-05, |
| "loss": 0.314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2966066002845764, |
| "step": 1700, |
| "valid_targets_mean": 3327.8, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 1.7909663865546217, |
| "grad_norm": 0.66060731387224, |
| "learning_rate": 3.71207309122651e-05, |
| "loss": 0.289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2911011576652527, |
| "step": 1705, |
| "valid_targets_mean": 2920.6, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 1.7962184873949578, |
| "grad_norm": 0.5843889526857856, |
| "learning_rate": 3.709359305106585e-05, |
| "loss": 0.2926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2868155837059021, |
| "step": 1710, |
| "valid_targets_mean": 3539.7, |
| "valid_targets_min": 996 |
| }, |
| { |
| "epoch": 1.8014705882352942, |
| "grad_norm": 0.586228171865445, |
| "learning_rate": 3.7066337915048354e-05, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27134719491004944, |
| "step": 1715, |
| "valid_targets_mean": 3357.1, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 1.8067226890756303, |
| "grad_norm": 0.606158452920606, |
| "learning_rate": 3.7038965691203205e-05, |
| "loss": 0.3019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31426700949668884, |
| "step": 1720, |
| "valid_targets_mean": 3613.5, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 1.8119747899159664, |
| "grad_norm": 0.5526990318942386, |
| "learning_rate": 3.701147656732431e-05, |
| "loss": 0.2812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24181315302848816, |
| "step": 1725, |
| "valid_targets_mean": 3327.4, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 1.8172268907563025, |
| "grad_norm": 0.6528173405719958, |
| "learning_rate": 3.6983870732007596e-05, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2989552617073059, |
| "step": 1730, |
| "valid_targets_mean": 2790.8, |
| "valid_targets_min": 1649 |
| }, |
| { |
| "epoch": 1.8224789915966386, |
| "grad_norm": 0.6835745034650174, |
| "learning_rate": 3.695614837464972e-05, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3165176808834076, |
| "step": 1735, |
| "valid_targets_mean": 2811.8, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 1.8277310924369747, |
| "grad_norm": 0.6755172073863958, |
| "learning_rate": 3.692830968544675e-05, |
| "loss": 0.306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3160332441329956, |
| "step": 1740, |
| "valid_targets_mean": 3420.2, |
| "valid_targets_min": 1720 |
| }, |
| { |
| "epoch": 1.832983193277311, |
| "grad_norm": 0.6087751854436854, |
| "learning_rate": 3.690035485539291e-05, |
| "loss": 0.2993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29514777660369873, |
| "step": 1745, |
| "valid_targets_mean": 3542.7, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 1.8382352941176472, |
| "grad_norm": 0.6241785789650026, |
| "learning_rate": 3.6872284076279205e-05, |
| "loss": 0.2966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2934738099575043, |
| "step": 1750, |
| "valid_targets_mean": 3049.7, |
| "valid_targets_min": 1643 |
| }, |
| { |
| "epoch": 1.8434873949579833, |
| "grad_norm": 0.5825825660256299, |
| "learning_rate": 3.684409754069215e-05, |
| "loss": 0.3039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30002132058143616, |
| "step": 1755, |
| "valid_targets_mean": 3757.8, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 1.8487394957983194, |
| "grad_norm": 0.6258913745185652, |
| "learning_rate": 3.681579544201244e-05, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.290172278881073, |
| "step": 1760, |
| "valid_targets_mean": 3715.1, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 1.8539915966386555, |
| "grad_norm": 0.6554971879023268, |
| "learning_rate": 3.6787377974413614e-05, |
| "loss": 0.3127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32472649216651917, |
| "step": 1765, |
| "valid_targets_mean": 3321.9, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 1.8592436974789917, |
| "grad_norm": 0.6104106962565312, |
| "learning_rate": 3.6758845332860734e-05, |
| "loss": 0.3036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.320326030254364, |
| "step": 1770, |
| "valid_targets_mean": 3713.2, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 1.8644957983193278, |
| "grad_norm": 0.6602404199908332, |
| "learning_rate": 3.673019771310903e-05, |
| "loss": 0.3009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3192262649536133, |
| "step": 1775, |
| "valid_targets_mean": 2961.8, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 1.8697478991596639, |
| "grad_norm": 0.9226641425449463, |
| "learning_rate": 3.670143531170258e-05, |
| "loss": 0.3044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30954253673553467, |
| "step": 1780, |
| "valid_targets_mean": 3012.6, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 1.875, |
| "grad_norm": 0.5947567961611435, |
| "learning_rate": 3.667255832597294e-05, |
| "loss": 0.2982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3080810010433197, |
| "step": 1785, |
| "valid_targets_mean": 3639.9, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 1.8802521008403361, |
| "grad_norm": 0.5635109826748741, |
| "learning_rate": 3.664356695403781e-05, |
| "loss": 0.2972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2792786955833435, |
| "step": 1790, |
| "valid_targets_mean": 4017.4, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 1.8855042016806722, |
| "grad_norm": 0.7060376087001079, |
| "learning_rate": 3.661446139479965e-05, |
| "loss": 0.2965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31975793838500977, |
| "step": 1795, |
| "valid_targets_mean": 3178.8, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 1.8907563025210083, |
| "grad_norm": 0.5936744481364934, |
| "learning_rate": 3.658524184794436e-05, |
| "loss": 0.2927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2860378324985504, |
| "step": 1800, |
| "valid_targets_mean": 3633.9, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 1.8960084033613445, |
| "grad_norm": 0.5822754669183862, |
| "learning_rate": 3.655590851393984e-05, |
| "loss": 0.3049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3000732660293579, |
| "step": 1805, |
| "valid_targets_mean": 3981.0, |
| "valid_targets_min": 1464 |
| }, |
| { |
| "epoch": 1.9012605042016806, |
| "grad_norm": 0.6913451388646343, |
| "learning_rate": 3.652646159403468e-05, |
| "loss": 0.3136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3260645866394043, |
| "step": 1810, |
| "valid_targets_mean": 2612.0, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 1.9065126050420167, |
| "grad_norm": 0.6287538437173945, |
| "learning_rate": 3.649690129025675e-05, |
| "loss": 0.2841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29579633474349976, |
| "step": 1815, |
| "valid_targets_mean": 3489.8, |
| "valid_targets_min": 1457 |
| }, |
| { |
| "epoch": 1.9117647058823528, |
| "grad_norm": 0.6767664513173561, |
| "learning_rate": 3.6467227805411824e-05, |
| "loss": 0.2916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29462265968322754, |
| "step": 1820, |
| "valid_targets_mean": 3059.1, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 1.917016806722689, |
| "grad_norm": 0.6395995499615521, |
| "learning_rate": 3.6437441343082174e-05, |
| "loss": 0.2944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3023369312286377, |
| "step": 1825, |
| "valid_targets_mean": 3259.2, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 1.9222689075630253, |
| "grad_norm": 0.5856128524517397, |
| "learning_rate": 3.6407542107625167e-05, |
| "loss": 0.2836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27946245670318604, |
| "step": 1830, |
| "valid_targets_mean": 3337.9, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 1.9275210084033614, |
| "grad_norm": 0.5516337340536542, |
| "learning_rate": 3.637753030417192e-05, |
| "loss": 0.282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2830444574356079, |
| "step": 1835, |
| "valid_targets_mean": 4091.9, |
| "valid_targets_min": 1876 |
| }, |
| { |
| "epoch": 1.9327731092436975, |
| "grad_norm": 0.6188213113954284, |
| "learning_rate": 3.6347406138625805e-05, |
| "loss": 0.2869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3005865812301636, |
| "step": 1840, |
| "valid_targets_mean": 3705.8, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 1.9380252100840336, |
| "grad_norm": 0.6342838492371049, |
| "learning_rate": 3.631716981766111e-05, |
| "loss": 0.2778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2753984034061432, |
| "step": 1845, |
| "valid_targets_mean": 3030.8, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 1.9432773109243697, |
| "grad_norm": 0.5880238709579537, |
| "learning_rate": 3.6286821548721594e-05, |
| "loss": 0.2822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28602135181427, |
| "step": 1850, |
| "valid_targets_mean": 3366.9, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 1.9485294117647058, |
| "grad_norm": 0.5720082036013604, |
| "learning_rate": 3.625636154001904e-05, |
| "loss": 0.2821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2676365375518799, |
| "step": 1855, |
| "valid_targets_mean": 3651.0, |
| "valid_targets_min": 1295 |
| }, |
| { |
| "epoch": 1.9537815126050422, |
| "grad_norm": 0.585699773613234, |
| "learning_rate": 3.622579000053186e-05, |
| "loss": 0.2902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29407864809036255, |
| "step": 1860, |
| "valid_targets_mean": 3583.6, |
| "valid_targets_min": 1598 |
| }, |
| { |
| "epoch": 1.9590336134453783, |
| "grad_norm": 0.6205691001395918, |
| "learning_rate": 3.619510714000368e-05, |
| "loss": 0.3088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27674800157546997, |
| "step": 1865, |
| "valid_targets_mean": 2903.2, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 1.9642857142857144, |
| "grad_norm": 0.7438366690160714, |
| "learning_rate": 3.616431316894181e-05, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31191760301589966, |
| "step": 1870, |
| "valid_targets_mean": 3116.1, |
| "valid_targets_min": 1621 |
| }, |
| { |
| "epoch": 1.9695378151260505, |
| "grad_norm": 0.6496526680316776, |
| "learning_rate": 3.613340829861592e-05, |
| "loss": 0.2777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2977924346923828, |
| "step": 1875, |
| "valid_targets_mean": 3081.4, |
| "valid_targets_min": 1858 |
| }, |
| { |
| "epoch": 1.9747899159663866, |
| "grad_norm": 0.5707764114436218, |
| "learning_rate": 3.61023927410565e-05, |
| "loss": 0.2855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25262773036956787, |
| "step": 1880, |
| "valid_targets_mean": 3470.7, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 1.9800420168067228, |
| "grad_norm": 0.601493220440057, |
| "learning_rate": 3.607126670905346e-05, |
| "loss": 0.2966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2920111417770386, |
| "step": 1885, |
| "valid_targets_mean": 3584.2, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 1.9852941176470589, |
| "grad_norm": 0.6874129379616689, |
| "learning_rate": 3.60400304161546e-05, |
| "loss": 0.3002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2971467673778534, |
| "step": 1890, |
| "valid_targets_mean": 2940.8, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 1.990546218487395, |
| "grad_norm": 0.6483438175679863, |
| "learning_rate": 3.600868407666426e-05, |
| "loss": 0.2939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29474449157714844, |
| "step": 1895, |
| "valid_targets_mean": 3248.2, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 1.995798319327731, |
| "grad_norm": 0.5918173246249905, |
| "learning_rate": 3.597722790564172e-05, |
| "loss": 0.2929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2911064624786377, |
| "step": 1900, |
| "valid_targets_mean": 3728.8, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 2.0010504201680672, |
| "grad_norm": 1.269479871339695, |
| "learning_rate": 3.5945662118899824e-05, |
| "loss": 0.2774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21561074256896973, |
| "step": 1905, |
| "valid_targets_mean": 1523.7, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 2.0063025210084033, |
| "grad_norm": 0.834502760942854, |
| "learning_rate": 3.5913986933003455e-05, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1978900134563446, |
| "step": 1910, |
| "valid_targets_mean": 1311.9, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 2.0115546218487395, |
| "grad_norm": 0.8472702704612042, |
| "learning_rate": 3.5882202565268046e-05, |
| "loss": 0.2006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19883087277412415, |
| "step": 1915, |
| "valid_targets_mean": 1391.8, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 2.0168067226890756, |
| "grad_norm": 0.8558019853903324, |
| "learning_rate": 3.58503092337581e-05, |
| "loss": 0.2006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2164035588502884, |
| "step": 1920, |
| "valid_targets_mean": 1409.8, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 2.0220588235294117, |
| "grad_norm": 0.755196603700863, |
| "learning_rate": 3.5818307157285705e-05, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20270323753356934, |
| "step": 1925, |
| "valid_targets_mean": 1448.8, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 2.027310924369748, |
| "grad_norm": 0.7296703034732365, |
| "learning_rate": 3.5786196555409006e-05, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18208900094032288, |
| "step": 1930, |
| "valid_targets_mean": 1219.5, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 2.032563025210084, |
| "grad_norm": 0.7684329269994562, |
| "learning_rate": 3.575397764843073e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19005586206912994, |
| "step": 1935, |
| "valid_targets_mean": 1416.7, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 2.03781512605042, |
| "grad_norm": 0.7346120823737189, |
| "learning_rate": 3.572165065739664e-05, |
| "loss": 0.1847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.173833429813385, |
| "step": 1940, |
| "valid_targets_mean": 1294.7, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 2.043067226890756, |
| "grad_norm": 0.7872472114882302, |
| "learning_rate": 3.5689215804094053e-05, |
| "loss": 0.2128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19836294651031494, |
| "step": 1945, |
| "valid_targets_mean": 1322.9, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 2.0483193277310923, |
| "grad_norm": 0.7139156271445127, |
| "learning_rate": 3.5656673311050285e-05, |
| "loss": 0.1869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.166924387216568, |
| "step": 1950, |
| "valid_targets_mean": 1500.9, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 2.0535714285714284, |
| "grad_norm": 0.7546720109875962, |
| "learning_rate": 3.562402340153115e-05, |
| "loss": 0.1969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1813475340604782, |
| "step": 1955, |
| "valid_targets_mean": 1277.2, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 2.0588235294117645, |
| "grad_norm": 0.8007930214332662, |
| "learning_rate": 3.559126629953942e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19298464059829712, |
| "step": 1960, |
| "valid_targets_mean": 1355.1, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.064075630252101, |
| "grad_norm": 1.0715850452767404, |
| "learning_rate": 3.5558402229813287e-05, |
| "loss": 0.197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19311118125915527, |
| "step": 1965, |
| "valid_targets_mean": 1323.2, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 2.069327731092437, |
| "grad_norm": 0.7534257104768941, |
| "learning_rate": 3.552543141782483e-05, |
| "loss": 0.1896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19203367829322815, |
| "step": 1970, |
| "valid_targets_mean": 1427.2, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 2.0745798319327733, |
| "grad_norm": 0.7434395907521474, |
| "learning_rate": 3.549235408977843e-05, |
| "loss": 0.1872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19772931933403015, |
| "step": 1975, |
| "valid_targets_mean": 1519.6, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 2.0798319327731094, |
| "grad_norm": 0.7265121475274179, |
| "learning_rate": 3.545917047260928e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16659091413021088, |
| "step": 1980, |
| "valid_targets_mean": 1209.2, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 2.0850840336134455, |
| "grad_norm": 0.7590657870156368, |
| "learning_rate": 3.542588079398179e-05, |
| "loss": 0.1988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20139284431934357, |
| "step": 1985, |
| "valid_targets_mean": 1439.6, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.0903361344537816, |
| "grad_norm": 0.7606478486879998, |
| "learning_rate": 3.539248528228801e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1940763294696808, |
| "step": 1990, |
| "valid_targets_mean": 1469.9, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 2.0955882352941178, |
| "grad_norm": 0.7061929545295577, |
| "learning_rate": 3.535898416664611e-05, |
| "loss": 0.2012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19255903363227844, |
| "step": 1995, |
| "valid_targets_mean": 1412.1, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 2.100840336134454, |
| "grad_norm": 0.7887719103581653, |
| "learning_rate": 3.5325377676898766e-05, |
| "loss": 0.1958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2186465561389923, |
| "step": 2000, |
| "valid_targets_mean": 1546.6, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 2.10609243697479, |
| "grad_norm": 0.8070718344561886, |
| "learning_rate": 3.529166604361161e-05, |
| "loss": 0.1912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2157689332962036, |
| "step": 2005, |
| "valid_targets_mean": 1728.5, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 2.111344537815126, |
| "grad_norm": 0.6799684604036553, |
| "learning_rate": 3.525784949807162e-05, |
| "loss": 0.1942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18615804612636566, |
| "step": 2010, |
| "valid_targets_mean": 1575.1, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 2.116596638655462, |
| "grad_norm": 0.7859292131535734, |
| "learning_rate": 3.522392827228557e-05, |
| "loss": 0.194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20224624872207642, |
| "step": 2015, |
| "valid_targets_mean": 1346.5, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 2.1218487394957983, |
| "grad_norm": 0.7769917237320048, |
| "learning_rate": 3.518990259897841e-05, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16991014778614044, |
| "step": 2020, |
| "valid_targets_mean": 1285.5, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 2.1271008403361344, |
| "grad_norm": 0.7202399948858199, |
| "learning_rate": 3.515577271159167e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1941305696964264, |
| "step": 2025, |
| "valid_targets_mean": 1565.5, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 2.1323529411764706, |
| "grad_norm": 0.7845226485201681, |
| "learning_rate": 3.512153884428188e-05, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17622260749340057, |
| "step": 2030, |
| "valid_targets_mean": 1331.2, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 2.1376050420168067, |
| "grad_norm": 0.7398989600657419, |
| "learning_rate": 3.5087201231918944e-05, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1894277185201645, |
| "step": 2035, |
| "valid_targets_mean": 1568.8, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 2.142857142857143, |
| "grad_norm": 0.7770180042406308, |
| "learning_rate": 3.505276011008454e-05, |
| "loss": 0.1929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2185641974210739, |
| "step": 2040, |
| "valid_targets_mean": 1584.9, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 2.148109243697479, |
| "grad_norm": 0.78686344769378, |
| "learning_rate": 3.501821571507048e-05, |
| "loss": 0.1869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1753498911857605, |
| "step": 2045, |
| "valid_targets_mean": 1267.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 2.153361344537815, |
| "grad_norm": 1.063699580344548, |
| "learning_rate": 3.498356828387714e-05, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1909262090921402, |
| "step": 2050, |
| "valid_targets_mean": 1532.2, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 2.158613445378151, |
| "grad_norm": 0.7643365744929539, |
| "learning_rate": 3.494881805421176e-05, |
| "loss": 0.1872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16610810160636902, |
| "step": 2055, |
| "valid_targets_mean": 1112.7, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 2.1638655462184873, |
| "grad_norm": 0.7926765771940254, |
| "learning_rate": 3.4913965264486894e-05, |
| "loss": 0.1948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18852682411670685, |
| "step": 2060, |
| "valid_targets_mean": 1402.3, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 2.1691176470588234, |
| "grad_norm": 0.729414923035659, |
| "learning_rate": 3.48790101538187e-05, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18665212392807007, |
| "step": 2065, |
| "valid_targets_mean": 1577.6, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 2.1743697478991595, |
| "grad_norm": 0.8405323016094074, |
| "learning_rate": 3.484395296202537e-05, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1933499127626419, |
| "step": 2070, |
| "valid_targets_mean": 1190.7, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 2.1796218487394956, |
| "grad_norm": 0.7875851862101669, |
| "learning_rate": 3.480879392962541e-05, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17440925538539886, |
| "step": 2075, |
| "valid_targets_mean": 1209.2, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.184873949579832, |
| "grad_norm": 0.7185518361219825, |
| "learning_rate": 3.477353329783606e-05, |
| "loss": 0.184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16545218229293823, |
| "step": 2080, |
| "valid_targets_mean": 1253.7, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 2.190126050420168, |
| "grad_norm": 0.7600617986037965, |
| "learning_rate": 3.4738171308571595e-05, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19123047590255737, |
| "step": 2085, |
| "valid_targets_mean": 1403.3, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.1953781512605044, |
| "grad_norm": 0.7730815354374817, |
| "learning_rate": 3.470270820444168e-05, |
| "loss": 0.1859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18116678297519684, |
| "step": 2090, |
| "valid_targets_mean": 1356.3, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 2.2006302521008405, |
| "grad_norm": 0.7542365322548513, |
| "learning_rate": 3.4667144228749697e-05, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18537303805351257, |
| "step": 2095, |
| "valid_targets_mean": 1550.9, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 2.2058823529411766, |
| "grad_norm": 0.7438888508924026, |
| "learning_rate": 3.463147962549109e-05, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16940736770629883, |
| "step": 2100, |
| "valid_targets_mean": 1295.9, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 2.2111344537815127, |
| "grad_norm": 0.7547714805297574, |
| "learning_rate": 3.459571463935168e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16632413864135742, |
| "step": 2105, |
| "valid_targets_mean": 1380.6, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 2.216386554621849, |
| "grad_norm": 0.7974469156906152, |
| "learning_rate": 3.455984951570598e-05, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20498281717300415, |
| "step": 2110, |
| "valid_targets_mean": 1487.6, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 2.221638655462185, |
| "grad_norm": 0.7460498917875708, |
| "learning_rate": 3.452388450061556e-05, |
| "loss": 0.1925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1839742511510849, |
| "step": 2115, |
| "valid_targets_mean": 1640.1, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 2.226890756302521, |
| "grad_norm": 0.7976082882204165, |
| "learning_rate": 3.448781984082727e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1880989819765091, |
| "step": 2120, |
| "valid_targets_mean": 1356.1, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 2.232142857142857, |
| "grad_norm": 0.8198726303330894, |
| "learning_rate": 3.4451655783771625e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19785097241401672, |
| "step": 2125, |
| "valid_targets_mean": 1494.3, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 2.2373949579831933, |
| "grad_norm": 0.7959727926112404, |
| "learning_rate": 3.4415392577561064e-05, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17913001775741577, |
| "step": 2130, |
| "valid_targets_mean": 1201.1, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 2.2426470588235294, |
| "grad_norm": 0.7163813248237905, |
| "learning_rate": 3.4379030470988285e-05, |
| "loss": 0.1909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1842835247516632, |
| "step": 2135, |
| "valid_targets_mean": 1393.6, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 2.2478991596638656, |
| "grad_norm": 0.7075959634728527, |
| "learning_rate": 3.4342569713524496e-05, |
| "loss": 0.1869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18208453059196472, |
| "step": 2140, |
| "valid_targets_mean": 1363.2, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 2.2531512605042017, |
| "grad_norm": 0.7211274630211372, |
| "learning_rate": 3.4306010555317735e-05, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18160000443458557, |
| "step": 2145, |
| "valid_targets_mean": 1349.1, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 2.258403361344538, |
| "grad_norm": 0.7402311941740003, |
| "learning_rate": 3.4269353247191135e-05, |
| "loss": 0.1802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1999184489250183, |
| "step": 2150, |
| "valid_targets_mean": 1651.7, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 2.263655462184874, |
| "grad_norm": 0.6795776738854672, |
| "learning_rate": 3.423259804064122e-05, |
| "loss": 0.1914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18849042057991028, |
| "step": 2155, |
| "valid_targets_mean": 1559.5, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 2.26890756302521, |
| "grad_norm": 0.7308651601236005, |
| "learning_rate": 3.419574518783616e-05, |
| "loss": 0.1861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17530426383018494, |
| "step": 2160, |
| "valid_targets_mean": 1387.0, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 2.274159663865546, |
| "grad_norm": 0.8144354216387479, |
| "learning_rate": 3.4158794941614055e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19270774722099304, |
| "step": 2165, |
| "valid_targets_mean": 1385.4, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 2.2794117647058822, |
| "grad_norm": 0.631924641323973, |
| "learning_rate": 3.4121747555481216e-05, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19547529518604279, |
| "step": 2170, |
| "valid_targets_mean": 1716.2, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 2.2846638655462184, |
| "grad_norm": 0.7544602510753329, |
| "learning_rate": 3.4084603283610365e-05, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18898774683475494, |
| "step": 2175, |
| "valid_targets_mean": 1409.9, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 2.2899159663865545, |
| "grad_norm": 0.7250456296463277, |
| "learning_rate": 3.404736238083897e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17501644790172577, |
| "step": 2180, |
| "valid_targets_mean": 1415.8, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 2.2951680672268906, |
| "grad_norm": 0.8001168867925627, |
| "learning_rate": 3.401002510266744e-05, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18818825483322144, |
| "step": 2185, |
| "valid_targets_mean": 1332.9, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 2.3004201680672267, |
| "grad_norm": 0.6987572245775185, |
| "learning_rate": 3.397259170525739e-05, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16560634970664978, |
| "step": 2190, |
| "valid_targets_mean": 1402.1, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 2.3056722689075633, |
| "grad_norm": 0.7531921047773884, |
| "learning_rate": 3.393506244542991e-05, |
| "loss": 0.1702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16486376523971558, |
| "step": 2195, |
| "valid_targets_mean": 1272.8, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 2.310924369747899, |
| "grad_norm": 0.6999344056695282, |
| "learning_rate": 3.389743758066374e-05, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17392639815807343, |
| "step": 2200, |
| "valid_targets_mean": 1460.0, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 2.3161764705882355, |
| "grad_norm": 0.7036250917228805, |
| "learning_rate": 3.385971736909357e-05, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1617729663848877, |
| "step": 2205, |
| "valid_targets_mean": 1283.6, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 2.3214285714285716, |
| "grad_norm": 0.7068382427421205, |
| "learning_rate": 3.382190206950822e-05, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17291636765003204, |
| "step": 2210, |
| "valid_targets_mean": 1288.4, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.3266806722689077, |
| "grad_norm": 0.663523616107997, |
| "learning_rate": 3.3783991941348916e-05, |
| "loss": 0.1823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16455985605716705, |
| "step": 2215, |
| "valid_targets_mean": 1533.8, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 2.331932773109244, |
| "grad_norm": 0.7721343986047551, |
| "learning_rate": 3.374598724470745e-05, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19193603098392487, |
| "step": 2220, |
| "valid_targets_mean": 1345.8, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 2.33718487394958, |
| "grad_norm": 0.7240487637559474, |
| "learning_rate": 3.370788824032441e-05, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1901538372039795, |
| "step": 2225, |
| "valid_targets_mean": 1601.2, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 2.342436974789916, |
| "grad_norm": 0.7718537058087979, |
| "learning_rate": 3.366969518958746e-05, |
| "loss": 0.1781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1778993457555771, |
| "step": 2230, |
| "valid_targets_mean": 1366.1, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 2.347689075630252, |
| "grad_norm": 0.7977490601269798, |
| "learning_rate": 3.363140835452945e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20514068007469177, |
| "step": 2235, |
| "valid_targets_mean": 1482.2, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 2.3529411764705883, |
| "grad_norm": 0.7668591077227411, |
| "learning_rate": 3.3593027997826654e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1879502534866333, |
| "step": 2240, |
| "valid_targets_mean": 1420.5, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 2.3581932773109244, |
| "grad_norm": 0.7855984838086749, |
| "learning_rate": 3.355455438279702e-05, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21655318140983582, |
| "step": 2245, |
| "valid_targets_mean": 1723.6, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 2.3634453781512605, |
| "grad_norm": 0.7364382070700145, |
| "learning_rate": 3.351598777339827e-05, |
| "loss": 0.1837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1900310218334198, |
| "step": 2250, |
| "valid_targets_mean": 1626.4, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 2.3686974789915967, |
| "grad_norm": 0.7437939379036828, |
| "learning_rate": 3.3477328434226164e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19543638825416565, |
| "step": 2255, |
| "valid_targets_mean": 1434.9, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 2.3739495798319328, |
| "grad_norm": 0.7246181422661423, |
| "learning_rate": 3.343857663051264e-05, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1804441660642624, |
| "step": 2260, |
| "valid_targets_mean": 1413.4, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 2.379201680672269, |
| "grad_norm": 0.73443894447988, |
| "learning_rate": 3.339973262812403e-05, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17590978741645813, |
| "step": 2265, |
| "valid_targets_mean": 1360.3, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 2.384453781512605, |
| "grad_norm": 0.8777730335212939, |
| "learning_rate": 3.336079669355921e-05, |
| "loss": 0.1786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18321183323860168, |
| "step": 2270, |
| "valid_targets_mean": 1550.0, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 2.389705882352941, |
| "grad_norm": 0.7244538791290572, |
| "learning_rate": 3.332176909394777e-05, |
| "loss": 0.1838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1737801432609558, |
| "step": 2275, |
| "valid_targets_mean": 1342.3, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 2.3949579831932772, |
| "grad_norm": 0.7245107985964735, |
| "learning_rate": 3.3282650097048206e-05, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1800583004951477, |
| "step": 2280, |
| "valid_targets_mean": 1339.6, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 2.4002100840336134, |
| "grad_norm": 0.7235945312664076, |
| "learning_rate": 3.324343997124606e-05, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15614992380142212, |
| "step": 2285, |
| "valid_targets_mean": 1459.4, |
| "valid_targets_min": 964 |
| }, |
| { |
| "epoch": 2.4054621848739495, |
| "grad_norm": 0.7567614980512993, |
| "learning_rate": 3.3204138985552094e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20014092326164246, |
| "step": 2290, |
| "valid_targets_mean": 1562.7, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 2.4107142857142856, |
| "grad_norm": 0.7418561305374557, |
| "learning_rate": 3.316474740960041e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17074398696422577, |
| "step": 2295, |
| "valid_targets_mean": 1367.2, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 2.4159663865546217, |
| "grad_norm": 0.7089430053862654, |
| "learning_rate": 3.312526551364667e-05, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17129768431186676, |
| "step": 2300, |
| "valid_targets_mean": 1451.4, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.421218487394958, |
| "grad_norm": 0.5820555364713835, |
| "learning_rate": 3.308569356856616e-05, |
| "loss": 0.1706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1320435255765915, |
| "step": 2305, |
| "valid_targets_mean": 2171.5, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 2.426470588235294, |
| "grad_norm": 0.6553889260546893, |
| "learning_rate": 3.3046031845851993e-05, |
| "loss": 0.1644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16868937015533447, |
| "step": 2310, |
| "valid_targets_mean": 1519.2, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 2.43172268907563, |
| "grad_norm": 0.7087358397507307, |
| "learning_rate": 3.3006280617613214e-05, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17215979099273682, |
| "step": 2315, |
| "valid_targets_mean": 1396.3, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 2.4369747899159666, |
| "grad_norm": 0.7369066907552546, |
| "learning_rate": 3.296644015657295e-05, |
| "loss": 0.1754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18438240885734558, |
| "step": 2320, |
| "valid_targets_mean": 1494.4, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 2.4422268907563023, |
| "grad_norm": 0.69010875765003, |
| "learning_rate": 3.292651073606652e-05, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16703712940216064, |
| "step": 2325, |
| "valid_targets_mean": 1541.1, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 2.447478991596639, |
| "grad_norm": 0.7340635719059896, |
| "learning_rate": 3.288649263003958e-05, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18820658326148987, |
| "step": 2330, |
| "valid_targets_mean": 1509.0, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 2.452731092436975, |
| "grad_norm": 0.7197216030974956, |
| "learning_rate": 3.284638611304623e-05, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17071965336799622, |
| "step": 2335, |
| "valid_targets_mean": 1484.4, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 2.457983193277311, |
| "grad_norm": 0.7517975842539306, |
| "learning_rate": 3.280619146024714e-05, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19978466629981995, |
| "step": 2340, |
| "valid_targets_mean": 1505.0, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 2.463235294117647, |
| "grad_norm": 0.7266865301196809, |
| "learning_rate": 3.2765908947407665e-05, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2888498306274414, |
| "step": 2345, |
| "valid_targets_mean": 3602.9, |
| "valid_targets_min": 1698 |
| }, |
| { |
| "epoch": 2.4684873949579833, |
| "grad_norm": 0.5649119554586547, |
| "learning_rate": 3.2725538850895933e-05, |
| "loss": 0.2777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25794461369514465, |
| "step": 2350, |
| "valid_targets_mean": 3718.5, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 2.4737394957983194, |
| "grad_norm": 0.7045726718503901, |
| "learning_rate": 3.268508144768096e-05, |
| "loss": 0.2725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2772102653980255, |
| "step": 2355, |
| "valid_targets_mean": 3299.2, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 2.4789915966386555, |
| "grad_norm": 0.564312940590048, |
| "learning_rate": 3.264453701533075e-05, |
| "loss": 0.2685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2812797725200653, |
| "step": 2360, |
| "valid_targets_mean": 4040.6, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 2.4842436974789917, |
| "grad_norm": 0.6103845308794094, |
| "learning_rate": 3.260390583201041e-05, |
| "loss": 0.2546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26815706491470337, |
| "step": 2365, |
| "valid_targets_mean": 3995.7, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 2.4894957983193278, |
| "grad_norm": 0.5643937322946125, |
| "learning_rate": 3.2563188176480217e-05, |
| "loss": 0.2817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31056275963783264, |
| "step": 2370, |
| "valid_targets_mean": 4070.5, |
| "valid_targets_min": 1744 |
| }, |
| { |
| "epoch": 2.494747899159664, |
| "grad_norm": 0.5232363392589175, |
| "learning_rate": 3.252238432809368e-05, |
| "loss": 0.2435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22355665266513824, |
| "step": 2375, |
| "valid_targets_mean": 3831.8, |
| "valid_targets_min": 1734 |
| }, |
| { |
| "epoch": 2.5, |
| "grad_norm": 0.666569390983386, |
| "learning_rate": 3.2481494566795716e-05, |
| "loss": 0.2587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2557009756565094, |
| "step": 2380, |
| "valid_targets_mean": 4593.9, |
| "valid_targets_min": 1381 |
| }, |
| { |
| "epoch": 2.505252100840336, |
| "grad_norm": 0.5634090394701392, |
| "learning_rate": 3.244051917312061e-05, |
| "loss": 0.2671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2774540185928345, |
| "step": 2385, |
| "valid_targets_mean": 3523.4, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 2.5105042016806722, |
| "grad_norm": 0.5827012399453538, |
| "learning_rate": 3.239945842819018e-05, |
| "loss": 0.2779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27029716968536377, |
| "step": 2390, |
| "valid_targets_mean": 3686.2, |
| "valid_targets_min": 2107 |
| }, |
| { |
| "epoch": 2.5157563025210083, |
| "grad_norm": 0.6119604303971371, |
| "learning_rate": 3.2358312613711804e-05, |
| "loss": 0.2674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2673264741897583, |
| "step": 2395, |
| "valid_targets_mean": 3195.1, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 2.5210084033613445, |
| "grad_norm": 0.5309909333341549, |
| "learning_rate": 3.231708201197653e-05, |
| "loss": 0.2697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27537453174591064, |
| "step": 2400, |
| "valid_targets_mean": 4344.2, |
| "valid_targets_min": 1597 |
| }, |
| { |
| "epoch": 2.5262605042016806, |
| "grad_norm": 0.6196309832297628, |
| "learning_rate": 3.227576690585706e-05, |
| "loss": 0.2717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27964839339256287, |
| "step": 2405, |
| "valid_targets_mean": 3039.4, |
| "valid_targets_min": 1535 |
| }, |
| { |
| "epoch": 2.5315126050420167, |
| "grad_norm": 0.6105328048520959, |
| "learning_rate": 3.223436757880591e-05, |
| "loss": 0.2655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2900930643081665, |
| "step": 2410, |
| "valid_targets_mean": 3732.8, |
| "valid_targets_min": 1385 |
| }, |
| { |
| "epoch": 2.536764705882353, |
| "grad_norm": 0.6121657286750687, |
| "learning_rate": 3.219288431485337e-05, |
| "loss": 0.271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.296478807926178, |
| "step": 2415, |
| "valid_targets_mean": 3802.3, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 2.542016806722689, |
| "grad_norm": 0.6645007327168074, |
| "learning_rate": 3.2151317398605646e-05, |
| "loss": 0.2782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29341888427734375, |
| "step": 2420, |
| "valid_targets_mean": 2909.6, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 2.5472689075630255, |
| "grad_norm": 0.6452736492861937, |
| "learning_rate": 3.2109667115242815e-05, |
| "loss": 0.2678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2756231725215912, |
| "step": 2425, |
| "valid_targets_mean": 2893.6, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 2.552521008403361, |
| "grad_norm": 0.6459381577493258, |
| "learning_rate": 3.206793375051694e-05, |
| "loss": 0.2821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2834113836288452, |
| "step": 2430, |
| "valid_targets_mean": 3271.2, |
| "valid_targets_min": 1695 |
| }, |
| { |
| "epoch": 2.5577731092436977, |
| "grad_norm": 0.6599512718640789, |
| "learning_rate": 3.2026117590750086e-05, |
| "loss": 0.2787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2733537554740906, |
| "step": 2435, |
| "valid_targets_mean": 3117.0, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 2.5630252100840334, |
| "grad_norm": 0.567668736976835, |
| "learning_rate": 3.198421892283235e-05, |
| "loss": 0.2722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2664722502231598, |
| "step": 2440, |
| "valid_targets_mean": 3738.3, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 2.56827731092437, |
| "grad_norm": 0.6231370164675432, |
| "learning_rate": 3.1942238034219885e-05, |
| "loss": 0.2675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28766465187072754, |
| "step": 2445, |
| "valid_targets_mean": 3198.6, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 2.5735294117647056, |
| "grad_norm": 0.6316291488754031, |
| "learning_rate": 3.190017521293296e-05, |
| "loss": 0.2649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2555858790874481, |
| "step": 2450, |
| "valid_targets_mean": 3085.4, |
| "valid_targets_min": 1385 |
| }, |
| { |
| "epoch": 2.578781512605042, |
| "grad_norm": 0.6263309654818119, |
| "learning_rate": 3.185803074755395e-05, |
| "loss": 0.2695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2710253596305847, |
| "step": 2455, |
| "valid_targets_mean": 3538.3, |
| "valid_targets_min": 1548 |
| }, |
| { |
| "epoch": 2.5840336134453783, |
| "grad_norm": 0.6117849557050007, |
| "learning_rate": 3.1815804927225363e-05, |
| "loss": 0.2718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26848098635673523, |
| "step": 2460, |
| "valid_targets_mean": 3289.2, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 2.5892857142857144, |
| "grad_norm": 0.6124680799238794, |
| "learning_rate": 3.1773498041647876e-05, |
| "loss": 0.2706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27038100361824036, |
| "step": 2465, |
| "valid_targets_mean": 3072.8, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 2.5945378151260505, |
| "grad_norm": 0.5501431568044479, |
| "learning_rate": 3.173111038107834e-05, |
| "loss": 0.2625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2502066195011139, |
| "step": 2470, |
| "valid_targets_mean": 4004.5, |
| "valid_targets_min": 1851 |
| }, |
| { |
| "epoch": 2.5997899159663866, |
| "grad_norm": 0.5757740316879347, |
| "learning_rate": 3.168864223632776e-05, |
| "loss": 0.2665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26100954413414, |
| "step": 2475, |
| "valid_targets_mean": 3751.6, |
| "valid_targets_min": 1540 |
| }, |
| { |
| "epoch": 2.6050420168067228, |
| "grad_norm": 0.623122866098537, |
| "learning_rate": 3.1646093898759334e-05, |
| "loss": 0.2675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.269726425409317, |
| "step": 2480, |
| "valid_targets_mean": 3402.6, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 2.610294117647059, |
| "grad_norm": 0.6140867953660799, |
| "learning_rate": 3.160346566028645e-05, |
| "loss": 0.2671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28402426838874817, |
| "step": 2485, |
| "valid_targets_mean": 3822.9, |
| "valid_targets_min": 2040 |
| }, |
| { |
| "epoch": 2.615546218487395, |
| "grad_norm": 0.6458360451166494, |
| "learning_rate": 3.156075781337068e-05, |
| "loss": 0.2722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2804952561855316, |
| "step": 2490, |
| "valid_targets_mean": 2824.4, |
| "valid_targets_min": 1458 |
| }, |
| { |
| "epoch": 2.620798319327731, |
| "grad_norm": 0.614578628604973, |
| "learning_rate": 3.1517970651019735e-05, |
| "loss": 0.2673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.267007976770401, |
| "step": 2495, |
| "valid_targets_mean": 3497.6, |
| "valid_targets_min": 1589 |
| }, |
| { |
| "epoch": 2.6260504201680672, |
| "grad_norm": 0.6550756431874655, |
| "learning_rate": 3.1475104466785536e-05, |
| "loss": 0.2628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2752663195133209, |
| "step": 2500, |
| "valid_targets_mean": 2745.1, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 2.6313025210084033, |
| "grad_norm": 0.7285449233093796, |
| "learning_rate": 3.143215955476211e-05, |
| "loss": 0.2695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30785495042800903, |
| "step": 2505, |
| "valid_targets_mean": 3143.5, |
| "valid_targets_min": 1636 |
| }, |
| { |
| "epoch": 2.6365546218487395, |
| "grad_norm": 0.5763401907930161, |
| "learning_rate": 3.138913620958365e-05, |
| "loss": 0.266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26492440700531006, |
| "step": 2510, |
| "valid_targets_mean": 3906.8, |
| "valid_targets_min": 2383 |
| }, |
| { |
| "epoch": 2.6418067226890756, |
| "grad_norm": 0.5946439618794739, |
| "learning_rate": 3.134603472642244e-05, |
| "loss": 0.2672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25987619161605835, |
| "step": 2515, |
| "valid_targets_mean": 3180.3, |
| "valid_targets_min": 1372 |
| }, |
| { |
| "epoch": 2.6470588235294117, |
| "grad_norm": 0.7017146713713763, |
| "learning_rate": 3.1302855400986866e-05, |
| "loss": 0.2652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25516122579574585, |
| "step": 2520, |
| "valid_targets_mean": 2634.1, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 2.652310924369748, |
| "grad_norm": 0.7063131822296524, |
| "learning_rate": 3.1259598529519336e-05, |
| "loss": 0.27, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2827465236186981, |
| "step": 2525, |
| "valid_targets_mean": 2937.3, |
| "valid_targets_min": 1504 |
| }, |
| { |
| "epoch": 2.657563025210084, |
| "grad_norm": 0.6322826497339568, |
| "learning_rate": 3.121626440879432e-05, |
| "loss": 0.2532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24802082777023315, |
| "step": 2530, |
| "valid_targets_mean": 3097.8, |
| "valid_targets_min": 1648 |
| }, |
| { |
| "epoch": 2.66281512605042, |
| "grad_norm": 0.6405774977690727, |
| "learning_rate": 3.117285333611625e-05, |
| "loss": 0.2679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.247537761926651, |
| "step": 2535, |
| "valid_targets_mean": 3982.1, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 2.668067226890756, |
| "grad_norm": 0.5925204140545449, |
| "learning_rate": 3.112936560931752e-05, |
| "loss": 0.2564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24100324511528015, |
| "step": 2540, |
| "valid_targets_mean": 3329.1, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 2.6733193277310923, |
| "grad_norm": 0.6277943771927688, |
| "learning_rate": 3.108580152675642e-05, |
| "loss": 0.2575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2357967495918274, |
| "step": 2545, |
| "valid_targets_mean": 3185.8, |
| "valid_targets_min": 1294 |
| }, |
| { |
| "epoch": 2.678571428571429, |
| "grad_norm": 0.6292055198908869, |
| "learning_rate": 3.104216138731511e-05, |
| "loss": 0.2676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2757669687271118, |
| "step": 2550, |
| "valid_targets_mean": 3340.1, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 2.6838235294117645, |
| "grad_norm": 0.6031199057951037, |
| "learning_rate": 3.0998445490397546e-05, |
| "loss": 0.2601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26977115869522095, |
| "step": 2555, |
| "valid_targets_mean": 3379.6, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 2.689075630252101, |
| "grad_norm": 0.6624342295310539, |
| "learning_rate": 3.095465413592743e-05, |
| "loss": 0.276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27833864092826843, |
| "step": 2560, |
| "valid_targets_mean": 2969.1, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 2.6943277310924367, |
| "grad_norm": 0.6361231679633825, |
| "learning_rate": 3.091078762434616e-05, |
| "loss": 0.265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2749124765396118, |
| "step": 2565, |
| "valid_targets_mean": 3232.6, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 2.6995798319327733, |
| "grad_norm": 0.616757107135465, |
| "learning_rate": 3.086684625661081e-05, |
| "loss": 0.2497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2631353735923767, |
| "step": 2570, |
| "valid_targets_mean": 3125.7, |
| "valid_targets_min": 1328 |
| }, |
| { |
| "epoch": 2.7048319327731094, |
| "grad_norm": 0.6893720258364816, |
| "learning_rate": 3.082283033419197e-05, |
| "loss": 0.2647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2686452567577362, |
| "step": 2575, |
| "valid_targets_mean": 3166.4, |
| "valid_targets_min": 1302 |
| }, |
| { |
| "epoch": 2.7100840336134455, |
| "grad_norm": 0.6092903528556366, |
| "learning_rate": 3.077874015907174e-05, |
| "loss": 0.2529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2558513283729553, |
| "step": 2580, |
| "valid_targets_mean": 4101.6, |
| "valid_targets_min": 1701 |
| }, |
| { |
| "epoch": 2.7153361344537816, |
| "grad_norm": 0.5889526951400187, |
| "learning_rate": 3.073457603374167e-05, |
| "loss": 0.2533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25581663846969604, |
| "step": 2585, |
| "valid_targets_mean": 3677.3, |
| "valid_targets_min": 1319 |
| }, |
| { |
| "epoch": 2.7205882352941178, |
| "grad_norm": 0.642935413766165, |
| "learning_rate": 3.069033826120066e-05, |
| "loss": 0.2416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.255086213350296, |
| "step": 2590, |
| "valid_targets_mean": 3259.8, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 2.725840336134454, |
| "grad_norm": 0.6235865519519191, |
| "learning_rate": 3.064602714495286e-05, |
| "loss": 0.2711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25447195768356323, |
| "step": 2595, |
| "valid_targets_mean": 2886.7, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 2.73109243697479, |
| "grad_norm": 0.5840881578880576, |
| "learning_rate": 3.060164298900565e-05, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25606703758239746, |
| "step": 2600, |
| "valid_targets_mean": 3948.4, |
| "valid_targets_min": 1742 |
| }, |
| { |
| "epoch": 2.736344537815126, |
| "grad_norm": 0.70617682044821, |
| "learning_rate": 3.055718609786749e-05, |
| "loss": 0.2641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2716052234172821, |
| "step": 2605, |
| "valid_targets_mean": 2877.3, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 2.741596638655462, |
| "grad_norm": 0.6377305035799299, |
| "learning_rate": 3.051265677654585e-05, |
| "loss": 0.2687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2713176906108856, |
| "step": 2610, |
| "valid_targets_mean": 3126.6, |
| "valid_targets_min": 1686 |
| }, |
| { |
| "epoch": 2.7468487394957983, |
| "grad_norm": 0.5626998875518994, |
| "learning_rate": 3.0468055330545162e-05, |
| "loss": 0.2651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23960676789283752, |
| "step": 2615, |
| "valid_targets_mean": 3957.4, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 2.7521008403361344, |
| "grad_norm": 0.6556128296668272, |
| "learning_rate": 3.0423382065864653e-05, |
| "loss": 0.2577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25945764780044556, |
| "step": 2620, |
| "valid_targets_mean": 2844.3, |
| "valid_targets_min": 1364 |
| }, |
| { |
| "epoch": 2.7573529411764706, |
| "grad_norm": 0.6666237064634677, |
| "learning_rate": 3.0378637288996304e-05, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26987403631210327, |
| "step": 2625, |
| "valid_targets_mean": 3537.1, |
| "valid_targets_min": 1514 |
| }, |
| { |
| "epoch": 2.7626050420168067, |
| "grad_norm": 0.6590248047133942, |
| "learning_rate": 3.033382130692269e-05, |
| "loss": 0.2504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26807478070259094, |
| "step": 2630, |
| "valid_targets_mean": 2863.1, |
| "valid_targets_min": 1073 |
| }, |
| { |
| "epoch": 2.767857142857143, |
| "grad_norm": 0.6761466657105407, |
| "learning_rate": 3.0288934427114955e-05, |
| "loss": 0.2553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27322080731391907, |
| "step": 2635, |
| "valid_targets_mean": 2907.8, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 2.773109243697479, |
| "grad_norm": 0.6353889677418061, |
| "learning_rate": 3.0243976957530602e-05, |
| "loss": 0.2463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23086395859718323, |
| "step": 2640, |
| "valid_targets_mean": 2695.9, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 2.778361344537815, |
| "grad_norm": 0.7083565681570431, |
| "learning_rate": 3.0198949206611475e-05, |
| "loss": 0.2493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27140820026397705, |
| "step": 2645, |
| "valid_targets_mean": 3112.3, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 2.783613445378151, |
| "grad_norm": 0.6445873412413864, |
| "learning_rate": 3.0153851483281582e-05, |
| "loss": 0.2574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29137080907821655, |
| "step": 2650, |
| "valid_targets_mean": 3687.8, |
| "valid_targets_min": 1817 |
| }, |
| { |
| "epoch": 2.7888655462184873, |
| "grad_norm": 0.6275537197106373, |
| "learning_rate": 3.010868409694499e-05, |
| "loss": 0.2617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2466498464345932, |
| "step": 2655, |
| "valid_targets_mean": 3197.7, |
| "valid_targets_min": 1411 |
| }, |
| { |
| "epoch": 2.7941176470588234, |
| "grad_norm": 0.5902973797283267, |
| "learning_rate": 3.0063447357483712e-05, |
| "loss": 0.2595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2413676530122757, |
| "step": 2660, |
| "valid_targets_mean": 3804.1, |
| "valid_targets_min": 2253 |
| }, |
| { |
| "epoch": 2.79936974789916, |
| "grad_norm": 0.6686261268710058, |
| "learning_rate": 3.0018141575255587e-05, |
| "loss": 0.2557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2801203727722168, |
| "step": 2665, |
| "valid_targets_mean": 3269.8, |
| "valid_targets_min": 1860 |
| }, |
| { |
| "epoch": 2.8046218487394956, |
| "grad_norm": 0.5958481124800947, |
| "learning_rate": 2.9972767061092107e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24206840991973877, |
| "step": 2670, |
| "valid_targets_mean": 3550.5, |
| "valid_targets_min": 1805 |
| }, |
| { |
| "epoch": 2.809873949579832, |
| "grad_norm": 0.5964898157229672, |
| "learning_rate": 2.9927324126296352e-05, |
| "loss": 0.2584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24410061538219452, |
| "step": 2675, |
| "valid_targets_mean": 3646.2, |
| "valid_targets_min": 1145 |
| }, |
| { |
| "epoch": 2.815126050420168, |
| "grad_norm": 0.6446057186222791, |
| "learning_rate": 2.98818130826408e-05, |
| "loss": 0.252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2676333785057068, |
| "step": 2680, |
| "valid_targets_mean": 3167.9, |
| "valid_targets_min": 1722 |
| }, |
| { |
| "epoch": 2.8203781512605044, |
| "grad_norm": 0.7582205523508831, |
| "learning_rate": 2.9836234242365204e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25383812189102173, |
| "step": 2685, |
| "valid_targets_mean": 2996.0, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 2.82563025210084, |
| "grad_norm": 0.6301709788550426, |
| "learning_rate": 2.979058791817447e-05, |
| "loss": 0.2661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2749696969985962, |
| "step": 2690, |
| "valid_targets_mean": 3538.0, |
| "valid_targets_min": 1426 |
| }, |
| { |
| "epoch": 2.8308823529411766, |
| "grad_norm": 0.6480505666026394, |
| "learning_rate": 2.974487442323647e-05, |
| "loss": 0.2685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2599114179611206, |
| "step": 2695, |
| "valid_targets_mean": 3115.1, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 2.8361344537815127, |
| "grad_norm": 0.6882139342020044, |
| "learning_rate": 2.9699094071179938e-05, |
| "loss": 0.2552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2708072364330292, |
| "step": 2700, |
| "valid_targets_mean": 2551.9, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 2.841386554621849, |
| "grad_norm": 0.6582888441321656, |
| "learning_rate": 2.9653247176092286e-05, |
| "loss": 0.2684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2539324164390564, |
| "step": 2705, |
| "valid_targets_mean": 3079.0, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 2.846638655462185, |
| "grad_norm": 0.638833559343612, |
| "learning_rate": 2.9607334052517466e-05, |
| "loss": 0.2569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28745412826538086, |
| "step": 2710, |
| "valid_targets_mean": 3822.1, |
| "valid_targets_min": 1625 |
| }, |
| { |
| "epoch": 2.851890756302521, |
| "grad_norm": 0.7422015502102081, |
| "learning_rate": 2.9561355015453803e-05, |
| "loss": 0.2732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29670873284339905, |
| "step": 2715, |
| "valid_targets_mean": 2883.9, |
| "valid_targets_min": 1400 |
| }, |
| { |
| "epoch": 2.857142857142857, |
| "grad_norm": 0.6490748235477826, |
| "learning_rate": 2.9515310380351847e-05, |
| "loss": 0.2608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24093633890151978, |
| "step": 2720, |
| "valid_targets_mean": 3222.6, |
| "valid_targets_min": 1868 |
| }, |
| { |
| "epoch": 2.8623949579831933, |
| "grad_norm": 0.7372791077034592, |
| "learning_rate": 2.9469200463112186e-05, |
| "loss": 0.2659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25444963574409485, |
| "step": 2725, |
| "valid_targets_mean": 2862.1, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 2.8676470588235294, |
| "grad_norm": 0.7192710572965154, |
| "learning_rate": 2.9423025580083298e-05, |
| "loss": 0.2623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.245719313621521, |
| "step": 2730, |
| "valid_targets_mean": 3024.6, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 2.8728991596638656, |
| "grad_norm": 0.6647970803562331, |
| "learning_rate": 2.937678604805938e-05, |
| "loss": 0.268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2540484070777893, |
| "step": 2735, |
| "valid_targets_mean": 3429.3, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 2.8781512605042017, |
| "grad_norm": 0.612522922361621, |
| "learning_rate": 2.9330482184278168e-05, |
| "loss": 0.2619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2477385699748993, |
| "step": 2740, |
| "valid_targets_mean": 3270.8, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 2.883403361344538, |
| "grad_norm": 0.7016630866988153, |
| "learning_rate": 2.9284114306418758e-05, |
| "loss": 0.2545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2649661898612976, |
| "step": 2745, |
| "valid_targets_mean": 3123.0, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 2.888655462184874, |
| "grad_norm": 0.6661752773535051, |
| "learning_rate": 2.923768273259942e-05, |
| "loss": 0.2639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.263710081577301, |
| "step": 2750, |
| "valid_targets_mean": 3085.5, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 2.89390756302521, |
| "grad_norm": 0.6197849509680783, |
| "learning_rate": 2.919118778137546e-05, |
| "loss": 0.2659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25989899039268494, |
| "step": 2755, |
| "valid_targets_mean": 3491.7, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 2.899159663865546, |
| "grad_norm": 0.594389488012544, |
| "learning_rate": 2.9144629771736954e-05, |
| "loss": 0.2689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2792191207408905, |
| "step": 2760, |
| "valid_targets_mean": 3904.9, |
| "valid_targets_min": 1613 |
| }, |
| { |
| "epoch": 2.9044117647058822, |
| "grad_norm": 0.5752638283362668, |
| "learning_rate": 2.9098009023106645e-05, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23264659941196442, |
| "step": 2765, |
| "valid_targets_mean": 3731.6, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 2.9096638655462184, |
| "grad_norm": 0.6490696888490648, |
| "learning_rate": 2.9051325855337684e-05, |
| "loss": 0.2605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26240965723991394, |
| "step": 2770, |
| "valid_targets_mean": 2823.0, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 2.9149159663865545, |
| "grad_norm": 0.6126363252048349, |
| "learning_rate": 2.90045805887115e-05, |
| "loss": 0.2539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27359646558761597, |
| "step": 2775, |
| "valid_targets_mean": 4032.0, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 2.9201680672268906, |
| "grad_norm": 0.6068839428847373, |
| "learning_rate": 2.8957773543935518e-05, |
| "loss": 0.2559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2474924623966217, |
| "step": 2780, |
| "valid_targets_mean": 3534.0, |
| "valid_targets_min": 1920 |
| }, |
| { |
| "epoch": 2.9254201680672267, |
| "grad_norm": 0.6329791757885024, |
| "learning_rate": 2.8910905042141046e-05, |
| "loss": 0.2452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25704294443130493, |
| "step": 2785, |
| "valid_targets_mean": 3527.5, |
| "valid_targets_min": 1687 |
| }, |
| { |
| "epoch": 2.9306722689075633, |
| "grad_norm": 0.6948103907388832, |
| "learning_rate": 2.8863975404881022e-05, |
| "loss": 0.2574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30331847071647644, |
| "step": 2790, |
| "valid_targets_mean": 3213.0, |
| "valid_targets_min": 1564 |
| }, |
| { |
| "epoch": 2.935924369747899, |
| "grad_norm": 0.6352221742702212, |
| "learning_rate": 2.881698495412781e-05, |
| "loss": 0.2477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2414446771144867, |
| "step": 2795, |
| "valid_targets_mean": 3689.7, |
| "valid_targets_min": 1947 |
| }, |
| { |
| "epoch": 2.9411764705882355, |
| "grad_norm": 0.6629581821365779, |
| "learning_rate": 2.8769934012271004e-05, |
| "loss": 0.2462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25725820660591125, |
| "step": 2800, |
| "valid_targets_mean": 2978.2, |
| "valid_targets_min": 1447 |
| }, |
| { |
| "epoch": 2.946428571428571, |
| "grad_norm": 0.6673202572073865, |
| "learning_rate": 2.8722822902115228e-05, |
| "loss": 0.2448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25360405445098877, |
| "step": 2805, |
| "valid_targets_mean": 3016.5, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 2.9516806722689077, |
| "grad_norm": 0.7063504788496237, |
| "learning_rate": 2.8675651946877884e-05, |
| "loss": 0.2506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27201586961746216, |
| "step": 2810, |
| "valid_targets_mean": 3199.0, |
| "valid_targets_min": 1679 |
| }, |
| { |
| "epoch": 2.956932773109244, |
| "grad_norm": 0.6749918994768315, |
| "learning_rate": 2.862842147018696e-05, |
| "loss": 0.2667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2709447741508484, |
| "step": 2815, |
| "valid_targets_mean": 3001.2, |
| "valid_targets_min": 1695 |
| }, |
| { |
| "epoch": 2.96218487394958, |
| "grad_norm": 0.6389022545015189, |
| "learning_rate": 2.858113179607881e-05, |
| "loss": 0.2539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24959295988082886, |
| "step": 2820, |
| "valid_targets_mean": 3370.9, |
| "valid_targets_min": 1469 |
| }, |
| { |
| "epoch": 2.967436974789916, |
| "grad_norm": 0.7014173062929902, |
| "learning_rate": 2.8533783248995938e-05, |
| "loss": 0.2515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24700427055358887, |
| "step": 2825, |
| "valid_targets_mean": 3245.9, |
| "valid_targets_min": 1593 |
| }, |
| { |
| "epoch": 2.972689075630252, |
| "grad_norm": 0.6469956378099957, |
| "learning_rate": 2.848637615378475e-05, |
| "loss": 0.2509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27041953802108765, |
| "step": 2830, |
| "valid_targets_mean": 3130.5, |
| "valid_targets_min": 1664 |
| }, |
| { |
| "epoch": 2.9779411764705883, |
| "grad_norm": 0.6169242449395833, |
| "learning_rate": 2.8438910835693314e-05, |
| "loss": 0.2443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22996433079242706, |
| "step": 2835, |
| "valid_targets_mean": 3460.2, |
| "valid_targets_min": 1605 |
| }, |
| { |
| "epoch": 2.9831932773109244, |
| "grad_norm": 0.6394181377322952, |
| "learning_rate": 2.8391387620369192e-05, |
| "loss": 0.2729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2803104519844055, |
| "step": 2840, |
| "valid_targets_mean": 3288.6, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 2.9884453781512605, |
| "grad_norm": 0.6854150282623844, |
| "learning_rate": 2.834380683385714e-05, |
| "loss": 0.265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2902924418449402, |
| "step": 2845, |
| "valid_targets_mean": 3601.4, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 2.9936974789915967, |
| "grad_norm": 0.6051689785920974, |
| "learning_rate": 2.8296168802596892e-05, |
| "loss": 0.2543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2509153187274933, |
| "step": 2850, |
| "valid_targets_mean": 3752.4, |
| "valid_targets_min": 2026 |
| }, |
| { |
| "epoch": 2.9989495798319328, |
| "grad_norm": 0.6083481456927304, |
| "learning_rate": 2.8248473853420933e-05, |
| "loss": 0.2533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2585148811340332, |
| "step": 2855, |
| "valid_targets_mean": 3430.5, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 3.004201680672269, |
| "grad_norm": 0.7319423401810515, |
| "learning_rate": 2.8200722313552247e-05, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2003440260887146, |
| "step": 2860, |
| "valid_targets_mean": 1489.3, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 3.009453781512605, |
| "grad_norm": 0.717771718263267, |
| "learning_rate": 2.8152914510602073e-05, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17707990109920502, |
| "step": 2865, |
| "valid_targets_mean": 1515.6, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.014705882352941, |
| "grad_norm": 0.8226879595885981, |
| "learning_rate": 2.810505077256765e-05, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18063870072364807, |
| "step": 2870, |
| "valid_targets_mean": 1443.1, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 3.0199579831932772, |
| "grad_norm": 0.8338357187658497, |
| "learning_rate": 2.8057131427829983e-05, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17110946774482727, |
| "step": 2875, |
| "valid_targets_mean": 1316.8, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 3.0252100840336134, |
| "grad_norm": 0.7376091557217379, |
| "learning_rate": 2.800915680515157e-05, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17430976033210754, |
| "step": 2880, |
| "valid_targets_mean": 1540.8, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 3.0304621848739495, |
| "grad_norm": 0.7831042239119287, |
| "learning_rate": 2.7961127233674167e-05, |
| "loss": 0.1816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2140425145626068, |
| "step": 2885, |
| "valid_targets_mean": 1648.9, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 3.0357142857142856, |
| "grad_norm": 0.7415542108375209, |
| "learning_rate": 2.7913043042916513e-05, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1582803726196289, |
| "step": 2890, |
| "valid_targets_mean": 1354.9, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 3.0409663865546217, |
| "grad_norm": 0.715142653421594, |
| "learning_rate": 2.786490456277208e-05, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25299903750419617, |
| "step": 2895, |
| "valid_targets_mean": 1589.9, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 3.046218487394958, |
| "grad_norm": 0.7873361806067022, |
| "learning_rate": 2.7816712123506796e-05, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1710663139820099, |
| "step": 2900, |
| "valid_targets_mean": 1485.4, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 3.051470588235294, |
| "grad_norm": 0.7770722242990561, |
| "learning_rate": 2.776846605575681e-05, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1824086308479309, |
| "step": 2905, |
| "valid_targets_mean": 1712.8, |
| "valid_targets_min": 964 |
| }, |
| { |
| "epoch": 3.05672268907563, |
| "grad_norm": 0.7616729738480414, |
| "learning_rate": 2.772016669052618e-05, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1748737096786499, |
| "step": 2910, |
| "valid_targets_mean": 1498.4, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 3.0619747899159666, |
| "grad_norm": 0.7583507582473836, |
| "learning_rate": 2.767181435918464e-05, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1768401861190796, |
| "step": 2915, |
| "valid_targets_mean": 1677.5, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 3.0672268907563027, |
| "grad_norm": 0.7278307085282013, |
| "learning_rate": 2.7623409393465298e-05, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1581869125366211, |
| "step": 2920, |
| "valid_targets_mean": 1325.3, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 3.072478991596639, |
| "grad_norm": 0.7617121869975262, |
| "learning_rate": 2.7574952125462386e-05, |
| "loss": 0.1577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16011205315589905, |
| "step": 2925, |
| "valid_targets_mean": 1324.7, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 3.077731092436975, |
| "grad_norm": 0.7554042058432768, |
| "learning_rate": 2.7526442887628962e-05, |
| "loss": 0.1553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15193405747413635, |
| "step": 2930, |
| "valid_targets_mean": 1288.1, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 3.082983193277311, |
| "grad_norm": 0.737075733110425, |
| "learning_rate": 2.7477882012774633e-05, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16672229766845703, |
| "step": 2935, |
| "valid_targets_mean": 1563.0, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 3.088235294117647, |
| "grad_norm": 0.8359898452206559, |
| "learning_rate": 2.742926983406328e-05, |
| "loss": 0.175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16956086456775665, |
| "step": 2940, |
| "valid_targets_mean": 1278.3, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 3.0934873949579833, |
| "grad_norm": 0.7553756145118757, |
| "learning_rate": 2.7380606685010767e-05, |
| "loss": 0.1735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17766933143138885, |
| "step": 2945, |
| "valid_targets_mean": 1552.1, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 3.0987394957983194, |
| "grad_norm": 0.7472526084646638, |
| "learning_rate": 2.7331892899482654e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1692330241203308, |
| "step": 2950, |
| "valid_targets_mean": 1548.2, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 3.1039915966386555, |
| "grad_norm": 0.6799508713485111, |
| "learning_rate": 2.7283128811691893e-05, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.146545872092247, |
| "step": 2955, |
| "valid_targets_mean": 1334.6, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 3.1092436974789917, |
| "grad_norm": 0.7171813544493029, |
| "learning_rate": 2.7234314756196564e-05, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15770323574543, |
| "step": 2960, |
| "valid_targets_mean": 1404.9, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 3.1144957983193278, |
| "grad_norm": 0.8566587780828107, |
| "learning_rate": 2.718545106789755e-05, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17677560448646545, |
| "step": 2965, |
| "valid_targets_mean": 1266.8, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 3.119747899159664, |
| "grad_norm": 0.8193397073508751, |
| "learning_rate": 2.713653808203626e-05, |
| "loss": 0.1581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15627950429916382, |
| "step": 2970, |
| "valid_targets_mean": 1427.1, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 3.125, |
| "grad_norm": 0.8274451736674825, |
| "learning_rate": 2.7087576134192305e-05, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16775844991207123, |
| "step": 2975, |
| "valid_targets_mean": 1421.0, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 3.130252100840336, |
| "grad_norm": 0.6953309030381479, |
| "learning_rate": 2.7038565560281252e-05, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16650184988975525, |
| "step": 2980, |
| "valid_targets_mean": 1685.9, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 3.1355042016806722, |
| "grad_norm": 0.8099890208928163, |
| "learning_rate": 2.6989506696552224e-05, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16752278804779053, |
| "step": 2985, |
| "valid_targets_mean": 1378.0, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 3.1407563025210083, |
| "grad_norm": 0.7795749997325356, |
| "learning_rate": 2.6940399879585685e-05, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16560722887516022, |
| "step": 2990, |
| "valid_targets_mean": 1599.2, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 3.1460084033613445, |
| "grad_norm": 0.7336389778027822, |
| "learning_rate": 2.6891245446291093e-05, |
| "loss": 0.1674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14416930079460144, |
| "step": 2995, |
| "valid_targets_mean": 1380.4, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 3.1512605042016806, |
| "grad_norm": 0.7490034715901619, |
| "learning_rate": 2.6842043733904578e-05, |
| "loss": 0.1593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15650300681591034, |
| "step": 3000, |
| "valid_targets_mean": 1571.5, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 3.1565126050420167, |
| "grad_norm": 0.8401911427116212, |
| "learning_rate": 2.6792795079986634e-05, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17290136218070984, |
| "step": 3005, |
| "valid_targets_mean": 1447.8, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 3.161764705882353, |
| "grad_norm": 0.8101203980462212, |
| "learning_rate": 2.6743499822419833e-05, |
| "loss": 0.1663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18794336915016174, |
| "step": 3010, |
| "valid_targets_mean": 1512.7, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 3.167016806722689, |
| "grad_norm": 0.7549079816000475, |
| "learning_rate": 2.669415829940646e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.148887038230896, |
| "step": 3015, |
| "valid_targets_mean": 1333.1, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 3.172268907563025, |
| "grad_norm": 0.8655198786602623, |
| "learning_rate": 2.6644770849466226e-05, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14870238304138184, |
| "step": 3020, |
| "valid_targets_mean": 1233.6, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 3.177521008403361, |
| "grad_norm": 0.6869481556598374, |
| "learning_rate": 2.6595337811433925e-05, |
| "loss": 0.1573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1471511870622635, |
| "step": 3025, |
| "valid_targets_mean": 1408.1, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 3.1827731092436973, |
| "grad_norm": 0.8476070443290739, |
| "learning_rate": 2.654585952445714e-05, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17854884266853333, |
| "step": 3030, |
| "valid_targets_mean": 1573.8, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 3.1880252100840334, |
| "grad_norm": 0.759943747176002, |
| "learning_rate": 2.6496336327993882e-05, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17004242539405823, |
| "step": 3035, |
| "valid_targets_mean": 1410.9, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 3.19327731092437, |
| "grad_norm": 0.7914392244697611, |
| "learning_rate": 2.6446768561810264e-05, |
| "loss": 0.1581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16128523647785187, |
| "step": 3040, |
| "valid_targets_mean": 1338.0, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 3.198529411764706, |
| "grad_norm": 0.7573632096372179, |
| "learning_rate": 2.6397156565978198e-05, |
| "loss": 0.1623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16719350218772888, |
| "step": 3045, |
| "valid_targets_mean": 1522.6, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 3.203781512605042, |
| "grad_norm": 0.7823159419268372, |
| "learning_rate": 2.6347500680873043e-05, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.170121967792511, |
| "step": 3050, |
| "valid_targets_mean": 1530.2, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 3.2090336134453783, |
| "grad_norm": 0.7715992991548748, |
| "learning_rate": 2.6297801247171258e-05, |
| "loss": 0.1645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14779695868492126, |
| "step": 3055, |
| "valid_targets_mean": 1266.6, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 3.2142857142857144, |
| "grad_norm": 0.7213196908664066, |
| "learning_rate": 2.6248058605848097e-05, |
| "loss": 0.1512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17193026840686798, |
| "step": 3060, |
| "valid_targets_mean": 1624.2, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 3.2195378151260505, |
| "grad_norm": 0.7460107195452109, |
| "learning_rate": 2.6198273098175234e-05, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1723858267068863, |
| "step": 3065, |
| "valid_targets_mean": 1508.1, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 3.2247899159663866, |
| "grad_norm": 0.7033456921737298, |
| "learning_rate": 2.614844506571844e-05, |
| "loss": 0.1588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16065514087677002, |
| "step": 3070, |
| "valid_targets_mean": 1645.1, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 3.2300420168067228, |
| "grad_norm": 0.700948054604266, |
| "learning_rate": 2.609857485033525e-05, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13682524859905243, |
| "step": 3075, |
| "valid_targets_mean": 1385.9, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 3.235294117647059, |
| "grad_norm": 0.8365081550151657, |
| "learning_rate": 2.6048662794172595e-05, |
| "loss": 0.156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1537787914276123, |
| "step": 3080, |
| "valid_targets_mean": 1489.9, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 3.240546218487395, |
| "grad_norm": 0.9620567262629217, |
| "learning_rate": 2.599870923966447e-05, |
| "loss": 0.1613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15811693668365479, |
| "step": 3085, |
| "valid_targets_mean": 1253.3, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 3.245798319327731, |
| "grad_norm": 0.7129512442205985, |
| "learning_rate": 2.5948714529529565e-05, |
| "loss": 0.1626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16663914918899536, |
| "step": 3090, |
| "valid_targets_mean": 1337.3, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 3.2510504201680672, |
| "grad_norm": 0.728601631393252, |
| "learning_rate": 2.5898679006768958e-05, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14995308220386505, |
| "step": 3095, |
| "valid_targets_mean": 1344.5, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 3.2563025210084033, |
| "grad_norm": 0.7807161695418345, |
| "learning_rate": 2.5848603014663702e-05, |
| "loss": 0.1554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15245237946510315, |
| "step": 3100, |
| "valid_targets_mean": 1302.3, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 3.2615546218487395, |
| "grad_norm": 0.7833067221288974, |
| "learning_rate": 2.579848689677252e-05, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.164436474442482, |
| "step": 3105, |
| "valid_targets_mean": 1489.2, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 3.2668067226890756, |
| "grad_norm": 0.7582720046388419, |
| "learning_rate": 2.5748330996929414e-05, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17622435092926025, |
| "step": 3110, |
| "valid_targets_mean": 1497.3, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 3.2720588235294117, |
| "grad_norm": 0.6761627015093946, |
| "learning_rate": 2.5698135659241334e-05, |
| "loss": 0.1564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14206218719482422, |
| "step": 3115, |
| "valid_targets_mean": 1376.9, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.277310924369748, |
| "grad_norm": 0.7569519780492563, |
| "learning_rate": 2.564790122808579e-05, |
| "loss": 0.1572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15797209739685059, |
| "step": 3120, |
| "valid_targets_mean": 1475.9, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 3.282563025210084, |
| "grad_norm": 0.7724507253369616, |
| "learning_rate": 2.5597628048108504e-05, |
| "loss": 0.1598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1651463806629181, |
| "step": 3125, |
| "valid_targets_mean": 1426.2, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 3.28781512605042, |
| "grad_norm": 0.7583229755048851, |
| "learning_rate": 2.5547316464221058e-05, |
| "loss": 0.1569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1635044515132904, |
| "step": 3130, |
| "valid_targets_mean": 1547.6, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 3.293067226890756, |
| "grad_norm": 0.7492941228082307, |
| "learning_rate": 2.5496966821598493e-05, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14868690073490143, |
| "step": 3135, |
| "valid_targets_mean": 1277.1, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 3.2983193277310923, |
| "grad_norm": 0.7918115514025105, |
| "learning_rate": 2.5446579465676977e-05, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14087459444999695, |
| "step": 3140, |
| "valid_targets_mean": 1292.3, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 3.3035714285714284, |
| "grad_norm": 0.7674670047525459, |
| "learning_rate": 2.5396154742151407e-05, |
| "loss": 0.1457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15545767545700073, |
| "step": 3145, |
| "valid_targets_mean": 1448.1, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.3088235294117645, |
| "grad_norm": 0.8361476210011558, |
| "learning_rate": 2.5345692996973075e-05, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17045646905899048, |
| "step": 3150, |
| "valid_targets_mean": 1472.6, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 3.314075630252101, |
| "grad_norm": 0.7425956748582699, |
| "learning_rate": 2.5295194576347233e-05, |
| "loss": 0.156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15749000012874603, |
| "step": 3155, |
| "valid_targets_mean": 1597.3, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 3.3193277310924367, |
| "grad_norm": 0.778056511779034, |
| "learning_rate": 2.5244659826730774e-05, |
| "loss": 0.1519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17436806857585907, |
| "step": 3160, |
| "valid_targets_mean": 1564.9, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 3.3245798319327733, |
| "grad_norm": 0.7457317148773122, |
| "learning_rate": 2.519408909482984e-05, |
| "loss": 0.1579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16804683208465576, |
| "step": 3165, |
| "valid_targets_mean": 1660.6, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 3.3298319327731094, |
| "grad_norm": 0.8015187816073955, |
| "learning_rate": 2.5143482727597427e-05, |
| "loss": 0.1572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16357378661632538, |
| "step": 3170, |
| "valid_targets_mean": 1392.3, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 3.3350840336134455, |
| "grad_norm": 0.7927587699859597, |
| "learning_rate": 2.509284107223102e-05, |
| "loss": 0.155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15347766876220703, |
| "step": 3175, |
| "valid_targets_mean": 1407.8, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 3.3403361344537816, |
| "grad_norm": 0.8291776111318878, |
| "learning_rate": 2.50421644761702e-05, |
| "loss": 0.155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14594411849975586, |
| "step": 3180, |
| "valid_targets_mean": 1237.5, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 3.3455882352941178, |
| "grad_norm": 0.786383044943235, |
| "learning_rate": 2.499145328709429e-05, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1620325744152069, |
| "step": 3185, |
| "valid_targets_mean": 1363.2, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 3.350840336134454, |
| "grad_norm": 0.8314225202905355, |
| "learning_rate": 2.4940707852919924e-05, |
| "loss": 0.1626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1637428104877472, |
| "step": 3190, |
| "valid_targets_mean": 1297.5, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 3.35609243697479, |
| "grad_norm": 0.8247848576495689, |
| "learning_rate": 2.488992852179868e-05, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1613052636384964, |
| "step": 3195, |
| "valid_targets_mean": 1466.3, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 3.361344537815126, |
| "grad_norm": 0.7169780960903507, |
| "learning_rate": 2.483911564211472e-05, |
| "loss": 0.1646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1574411392211914, |
| "step": 3200, |
| "valid_targets_mean": 1801.2, |
| "valid_targets_min": 1202 |
| }, |
| { |
| "epoch": 3.366596638655462, |
| "grad_norm": 0.6906945355495036, |
| "learning_rate": 2.4788269562482355e-05, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15213462710380554, |
| "step": 3205, |
| "valid_targets_mean": 1441.4, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 3.3718487394957983, |
| "grad_norm": 0.7855731357671363, |
| "learning_rate": 2.4737390631743675e-05, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15283282101154327, |
| "step": 3210, |
| "valid_targets_mean": 1442.9, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 3.3771008403361344, |
| "grad_norm": 0.7999940593483418, |
| "learning_rate": 2.4686479198966146e-05, |
| "loss": 0.1561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16701379418373108, |
| "step": 3215, |
| "valid_targets_mean": 1305.1, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 3.3823529411764706, |
| "grad_norm": 0.7802222544911187, |
| "learning_rate": 2.463553561344024e-05, |
| "loss": 0.1492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1388361155986786, |
| "step": 3220, |
| "valid_targets_mean": 1236.6, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 3.3876050420168067, |
| "grad_norm": 0.7997658424367834, |
| "learning_rate": 2.4584560224677013e-05, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14376091957092285, |
| "step": 3225, |
| "valid_targets_mean": 1261.1, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 3.392857142857143, |
| "grad_norm": 0.7589895889200633, |
| "learning_rate": 2.4533553382405702e-05, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16269132494926453, |
| "step": 3230, |
| "valid_targets_mean": 1451.1, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 3.398109243697479, |
| "grad_norm": 0.9088457131074477, |
| "learning_rate": 2.4482515436571365e-05, |
| "loss": 0.149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1583980917930603, |
| "step": 3235, |
| "valid_targets_mean": 1466.4, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 3.403361344537815, |
| "grad_norm": 0.8253891514753098, |
| "learning_rate": 2.4431446737332437e-05, |
| "loss": 0.1514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16583885252475739, |
| "step": 3240, |
| "valid_targets_mean": 1435.1, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 3.408613445378151, |
| "grad_norm": 0.7126823695261846, |
| "learning_rate": 2.438034763505833e-05, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14703774452209473, |
| "step": 3245, |
| "valid_targets_mean": 1411.8, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 3.4138655462184873, |
| "grad_norm": 0.7389656217215542, |
| "learning_rate": 2.432921848032707e-05, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14308568835258484, |
| "step": 3250, |
| "valid_targets_mean": 1495.9, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 3.4191176470588234, |
| "grad_norm": 0.7063481251451478, |
| "learning_rate": 2.427805962392286e-05, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15941093862056732, |
| "step": 3255, |
| "valid_targets_mean": 1643.2, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 3.4243697478991595, |
| "grad_norm": 0.7292997254366875, |
| "learning_rate": 2.4226871416833683e-05, |
| "loss": 0.1434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.146925687789917, |
| "step": 3260, |
| "valid_targets_mean": 1451.4, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 3.4296218487394956, |
| "grad_norm": 0.7542406085374198, |
| "learning_rate": 2.4175654210248848e-05, |
| "loss": 0.1404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.161025732755661, |
| "step": 3265, |
| "valid_targets_mean": 1615.9, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 3.434873949579832, |
| "grad_norm": 0.6966112598828675, |
| "learning_rate": 2.4124408355556677e-05, |
| "loss": 0.1512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1535557061433792, |
| "step": 3270, |
| "valid_targets_mean": 1596.5, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 3.440126050420168, |
| "grad_norm": 0.7555059854029672, |
| "learning_rate": 2.4073134204342014e-05, |
| "loss": 0.1523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16238391399383545, |
| "step": 3275, |
| "valid_targets_mean": 1445.5, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 3.4453781512605044, |
| "grad_norm": 0.8208149984721342, |
| "learning_rate": 2.4021832108383837e-05, |
| "loss": 0.1462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15757635235786438, |
| "step": 3280, |
| "valid_targets_mean": 1437.9, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 3.4506302521008405, |
| "grad_norm": 0.7056998799882124, |
| "learning_rate": 2.3970502419652854e-05, |
| "loss": 0.15, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15004190802574158, |
| "step": 3285, |
| "valid_targets_mean": 1559.1, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 3.4558823529411766, |
| "grad_norm": 0.7958553721684484, |
| "learning_rate": 2.3919145490309076e-05, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15160951018333435, |
| "step": 3290, |
| "valid_targets_mean": 1341.6, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 3.4611344537815127, |
| "grad_norm": 0.703390230979893, |
| "learning_rate": 2.38677616726994e-05, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1494627594947815, |
| "step": 3295, |
| "valid_targets_mean": 1747.5, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 3.466386554621849, |
| "grad_norm": 0.6829115937221362, |
| "learning_rate": 2.381635131935521e-05, |
| "loss": 0.2567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27713343501091003, |
| "step": 3300, |
| "valid_targets_mean": 3387.2, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 3.471638655462185, |
| "grad_norm": 0.5039365129794023, |
| "learning_rate": 2.3764914782989926e-05, |
| "loss": 0.2376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21012486517429352, |
| "step": 3305, |
| "valid_targets_mean": 4538.6, |
| "valid_targets_min": 1799 |
| }, |
| { |
| "epoch": 3.476890756302521, |
| "grad_norm": 0.5334008441824496, |
| "learning_rate": 2.3713452416496625e-05, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2371271550655365, |
| "step": 3310, |
| "valid_targets_mean": 4182.4, |
| "valid_targets_min": 1560 |
| }, |
| { |
| "epoch": 3.482142857142857, |
| "grad_norm": 0.5252301039129134, |
| "learning_rate": 2.366196457294558e-05, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20833566784858704, |
| "step": 3315, |
| "valid_targets_mean": 4361.0, |
| "valid_targets_min": 1681 |
| }, |
| { |
| "epoch": 3.4873949579831933, |
| "grad_norm": 0.617549050257743, |
| "learning_rate": 2.3610451605581858e-05, |
| "loss": 0.2411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2543012499809265, |
| "step": 3320, |
| "valid_targets_mean": 3627.6, |
| "valid_targets_min": 1374 |
| }, |
| { |
| "epoch": 3.4926470588235294, |
| "grad_norm": 0.6304506600012845, |
| "learning_rate": 2.3558913867822905e-05, |
| "loss": 0.2335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22949200868606567, |
| "step": 3325, |
| "valid_targets_mean": 3204.2, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 3.4978991596638656, |
| "grad_norm": 0.5586583847778026, |
| "learning_rate": 2.3507351713256105e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23757925629615784, |
| "step": 3330, |
| "valid_targets_mean": 4203.4, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 3.5031512605042017, |
| "grad_norm": 0.5579364042848073, |
| "learning_rate": 2.3455765495636353e-05, |
| "loss": 0.2318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23478400707244873, |
| "step": 3335, |
| "valid_targets_mean": 3778.9, |
| "valid_targets_min": 1574 |
| }, |
| { |
| "epoch": 3.508403361344538, |
| "grad_norm": 0.6191817742700788, |
| "learning_rate": 2.3404155568883643e-05, |
| "loss": 0.2425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25709354877471924, |
| "step": 3340, |
| "valid_targets_mean": 3704.9, |
| "valid_targets_min": 1921 |
| }, |
| { |
| "epoch": 3.513655462184874, |
| "grad_norm": 0.587021701284441, |
| "learning_rate": 2.3352522287080625e-05, |
| "loss": 0.2314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23616047203540802, |
| "step": 3345, |
| "valid_targets_mean": 3960.9, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 3.51890756302521, |
| "grad_norm": 0.6254607818726631, |
| "learning_rate": 2.3300866004470182e-05, |
| "loss": 0.2414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24480389058589935, |
| "step": 3350, |
| "valid_targets_mean": 3504.5, |
| "valid_targets_min": 1499 |
| }, |
| { |
| "epoch": 3.524159663865546, |
| "grad_norm": 0.5925836663255958, |
| "learning_rate": 2.324918707545302e-05, |
| "loss": 0.2396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26201432943344116, |
| "step": 3355, |
| "valid_targets_mean": 3803.8, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 3.5294117647058822, |
| "grad_norm": 0.5642203624546177, |
| "learning_rate": 2.3197485854585183e-05, |
| "loss": 0.2267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2236984670162201, |
| "step": 3360, |
| "valid_targets_mean": 4146.8, |
| "valid_targets_min": 1543 |
| }, |
| { |
| "epoch": 3.5346638655462184, |
| "grad_norm": 0.6221598960605759, |
| "learning_rate": 2.3145762696575675e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24771781265735626, |
| "step": 3365, |
| "valid_targets_mean": 3705.0, |
| "valid_targets_min": 2050 |
| }, |
| { |
| "epoch": 3.5399159663865545, |
| "grad_norm": 0.667308661071586, |
| "learning_rate": 2.3094017956283995e-05, |
| "loss": 0.2444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2562797963619232, |
| "step": 3370, |
| "valid_targets_mean": 3287.6, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 3.5451680672268906, |
| "grad_norm": 0.6591430962273881, |
| "learning_rate": 2.3042251988717728e-05, |
| "loss": 0.234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24168621003627777, |
| "step": 3375, |
| "valid_targets_mean": 3219.6, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 3.5504201680672267, |
| "grad_norm": 0.5861565049376661, |
| "learning_rate": 2.2990465149030077e-05, |
| "loss": 0.2408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2576037347316742, |
| "step": 3380, |
| "valid_targets_mean": 3420.2, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 3.5556722689075633, |
| "grad_norm": 0.676375370367313, |
| "learning_rate": 2.2938657792517446e-05, |
| "loss": 0.2489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24123093485832214, |
| "step": 3385, |
| "valid_targets_mean": 2978.2, |
| "valid_targets_min": 1173 |
| }, |
| { |
| "epoch": 3.560924369747899, |
| "grad_norm": 0.7090066415466851, |
| "learning_rate": 2.2886830274617017e-05, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2423102855682373, |
| "step": 3390, |
| "valid_targets_mean": 3106.8, |
| "valid_targets_min": 1165 |
| }, |
| { |
| "epoch": 3.5661764705882355, |
| "grad_norm": 0.6215177878656555, |
| "learning_rate": 2.2834982950904267e-05, |
| "loss": 0.2309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20194599032402039, |
| "step": 3395, |
| "valid_targets_mean": 3800.3, |
| "valid_targets_min": 1365 |
| }, |
| { |
| "epoch": 3.571428571428571, |
| "grad_norm": 0.6568484423092628, |
| "learning_rate": 2.2783116177090573e-05, |
| "loss": 0.2369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2180924117565155, |
| "step": 3400, |
| "valid_targets_mean": 3020.4, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 3.5766806722689077, |
| "grad_norm": 0.72432526478877, |
| "learning_rate": 2.2731230309020762e-05, |
| "loss": 0.2335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2589854300022125, |
| "step": 3405, |
| "valid_targets_mean": 2882.1, |
| "valid_targets_min": 1345 |
| }, |
| { |
| "epoch": 3.581932773109244, |
| "grad_norm": 0.647347676568134, |
| "learning_rate": 2.2679325702670642e-05, |
| "loss": 0.2387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23592257499694824, |
| "step": 3410, |
| "valid_targets_mean": 3123.4, |
| "valid_targets_min": 1747 |
| }, |
| { |
| "epoch": 3.58718487394958, |
| "grad_norm": 0.6321313310777158, |
| "learning_rate": 2.2627402714144586e-05, |
| "loss": 0.2422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23397618532180786, |
| "step": 3415, |
| "valid_targets_mean": 3041.9, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 3.592436974789916, |
| "grad_norm": 0.6163425879015834, |
| "learning_rate": 2.2575461699673085e-05, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24911564588546753, |
| "step": 3420, |
| "valid_targets_mean": 3629.4, |
| "valid_targets_min": 1511 |
| }, |
| { |
| "epoch": 3.597689075630252, |
| "grad_norm": 0.8662060186406194, |
| "learning_rate": 2.2523503015610303e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.219038188457489, |
| "step": 3425, |
| "valid_targets_mean": 3007.8, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 3.6029411764705883, |
| "grad_norm": 0.6505678950823406, |
| "learning_rate": 2.2471527018431637e-05, |
| "loss": 0.2332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2250857800245285, |
| "step": 3430, |
| "valid_targets_mean": 3147.4, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 3.6081932773109244, |
| "grad_norm": 0.6624584977841851, |
| "learning_rate": 2.2419534064731238e-05, |
| "loss": 0.2359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22663256525993347, |
| "step": 3435, |
| "valid_targets_mean": 3047.1, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 3.6134453781512605, |
| "grad_norm": 0.68180528409829, |
| "learning_rate": 2.236752451121963e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2614358067512512, |
| "step": 3440, |
| "valid_targets_mean": 3288.3, |
| "valid_targets_min": 1367 |
| }, |
| { |
| "epoch": 3.6186974789915967, |
| "grad_norm": 0.5943225731704131, |
| "learning_rate": 2.2315498714721198e-05, |
| "loss": 0.2327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2073296308517456, |
| "step": 3445, |
| "valid_targets_mean": 3621.2, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 3.6239495798319328, |
| "grad_norm": 0.7143384166342921, |
| "learning_rate": 2.2263457032171762e-05, |
| "loss": 0.2297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22933131456375122, |
| "step": 3450, |
| "valid_targets_mean": 2664.7, |
| "valid_targets_min": 1480 |
| }, |
| { |
| "epoch": 3.629201680672269, |
| "grad_norm": 0.6637253904207627, |
| "learning_rate": 2.2211399820616154e-05, |
| "loss": 0.232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21584278345108032, |
| "step": 3455, |
| "valid_targets_mean": 3043.8, |
| "valid_targets_min": 1229 |
| }, |
| { |
| "epoch": 3.634453781512605, |
| "grad_norm": 0.6381313624483769, |
| "learning_rate": 2.2159327437205733e-05, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23317265510559082, |
| "step": 3460, |
| "valid_targets_mean": 3533.5, |
| "valid_targets_min": 1727 |
| }, |
| { |
| "epoch": 3.639705882352941, |
| "grad_norm": 0.6079366483063177, |
| "learning_rate": 2.210724023919595e-05, |
| "loss": 0.2337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23725667595863342, |
| "step": 3465, |
| "valid_targets_mean": 3763.2, |
| "valid_targets_min": 1860 |
| }, |
| { |
| "epoch": 3.6449579831932772, |
| "grad_norm": 0.6617853538852045, |
| "learning_rate": 2.205513858394389e-05, |
| "loss": 0.233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23891595005989075, |
| "step": 3470, |
| "valid_targets_mean": 3145.0, |
| "valid_targets_min": 1145 |
| }, |
| { |
| "epoch": 3.6502100840336134, |
| "grad_norm": 0.6931454910102819, |
| "learning_rate": 2.2003022828905832e-05, |
| "loss": 0.2342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24554722011089325, |
| "step": 3475, |
| "valid_targets_mean": 3148.6, |
| "valid_targets_min": 1363 |
| }, |
| { |
| "epoch": 3.6554621848739495, |
| "grad_norm": 0.6830097683535337, |
| "learning_rate": 2.19508933316348e-05, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2083757519721985, |
| "step": 3480, |
| "valid_targets_mean": 3347.4, |
| "valid_targets_min": 1087 |
| }, |
| { |
| "epoch": 3.6607142857142856, |
| "grad_norm": 0.6284986422875785, |
| "learning_rate": 2.189875044977808e-05, |
| "loss": 0.2357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22864796221256256, |
| "step": 3485, |
| "valid_targets_mean": 4141.5, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 3.6659663865546217, |
| "grad_norm": 0.6424551917347495, |
| "learning_rate": 2.1846594541074796e-05, |
| "loss": 0.2283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21687257289886475, |
| "step": 3490, |
| "valid_targets_mean": 3053.2, |
| "valid_targets_min": 1406 |
| }, |
| { |
| "epoch": 3.671218487394958, |
| "grad_norm": 0.6118476480500536, |
| "learning_rate": 2.179442596335345e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21437662839889526, |
| "step": 3495, |
| "valid_targets_mean": 3413.8, |
| "valid_targets_min": 1833 |
| }, |
| { |
| "epoch": 3.6764705882352944, |
| "grad_norm": 0.6834904631426817, |
| "learning_rate": 2.174224507452945e-05, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23827575147151947, |
| "step": 3500, |
| "valid_targets_mean": 3292.0, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 3.68172268907563, |
| "grad_norm": 0.6540573235032019, |
| "learning_rate": 2.1690052232602677e-05, |
| "loss": 0.2306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2561336159706116, |
| "step": 3505, |
| "valid_targets_mean": 3815.1, |
| "valid_targets_min": 1607 |
| }, |
| { |
| "epoch": 3.6869747899159666, |
| "grad_norm": 0.7038556545538145, |
| "learning_rate": 2.1637847795655022e-05, |
| "loss": 0.2357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23643259704113007, |
| "step": 3510, |
| "valid_targets_mean": 2850.3, |
| "valid_targets_min": 1358 |
| }, |
| { |
| "epoch": 3.6922268907563023, |
| "grad_norm": 0.6142418362337423, |
| "learning_rate": 2.1585632121847925e-05, |
| "loss": 0.2339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2268371880054474, |
| "step": 3515, |
| "valid_targets_mean": 3897.3, |
| "valid_targets_min": 1757 |
| }, |
| { |
| "epoch": 3.697478991596639, |
| "grad_norm": 0.6018277229359115, |
| "learning_rate": 2.153340556941991e-05, |
| "loss": 0.2267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19471925497055054, |
| "step": 3520, |
| "valid_targets_mean": 3365.7, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 3.7027310924369745, |
| "grad_norm": 0.7817444103413864, |
| "learning_rate": 2.1481168496684145e-05, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24332907795906067, |
| "step": 3525, |
| "valid_targets_mean": 2908.3, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 3.707983193277311, |
| "grad_norm": 0.6733856863461328, |
| "learning_rate": 2.142892126202597e-05, |
| "loss": 0.2271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22530926764011383, |
| "step": 3530, |
| "valid_targets_mean": 3249.9, |
| "valid_targets_min": 1140 |
| }, |
| { |
| "epoch": 3.713235294117647, |
| "grad_norm": 0.6772781803626257, |
| "learning_rate": 2.137666422390045e-05, |
| "loss": 0.2233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2468833178281784, |
| "step": 3535, |
| "valid_targets_mean": 3621.2, |
| "valid_targets_min": 2266 |
| }, |
| { |
| "epoch": 3.7184873949579833, |
| "grad_norm": 0.596320718539212, |
| "learning_rate": 2.132439774082991e-05, |
| "loss": 0.2084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19030636548995972, |
| "step": 3540, |
| "valid_targets_mean": 3192.4, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 3.7237394957983194, |
| "grad_norm": 0.6683616408438122, |
| "learning_rate": 2.1272122171401467e-05, |
| "loss": 0.24, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2368716150522232, |
| "step": 3545, |
| "valid_targets_mean": 3176.4, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 3.7289915966386555, |
| "grad_norm": 0.5993575332277289, |
| "learning_rate": 2.1219837874264573e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19735181331634521, |
| "step": 3550, |
| "valid_targets_mean": 3426.4, |
| "valid_targets_min": 964 |
| }, |
| { |
| "epoch": 3.7342436974789917, |
| "grad_norm": 0.6105324798756142, |
| "learning_rate": 2.116754520812857e-05, |
| "loss": 0.2313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22294853627681732, |
| "step": 3555, |
| "valid_targets_mean": 3946.7, |
| "valid_targets_min": 1105 |
| }, |
| { |
| "epoch": 3.7394957983193278, |
| "grad_norm": 0.7317392218199291, |
| "learning_rate": 2.111524453176022e-05, |
| "loss": 0.2324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23324161767959595, |
| "step": 3560, |
| "valid_targets_mean": 2534.7, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 3.744747899159664, |
| "grad_norm": 0.679940437130019, |
| "learning_rate": 2.1062936203981227e-05, |
| "loss": 0.243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23880356550216675, |
| "step": 3565, |
| "valid_targets_mean": 3673.0, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 3.75, |
| "grad_norm": 0.6386888401169865, |
| "learning_rate": 2.10106205836658e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21099084615707397, |
| "step": 3570, |
| "valid_targets_mean": 3355.7, |
| "valid_targets_min": 1771 |
| }, |
| { |
| "epoch": 3.755252100840336, |
| "grad_norm": 0.609185135460291, |
| "learning_rate": 2.095829802973817e-05, |
| "loss": 0.2207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20622901618480682, |
| "step": 3575, |
| "valid_targets_mean": 3403.8, |
| "valid_targets_min": 1625 |
| }, |
| { |
| "epoch": 3.7605042016806722, |
| "grad_norm": 0.6933994920811911, |
| "learning_rate": 2.090596890117016e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20166133344173431, |
| "step": 3580, |
| "valid_targets_mean": 3379.6, |
| "valid_targets_min": 1180 |
| }, |
| { |
| "epoch": 3.7657563025210083, |
| "grad_norm": 0.7001758773355745, |
| "learning_rate": 2.0853633556978674e-05, |
| "loss": 0.2214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2164371758699417, |
| "step": 3585, |
| "valid_targets_mean": 3085.8, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 3.7710084033613445, |
| "grad_norm": 0.6982893325743658, |
| "learning_rate": 2.0801292356223265e-05, |
| "loss": 0.2245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22557231783866882, |
| "step": 3590, |
| "valid_targets_mean": 3090.9, |
| "valid_targets_min": 1079 |
| }, |
| { |
| "epoch": 3.7762605042016806, |
| "grad_norm": 0.6862429302576437, |
| "learning_rate": 2.0748945658003695e-05, |
| "loss": 0.2073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21564340591430664, |
| "step": 3595, |
| "valid_targets_mean": 2751.7, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 3.7815126050420167, |
| "grad_norm": 0.7486537584683461, |
| "learning_rate": 2.0696593821457392e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2403099536895752, |
| "step": 3600, |
| "valid_targets_mean": 3262.4, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 3.786764705882353, |
| "grad_norm": 0.6292490113807976, |
| "learning_rate": 2.064423720575709e-05, |
| "loss": 0.2365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21284765005111694, |
| "step": 3605, |
| "valid_targets_mean": 3452.1, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 3.792016806722689, |
| "grad_norm": 0.6731713864780883, |
| "learning_rate": 2.0591876170108257e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23124480247497559, |
| "step": 3610, |
| "valid_targets_mean": 2805.6, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 3.7972689075630255, |
| "grad_norm": 0.570026508038886, |
| "learning_rate": 2.0539511073746743e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21886953711509705, |
| "step": 3615, |
| "valid_targets_mean": 4512.7, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 3.802521008403361, |
| "grad_norm": 0.6587414192570736, |
| "learning_rate": 2.0487142275936213e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21692374348640442, |
| "step": 3620, |
| "valid_targets_mean": 3188.2, |
| "valid_targets_min": 1388 |
| }, |
| { |
| "epoch": 3.8077731092436977, |
| "grad_norm": 0.6975757464948207, |
| "learning_rate": 2.0434770135965743e-05, |
| "loss": 0.238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23684664070606232, |
| "step": 3625, |
| "valid_targets_mean": 3106.9, |
| "valid_targets_min": 1986 |
| }, |
| { |
| "epoch": 3.8130252100840334, |
| "grad_norm": 0.6390716602559315, |
| "learning_rate": 2.0382395013147347e-05, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23830687999725342, |
| "step": 3630, |
| "valid_targets_mean": 3893.1, |
| "valid_targets_min": 1671 |
| }, |
| { |
| "epoch": 3.81827731092437, |
| "grad_norm": 0.6520611936803277, |
| "learning_rate": 2.033001726681349e-05, |
| "loss": 0.2184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19424161314964294, |
| "step": 3635, |
| "valid_targets_mean": 3246.8, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 3.8235294117647056, |
| "grad_norm": 0.653877417451473, |
| "learning_rate": 2.027763725631463e-05, |
| "loss": 0.2257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21053674817085266, |
| "step": 3640, |
| "valid_targets_mean": 3285.3, |
| "valid_targets_min": 1202 |
| }, |
| { |
| "epoch": 3.828781512605042, |
| "grad_norm": 0.6519721595841632, |
| "learning_rate": 2.0225255341016794e-05, |
| "loss": 0.2395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22552523016929626, |
| "step": 3645, |
| "valid_targets_mean": 4012.8, |
| "valid_targets_min": 1645 |
| }, |
| { |
| "epoch": 3.8340336134453783, |
| "grad_norm": 0.6008225197326998, |
| "learning_rate": 2.017287188029904e-05, |
| "loss": 0.226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20129550993442535, |
| "step": 3650, |
| "valid_targets_mean": 3525.8, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 3.8392857142857144, |
| "grad_norm": 0.7071580358913306, |
| "learning_rate": 2.0120487233551035e-05, |
| "loss": 0.2369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2568947672843933, |
| "step": 3655, |
| "valid_targets_mean": 3044.6, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 3.8445378151260505, |
| "grad_norm": 0.7176723110707379, |
| "learning_rate": 2.006810176017059e-05, |
| "loss": 0.2279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23161205649375916, |
| "step": 3660, |
| "valid_targets_mean": 3179.8, |
| "valid_targets_min": 1625 |
| }, |
| { |
| "epoch": 3.8497899159663866, |
| "grad_norm": 0.6943499018659017, |
| "learning_rate": 2.0015715819561205e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24318306148052216, |
| "step": 3665, |
| "valid_targets_mean": 3399.9, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 3.8550420168067228, |
| "grad_norm": 0.6973815528618685, |
| "learning_rate": 1.9963329771129558e-05, |
| "loss": 0.2401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24660438299179077, |
| "step": 3670, |
| "valid_targets_mean": 2866.4, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 3.860294117647059, |
| "grad_norm": 0.6342688826905563, |
| "learning_rate": 1.9910943974283066e-05, |
| "loss": 0.2331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23309576511383057, |
| "step": 3675, |
| "valid_targets_mean": 3480.4, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 3.865546218487395, |
| "grad_norm": 0.735979206541467, |
| "learning_rate": 1.9858558788427447e-05, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22612996399402618, |
| "step": 3680, |
| "valid_targets_mean": 2920.8, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 3.870798319327731, |
| "grad_norm": 0.6974844461519691, |
| "learning_rate": 1.9806174572964205e-05, |
| "loss": 0.2349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22539496421813965, |
| "step": 3685, |
| "valid_targets_mean": 2983.9, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 3.8760504201680672, |
| "grad_norm": 0.7806658133125973, |
| "learning_rate": 1.975379168728819e-05, |
| "loss": 0.2367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25455334782600403, |
| "step": 3690, |
| "valid_targets_mean": 2842.1, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 3.8813025210084033, |
| "grad_norm": 0.653382148721513, |
| "learning_rate": 1.9701410490785128e-05, |
| "loss": 0.2215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22338590025901794, |
| "step": 3695, |
| "valid_targets_mean": 3210.6, |
| "valid_targets_min": 1665 |
| }, |
| { |
| "epoch": 3.8865546218487395, |
| "grad_norm": 0.6977766979229648, |
| "learning_rate": 1.9649031342829178e-05, |
| "loss": 0.2357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24201029539108276, |
| "step": 3700, |
| "valid_targets_mean": 3020.0, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 3.8918067226890756, |
| "grad_norm": 0.6441901232419098, |
| "learning_rate": 1.9596654602780398e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2265818864107132, |
| "step": 3705, |
| "valid_targets_mean": 3548.8, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 3.8970588235294117, |
| "grad_norm": 0.715226965706479, |
| "learning_rate": 1.9544280629982364e-05, |
| "loss": 0.2428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25313618779182434, |
| "step": 3710, |
| "valid_targets_mean": 3038.7, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 3.902310924369748, |
| "grad_norm": 0.6360683211422588, |
| "learning_rate": 1.949190978375966e-05, |
| "loss": 0.2366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22172778844833374, |
| "step": 3715, |
| "valid_targets_mean": 3616.2, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 3.907563025210084, |
| "grad_norm": 0.6393776390642489, |
| "learning_rate": 1.9439542423415413e-05, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.205665722489357, |
| "step": 3720, |
| "valid_targets_mean": 3152.5, |
| "valid_targets_min": 1351 |
| }, |
| { |
| "epoch": 3.91281512605042, |
| "grad_norm": 0.6380081375418487, |
| "learning_rate": 1.9387178908228838e-05, |
| "loss": 0.2292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23773056268692017, |
| "step": 3725, |
| "valid_targets_mean": 4153.7, |
| "valid_targets_min": 1307 |
| }, |
| { |
| "epoch": 3.918067226890756, |
| "grad_norm": 0.5502610030856153, |
| "learning_rate": 1.933481959745276e-05, |
| "loss": 0.225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2143445611000061, |
| "step": 3730, |
| "valid_targets_mean": 5039.1, |
| "valid_targets_min": 1587 |
| }, |
| { |
| "epoch": 3.9233193277310923, |
| "grad_norm": 0.5822473871522699, |
| "learning_rate": 1.9282464850311184e-05, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20977917313575745, |
| "step": 3735, |
| "valid_targets_mean": 4101.8, |
| "valid_targets_min": 1741 |
| }, |
| { |
| "epoch": 3.928571428571429, |
| "grad_norm": 0.5793820699573822, |
| "learning_rate": 1.9230115025996764e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20586253702640533, |
| "step": 3740, |
| "valid_targets_mean": 3830.2, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 3.9338235294117645, |
| "grad_norm": 0.7167408375172564, |
| "learning_rate": 1.9177770483668416e-05, |
| "loss": 0.2302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22084660828113556, |
| "step": 3745, |
| "valid_targets_mean": 3468.1, |
| "valid_targets_min": 1886 |
| }, |
| { |
| "epoch": 3.939075630252101, |
| "grad_norm": 0.6404425612951213, |
| "learning_rate": 1.912543158244881e-05, |
| "loss": 0.2174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2383722960948944, |
| "step": 3750, |
| "valid_targets_mean": 3603.1, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 3.9443277310924367, |
| "grad_norm": 0.6506827435964047, |
| "learning_rate": 1.9073098681421895e-05, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19391639530658722, |
| "step": 3755, |
| "valid_targets_mean": 3134.8, |
| "valid_targets_min": 1484 |
| }, |
| { |
| "epoch": 3.9495798319327733, |
| "grad_norm": 0.6963957310682597, |
| "learning_rate": 1.902077213963048e-05, |
| "loss": 0.2203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21799013018608093, |
| "step": 3760, |
| "valid_targets_mean": 3377.2, |
| "valid_targets_min": 1152 |
| }, |
| { |
| "epoch": 3.9548319327731094, |
| "grad_norm": 0.7783983083913816, |
| "learning_rate": 1.896845231607372e-05, |
| "loss": 0.238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27412140369415283, |
| "step": 3765, |
| "valid_targets_mean": 2750.6, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 3.9600840336134455, |
| "grad_norm": 0.6595123518563015, |
| "learning_rate": 1.8916139569704704e-05, |
| "loss": 0.2292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2191227525472641, |
| "step": 3770, |
| "valid_targets_mean": 3052.4, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 3.9653361344537816, |
| "grad_norm": 0.6850818119709559, |
| "learning_rate": 1.886383425942795e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21025024354457855, |
| "step": 3775, |
| "valid_targets_mean": 3002.1, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 3.9705882352941178, |
| "grad_norm": 0.7391622979048171, |
| "learning_rate": 1.8811536744096956e-05, |
| "loss": 0.2154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22044730186462402, |
| "step": 3780, |
| "valid_targets_mean": 2914.0, |
| "valid_targets_min": 1275 |
| }, |
| { |
| "epoch": 3.975840336134454, |
| "grad_norm": 0.7238761932845064, |
| "learning_rate": 1.8759247382511748e-05, |
| "loss": 0.2242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2314056158065796, |
| "step": 3785, |
| "valid_targets_mean": 3362.9, |
| "valid_targets_min": 1669 |
| }, |
| { |
| "epoch": 3.98109243697479, |
| "grad_norm": 0.6629448508084417, |
| "learning_rate": 1.8706966533416413e-05, |
| "loss": 0.2281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2214796096086502, |
| "step": 3790, |
| "valid_targets_mean": 3065.4, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 3.986344537815126, |
| "grad_norm": 0.957526256499955, |
| "learning_rate": 1.8654694555496624e-05, |
| "loss": 0.2292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21655909717082977, |
| "step": 3795, |
| "valid_targets_mean": 3591.1, |
| "valid_targets_min": 1685 |
| }, |
| { |
| "epoch": 3.991596638655462, |
| "grad_norm": 0.6385611154020212, |
| "learning_rate": 1.860243180737721e-05, |
| "loss": 0.2315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23146796226501465, |
| "step": 3800, |
| "valid_targets_mean": 3571.6, |
| "valid_targets_min": 1793 |
| }, |
| { |
| "epoch": 3.9968487394957983, |
| "grad_norm": 0.6361743923463639, |
| "learning_rate": 1.8550178647619664e-05, |
| "loss": 0.2344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23826557397842407, |
| "step": 3805, |
| "valid_targets_mean": 3868.6, |
| "valid_targets_min": 1976 |
| }, |
| { |
| "epoch": 4.0021008403361344, |
| "grad_norm": 0.9276215598529717, |
| "learning_rate": 1.84979354347197e-05, |
| "loss": 0.2029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17189082503318787, |
| "step": 3810, |
| "valid_targets_mean": 1553.1, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 4.007352941176471, |
| "grad_norm": 0.866049721179808, |
| "learning_rate": 1.8445702527104782e-05, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1560104489326477, |
| "step": 3815, |
| "valid_targets_mean": 1315.5, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 4.012605042016807, |
| "grad_norm": 0.7548114470500479, |
| "learning_rate": 1.8393480283131677e-05, |
| "loss": 0.1496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1479974240064621, |
| "step": 3820, |
| "valid_targets_mean": 1626.6, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 4.017857142857143, |
| "grad_norm": 0.8337315927989255, |
| "learning_rate": 1.8341269061083996e-05, |
| "loss": 0.1512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12990880012512207, |
| "step": 3825, |
| "valid_targets_mean": 1316.2, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 4.023109243697479, |
| "grad_norm": 0.8291733641726188, |
| "learning_rate": 1.8289069219169717e-05, |
| "loss": 0.1484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15963760018348694, |
| "step": 3830, |
| "valid_targets_mean": 1752.4, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 4.0283613445378155, |
| "grad_norm": 0.8304874985400824, |
| "learning_rate": 1.8236881115518766e-05, |
| "loss": 0.1498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14934542775154114, |
| "step": 3835, |
| "valid_targets_mean": 1383.9, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.033613445378151, |
| "grad_norm": 0.8052129046929378, |
| "learning_rate": 1.8184705108180516e-05, |
| "loss": 0.1579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15371397137641907, |
| "step": 3840, |
| "valid_targets_mean": 1573.9, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 4.038865546218488, |
| "grad_norm": 0.8085904112301928, |
| "learning_rate": 1.8132541555121353e-05, |
| "loss": 0.1364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14829567074775696, |
| "step": 3845, |
| "valid_targets_mean": 1383.1, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 4.044117647058823, |
| "grad_norm": 0.8018131771688088, |
| "learning_rate": 1.808039081422223e-05, |
| "loss": 0.1588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1333727240562439, |
| "step": 3850, |
| "valid_targets_mean": 1518.7, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 4.04936974789916, |
| "grad_norm": 0.8491004069838234, |
| "learning_rate": 1.802825324327618e-05, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15288317203521729, |
| "step": 3855, |
| "valid_targets_mean": 1489.7, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 4.054621848739496, |
| "grad_norm": 0.8165835733627114, |
| "learning_rate": 1.7976129199985886e-05, |
| "loss": 0.147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1399635225534439, |
| "step": 3860, |
| "valid_targets_mean": 1304.5, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 4.059873949579832, |
| "grad_norm": 0.7748737501704929, |
| "learning_rate": 1.7924019041961228e-05, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14403750002384186, |
| "step": 3865, |
| "valid_targets_mean": 1409.2, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 4.065126050420168, |
| "grad_norm": 0.8803098411860152, |
| "learning_rate": 1.7871923126716827e-05, |
| "loss": 0.1501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15918989479541779, |
| "step": 3870, |
| "valid_targets_mean": 1331.1, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 4.070378151260504, |
| "grad_norm": 0.753689435569324, |
| "learning_rate": 1.7819841811669573e-05, |
| "loss": 0.1342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13107150793075562, |
| "step": 3875, |
| "valid_targets_mean": 1473.2, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 4.07563025210084, |
| "grad_norm": 0.7637352369796083, |
| "learning_rate": 1.7767775454136194e-05, |
| "loss": 0.1367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12565407156944275, |
| "step": 3880, |
| "valid_targets_mean": 1367.2, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 4.080882352941177, |
| "grad_norm": 0.8931529994254264, |
| "learning_rate": 1.7715724411330806e-05, |
| "loss": 0.1381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1554366648197174, |
| "step": 3885, |
| "valid_targets_mean": 1507.5, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 4.086134453781512, |
| "grad_norm": 0.8058581428686146, |
| "learning_rate": 1.7663689040362446e-05, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14042530953884125, |
| "step": 3890, |
| "valid_targets_mean": 1363.7, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 4.091386554621849, |
| "grad_norm": 0.8507202166895215, |
| "learning_rate": 1.761166969823262e-05, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13831481337547302, |
| "step": 3895, |
| "valid_targets_mean": 1315.4, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 4.0966386554621845, |
| "grad_norm": 0.7947736774793486, |
| "learning_rate": 1.7559666741832896e-05, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12960849702358246, |
| "step": 3900, |
| "valid_targets_mean": 1341.5, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 4.101890756302521, |
| "grad_norm": 0.8251862770713435, |
| "learning_rate": 1.750768052794239e-05, |
| "loss": 0.1514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15292903780937195, |
| "step": 3905, |
| "valid_targets_mean": 1436.5, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 4.107142857142857, |
| "grad_norm": 0.799156965792982, |
| "learning_rate": 1.7455711413225372e-05, |
| "loss": 0.142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13684728741645813, |
| "step": 3910, |
| "valid_targets_mean": 1338.8, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 4.112394957983193, |
| "grad_norm": 0.8117329071283277, |
| "learning_rate": 1.7403759754228794e-05, |
| "loss": 0.14, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13306397199630737, |
| "step": 3915, |
| "valid_targets_mean": 1343.0, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 4.117647058823529, |
| "grad_norm": 0.8678892755082293, |
| "learning_rate": 1.7351825907379837e-05, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1487090289592743, |
| "step": 3920, |
| "valid_targets_mean": 1398.7, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.1228991596638656, |
| "grad_norm": 0.8732015715863755, |
| "learning_rate": 1.7299910228983513e-05, |
| "loss": 0.1317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14107802510261536, |
| "step": 3925, |
| "valid_targets_mean": 1339.1, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 4.128151260504202, |
| "grad_norm": 0.8358116761683432, |
| "learning_rate": 1.7248013075220128e-05, |
| "loss": 0.14, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13086049258708954, |
| "step": 3930, |
| "valid_targets_mean": 1377.6, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 4.133403361344538, |
| "grad_norm": 0.882675069386114, |
| "learning_rate": 1.7196134802142945e-05, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1546640843153, |
| "step": 3935, |
| "valid_targets_mean": 1540.8, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 4.138655462184874, |
| "grad_norm": 0.7673275063053835, |
| "learning_rate": 1.7144275765675673e-05, |
| "loss": 0.1388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13223353028297424, |
| "step": 3940, |
| "valid_targets_mean": 1435.7, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 4.14390756302521, |
| "grad_norm": 0.8161750428827426, |
| "learning_rate": 1.7092436321610042e-05, |
| "loss": 0.1482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.147655189037323, |
| "step": 3945, |
| "valid_targets_mean": 1520.5, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 4.149159663865547, |
| "grad_norm": 0.8361768379372263, |
| "learning_rate": 1.704061682560336e-05, |
| "loss": 0.1375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13745343685150146, |
| "step": 3950, |
| "valid_targets_mean": 1408.2, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 4.154411764705882, |
| "grad_norm": 0.8345898800935504, |
| "learning_rate": 1.698881763317609e-05, |
| "loss": 0.1438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13992251455783844, |
| "step": 3955, |
| "valid_targets_mean": 1531.4, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 4.159663865546219, |
| "grad_norm": 0.7875946022995587, |
| "learning_rate": 1.69370390997094e-05, |
| "loss": 0.1387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13176432251930237, |
| "step": 3960, |
| "valid_targets_mean": 1391.6, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 4.1649159663865545, |
| "grad_norm": 0.7017178626610292, |
| "learning_rate": 1.6885281580442677e-05, |
| "loss": 0.142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.114842988550663, |
| "step": 3965, |
| "valid_targets_mean": 1312.7, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 4.170168067226891, |
| "grad_norm": 0.7974602402640565, |
| "learning_rate": 1.6833545430471194e-05, |
| "loss": 0.1374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1272060126066208, |
| "step": 3970, |
| "valid_targets_mean": 1347.1, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 4.175420168067227, |
| "grad_norm": 0.8100956763693268, |
| "learning_rate": 1.678183100474359e-05, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13280612230300903, |
| "step": 3975, |
| "valid_targets_mean": 1394.2, |
| "valid_targets_min": 749 |
| }, |
| { |
| "epoch": 4.180672268907563, |
| "grad_norm": 0.8839233586552578, |
| "learning_rate": 1.6730138658059448e-05, |
| "loss": 0.1279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13839851319789886, |
| "step": 3980, |
| "valid_targets_mean": 1372.1, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 4.185924369747899, |
| "grad_norm": 0.7770716555066293, |
| "learning_rate": 1.667846874506689e-05, |
| "loss": 0.1345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12787684798240662, |
| "step": 3985, |
| "valid_targets_mean": 1425.2, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 4.1911764705882355, |
| "grad_norm": 0.8263514960899874, |
| "learning_rate": 1.662682162026012e-05, |
| "loss": 0.1384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14100591838359833, |
| "step": 3990, |
| "valid_targets_mean": 1423.1, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 4.196428571428571, |
| "grad_norm": 0.8174867184649295, |
| "learning_rate": 1.6575197637976995e-05, |
| "loss": 0.1377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14689315855503082, |
| "step": 3995, |
| "valid_targets_mean": 1509.8, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 4.201680672268908, |
| "grad_norm": 0.8589762302363031, |
| "learning_rate": 1.652359715239661e-05, |
| "loss": 0.1368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13010036945343018, |
| "step": 4000, |
| "valid_targets_mean": 1292.4, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 4.206932773109243, |
| "grad_norm": 0.8425688419243291, |
| "learning_rate": 1.6472020517536828e-05, |
| "loss": 0.14, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1463192105293274, |
| "step": 4005, |
| "valid_targets_mean": 1474.6, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 4.21218487394958, |
| "grad_norm": 0.8171247963907109, |
| "learning_rate": 1.6420468087251907e-05, |
| "loss": 0.1321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13386958837509155, |
| "step": 4010, |
| "valid_targets_mean": 1377.2, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 4.217436974789916, |
| "grad_norm": 0.8221524193856137, |
| "learning_rate": 1.6368940215230026e-05, |
| "loss": 0.1398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14860522747039795, |
| "step": 4015, |
| "valid_targets_mean": 1693.8, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 4.222689075630252, |
| "grad_norm": 0.8080758516493216, |
| "learning_rate": 1.6317437254990875e-05, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13878750801086426, |
| "step": 4020, |
| "valid_targets_mean": 1473.4, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 4.227941176470588, |
| "grad_norm": 0.8329372613650491, |
| "learning_rate": 1.626595955988325e-05, |
| "loss": 0.1445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14070574939250946, |
| "step": 4025, |
| "valid_targets_mean": 1439.1, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 4.233193277310924, |
| "grad_norm": 0.7819540997359885, |
| "learning_rate": 1.6214507483082593e-05, |
| "loss": 0.1315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13133744895458221, |
| "step": 4030, |
| "valid_targets_mean": 1577.8, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 4.23844537815126, |
| "grad_norm": 0.7658805060914474, |
| "learning_rate": 1.6163081377588588e-05, |
| "loss": 0.131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13184303045272827, |
| "step": 4035, |
| "valid_targets_mean": 1500.7, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 4.243697478991597, |
| "grad_norm": 0.7854703396401594, |
| "learning_rate": 1.6111681596222732e-05, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13113921880722046, |
| "step": 4040, |
| "valid_targets_mean": 1402.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 4.248949579831933, |
| "grad_norm": 0.765545221207553, |
| "learning_rate": 1.606030849162593e-05, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1270998865365982, |
| "step": 4045, |
| "valid_targets_mean": 1522.0, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 4.254201680672269, |
| "grad_norm": 0.80112535205176, |
| "learning_rate": 1.600896241625605e-05, |
| "loss": 0.1314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13291269540786743, |
| "step": 4050, |
| "valid_targets_mean": 1373.8, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 4.2594537815126055, |
| "grad_norm": 0.8177224842495399, |
| "learning_rate": 1.5957643722385532e-05, |
| "loss": 0.132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14079031348228455, |
| "step": 4055, |
| "valid_targets_mean": 1517.9, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.264705882352941, |
| "grad_norm": 0.795808535657422, |
| "learning_rate": 1.590635276209896e-05, |
| "loss": 0.1396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13821426033973694, |
| "step": 4060, |
| "valid_targets_mean": 1521.1, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 4.269957983193278, |
| "grad_norm": 0.8258679101265551, |
| "learning_rate": 1.5855089887290634e-05, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14685073494911194, |
| "step": 4065, |
| "valid_targets_mean": 1565.1, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 4.275210084033613, |
| "grad_norm": 0.8117779327857177, |
| "learning_rate": 1.5803855449662175e-05, |
| "loss": 0.1323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13573217391967773, |
| "step": 4070, |
| "valid_targets_mean": 1411.9, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 4.28046218487395, |
| "grad_norm": 0.7103133306723244, |
| "learning_rate": 1.5752649800720096e-05, |
| "loss": 0.1355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14503194391727448, |
| "step": 4075, |
| "valid_targets_mean": 1797.2, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 4.285714285714286, |
| "grad_norm": 0.7877525685043663, |
| "learning_rate": 1.5701473291773395e-05, |
| "loss": 0.1303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12483812868595123, |
| "step": 4080, |
| "valid_targets_mean": 1316.6, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 4.290966386554622, |
| "grad_norm": 0.7744871393889592, |
| "learning_rate": 1.5650326273931166e-05, |
| "loss": 0.137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13510701060295105, |
| "step": 4085, |
| "valid_targets_mean": 1644.8, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 4.296218487394958, |
| "grad_norm": 0.7786406479142675, |
| "learning_rate": 1.559920909810016e-05, |
| "loss": 0.1311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13013191521167755, |
| "step": 4090, |
| "valid_targets_mean": 1388.4, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 4.301470588235294, |
| "grad_norm": 0.7764860246380487, |
| "learning_rate": 1.5548122114982393e-05, |
| "loss": 0.1272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12222108244895935, |
| "step": 4095, |
| "valid_targets_mean": 1277.5, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 4.30672268907563, |
| "grad_norm": 0.8106042463016419, |
| "learning_rate": 1.5497065675072728e-05, |
| "loss": 0.1279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14016015827655792, |
| "step": 4100, |
| "valid_targets_mean": 1502.6, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 4.311974789915967, |
| "grad_norm": 0.8543220451468436, |
| "learning_rate": 1.5446040128656485e-05, |
| "loss": 0.1403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14713945984840393, |
| "step": 4105, |
| "valid_targets_mean": 1561.8, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 4.317226890756302, |
| "grad_norm": 0.7953069524968457, |
| "learning_rate": 1.539504582580704e-05, |
| "loss": 0.1292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12721598148345947, |
| "step": 4110, |
| "valid_targets_mean": 1307.5, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 4.322478991596639, |
| "grad_norm": 0.8097826390836019, |
| "learning_rate": 1.5344083116383395e-05, |
| "loss": 0.1339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12812337279319763, |
| "step": 4115, |
| "valid_targets_mean": 1381.6, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 4.3277310924369745, |
| "grad_norm": 0.7958890094736837, |
| "learning_rate": 1.529315235002781e-05, |
| "loss": 0.1375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14337149262428284, |
| "step": 4120, |
| "valid_targets_mean": 1599.2, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 4.332983193277311, |
| "grad_norm": 0.783528991087372, |
| "learning_rate": 1.5242253876163399e-05, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12217546254396439, |
| "step": 4125, |
| "valid_targets_mean": 1385.0, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 4.338235294117647, |
| "grad_norm": 0.8168471451852063, |
| "learning_rate": 1.5191388043991712e-05, |
| "loss": 0.1322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12848719954490662, |
| "step": 4130, |
| "valid_targets_mean": 1420.3, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 4.343487394957983, |
| "grad_norm": 0.8687088982404517, |
| "learning_rate": 1.5140555202490359e-05, |
| "loss": 0.1335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1381555199623108, |
| "step": 4135, |
| "valid_targets_mean": 1435.8, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 4.348739495798319, |
| "grad_norm": 0.824701387692817, |
| "learning_rate": 1.5089755700410602e-05, |
| "loss": 0.1358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13314849138259888, |
| "step": 4140, |
| "valid_targets_mean": 1477.9, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 4.3539915966386555, |
| "grad_norm": 1.1187004100398168, |
| "learning_rate": 1.5038989886274992e-05, |
| "loss": 0.1372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1633179783821106, |
| "step": 4145, |
| "valid_targets_mean": 1382.3, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 4.359243697478991, |
| "grad_norm": 0.843059495998902, |
| "learning_rate": 1.498825810837492e-05, |
| "loss": 0.1354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12570440769195557, |
| "step": 4150, |
| "valid_targets_mean": 1461.6, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 4.364495798319328, |
| "grad_norm": 0.816554096771243, |
| "learning_rate": 1.4937560714768283e-05, |
| "loss": 0.1385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1403723806142807, |
| "step": 4155, |
| "valid_targets_mean": 1461.2, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 4.369747899159664, |
| "grad_norm": 0.8797104989098917, |
| "learning_rate": 1.4886898053277086e-05, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15383698046207428, |
| "step": 4160, |
| "valid_targets_mean": 1542.3, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 4.375, |
| "grad_norm": 0.7898626242305901, |
| "learning_rate": 1.4836270471485029e-05, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12376511842012405, |
| "step": 4165, |
| "valid_targets_mean": 1244.7, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 4.380252100840336, |
| "grad_norm": 0.8780197054651814, |
| "learning_rate": 1.4785678316735144e-05, |
| "loss": 0.1308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14664515852928162, |
| "step": 4170, |
| "valid_targets_mean": 1673.9, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 4.385504201680672, |
| "grad_norm": 0.9346525477732902, |
| "learning_rate": 1.4735121936127406e-05, |
| "loss": 0.1321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15194876492023468, |
| "step": 4175, |
| "valid_targets_mean": 1695.9, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 4.390756302521009, |
| "grad_norm": 0.9211785858456039, |
| "learning_rate": 1.4684601676516366e-05, |
| "loss": 0.1318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.138489231467247, |
| "step": 4180, |
| "valid_targets_mean": 1400.1, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 4.3960084033613445, |
| "grad_norm": 0.8373085168906266, |
| "learning_rate": 1.4634117884508738e-05, |
| "loss": 0.1274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12678782641887665, |
| "step": 4185, |
| "valid_targets_mean": 1299.4, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 4.401260504201681, |
| "grad_norm": 0.8325212171741512, |
| "learning_rate": 1.458367090646105e-05, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1405733823776245, |
| "step": 4190, |
| "valid_targets_mean": 1521.1, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 4.406512605042017, |
| "grad_norm": 0.9073092150371975, |
| "learning_rate": 1.4533261088477257e-05, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16051650047302246, |
| "step": 4195, |
| "valid_targets_mean": 1617.8, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 4.411764705882353, |
| "grad_norm": 0.7397162950148408, |
| "learning_rate": 1.448288877640637e-05, |
| "loss": 0.1297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11534975469112396, |
| "step": 4200, |
| "valid_targets_mean": 1434.4, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 4.417016806722689, |
| "grad_norm": 0.7733942072643732, |
| "learning_rate": 1.4432554315840082e-05, |
| "loss": 0.1279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12870749831199646, |
| "step": 4205, |
| "valid_targets_mean": 1500.7, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 4.4222689075630255, |
| "grad_norm": 0.8287058084711577, |
| "learning_rate": 1.438225805211039e-05, |
| "loss": 0.1252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12352833896875381, |
| "step": 4210, |
| "valid_targets_mean": 1306.1, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 4.427521008403361, |
| "grad_norm": 0.8460146278274804, |
| "learning_rate": 1.4332000330287248e-05, |
| "loss": 0.1163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11612292379140854, |
| "step": 4215, |
| "valid_targets_mean": 1381.9, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 4.432773109243698, |
| "grad_norm": 0.8428338799366506, |
| "learning_rate": 1.428178149517617e-05, |
| "loss": 0.1303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1271061897277832, |
| "step": 4220, |
| "valid_targets_mean": 1532.2, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 4.438025210084033, |
| "grad_norm": 0.7764971458397468, |
| "learning_rate": 1.4231601891315876e-05, |
| "loss": 0.1255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1206718236207962, |
| "step": 4225, |
| "valid_targets_mean": 1425.2, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 4.44327731092437, |
| "grad_norm": 0.8017610552892988, |
| "learning_rate": 1.418146186297594e-05, |
| "loss": 0.1257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12809637188911438, |
| "step": 4230, |
| "valid_targets_mean": 1575.6, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 4.448529411764706, |
| "grad_norm": 0.8204445283311675, |
| "learning_rate": 1.413136175415441e-05, |
| "loss": 0.1298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1299220323562622, |
| "step": 4235, |
| "valid_targets_mean": 1367.1, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 4.453781512605042, |
| "grad_norm": 0.8229673951166021, |
| "learning_rate": 1.4081301908575457e-05, |
| "loss": 0.1265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13332301378250122, |
| "step": 4240, |
| "valid_targets_mean": 1369.4, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 4.459033613445378, |
| "grad_norm": 0.8025930909766332, |
| "learning_rate": 1.4031282669687035e-05, |
| "loss": 0.1291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11734200268983841, |
| "step": 4245, |
| "valid_targets_mean": 1319.9, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 4.464285714285714, |
| "grad_norm": 0.9239894606873152, |
| "learning_rate": 1.3981304380658474e-05, |
| "loss": 0.1925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21401086449623108, |
| "step": 4250, |
| "valid_targets_mean": 4488.5, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 4.46953781512605, |
| "grad_norm": 0.6598274422549769, |
| "learning_rate": 1.3931367384378183e-05, |
| "loss": 0.2242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2256534993648529, |
| "step": 4255, |
| "valid_targets_mean": 4344.8, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 4.474789915966387, |
| "grad_norm": 0.5777142536216642, |
| "learning_rate": 1.3881472023451262e-05, |
| "loss": 0.2173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21953260898590088, |
| "step": 4260, |
| "valid_targets_mean": 4358.4, |
| "valid_targets_min": 1509 |
| }, |
| { |
| "epoch": 4.480042016806722, |
| "grad_norm": 0.5644265671396247, |
| "learning_rate": 1.3831618640197153e-05, |
| "loss": 0.211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19617916643619537, |
| "step": 4265, |
| "valid_targets_mean": 4067.4, |
| "valid_targets_min": 2689 |
| }, |
| { |
| "epoch": 4.485294117647059, |
| "grad_norm": 0.6800329773093203, |
| "learning_rate": 1.3781807576647315e-05, |
| "loss": 0.202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19588659703731537, |
| "step": 4270, |
| "valid_targets_mean": 3231.8, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 4.4905462184873945, |
| "grad_norm": 0.583998108779037, |
| "learning_rate": 1.373203917454285e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18826688826084137, |
| "step": 4275, |
| "valid_targets_mean": 4015.0, |
| "valid_targets_min": 1413 |
| }, |
| { |
| "epoch": 4.495798319327731, |
| "grad_norm": 0.5993018924234834, |
| "learning_rate": 1.3682313775332186e-05, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20078253746032715, |
| "step": 4280, |
| "valid_targets_mean": 4218.1, |
| "valid_targets_min": 2160 |
| }, |
| { |
| "epoch": 4.501050420168067, |
| "grad_norm": 0.6213345974417059, |
| "learning_rate": 1.3632631720168705e-05, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21006864309310913, |
| "step": 4285, |
| "valid_targets_mean": 3998.2, |
| "valid_targets_min": 1654 |
| }, |
| { |
| "epoch": 4.506302521008403, |
| "grad_norm": 0.6454438419555589, |
| "learning_rate": 1.358299334990842e-05, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21891412138938904, |
| "step": 4290, |
| "valid_targets_mean": 3480.9, |
| "valid_targets_min": 1462 |
| }, |
| { |
| "epoch": 4.51155462184874, |
| "grad_norm": 0.5793855112485845, |
| "learning_rate": 1.3533399005107635e-05, |
| "loss": 0.214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19543211162090302, |
| "step": 4295, |
| "valid_targets_mean": 4008.8, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 4.516806722689076, |
| "grad_norm": 0.5886149747788205, |
| "learning_rate": 1.3483849026020603e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19601313769817352, |
| "step": 4300, |
| "valid_targets_mean": 3658.9, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 4.522058823529412, |
| "grad_norm": 0.6162622988474424, |
| "learning_rate": 1.3434343752597199e-05, |
| "loss": 0.2143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2158222198486328, |
| "step": 4305, |
| "valid_targets_mean": 4291.2, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 4.527310924369748, |
| "grad_norm": 0.5225855536952907, |
| "learning_rate": 1.3384883524480576e-05, |
| "loss": 0.2084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1962510198354721, |
| "step": 4310, |
| "valid_targets_mean": 4939.0, |
| "valid_targets_min": 1596 |
| }, |
| { |
| "epoch": 4.532563025210084, |
| "grad_norm": 0.639285317945504, |
| "learning_rate": 1.333546868100486e-05, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20231905579566956, |
| "step": 4315, |
| "valid_targets_mean": 3340.8, |
| "valid_targets_min": 1759 |
| }, |
| { |
| "epoch": 4.53781512605042, |
| "grad_norm": 0.6692843580892279, |
| "learning_rate": 1.3286099561192784e-05, |
| "loss": 0.2128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21312329173088074, |
| "step": 4320, |
| "valid_targets_mean": 3084.3, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 4.543067226890757, |
| "grad_norm": 0.6120205294157653, |
| "learning_rate": 1.3236776503753397e-05, |
| "loss": 0.2112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19397076964378357, |
| "step": 4325, |
| "valid_targets_mean": 3763.4, |
| "valid_targets_min": 1643 |
| }, |
| { |
| "epoch": 4.548319327731092, |
| "grad_norm": 0.668479121847745, |
| "learning_rate": 1.3187499847079713e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2041492760181427, |
| "step": 4330, |
| "valid_targets_mean": 3227.9, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 4.553571428571429, |
| "grad_norm": 0.6752786859520122, |
| "learning_rate": 1.3138269929246427e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22046181559562683, |
| "step": 4335, |
| "valid_targets_mean": 3324.2, |
| "valid_targets_min": 1681 |
| }, |
| { |
| "epoch": 4.5588235294117645, |
| "grad_norm": 0.6548319871768743, |
| "learning_rate": 1.308908708800753e-05, |
| "loss": 0.2125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2117079198360443, |
| "step": 4340, |
| "valid_targets_mean": 3792.3, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 4.564075630252101, |
| "grad_norm": 0.6879232525076725, |
| "learning_rate": 1.3039951660794063e-05, |
| "loss": 0.2128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20829437673091888, |
| "step": 4345, |
| "valid_targets_mean": 3502.8, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 4.569327731092437, |
| "grad_norm": 0.6897322297757514, |
| "learning_rate": 1.2990863984711773e-05, |
| "loss": 0.2062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21518868207931519, |
| "step": 4350, |
| "valid_targets_mean": 3320.8, |
| "valid_targets_min": 2077 |
| }, |
| { |
| "epoch": 4.574579831932773, |
| "grad_norm": 0.688837675359442, |
| "learning_rate": 1.294182439653878e-05, |
| "loss": 0.2003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18814504146575928, |
| "step": 4355, |
| "valid_targets_mean": 2756.4, |
| "valid_targets_min": 1505 |
| }, |
| { |
| "epoch": 4.579831932773109, |
| "grad_norm": 0.7330677533755521, |
| "learning_rate": 1.2892833232723297e-05, |
| "loss": 0.2183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24092328548431396, |
| "step": 4360, |
| "valid_targets_mean": 3447.9, |
| "valid_targets_min": 1978 |
| }, |
| { |
| "epoch": 4.5850840336134455, |
| "grad_norm": 0.7241849761685287, |
| "learning_rate": 1.2843890829381303e-05, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26030996441841125, |
| "step": 4365, |
| "valid_targets_mean": 4194.2, |
| "valid_targets_min": 1490 |
| }, |
| { |
| "epoch": 4.590336134453781, |
| "grad_norm": 0.7026396424067808, |
| "learning_rate": 1.2794997522294263e-05, |
| "loss": 0.2035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21944516897201538, |
| "step": 4370, |
| "valid_targets_mean": 2970.4, |
| "valid_targets_min": 1422 |
| }, |
| { |
| "epoch": 4.595588235294118, |
| "grad_norm": 0.6259185795346857, |
| "learning_rate": 1.2746153646906766e-05, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1922265887260437, |
| "step": 4375, |
| "valid_targets_mean": 3396.0, |
| "valid_targets_min": 1603 |
| }, |
| { |
| "epoch": 4.600840336134453, |
| "grad_norm": 0.7438486179833006, |
| "learning_rate": 1.2697359538324303e-05, |
| "loss": 0.2121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21673396229743958, |
| "step": 4380, |
| "valid_targets_mean": 2728.2, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 4.60609243697479, |
| "grad_norm": 0.6370907634088678, |
| "learning_rate": 1.2648615531310907e-05, |
| "loss": 0.2024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19770187139511108, |
| "step": 4385, |
| "valid_targets_mean": 3677.7, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 4.6113445378151265, |
| "grad_norm": 0.68482682086709, |
| "learning_rate": 1.259992196028688e-05, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2116718888282776, |
| "step": 4390, |
| "valid_targets_mean": 3316.8, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 4.616596638655462, |
| "grad_norm": 0.7052208338762722, |
| "learning_rate": 1.2551279159326495e-05, |
| "loss": 0.2127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2252679467201233, |
| "step": 4395, |
| "valid_targets_mean": 3425.5, |
| "valid_targets_min": 1828 |
| }, |
| { |
| "epoch": 4.621848739495798, |
| "grad_norm": 0.6124764309205445, |
| "learning_rate": 1.2502687462155709e-05, |
| "loss": 0.202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1903487741947174, |
| "step": 4400, |
| "valid_targets_mean": 3237.6, |
| "valid_targets_min": 1110 |
| }, |
| { |
| "epoch": 4.6271008403361344, |
| "grad_norm": 0.8771050749310795, |
| "learning_rate": 1.2454147202149865e-05, |
| "loss": 0.2051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21824470162391663, |
| "step": 4405, |
| "valid_targets_mean": 2931.8, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 4.632352941176471, |
| "grad_norm": 0.681928418139891, |
| "learning_rate": 1.2405658712331409e-05, |
| "loss": 0.2058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20178645849227905, |
| "step": 4410, |
| "valid_targets_mean": 3311.4, |
| "valid_targets_min": 1714 |
| }, |
| { |
| "epoch": 4.637605042016807, |
| "grad_norm": 0.7118807798201505, |
| "learning_rate": 1.2357222325367604e-05, |
| "loss": 0.2084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21912041306495667, |
| "step": 4415, |
| "valid_targets_mean": 3572.0, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 4.642857142857143, |
| "grad_norm": 0.6823054558978693, |
| "learning_rate": 1.2308838373568249e-05, |
| "loss": 0.2051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20421810448169708, |
| "step": 4420, |
| "valid_targets_mean": 3451.4, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 4.648109243697479, |
| "grad_norm": 0.6938843637670672, |
| "learning_rate": 1.2260507188883395e-05, |
| "loss": 0.2049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19850008189678192, |
| "step": 4425, |
| "valid_targets_mean": 3175.6, |
| "valid_targets_min": 1292 |
| }, |
| { |
| "epoch": 4.6533613445378155, |
| "grad_norm": 0.7077142011650852, |
| "learning_rate": 1.2212229102901077e-05, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2047484815120697, |
| "step": 4430, |
| "valid_targets_mean": 3533.4, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 4.658613445378151, |
| "grad_norm": 0.7159319249656814, |
| "learning_rate": 1.2164004446845037e-05, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20691466331481934, |
| "step": 4435, |
| "valid_targets_mean": 3325.9, |
| "valid_targets_min": 1394 |
| }, |
| { |
| "epoch": 4.663865546218488, |
| "grad_norm": 0.7559645592765224, |
| "learning_rate": 1.2115833551572438e-05, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2295243889093399, |
| "step": 4440, |
| "valid_targets_mean": 3590.2, |
| "valid_targets_min": 1844 |
| }, |
| { |
| "epoch": 4.669117647058823, |
| "grad_norm": 0.7415198687787329, |
| "learning_rate": 1.2067716747571616e-05, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23479296267032623, |
| "step": 4445, |
| "valid_targets_mean": 3564.9, |
| "valid_targets_min": 1482 |
| }, |
| { |
| "epoch": 4.67436974789916, |
| "grad_norm": 0.688853324893974, |
| "learning_rate": 1.201965436495978e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21714499592781067, |
| "step": 4450, |
| "valid_targets_mean": 3340.8, |
| "valid_targets_min": 1654 |
| }, |
| { |
| "epoch": 4.679621848739496, |
| "grad_norm": 0.7016909162355258, |
| "learning_rate": 1.1971646733480784e-05, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20046481490135193, |
| "step": 4455, |
| "valid_targets_mean": 2951.6, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 4.684873949579832, |
| "grad_norm": 0.6941971218245336, |
| "learning_rate": 1.1923694182502848e-05, |
| "loss": 0.2035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2116384208202362, |
| "step": 4460, |
| "valid_targets_mean": 3478.9, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 4.690126050420168, |
| "grad_norm": 0.6893303247496907, |
| "learning_rate": 1.1875797041016286e-05, |
| "loss": 0.2129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2102683186531067, |
| "step": 4465, |
| "valid_targets_mean": 3287.8, |
| "valid_targets_min": 1350 |
| }, |
| { |
| "epoch": 4.695378151260504, |
| "grad_norm": 0.7350721707173831, |
| "learning_rate": 1.1827955637631283e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21726731956005096, |
| "step": 4470, |
| "valid_targets_mean": 3590.0, |
| "valid_targets_min": 1624 |
| }, |
| { |
| "epoch": 4.70063025210084, |
| "grad_norm": 0.6938494286562441, |
| "learning_rate": 1.1780170300575602e-05, |
| "loss": 0.1884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18289947509765625, |
| "step": 4475, |
| "valid_targets_mean": 2807.6, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 4.705882352941177, |
| "grad_norm": 0.6412962232296662, |
| "learning_rate": 1.1732441357692353e-05, |
| "loss": 0.2057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18760257959365845, |
| "step": 4480, |
| "valid_targets_mean": 3658.0, |
| "valid_targets_min": 2032 |
| }, |
| { |
| "epoch": 4.711134453781512, |
| "grad_norm": 0.7583818317813796, |
| "learning_rate": 1.1684769136437742e-05, |
| "loss": 0.2024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21241483092308044, |
| "step": 4485, |
| "valid_targets_mean": 3141.9, |
| "valid_targets_min": 1259 |
| }, |
| { |
| "epoch": 4.716386554621849, |
| "grad_norm": 0.6326913726737966, |
| "learning_rate": 1.1637153963878815e-05, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19029675424098969, |
| "step": 4490, |
| "valid_targets_mean": 3575.4, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 4.7216386554621845, |
| "grad_norm": 0.6290790387214149, |
| "learning_rate": 1.1589596166691231e-05, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21391956508159637, |
| "step": 4495, |
| "valid_targets_mean": 4193.9, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 4.726890756302521, |
| "grad_norm": 0.6475834579736413, |
| "learning_rate": 1.1542096071157012e-05, |
| "loss": 0.2114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20298393070697784, |
| "step": 4500, |
| "valid_targets_mean": 3821.9, |
| "valid_targets_min": 1726 |
| }, |
| { |
| "epoch": 4.732142857142857, |
| "grad_norm": 0.6979196464072809, |
| "learning_rate": 1.1494654003162285e-05, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20892876386642456, |
| "step": 4505, |
| "valid_targets_mean": 3171.0, |
| "valid_targets_min": 1669 |
| }, |
| { |
| "epoch": 4.737394957983193, |
| "grad_norm": 0.6535989262032701, |
| "learning_rate": 1.1447270288195089e-05, |
| "loss": 0.208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20477300882339478, |
| "step": 4510, |
| "valid_targets_mean": 3491.4, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 4.742647058823529, |
| "grad_norm": 0.7434999336674271, |
| "learning_rate": 1.1399945251343114e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23692408204078674, |
| "step": 4515, |
| "valid_targets_mean": 3283.9, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 4.7478991596638656, |
| "grad_norm": 0.7222774058425186, |
| "learning_rate": 1.1352679217291457e-05, |
| "loss": 0.2049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2167915254831314, |
| "step": 4520, |
| "valid_targets_mean": 3654.3, |
| "valid_targets_min": 1352 |
| }, |
| { |
| "epoch": 4.753151260504202, |
| "grad_norm": 0.5928834886740821, |
| "learning_rate": 1.1305472510320419e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1938672959804535, |
| "step": 4525, |
| "valid_targets_mean": 4265.6, |
| "valid_targets_min": 1535 |
| }, |
| { |
| "epoch": 4.758403361344538, |
| "grad_norm": 0.7282043659742619, |
| "learning_rate": 1.1258325454303286e-05, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1851435899734497, |
| "step": 4530, |
| "valid_targets_mean": 2997.0, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 4.7636554621848735, |
| "grad_norm": 0.7451730107148029, |
| "learning_rate": 1.1211238372704073e-05, |
| "loss": 0.1919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18663758039474487, |
| "step": 4535, |
| "valid_targets_mean": 2795.1, |
| "valid_targets_min": 1179 |
| }, |
| { |
| "epoch": 4.76890756302521, |
| "grad_norm": 0.7184545671700696, |
| "learning_rate": 1.1164211588575339e-05, |
| "loss": 0.1969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19145233929157257, |
| "step": 4540, |
| "valid_targets_mean": 3652.7, |
| "valid_targets_min": 1444 |
| }, |
| { |
| "epoch": 4.774159663865547, |
| "grad_norm": 0.7397780134283227, |
| "learning_rate": 1.1117245424555967e-05, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1895849108695984, |
| "step": 4545, |
| "valid_targets_mean": 2500.1, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 4.779411764705882, |
| "grad_norm": 0.6713856995898463, |
| "learning_rate": 1.1070340202868915e-05, |
| "loss": 0.1896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1881069391965866, |
| "step": 4550, |
| "valid_targets_mean": 3590.1, |
| "valid_targets_min": 1637 |
| }, |
| { |
| "epoch": 4.784663865546219, |
| "grad_norm": 0.8087445793498248, |
| "learning_rate": 1.1023496245319056e-05, |
| "loss": 0.2125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24480175971984863, |
| "step": 4555, |
| "valid_targets_mean": 3466.0, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 4.7899159663865545, |
| "grad_norm": 0.7068565649556457, |
| "learning_rate": 1.0976713873290925e-05, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20139086246490479, |
| "step": 4560, |
| "valid_targets_mean": 3205.6, |
| "valid_targets_min": 1612 |
| }, |
| { |
| "epoch": 4.795168067226891, |
| "grad_norm": 0.6620926828840262, |
| "learning_rate": 1.0929993407746543e-05, |
| "loss": 0.2027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19388242065906525, |
| "step": 4565, |
| "valid_targets_mean": 3423.2, |
| "valid_targets_min": 1743 |
| }, |
| { |
| "epoch": 4.800420168067227, |
| "grad_norm": 0.6727413718092184, |
| "learning_rate": 1.0883335169223212e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1882367581129074, |
| "step": 4570, |
| "valid_targets_mean": 3168.8, |
| "valid_targets_min": 1398 |
| }, |
| { |
| "epoch": 4.805672268907563, |
| "grad_norm": 0.6558248286205179, |
| "learning_rate": 1.0836739477831297e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20704635977745056, |
| "step": 4575, |
| "valid_targets_mean": 3489.9, |
| "valid_targets_min": 1558 |
| }, |
| { |
| "epoch": 4.810924369747899, |
| "grad_norm": 0.6847057248913088, |
| "learning_rate": 1.0790206653252055e-05, |
| "loss": 0.2032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20168985426425934, |
| "step": 4580, |
| "valid_targets_mean": 3278.1, |
| "valid_targets_min": 1445 |
| }, |
| { |
| "epoch": 4.8161764705882355, |
| "grad_norm": 0.6533366829855569, |
| "learning_rate": 1.0743737014735434e-05, |
| "loss": 0.1938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18918371200561523, |
| "step": 4585, |
| "valid_targets_mean": 3682.9, |
| "valid_targets_min": 2000 |
| }, |
| { |
| "epoch": 4.821428571428571, |
| "grad_norm": 0.7708553362949551, |
| "learning_rate": 1.0697330881097857e-05, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19962045550346375, |
| "step": 4590, |
| "valid_targets_mean": 3065.2, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 4.826680672268908, |
| "grad_norm": 0.7089419295191447, |
| "learning_rate": 1.0650988570720077e-05, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20890700817108154, |
| "step": 4595, |
| "valid_targets_mean": 3286.4, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 4.831932773109243, |
| "grad_norm": 0.7147247615274656, |
| "learning_rate": 1.0604710401544963e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19596712291240692, |
| "step": 4600, |
| "valid_targets_mean": 3027.9, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 4.83718487394958, |
| "grad_norm": 0.7304597580233416, |
| "learning_rate": 1.0558496691075318e-05, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20904818177223206, |
| "step": 4605, |
| "valid_targets_mean": 3077.8, |
| "valid_targets_min": 1603 |
| }, |
| { |
| "epoch": 4.842436974789916, |
| "grad_norm": 0.7224217938478468, |
| "learning_rate": 1.0512347756371726e-05, |
| "loss": 0.206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18744680285453796, |
| "step": 4610, |
| "valid_targets_mean": 2883.4, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 4.847689075630252, |
| "grad_norm": 0.7107738441028865, |
| "learning_rate": 1.0466263914050362e-05, |
| "loss": 0.2078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2116435468196869, |
| "step": 4615, |
| "valid_targets_mean": 3873.2, |
| "valid_targets_min": 1994 |
| }, |
| { |
| "epoch": 4.852941176470588, |
| "grad_norm": 0.7236551319922022, |
| "learning_rate": 1.0420245480280804e-05, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18254084885120392, |
| "step": 4620, |
| "valid_targets_mean": 3090.9, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 4.858193277310924, |
| "grad_norm": 0.6924268052728789, |
| "learning_rate": 1.0374292770783891e-05, |
| "loss": 0.2099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21132606267929077, |
| "step": 4625, |
| "valid_targets_mean": 3609.6, |
| "valid_targets_min": 1648 |
| }, |
| { |
| "epoch": 4.86344537815126, |
| "grad_norm": 0.710132639844148, |
| "learning_rate": 1.0328406100829542e-05, |
| "loss": 0.2081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19806388020515442, |
| "step": 4630, |
| "valid_targets_mean": 3135.9, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 4.868697478991597, |
| "grad_norm": 8.223593196499644, |
| "learning_rate": 1.0282585785234578e-05, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21035614609718323, |
| "step": 4635, |
| "valid_targets_mean": 2491.6, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 4.873949579831933, |
| "grad_norm": 0.6950690926035392, |
| "learning_rate": 1.023683213836061e-05, |
| "loss": 0.2101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20301932096481323, |
| "step": 4640, |
| "valid_targets_mean": 3529.4, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 4.879201680672269, |
| "grad_norm": 0.7338702013416679, |
| "learning_rate": 1.0191145474111823e-05, |
| "loss": 0.2063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20622602105140686, |
| "step": 4645, |
| "valid_targets_mean": 3178.1, |
| "valid_targets_min": 1372 |
| }, |
| { |
| "epoch": 4.884453781512605, |
| "grad_norm": 0.6717591588502287, |
| "learning_rate": 1.0145526105932872e-05, |
| "loss": 0.2012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2017562985420227, |
| "step": 4650, |
| "valid_targets_mean": 3422.6, |
| "valid_targets_min": 1598 |
| }, |
| { |
| "epoch": 4.889705882352941, |
| "grad_norm": 0.76533252784604, |
| "learning_rate": 1.0099974346806714e-05, |
| "loss": 0.2065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1944223940372467, |
| "step": 4655, |
| "valid_targets_mean": 2925.1, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 4.894957983193278, |
| "grad_norm": 0.6637317114328515, |
| "learning_rate": 1.0054490509252423e-05, |
| "loss": 0.2099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19309523701667786, |
| "step": 4660, |
| "valid_targets_mean": 3366.2, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 4.900210084033613, |
| "grad_norm": 0.6982820833530574, |
| "learning_rate": 1.0009074905323118e-05, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21207424998283386, |
| "step": 4665, |
| "valid_targets_mean": 3100.1, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 4.90546218487395, |
| "grad_norm": 0.6432617078880017, |
| "learning_rate": 9.963727846603784e-06, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21252809464931488, |
| "step": 4670, |
| "valid_targets_mean": 3674.5, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 4.910714285714286, |
| "grad_norm": 0.7841146093401851, |
| "learning_rate": 9.918449644209087e-06, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18188413977622986, |
| "step": 4675, |
| "valid_targets_mean": 2951.1, |
| "valid_targets_min": 1107 |
| }, |
| { |
| "epoch": 4.915966386554622, |
| "grad_norm": 0.7711023446249636, |
| "learning_rate": 9.873240608781341e-06, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20018140971660614, |
| "step": 4680, |
| "valid_targets_mean": 2839.9, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 4.921218487394958, |
| "grad_norm": 0.6720914422866899, |
| "learning_rate": 9.828101050488308e-06, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19184359908103943, |
| "step": 4685, |
| "valid_targets_mean": 3508.3, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 4.926470588235294, |
| "grad_norm": 0.6979997171728765, |
| "learning_rate": 9.783031279021063e-06, |
| "loss": 0.1949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1979558765888214, |
| "step": 4690, |
| "valid_targets_mean": 3186.6, |
| "valid_targets_min": 1193 |
| }, |
| { |
| "epoch": 4.93172268907563, |
| "grad_norm": 0.6375536515405493, |
| "learning_rate": 9.738031603591926e-06, |
| "loss": 0.2031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18585914373397827, |
| "step": 4695, |
| "valid_targets_mean": 3687.8, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 4.936974789915967, |
| "grad_norm": 0.6740300095798715, |
| "learning_rate": 9.69310233293227e-06, |
| "loss": 0.1963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1872563362121582, |
| "step": 4700, |
| "valid_targets_mean": 3261.6, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 4.942226890756302, |
| "grad_norm": 0.6728949238979616, |
| "learning_rate": 9.648243775290476e-06, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1736118197441101, |
| "step": 4705, |
| "valid_targets_mean": 2934.8, |
| "valid_targets_min": 1575 |
| }, |
| { |
| "epoch": 4.947478991596639, |
| "grad_norm": 0.7317387069659124, |
| "learning_rate": 9.60345623842974e-06, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19196751713752747, |
| "step": 4710, |
| "valid_targets_mean": 3090.5, |
| "valid_targets_min": 1697 |
| }, |
| { |
| "epoch": 4.9527310924369745, |
| "grad_norm": 0.7423800247961655, |
| "learning_rate": 9.558740029626046e-06, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19240882992744446, |
| "step": 4715, |
| "valid_targets_mean": 3297.7, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 4.957983193277311, |
| "grad_norm": 0.79806625760805, |
| "learning_rate": 9.51409545566597e-06, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22060896456241608, |
| "step": 4720, |
| "valid_targets_mean": 3071.2, |
| "valid_targets_min": 887 |
| }, |
| { |
| "epoch": 4.963235294117647, |
| "grad_norm": 0.7615537115059738, |
| "learning_rate": 9.469522822844663e-06, |
| "loss": 0.1948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20150801539421082, |
| "step": 4725, |
| "valid_targets_mean": 2714.7, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 4.968487394957983, |
| "grad_norm": 0.7230728317576487, |
| "learning_rate": 9.425022436963664e-06, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17812782526016235, |
| "step": 4730, |
| "valid_targets_mean": 3112.9, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 4.973739495798319, |
| "grad_norm": 0.8017286637803975, |
| "learning_rate": 9.380594603328875e-06, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21535563468933105, |
| "step": 4735, |
| "valid_targets_mean": 3526.3, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 4.9789915966386555, |
| "grad_norm": 0.7962974276395127, |
| "learning_rate": 9.336239626748432e-06, |
| "loss": 0.2009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24022144079208374, |
| "step": 4740, |
| "valid_targets_mean": 2941.2, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 4.984243697478991, |
| "grad_norm": 0.6987990811270663, |
| "learning_rate": 9.291957811530602e-06, |
| "loss": 0.208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20734629034996033, |
| "step": 4745, |
| "valid_targets_mean": 3804.6, |
| "valid_targets_min": 1737 |
| }, |
| { |
| "epoch": 4.989495798319328, |
| "grad_norm": 0.6320507915977177, |
| "learning_rate": 9.247749461481712e-06, |
| "loss": 0.2059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17486436665058136, |
| "step": 4750, |
| "valid_targets_mean": 3503.6, |
| "valid_targets_min": 1276 |
| }, |
| { |
| "epoch": 4.994747899159664, |
| "grad_norm": 0.6565835428886582, |
| "learning_rate": 9.203614879904083e-06, |
| "loss": 0.21, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21443158388137817, |
| "step": 4755, |
| "valid_targets_mean": 4137.7, |
| "valid_targets_min": 1572 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.7198533786254716, |
| "learning_rate": 9.159554369593901e-06, |
| "loss": 0.2046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2270594984292984, |
| "step": 4760, |
| "valid_targets_mean": 3715.1, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 5.005252100840337, |
| "grad_norm": 0.7571959238315181, |
| "learning_rate": 9.115568232839193e-06, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13461460173130035, |
| "step": 4765, |
| "valid_targets_mean": 1423.4, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 5.010504201680672, |
| "grad_norm": 0.8301602733718247, |
| "learning_rate": 9.071656771417721e-06, |
| "loss": 0.1363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12977659702301025, |
| "step": 4770, |
| "valid_targets_mean": 1407.8, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 5.015756302521009, |
| "grad_norm": 0.8166485961728386, |
| "learning_rate": 9.027820286594902e-06, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13986307382583618, |
| "step": 4775, |
| "valid_targets_mean": 1413.5, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 5.0210084033613445, |
| "grad_norm": 0.8634652135372101, |
| "learning_rate": 8.984059079121785e-06, |
| "loss": 0.1281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12289293855428696, |
| "step": 4780, |
| "valid_targets_mean": 1450.1, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 5.026260504201681, |
| "grad_norm": 1.0868991923247484, |
| "learning_rate": 8.940373449232935e-06, |
| "loss": 0.1387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1558552235364914, |
| "step": 4785, |
| "valid_targets_mean": 1481.1, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 5.031512605042017, |
| "grad_norm": 0.8280248464569533, |
| "learning_rate": 8.896763696644405e-06, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13719496130943298, |
| "step": 4790, |
| "valid_targets_mean": 1530.8, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 5.036764705882353, |
| "grad_norm": 0.8223621736586295, |
| "learning_rate": 8.853230120551693e-06, |
| "loss": 0.1238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12621982395648956, |
| "step": 4795, |
| "valid_targets_mean": 1416.6, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 5.042016806722689, |
| "grad_norm": 0.870763805985631, |
| "learning_rate": 8.809773019627635e-06, |
| "loss": 0.1404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13102170825004578, |
| "step": 4800, |
| "valid_targets_mean": 1371.5, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 5.0472689075630255, |
| "grad_norm": 0.8397454624147834, |
| "learning_rate": 8.766392692020413e-06, |
| "loss": 0.1263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12862995266914368, |
| "step": 4805, |
| "valid_targets_mean": 1484.7, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 5.052521008403361, |
| "grad_norm": 0.7882246072954778, |
| "learning_rate": 8.723089435351497e-06, |
| "loss": 0.1306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11443109065294266, |
| "step": 4810, |
| "valid_targets_mean": 1365.5, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 5.057773109243698, |
| "grad_norm": 0.8742920757552072, |
| "learning_rate": 8.679863546713559e-06, |
| "loss": 0.1256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.127573624253273, |
| "step": 4815, |
| "valid_targets_mean": 1234.7, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 5.063025210084033, |
| "grad_norm": 0.7920380834226816, |
| "learning_rate": 8.636715322668498e-06, |
| "loss": 0.1276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11717408895492554, |
| "step": 4820, |
| "valid_targets_mean": 1540.4, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 5.06827731092437, |
| "grad_norm": 0.780341581121388, |
| "learning_rate": 8.593645059245365e-06, |
| "loss": 0.1243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11017392575740814, |
| "step": 4825, |
| "valid_targets_mean": 1329.9, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 5.073529411764706, |
| "grad_norm": 0.7603227971883492, |
| "learning_rate": 8.550653051938333e-06, |
| "loss": 0.1181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11557639390230179, |
| "step": 4830, |
| "valid_targets_mean": 1549.6, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 5.078781512605042, |
| "grad_norm": 0.9030555834076215, |
| "learning_rate": 8.507739595704695e-06, |
| "loss": 0.1192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13490742444992065, |
| "step": 4835, |
| "valid_targets_mean": 1507.4, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 5.084033613445378, |
| "grad_norm": 0.954349785672474, |
| "learning_rate": 8.464904984962832e-06, |
| "loss": 0.1242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14801670610904694, |
| "step": 4840, |
| "valid_targets_mean": 1542.4, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 5.089285714285714, |
| "grad_norm": 0.9125020805445457, |
| "learning_rate": 8.422149513590151e-06, |
| "loss": 0.1271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13509975373744965, |
| "step": 4845, |
| "valid_targets_mean": 1595.2, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 5.09453781512605, |
| "grad_norm": 0.871199900697412, |
| "learning_rate": 8.37947347492115e-06, |
| "loss": 0.1303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13447391986846924, |
| "step": 4850, |
| "valid_targets_mean": 1401.6, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 5.099789915966387, |
| "grad_norm": 0.8629277026545269, |
| "learning_rate": 8.33687716174532e-06, |
| "loss": 0.1242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11550725251436234, |
| "step": 4855, |
| "valid_targets_mean": 1298.4, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 5.105042016806722, |
| "grad_norm": 0.8030715253201013, |
| "learning_rate": 8.294360866305192e-06, |
| "loss": 0.1272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1309053897857666, |
| "step": 4860, |
| "valid_targets_mean": 1659.7, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 5.110294117647059, |
| "grad_norm": 0.9265947353354664, |
| "learning_rate": 8.251924880294317e-06, |
| "loss": 0.1264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13342975080013275, |
| "step": 4865, |
| "valid_targets_mean": 1600.4, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 5.1155462184873945, |
| "grad_norm": 0.8041955738679034, |
| "learning_rate": 8.20956949485527e-06, |
| "loss": 0.1196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1035323292016983, |
| "step": 4870, |
| "valid_targets_mean": 1338.3, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 5.120798319327731, |
| "grad_norm": 0.8494495064085696, |
| "learning_rate": 8.167295000577622e-06, |
| "loss": 0.1197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11942795664072037, |
| "step": 4875, |
| "valid_targets_mean": 1456.2, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 5.126050420168067, |
| "grad_norm": 1.0365198065360532, |
| "learning_rate": 8.125101687496e-06, |
| "loss": 0.1181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11641368269920349, |
| "step": 4880, |
| "valid_targets_mean": 1340.2, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 5.131302521008403, |
| "grad_norm": 0.8635148283698016, |
| "learning_rate": 8.082989845088038e-06, |
| "loss": 0.1203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11869832128286362, |
| "step": 4885, |
| "valid_targets_mean": 1394.4, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 5.13655462184874, |
| "grad_norm": 0.877173265352079, |
| "learning_rate": 8.040959762272441e-06, |
| "loss": 0.1232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12606994807720184, |
| "step": 4890, |
| "valid_targets_mean": 1501.8, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 5.141806722689076, |
| "grad_norm": 0.9671178369518909, |
| "learning_rate": 7.999011727406995e-06, |
| "loss": 0.1224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12263111025094986, |
| "step": 4895, |
| "valid_targets_mean": 1651.7, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 5.147058823529412, |
| "grad_norm": 0.8799343051970719, |
| "learning_rate": 7.957146028286524e-06, |
| "loss": 0.1285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13233694434165955, |
| "step": 4900, |
| "valid_targets_mean": 1632.1, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 5.152310924369748, |
| "grad_norm": 0.8281302903839795, |
| "learning_rate": 7.915362952141017e-06, |
| "loss": 0.1215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13629840314388275, |
| "step": 4905, |
| "valid_targets_mean": 1615.3, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 5.157563025210084, |
| "grad_norm": 0.9542718681795296, |
| "learning_rate": 7.873662785633594e-06, |
| "loss": 0.1291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14337027072906494, |
| "step": 4910, |
| "valid_targets_mean": 1482.9, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 5.16281512605042, |
| "grad_norm": 1.3637598590452737, |
| "learning_rate": 7.832045814858538e-06, |
| "loss": 0.1235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12161692976951599, |
| "step": 4915, |
| "valid_targets_mean": 1552.8, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 5.168067226890757, |
| "grad_norm": 0.821599075602171, |
| "learning_rate": 7.790512325339367e-06, |
| "loss": 0.1169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12724722921848297, |
| "step": 4920, |
| "valid_targets_mean": 1590.4, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 5.173319327731092, |
| "grad_norm": 0.8859043037264651, |
| "learning_rate": 7.74906260202685e-06, |
| "loss": 0.1194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1232469454407692, |
| "step": 4925, |
| "valid_targets_mean": 1417.6, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 5.178571428571429, |
| "grad_norm": 0.8207302664180218, |
| "learning_rate": 7.707696929297053e-06, |
| "loss": 0.1116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10313037782907486, |
| "step": 4930, |
| "valid_targets_mean": 1255.4, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 5.1838235294117645, |
| "grad_norm": 0.8196199367733106, |
| "learning_rate": 7.666415590949382e-06, |
| "loss": 0.1214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12141343951225281, |
| "step": 4935, |
| "valid_targets_mean": 1566.6, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 5.189075630252101, |
| "grad_norm": 0.8397722105470354, |
| "learning_rate": 7.625218870204676e-06, |
| "loss": 0.1157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11369533091783524, |
| "step": 4940, |
| "valid_targets_mean": 1440.9, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 5.194327731092437, |
| "grad_norm": 0.84723032993192, |
| "learning_rate": 7.584107049703195e-06, |
| "loss": 0.1194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1220942959189415, |
| "step": 4945, |
| "valid_targets_mean": 1399.1, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 5.199579831932773, |
| "grad_norm": 1.1583713663548252, |
| "learning_rate": 7.5430804115027615e-06, |
| "loss": 0.1222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1239510029554367, |
| "step": 4950, |
| "valid_targets_mean": 1334.3, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 5.204831932773109, |
| "grad_norm": 0.940619146388919, |
| "learning_rate": 7.502139237076744e-06, |
| "loss": 0.1203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13509805500507355, |
| "step": 4955, |
| "valid_targets_mean": 1452.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 5.2100840336134455, |
| "grad_norm": 0.9031648217368532, |
| "learning_rate": 7.461283807312194e-06, |
| "loss": 0.117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10953864455223083, |
| "step": 4960, |
| "valid_targets_mean": 1338.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 5.215336134453781, |
| "grad_norm": 0.7885774798170768, |
| "learning_rate": 7.420514402507886e-06, |
| "loss": 0.1134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11579865217208862, |
| "step": 4965, |
| "valid_targets_mean": 1360.2, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 5.220588235294118, |
| "grad_norm": 0.8567753502507811, |
| "learning_rate": 7.379831302372389e-06, |
| "loss": 0.1264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12191884219646454, |
| "step": 4970, |
| "valid_targets_mean": 1520.9, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 5.225840336134453, |
| "grad_norm": 0.9494851235486876, |
| "learning_rate": 7.3392347860221556e-06, |
| "loss": 0.1282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16232752799987793, |
| "step": 4975, |
| "valid_targets_mean": 1814.6, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 5.23109243697479, |
| "grad_norm": 0.8077534069393267, |
| "learning_rate": 7.298725131979629e-06, |
| "loss": 0.1143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11486963927745819, |
| "step": 4980, |
| "valid_targets_mean": 1478.3, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 5.236344537815126, |
| "grad_norm": 0.8359577317112136, |
| "learning_rate": 7.258302618171287e-06, |
| "loss": 0.1153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11313410103321075, |
| "step": 4985, |
| "valid_targets_mean": 1497.9, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 5.241596638655462, |
| "grad_norm": 0.9503036196925028, |
| "learning_rate": 7.217967521925775e-06, |
| "loss": 0.1215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12508943676948547, |
| "step": 4990, |
| "valid_targets_mean": 1550.5, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 5.246848739495798, |
| "grad_norm": 0.8718205924513632, |
| "learning_rate": 7.177720119971998e-06, |
| "loss": 0.1179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11915310472249985, |
| "step": 4995, |
| "valid_targets_mean": 1372.5, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 5.2521008403361344, |
| "grad_norm": 0.9288193265136786, |
| "learning_rate": 7.137560688437184e-06, |
| "loss": 0.1122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12416621297597885, |
| "step": 5000, |
| "valid_targets_mean": 1479.0, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 5.257352941176471, |
| "grad_norm": 0.8635518493795323, |
| "learning_rate": 7.097489502845047e-06, |
| "loss": 0.1082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09854140877723694, |
| "step": 5005, |
| "valid_targets_mean": 1234.8, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 5.262605042016807, |
| "grad_norm": 0.9381227734247657, |
| "learning_rate": 7.0575068381138525e-06, |
| "loss": 0.1246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12833383679389954, |
| "step": 5010, |
| "valid_targets_mean": 1363.2, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 5.267857142857143, |
| "grad_norm": 0.8806803188401461, |
| "learning_rate": 7.0176129685545414e-06, |
| "loss": 0.1202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12506265938282013, |
| "step": 5015, |
| "valid_targets_mean": 1532.1, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 5.273109243697479, |
| "grad_norm": 0.8640788078067893, |
| "learning_rate": 6.977808167868867e-06, |
| "loss": 0.1139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1157342940568924, |
| "step": 5020, |
| "valid_targets_mean": 1471.0, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 5.2783613445378155, |
| "grad_norm": 0.8116063638815398, |
| "learning_rate": 6.9380927091475085e-06, |
| "loss": 0.1159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10994266718626022, |
| "step": 5025, |
| "valid_targets_mean": 1494.1, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 5.283613445378151, |
| "grad_norm": 0.8409841937184768, |
| "learning_rate": 6.898466864868165e-06, |
| "loss": 0.1185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1092015877366066, |
| "step": 5030, |
| "valid_targets_mean": 1340.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 5.288865546218488, |
| "grad_norm": 0.8012571565338946, |
| "learning_rate": 6.858930906893751e-06, |
| "loss": 0.119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12151382863521576, |
| "step": 5035, |
| "valid_targets_mean": 1530.9, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 5.294117647058823, |
| "grad_norm": 1.0099731756987655, |
| "learning_rate": 6.819485106470454e-06, |
| "loss": 0.1119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.115475133061409, |
| "step": 5040, |
| "valid_targets_mean": 1233.0, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 5.29936974789916, |
| "grad_norm": 0.8353570829541407, |
| "learning_rate": 6.780129734225949e-06, |
| "loss": 0.1155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1095833033323288, |
| "step": 5045, |
| "valid_targets_mean": 1246.8, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 5.304621848739496, |
| "grad_norm": 0.8983751034814326, |
| "learning_rate": 6.740865060167483e-06, |
| "loss": 0.1079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1118505597114563, |
| "step": 5050, |
| "valid_targets_mean": 1392.5, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 5.309873949579832, |
| "grad_norm": 0.8427967821093256, |
| "learning_rate": 6.701691353680049e-06, |
| "loss": 0.1195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1080687940120697, |
| "step": 5055, |
| "valid_targets_mean": 1319.9, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 5.315126050420168, |
| "grad_norm": 0.8079776828047187, |
| "learning_rate": 6.662608883524542e-06, |
| "loss": 0.118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11414103209972382, |
| "step": 5060, |
| "valid_targets_mean": 1554.4, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 5.320378151260504, |
| "grad_norm": 0.9308438137878955, |
| "learning_rate": 6.6236179178359115e-06, |
| "loss": 0.1152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12251292169094086, |
| "step": 5065, |
| "valid_targets_mean": 1417.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 5.32563025210084, |
| "grad_norm": 1.0492334793929392, |
| "learning_rate": 6.5847187241213e-06, |
| "loss": 0.1171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11902189999818802, |
| "step": 5070, |
| "valid_targets_mean": 1223.8, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 5.330882352941177, |
| "grad_norm": 0.8741745375157363, |
| "learning_rate": 6.5459115692582386e-06, |
| "loss": 0.1184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1177992969751358, |
| "step": 5075, |
| "valid_targets_mean": 1550.6, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 5.336134453781512, |
| "grad_norm": 0.8231983027778437, |
| "learning_rate": 6.507196719492819e-06, |
| "loss": 0.115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11274613440036774, |
| "step": 5080, |
| "valid_targets_mean": 1542.2, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 5.341386554621849, |
| "grad_norm": 0.838222313849615, |
| "learning_rate": 6.468574440437801e-06, |
| "loss": 0.1162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11383190006017685, |
| "step": 5085, |
| "valid_targets_mean": 1390.6, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 5.3466386554621845, |
| "grad_norm": 0.8704926336132325, |
| "learning_rate": 6.43004499707089e-06, |
| "loss": 0.1154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12034046649932861, |
| "step": 5090, |
| "valid_targets_mean": 1515.5, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 5.351890756302521, |
| "grad_norm": 0.7942910330002284, |
| "learning_rate": 6.3916086537328545e-06, |
| "loss": 0.1151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09943848103284836, |
| "step": 5095, |
| "valid_targets_mean": 1333.3, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 5.357142857142857, |
| "grad_norm": 0.8272207055546795, |
| "learning_rate": 6.3532656741257145e-06, |
| "loss": 0.1196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11656372249126434, |
| "step": 5100, |
| "valid_targets_mean": 1395.2, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 5.362394957983193, |
| "grad_norm": 0.8835103895559686, |
| "learning_rate": 6.315016321310965e-06, |
| "loss": 0.1223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11481855809688568, |
| "step": 5105, |
| "valid_targets_mean": 1515.6, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 5.367647058823529, |
| "grad_norm": 0.8627265594469545, |
| "learning_rate": 6.276860857707727e-06, |
| "loss": 0.1153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11496169120073318, |
| "step": 5110, |
| "valid_targets_mean": 1312.8, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 5.3728991596638656, |
| "grad_norm": 0.909694468472037, |
| "learning_rate": 6.238799545090994e-06, |
| "loss": 0.1215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12938551604747772, |
| "step": 5115, |
| "valid_targets_mean": 1492.9, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 5.378151260504202, |
| "grad_norm": 0.8310216699675694, |
| "learning_rate": 6.20083264458981e-06, |
| "loss": 0.1099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10411947965621948, |
| "step": 5120, |
| "valid_targets_mean": 1369.1, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 5.383403361344538, |
| "grad_norm": 0.8711155777854998, |
| "learning_rate": 6.162960416685469e-06, |
| "loss": 0.1109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11428333818912506, |
| "step": 5125, |
| "valid_targets_mean": 1521.9, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 5.388655462184874, |
| "grad_norm": 0.870482484994608, |
| "learning_rate": 6.125183121209741e-06, |
| "loss": 0.1191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10633750259876251, |
| "step": 5130, |
| "valid_targets_mean": 1277.9, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 5.39390756302521, |
| "grad_norm": 0.8795820034570103, |
| "learning_rate": 6.087501017343107e-06, |
| "loss": 0.1118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10446271300315857, |
| "step": 5135, |
| "valid_targets_mean": 1336.5, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 5.399159663865547, |
| "grad_norm": 0.8575277820951928, |
| "learning_rate": 6.0499143636129384e-06, |
| "loss": 0.1105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10649226605892181, |
| "step": 5140, |
| "valid_targets_mean": 1288.1, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 5.404411764705882, |
| "grad_norm": 0.8701860188774736, |
| "learning_rate": 6.012423417891766e-06, |
| "loss": 0.116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11557996273040771, |
| "step": 5145, |
| "valid_targets_mean": 1526.9, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 5.409663865546219, |
| "grad_norm": 0.9973788403003421, |
| "learning_rate": 5.975028437395493e-06, |
| "loss": 0.124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1302410513162613, |
| "step": 5150, |
| "valid_targets_mean": 1372.4, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 5.4149159663865545, |
| "grad_norm": 0.8939645783701128, |
| "learning_rate": 5.937729678681612e-06, |
| "loss": 0.1082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11539514362812042, |
| "step": 5155, |
| "valid_targets_mean": 1356.8, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 5.420168067226891, |
| "grad_norm": 0.8246273501078926, |
| "learning_rate": 5.9005273976474684e-06, |
| "loss": 0.1136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11548338830471039, |
| "step": 5160, |
| "valid_targets_mean": 1540.9, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 5.425420168067227, |
| "grad_norm": 0.7236132877010878, |
| "learning_rate": 5.8634218495285126e-06, |
| "loss": 0.0987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08354189991950989, |
| "step": 5165, |
| "valid_targets_mean": 1442.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 5.430672268907563, |
| "grad_norm": 0.8988049282372673, |
| "learning_rate": 5.8264132888965155e-06, |
| "loss": 0.1087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11418993771076202, |
| "step": 5170, |
| "valid_targets_mean": 1407.6, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 5.435924369747899, |
| "grad_norm": 0.8655375216766177, |
| "learning_rate": 5.789501969657853e-06, |
| "loss": 0.1082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10003848373889923, |
| "step": 5175, |
| "valid_targets_mean": 1197.8, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 5.4411764705882355, |
| "grad_norm": 0.8362323911596797, |
| "learning_rate": 5.752688145051761e-06, |
| "loss": 0.1083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09275621920824051, |
| "step": 5180, |
| "valid_targets_mean": 1423.3, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 5.446428571428571, |
| "grad_norm": 0.8296465425650306, |
| "learning_rate": 5.715972067648561e-06, |
| "loss": 0.1078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10052791237831116, |
| "step": 5185, |
| "valid_targets_mean": 1331.5, |
| "valid_targets_min": 827 |
| }, |
| { |
| "epoch": 5.451680672268908, |
| "grad_norm": 0.8321903503583684, |
| "learning_rate": 5.679353989347989e-06, |
| "loss": 0.1124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10639987140893936, |
| "step": 5190, |
| "valid_targets_mean": 1381.7, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 5.456932773109243, |
| "grad_norm": 0.8907023908538945, |
| "learning_rate": 5.642834161377408e-06, |
| "loss": 0.1107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11636456847190857, |
| "step": 5195, |
| "valid_targets_mean": 1472.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 5.46218487394958, |
| "grad_norm": 1.304588509837649, |
| "learning_rate": 5.606412834290121e-06, |
| "loss": 0.1349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2201894223690033, |
| "step": 5200, |
| "valid_targets_mean": 2248.9, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 5.467436974789916, |
| "grad_norm": 1.075014973641161, |
| "learning_rate": 5.570090257963645e-06, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2059841752052307, |
| "step": 5205, |
| "valid_targets_mean": 3664.4, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 5.472689075630252, |
| "grad_norm": 0.8446914601975626, |
| "learning_rate": 5.533866681597981e-06, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20752739906311035, |
| "step": 5210, |
| "valid_targets_mean": 3591.1, |
| "valid_targets_min": 1635 |
| }, |
| { |
| "epoch": 5.477941176470588, |
| "grad_norm": 0.6615718547643281, |
| "learning_rate": 5.497742353713928e-06, |
| "loss": 0.1996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1898113489151001, |
| "step": 5215, |
| "valid_targets_mean": 4172.7, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 5.483193277310924, |
| "grad_norm": 0.6331051011117288, |
| "learning_rate": 5.461717522151371e-06, |
| "loss": 0.1901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2003975212574005, |
| "step": 5220, |
| "valid_targets_mean": 4040.2, |
| "valid_targets_min": 2187 |
| }, |
| { |
| "epoch": 5.48844537815126, |
| "grad_norm": 0.6969541078527951, |
| "learning_rate": 5.4257924340675535e-06, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18878155946731567, |
| "step": 5225, |
| "valid_targets_mean": 3156.3, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 5.493697478991597, |
| "grad_norm": 0.5916400175296245, |
| "learning_rate": 5.389967335935429e-06, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17551878094673157, |
| "step": 5230, |
| "valid_targets_mean": 3529.7, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 5.498949579831933, |
| "grad_norm": 0.624324534174277, |
| "learning_rate": 5.3542424735419306e-06, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17499442398548126, |
| "step": 5235, |
| "valid_targets_mean": 3485.6, |
| "valid_targets_min": 1488 |
| }, |
| { |
| "epoch": 5.504201680672269, |
| "grad_norm": 0.6222898231435748, |
| "learning_rate": 5.318618091986294e-06, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17875801026821136, |
| "step": 5240, |
| "valid_targets_mean": 3707.0, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 5.509453781512605, |
| "grad_norm": 0.6245877514119683, |
| "learning_rate": 5.283094435678398e-06, |
| "loss": 0.2027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19261011481285095, |
| "step": 5245, |
| "valid_targets_mean": 4252.4, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 5.514705882352941, |
| "grad_norm": 0.6826116098814055, |
| "learning_rate": 5.2476717483370685e-06, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21187934279441833, |
| "step": 5250, |
| "valid_targets_mean": 4029.2, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 5.519957983193278, |
| "grad_norm": 0.5667810450047195, |
| "learning_rate": 5.212350272988394e-06, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17751820385456085, |
| "step": 5255, |
| "valid_targets_mean": 4507.0, |
| "valid_targets_min": 2011 |
| }, |
| { |
| "epoch": 5.525210084033613, |
| "grad_norm": 0.6114125208911464, |
| "learning_rate": 5.177130251964088e-06, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17235472798347473, |
| "step": 5260, |
| "valid_targets_mean": 4268.2, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 5.53046218487395, |
| "grad_norm": 0.6625902480426628, |
| "learning_rate": 5.1420119268998085e-06, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18950673937797546, |
| "step": 5265, |
| "valid_targets_mean": 3858.9, |
| "valid_targets_min": 1366 |
| }, |
| { |
| "epoch": 5.535714285714286, |
| "grad_norm": 0.6651401874085916, |
| "learning_rate": 5.106995538733488e-06, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17550374567508698, |
| "step": 5270, |
| "valid_targets_mean": 3169.1, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 5.540966386554622, |
| "grad_norm": 0.6231114187474077, |
| "learning_rate": 5.07208132770372e-06, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18051046133041382, |
| "step": 5275, |
| "valid_targets_mean": 4130.4, |
| "valid_targets_min": 1762 |
| }, |
| { |
| "epoch": 5.546218487394958, |
| "grad_norm": 0.6708862310223077, |
| "learning_rate": 5.037269533348075e-06, |
| "loss": 0.1924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19089899957180023, |
| "step": 5280, |
| "valid_targets_mean": 3285.0, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 5.551470588235294, |
| "grad_norm": 0.7236660627737345, |
| "learning_rate": 5.002560394501463e-06, |
| "loss": 0.1988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2103574275970459, |
| "step": 5285, |
| "valid_targets_mean": 3298.2, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 5.55672268907563, |
| "grad_norm": 0.7530081580597202, |
| "learning_rate": 4.9679541492945135e-06, |
| "loss": 0.1988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1874314844608307, |
| "step": 5290, |
| "valid_targets_mean": 2740.4, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 5.561974789915967, |
| "grad_norm": 0.7386136479775732, |
| "learning_rate": 4.933451035151913e-06, |
| "loss": 0.196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19821321964263916, |
| "step": 5295, |
| "valid_targets_mean": 2995.1, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 5.567226890756302, |
| "grad_norm": 0.72395057035861, |
| "learning_rate": 4.899051288790806e-06, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18655264377593994, |
| "step": 5300, |
| "valid_targets_mean": 2811.6, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 5.572478991596639, |
| "grad_norm": 0.7470437002909036, |
| "learning_rate": 4.86475514621916e-06, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19498442113399506, |
| "step": 5305, |
| "valid_targets_mean": 3709.5, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 5.5777310924369745, |
| "grad_norm": 0.7302797839356747, |
| "learning_rate": 4.830562842734112e-06, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18496988713741302, |
| "step": 5310, |
| "valid_targets_mean": 2960.6, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 5.582983193277311, |
| "grad_norm": 0.7028513017526096, |
| "learning_rate": 4.796474612920421e-06, |
| "loss": 0.1973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19564983248710632, |
| "step": 5315, |
| "valid_targets_mean": 3189.2, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 5.588235294117647, |
| "grad_norm": 0.6143075180595077, |
| "learning_rate": 4.762490690648813e-06, |
| "loss": 0.1941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1765946000814438, |
| "step": 5320, |
| "valid_targets_mean": 3823.1, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 5.593487394957983, |
| "grad_norm": 0.7331719157365119, |
| "learning_rate": 4.728611309074374e-06, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15561848878860474, |
| "step": 5325, |
| "valid_targets_mean": 2639.4, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 5.598739495798319, |
| "grad_norm": 0.799889226199126, |
| "learning_rate": 4.694836700634975e-06, |
| "loss": 0.1892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20055752992630005, |
| "step": 5330, |
| "valid_targets_mean": 2988.3, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 5.6039915966386555, |
| "grad_norm": 0.7723682554917705, |
| "learning_rate": 4.661167097049668e-06, |
| "loss": 0.1886, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19730721414089203, |
| "step": 5335, |
| "valid_targets_mean": 3563.1, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 5.609243697478991, |
| "grad_norm": 0.6899888581366523, |
| "learning_rate": 4.62760272931708e-06, |
| "loss": 0.1879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17451027035713196, |
| "step": 5340, |
| "valid_targets_mean": 3737.9, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 5.614495798319328, |
| "grad_norm": 0.7422252794353547, |
| "learning_rate": 4.594143827713844e-06, |
| "loss": 0.1962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17348533868789673, |
| "step": 5345, |
| "valid_targets_mean": 2745.8, |
| "valid_targets_min": 1036 |
| }, |
| { |
| "epoch": 5.619747899159664, |
| "grad_norm": 0.7524666990737761, |
| "learning_rate": 4.56079062179303e-06, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1979708969593048, |
| "step": 5350, |
| "valid_targets_mean": 3516.4, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 5.625, |
| "grad_norm": 0.6922592034045233, |
| "learning_rate": 4.527543340382538e-06, |
| "loss": 0.1828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17850226163864136, |
| "step": 5355, |
| "valid_targets_mean": 3279.4, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 5.630252100840336, |
| "grad_norm": 0.6631764263997426, |
| "learning_rate": 4.494402211583569e-06, |
| "loss": 0.1855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16947326064109802, |
| "step": 5360, |
| "valid_targets_mean": 3180.4, |
| "valid_targets_min": 1816 |
| }, |
| { |
| "epoch": 5.635504201680672, |
| "grad_norm": 0.7291414927160216, |
| "learning_rate": 4.461367462769009e-06, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18259739875793457, |
| "step": 5365, |
| "valid_targets_mean": 2939.2, |
| "valid_targets_min": 1629 |
| }, |
| { |
| "epoch": 5.640756302521009, |
| "grad_norm": 0.7503072179394285, |
| "learning_rate": 4.428439320581923e-06, |
| "loss": 0.1934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1907494068145752, |
| "step": 5370, |
| "valid_targets_mean": 2755.7, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 5.6460084033613445, |
| "grad_norm": 0.7463064226667883, |
| "learning_rate": 4.3956180109339705e-06, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19494910538196564, |
| "step": 5375, |
| "valid_targets_mean": 3390.2, |
| "valid_targets_min": 1973 |
| }, |
| { |
| "epoch": 5.651260504201681, |
| "grad_norm": 0.7574766718662052, |
| "learning_rate": 4.362903759003849e-06, |
| "loss": 0.1872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.175164133310318, |
| "step": 5380, |
| "valid_targets_mean": 2960.4, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 5.656512605042017, |
| "grad_norm": 0.7408855986734103, |
| "learning_rate": 4.33029678923576e-06, |
| "loss": 0.1828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19168353080749512, |
| "step": 5385, |
| "valid_targets_mean": 3181.4, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 5.661764705882353, |
| "grad_norm": 0.7242394613336414, |
| "learning_rate": 4.297797325337889e-06, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1881379634141922, |
| "step": 5390, |
| "valid_targets_mean": 3464.2, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 5.667016806722689, |
| "grad_norm": 0.729199912715331, |
| "learning_rate": 4.265405590280822e-06, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18175436556339264, |
| "step": 5395, |
| "valid_targets_mean": 3443.1, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 5.6722689075630255, |
| "grad_norm": 0.7780886091437504, |
| "learning_rate": 4.233121806296072e-06, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20643776655197144, |
| "step": 5400, |
| "valid_targets_mean": 3891.4, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 5.677521008403361, |
| "grad_norm": 2.0082601362553083, |
| "learning_rate": 4.200946194874514e-06, |
| "loss": 0.1895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19502270221710205, |
| "step": 5405, |
| "valid_targets_mean": 3368.9, |
| "valid_targets_min": 1700 |
| }, |
| { |
| "epoch": 5.682773109243698, |
| "grad_norm": 0.7542156394780143, |
| "learning_rate": 4.168878976764872e-06, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17632341384887695, |
| "step": 5410, |
| "valid_targets_mean": 2497.1, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 5.688025210084033, |
| "grad_norm": 0.7204058422362926, |
| "learning_rate": 4.136920371972228e-06, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1968623399734497, |
| "step": 5415, |
| "valid_targets_mean": 3391.2, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 5.69327731092437, |
| "grad_norm": 0.7514367050409141, |
| "learning_rate": 4.105070599756482e-06, |
| "loss": 0.1906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1881876438856125, |
| "step": 5420, |
| "valid_targets_mean": 3003.8, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 5.698529411764706, |
| "grad_norm": 0.671835209360093, |
| "learning_rate": 4.073329878630856e-06, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16645438969135284, |
| "step": 5425, |
| "valid_targets_mean": 3239.7, |
| "valid_targets_min": 1679 |
| }, |
| { |
| "epoch": 5.703781512605042, |
| "grad_norm": 0.7151451061634367, |
| "learning_rate": 4.041698426360425e-06, |
| "loss": 0.1883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.190008282661438, |
| "step": 5430, |
| "valid_targets_mean": 3101.2, |
| "valid_targets_min": 1739 |
| }, |
| { |
| "epoch": 5.709033613445378, |
| "grad_norm": 0.8510471746451064, |
| "learning_rate": 4.010176459960569e-06, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.172542542219162, |
| "step": 5435, |
| "valid_targets_mean": 2844.4, |
| "valid_targets_min": 1278 |
| }, |
| { |
| "epoch": 5.714285714285714, |
| "grad_norm": 0.6595419486913193, |
| "learning_rate": 3.978764195695528e-06, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1725081354379654, |
| "step": 5440, |
| "valid_targets_mean": 3563.4, |
| "valid_targets_min": 1522 |
| }, |
| { |
| "epoch": 5.71953781512605, |
| "grad_norm": 0.7513983043013762, |
| "learning_rate": 3.947461849076912e-06, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1882949024438858, |
| "step": 5445, |
| "valid_targets_mean": 3589.0, |
| "valid_targets_min": 464 |
| }, |
| { |
| "epoch": 5.724789915966387, |
| "grad_norm": 0.6781411607065908, |
| "learning_rate": 3.916269634862193e-06, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1876165270805359, |
| "step": 5450, |
| "valid_targets_mean": 3827.1, |
| "valid_targets_min": 1003 |
| }, |
| { |
| "epoch": 5.730042016806722, |
| "grad_norm": 0.7521498102078784, |
| "learning_rate": 3.885187767053269e-06, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18409094214439392, |
| "step": 5455, |
| "valid_targets_mean": 3042.1, |
| "valid_targets_min": 1446 |
| }, |
| { |
| "epoch": 5.735294117647059, |
| "grad_norm": 0.6989125002761396, |
| "learning_rate": 3.854216458894973e-06, |
| "loss": 0.1915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18674632906913757, |
| "step": 5460, |
| "valid_targets_mean": 3257.8, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 5.740546218487395, |
| "grad_norm": 0.7363983943406658, |
| "learning_rate": 3.823355922873606e-06, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20742374658584595, |
| "step": 5465, |
| "valid_targets_mean": 3858.5, |
| "valid_targets_min": 1336 |
| }, |
| { |
| "epoch": 5.745798319327731, |
| "grad_norm": 0.6688145340655683, |
| "learning_rate": 3.792606370715508e-06, |
| "loss": 0.1979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18492421507835388, |
| "step": 5470, |
| "valid_targets_mean": 3821.1, |
| "valid_targets_min": 1275 |
| }, |
| { |
| "epoch": 5.751050420168067, |
| "grad_norm": 0.7198758184286466, |
| "learning_rate": 3.761968013385584e-06, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1842348277568817, |
| "step": 5475, |
| "valid_targets_mean": 2914.6, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 5.756302521008403, |
| "grad_norm": 0.71314811892582, |
| "learning_rate": 3.731441061085843e-06, |
| "loss": 0.1799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17556104063987732, |
| "step": 5480, |
| "valid_targets_mean": 3083.4, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 5.76155462184874, |
| "grad_norm": 0.7631003279463335, |
| "learning_rate": 3.701025723253988e-06, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17353874444961548, |
| "step": 5485, |
| "valid_targets_mean": 2747.4, |
| "valid_targets_min": 1557 |
| }, |
| { |
| "epoch": 5.766806722689076, |
| "grad_norm": 0.7552536091187607, |
| "learning_rate": 3.67072220856197e-06, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18228024244308472, |
| "step": 5490, |
| "valid_targets_mean": 3405.2, |
| "valid_targets_min": 1405 |
| }, |
| { |
| "epoch": 5.772058823529412, |
| "grad_norm": 0.7052066859512669, |
| "learning_rate": 3.640530724914517e-06, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17114409804344177, |
| "step": 5495, |
| "valid_targets_mean": 3507.1, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 5.777310924369748, |
| "grad_norm": 0.7275066681746295, |
| "learning_rate": 3.61045147944777e-06, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1737072765827179, |
| "step": 5500, |
| "valid_targets_mean": 3079.7, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 5.782563025210084, |
| "grad_norm": 0.738557032225339, |
| "learning_rate": 3.5804846785278315e-06, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17162227630615234, |
| "step": 5505, |
| "valid_targets_mean": 2934.3, |
| "valid_targets_min": 1288 |
| }, |
| { |
| "epoch": 5.78781512605042, |
| "grad_norm": 0.6881422147874104, |
| "learning_rate": 3.5506305277493326e-06, |
| "loss": 0.196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17860713601112366, |
| "step": 5510, |
| "valid_targets_mean": 3428.2, |
| "valid_targets_min": 1915 |
| }, |
| { |
| "epoch": 5.793067226890757, |
| "grad_norm": 0.8082399213846237, |
| "learning_rate": 3.520889231934057e-06, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2075139284133911, |
| "step": 5515, |
| "valid_targets_mean": 3764.9, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 5.798319327731092, |
| "grad_norm": 0.7470662206853251, |
| "learning_rate": 3.4912609951295084e-06, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18600235879421234, |
| "step": 5520, |
| "valid_targets_mean": 3006.5, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 5.803571428571429, |
| "grad_norm": 0.7396369320045814, |
| "learning_rate": 3.461746020607526e-06, |
| "loss": 0.1877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21041221916675568, |
| "step": 5525, |
| "valid_targets_mean": 3326.2, |
| "valid_targets_min": 1586 |
| }, |
| { |
| "epoch": 5.8088235294117645, |
| "grad_norm": 0.6985035686259948, |
| "learning_rate": 3.432344510862895e-06, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16554896533489227, |
| "step": 5530, |
| "valid_targets_mean": 3205.2, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 5.814075630252101, |
| "grad_norm": 0.7863118868734756, |
| "learning_rate": 3.403056667611917e-06, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17784982919692993, |
| "step": 5535, |
| "valid_targets_mean": 2735.1, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 5.819327731092437, |
| "grad_norm": 0.740543140779203, |
| "learning_rate": 3.373882691791088e-06, |
| "loss": 0.1821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19035407900810242, |
| "step": 5540, |
| "valid_targets_mean": 3735.8, |
| "valid_targets_min": 1681 |
| }, |
| { |
| "epoch": 5.824579831932773, |
| "grad_norm": 0.774595013152137, |
| "learning_rate": 3.344822783555679e-06, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20152834057807922, |
| "step": 5545, |
| "valid_targets_mean": 2883.7, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 5.829831932773109, |
| "grad_norm": 0.807774445390228, |
| "learning_rate": 3.315877142278363e-06, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21530133485794067, |
| "step": 5550, |
| "valid_targets_mean": 3324.1, |
| "valid_targets_min": 1455 |
| }, |
| { |
| "epoch": 5.8350840336134455, |
| "grad_norm": 0.6932108713568098, |
| "learning_rate": 3.287045966547866e-06, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19992104172706604, |
| "step": 5555, |
| "valid_targets_mean": 3948.6, |
| "valid_targets_min": 1529 |
| }, |
| { |
| "epoch": 5.840336134453781, |
| "grad_norm": 0.7588685281732017, |
| "learning_rate": 3.258329454167599e-06, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20404741168022156, |
| "step": 5560, |
| "valid_targets_mean": 3419.9, |
| "valid_targets_min": 1450 |
| }, |
| { |
| "epoch": 5.845588235294118, |
| "grad_norm": 0.6654008948279083, |
| "learning_rate": 3.2297278021542833e-06, |
| "loss": 0.1813, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1653444766998291, |
| "step": 5565, |
| "valid_targets_mean": 3465.6, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 5.850840336134453, |
| "grad_norm": 0.7617245678374055, |
| "learning_rate": 3.201241206736614e-06, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19317778944969177, |
| "step": 5570, |
| "valid_targets_mean": 3085.4, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 5.85609243697479, |
| "grad_norm": 0.7601710209752651, |
| "learning_rate": 3.1728698633539266e-06, |
| "loss": 0.1979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1923319697380066, |
| "step": 5575, |
| "valid_targets_mean": 3230.6, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 5.8613445378151265, |
| "grad_norm": 0.8026621042498756, |
| "learning_rate": 3.1446139666548212e-06, |
| "loss": 0.1941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19206663966178894, |
| "step": 5580, |
| "valid_targets_mean": 2908.7, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 5.866596638655462, |
| "grad_norm": 0.8143821059911558, |
| "learning_rate": 3.1164737104958707e-06, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2039254605770111, |
| "step": 5585, |
| "valid_targets_mean": 2748.8, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 5.871848739495798, |
| "grad_norm": 0.7917201537427566, |
| "learning_rate": 3.0884492879402452e-06, |
| "loss": 0.1983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2050473690032959, |
| "step": 5590, |
| "valid_targets_mean": 3297.7, |
| "valid_targets_min": 1683 |
| }, |
| { |
| "epoch": 5.8771008403361344, |
| "grad_norm": 0.7656092656857109, |
| "learning_rate": 3.0605408912564184e-06, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18506518006324768, |
| "step": 5595, |
| "valid_targets_mean": 3406.1, |
| "valid_targets_min": 1913 |
| }, |
| { |
| "epoch": 5.882352941176471, |
| "grad_norm": 0.7130368872222834, |
| "learning_rate": 3.032748711916851e-06, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18892902135849, |
| "step": 5600, |
| "valid_targets_mean": 3848.1, |
| "valid_targets_min": 1659 |
| }, |
| { |
| "epoch": 5.887605042016807, |
| "grad_norm": 0.7127010208647905, |
| "learning_rate": 3.0050729405966495e-06, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17573906481266022, |
| "step": 5605, |
| "valid_targets_mean": 3390.7, |
| "valid_targets_min": 1390 |
| }, |
| { |
| "epoch": 5.892857142857143, |
| "grad_norm": 0.7730291184647539, |
| "learning_rate": 2.9775137671722754e-06, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2364846169948578, |
| "step": 5610, |
| "valid_targets_mean": 3338.5, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 5.898109243697479, |
| "grad_norm": 0.7437425304974528, |
| "learning_rate": 2.9500713807202565e-06, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1972287893295288, |
| "step": 5615, |
| "valid_targets_mean": 3389.6, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 5.9033613445378155, |
| "grad_norm": 0.7338868027074469, |
| "learning_rate": 2.9227459695158543e-06, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.165279358625412, |
| "step": 5620, |
| "valid_targets_mean": 3097.9, |
| "valid_targets_min": 1459 |
| }, |
| { |
| "epoch": 5.908613445378151, |
| "grad_norm": 0.8398618395284945, |
| "learning_rate": 2.895537721031809e-06, |
| "loss": 0.1865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20163550972938538, |
| "step": 5625, |
| "valid_targets_mean": 2619.4, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 5.913865546218488, |
| "grad_norm": 0.6872190021050335, |
| "learning_rate": 2.8684468219370364e-06, |
| "loss": 0.1856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17330724000930786, |
| "step": 5630, |
| "valid_targets_mean": 3791.2, |
| "valid_targets_min": 1564 |
| }, |
| { |
| "epoch": 5.919117647058823, |
| "grad_norm": 0.7915970239951657, |
| "learning_rate": 2.841473458095334e-06, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19606292247772217, |
| "step": 5635, |
| "valid_targets_mean": 3223.3, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 5.92436974789916, |
| "grad_norm": 0.7371089384298193, |
| "learning_rate": 2.8146178145641355e-06, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18127654492855072, |
| "step": 5640, |
| "valid_targets_mean": 3439.2, |
| "valid_targets_min": 1524 |
| }, |
| { |
| "epoch": 5.929621848739496, |
| "grad_norm": 0.7111215478308646, |
| "learning_rate": 2.787880075593217e-06, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18391185998916626, |
| "step": 5645, |
| "valid_targets_mean": 3744.9, |
| "valid_targets_min": 1375 |
| }, |
| { |
| "epoch": 5.934873949579832, |
| "grad_norm": 0.7280994223942271, |
| "learning_rate": 2.7612604246234355e-06, |
| "loss": 0.1925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17705269157886505, |
| "step": 5650, |
| "valid_targets_mean": 3036.2, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 5.940126050420168, |
| "grad_norm": 0.6242246207880907, |
| "learning_rate": 2.7347590442854867e-06, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1647983193397522, |
| "step": 5655, |
| "valid_targets_mean": 3766.5, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 5.945378151260504, |
| "grad_norm": 0.7653759814637277, |
| "learning_rate": 2.7083761163986433e-06, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20250293612480164, |
| "step": 5660, |
| "valid_targets_mean": 3225.9, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 5.95063025210084, |
| "grad_norm": 0.7475006568229906, |
| "learning_rate": 2.682111821969493e-06, |
| "loss": 0.1819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19375839829444885, |
| "step": 5665, |
| "valid_targets_mean": 3751.3, |
| "valid_targets_min": 2264 |
| }, |
| { |
| "epoch": 5.955882352941177, |
| "grad_norm": 0.737881904148586, |
| "learning_rate": 2.6559663411907233e-06, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1940421611070633, |
| "step": 5670, |
| "valid_targets_mean": 3505.2, |
| "valid_targets_min": 1454 |
| }, |
| { |
| "epoch": 5.961134453781512, |
| "grad_norm": 0.7664181534172059, |
| "learning_rate": 2.629939853439856e-06, |
| "loss": 0.1892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18167239427566528, |
| "step": 5675, |
| "valid_targets_mean": 3385.7, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 5.966386554621849, |
| "grad_norm": 0.7497306698153924, |
| "learning_rate": 2.604032537278052e-06, |
| "loss": 0.1847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1727236807346344, |
| "step": 5680, |
| "valid_targets_mean": 3201.6, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 5.9716386554621845, |
| "grad_norm": 0.7405178705998576, |
| "learning_rate": 2.5782445704488447e-06, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1837659776210785, |
| "step": 5685, |
| "valid_targets_mean": 3362.1, |
| "valid_targets_min": 1512 |
| }, |
| { |
| "epoch": 5.976890756302521, |
| "grad_norm": 0.697865915003433, |
| "learning_rate": 2.5525761298769515e-06, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18182769417762756, |
| "step": 5690, |
| "valid_targets_mean": 3643.9, |
| "valid_targets_min": 2048 |
| }, |
| { |
| "epoch": 5.982142857142857, |
| "grad_norm": 0.7426309465732394, |
| "learning_rate": 2.527027391667054e-06, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1931290328502655, |
| "step": 5695, |
| "valid_targets_mean": 3107.1, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 5.987394957983193, |
| "grad_norm": 0.7413852866874329, |
| "learning_rate": 2.501598531102587e-06, |
| "loss": 0.1963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20602191984653473, |
| "step": 5700, |
| "valid_targets_mean": 3339.4, |
| "valid_targets_min": 1878 |
| }, |
| { |
| "epoch": 5.992647058823529, |
| "grad_norm": 0.8082149132119589, |
| "learning_rate": 2.47628972264452e-06, |
| "loss": 0.1972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21446332335472107, |
| "step": 5705, |
| "valid_targets_mean": 3394.6, |
| "valid_targets_min": 1727 |
| }, |
| { |
| "epoch": 5.9978991596638656, |
| "grad_norm": 0.673717887910672, |
| "learning_rate": 2.4511011399301944e-06, |
| "loss": 0.1884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1594567894935608, |
| "step": 5710, |
| "valid_targets_mean": 2924.3, |
| "valid_targets_min": 1622 |
| }, |
| { |
| "epoch": 6.003151260504202, |
| "grad_norm": 0.888726685758785, |
| "learning_rate": 2.4260329557721107e-06, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1586988866329193, |
| "step": 5715, |
| "valid_targets_mean": 1587.9, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 6.008403361344538, |
| "grad_norm": 0.7892723724374661, |
| "learning_rate": 2.4010853421567237e-06, |
| "loss": 0.131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12804922461509705, |
| "step": 5720, |
| "valid_targets_mean": 1591.2, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 6.013655462184874, |
| "grad_norm": 0.7624099131843867, |
| "learning_rate": 2.376258470243309e-06, |
| "loss": 0.1218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11783352494239807, |
| "step": 5725, |
| "valid_targets_mean": 1418.7, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 6.01890756302521, |
| "grad_norm": 0.7792462436940873, |
| "learning_rate": 2.351552510362758e-06, |
| "loss": 0.1228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11473619192838669, |
| "step": 5730, |
| "valid_targets_mean": 1389.0, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 6.024159663865547, |
| "grad_norm": 0.8703079476348818, |
| "learning_rate": 2.326967632016406e-06, |
| "loss": 0.1226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11579575389623642, |
| "step": 5735, |
| "valid_targets_mean": 1513.9, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 6.029411764705882, |
| "grad_norm": 0.8915876673258326, |
| "learning_rate": 2.302504003874888e-06, |
| "loss": 0.1241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12122771143913269, |
| "step": 5740, |
| "valid_targets_mean": 1482.3, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 6.034663865546219, |
| "grad_norm": 0.8177570400824066, |
| "learning_rate": 2.2781617937769675e-06, |
| "loss": 0.1256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10171643644571304, |
| "step": 5745, |
| "valid_targets_mean": 1189.1, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 6.0399159663865545, |
| "grad_norm": 1.025573849186844, |
| "learning_rate": 2.2539411687283907e-06, |
| "loss": 0.1108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1116051971912384, |
| "step": 5750, |
| "valid_targets_mean": 1299.6, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 6.045168067226891, |
| "grad_norm": 0.873608647534603, |
| "learning_rate": 2.229842294900744e-06, |
| "loss": 0.1314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1157689318060875, |
| "step": 5755, |
| "valid_targets_mean": 1407.6, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 6.050420168067227, |
| "grad_norm": 0.9798749449474746, |
| "learning_rate": 2.205865337630302e-06, |
| "loss": 0.1219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13768497109413147, |
| "step": 5760, |
| "valid_targets_mean": 1544.1, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 6.055672268907563, |
| "grad_norm": 0.916099508349051, |
| "learning_rate": 2.182010461416899e-06, |
| "loss": 0.115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11846692860126495, |
| "step": 5765, |
| "valid_targets_mean": 1511.1, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 6.060924369747899, |
| "grad_norm": 0.8853677750337303, |
| "learning_rate": 2.158277829922817e-06, |
| "loss": 0.1186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12952449917793274, |
| "step": 5770, |
| "valid_targets_mean": 1638.0, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 6.0661764705882355, |
| "grad_norm": 0.7694796846656141, |
| "learning_rate": 2.1346676059716253e-06, |
| "loss": 0.1188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11292778700590134, |
| "step": 5775, |
| "valid_targets_mean": 1526.9, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 6.071428571428571, |
| "grad_norm": 0.8108257454301182, |
| "learning_rate": 2.1111799515471066e-06, |
| "loss": 0.1079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1118139773607254, |
| "step": 5780, |
| "valid_targets_mean": 1387.4, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 6.076680672268908, |
| "grad_norm": 0.816088021557387, |
| "learning_rate": 2.0878150277921195e-06, |
| "loss": 0.1076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1065862700343132, |
| "step": 5785, |
| "valid_targets_mean": 1382.9, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 6.081932773109243, |
| "grad_norm": 0.8469714058115316, |
| "learning_rate": 2.064572995007492e-06, |
| "loss": 0.1093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09756132960319519, |
| "step": 5790, |
| "valid_targets_mean": 1312.1, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 6.08718487394958, |
| "grad_norm": 0.9292126584824716, |
| "learning_rate": 2.0414540126509274e-06, |
| "loss": 0.1195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11742901057004929, |
| "step": 5795, |
| "valid_targets_mean": 1397.6, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 6.092436974789916, |
| "grad_norm": 0.9989157343383366, |
| "learning_rate": 2.0184582393359253e-06, |
| "loss": 0.1177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12957970798015594, |
| "step": 5800, |
| "valid_targets_mean": 1419.4, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 6.097689075630252, |
| "grad_norm": 0.8687109853494948, |
| "learning_rate": 1.99558583283066e-06, |
| "loss": 0.118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12820440530776978, |
| "step": 5805, |
| "valid_targets_mean": 1647.7, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 6.102941176470588, |
| "grad_norm": 0.8429889291483497, |
| "learning_rate": 1.9728369500569333e-06, |
| "loss": 0.1183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11039917171001434, |
| "step": 5810, |
| "valid_targets_mean": 1545.5, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 6.108193277310924, |
| "grad_norm": 0.9401593816021946, |
| "learning_rate": 1.950211747089077e-06, |
| "loss": 0.1152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11282265186309814, |
| "step": 5815, |
| "valid_targets_mean": 1411.8, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 6.11344537815126, |
| "grad_norm": 0.8579915255635823, |
| "learning_rate": 1.927710379152881e-06, |
| "loss": 0.1104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11633343994617462, |
| "step": 5820, |
| "valid_targets_mean": 1437.3, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 6.118697478991597, |
| "grad_norm": 0.8470196779150363, |
| "learning_rate": 1.9053330006245452e-06, |
| "loss": 0.1086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0939580649137497, |
| "step": 5825, |
| "valid_targets_mean": 1193.6, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 6.123949579831933, |
| "grad_norm": 0.8951203579512895, |
| "learning_rate": 1.8830797650296006e-06, |
| "loss": 0.1087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11357836425304413, |
| "step": 5830, |
| "valid_targets_mean": 1514.0, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 6.129201680672269, |
| "grad_norm": 0.8204950266453027, |
| "learning_rate": 1.8609508250418628e-06, |
| "loss": 0.1089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10361876338720322, |
| "step": 5835, |
| "valid_targets_mean": 1379.1, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 6.1344537815126055, |
| "grad_norm": 0.827334438729143, |
| "learning_rate": 1.8389463324823986e-06, |
| "loss": 0.1121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10381718724966049, |
| "step": 5840, |
| "valid_targets_mean": 1455.5, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 6.139705882352941, |
| "grad_norm": 1.0670876809595125, |
| "learning_rate": 1.81706643831846e-06, |
| "loss": 0.113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11400048434734344, |
| "step": 5845, |
| "valid_targets_mean": 1525.2, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 6.144957983193278, |
| "grad_norm": 0.9783834172435171, |
| "learning_rate": 1.7953112926624715e-06, |
| "loss": 0.119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11489921063184738, |
| "step": 5850, |
| "valid_targets_mean": 1476.6, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 6.150210084033613, |
| "grad_norm": 0.8766319864539988, |
| "learning_rate": 1.7736810447709852e-06, |
| "loss": 0.1092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11097388714551926, |
| "step": 5855, |
| "valid_targets_mean": 1467.1, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 6.15546218487395, |
| "grad_norm": 0.8785524728820334, |
| "learning_rate": 1.7521758430436553e-06, |
| "loss": 0.1158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10426779836416245, |
| "step": 5860, |
| "valid_targets_mean": 1341.3, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 6.160714285714286, |
| "grad_norm": 0.8829153848682123, |
| "learning_rate": 1.7307958350222366e-06, |
| "loss": 0.1139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11685581505298615, |
| "step": 5865, |
| "valid_targets_mean": 1556.4, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 6.165966386554622, |
| "grad_norm": 0.8180165865392631, |
| "learning_rate": 1.7095411673895545e-06, |
| "loss": 0.1147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11777027696371078, |
| "step": 5870, |
| "valid_targets_mean": 1509.7, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 6.171218487394958, |
| "grad_norm": 0.8375114382633897, |
| "learning_rate": 1.6884119859685034e-06, |
| "loss": 0.1098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11995431780815125, |
| "step": 5875, |
| "valid_targets_mean": 1408.4, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 6.176470588235294, |
| "grad_norm": 0.7972330265214028, |
| "learning_rate": 1.6674084357210562e-06, |
| "loss": 0.1071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10255067050457001, |
| "step": 5880, |
| "valid_targets_mean": 1449.8, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 6.18172268907563, |
| "grad_norm": 0.8858809578498907, |
| "learning_rate": 1.6465306607472608e-06, |
| "loss": 0.102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10549542307853699, |
| "step": 5885, |
| "valid_targets_mean": 1489.8, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 6.186974789915967, |
| "grad_norm": 0.9235725158063691, |
| "learning_rate": 1.625778804284246e-06, |
| "loss": 0.1083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10902103036642075, |
| "step": 5890, |
| "valid_targets_mean": 1379.1, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 6.192226890756302, |
| "grad_norm": 0.8610604938191373, |
| "learning_rate": 1.6051530087052558e-06, |
| "loss": 0.1107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10405048727989197, |
| "step": 5895, |
| "valid_targets_mean": 1347.1, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 6.197478991596639, |
| "grad_norm": 0.844841243204075, |
| "learning_rate": 1.5846534155186511e-06, |
| "loss": 0.1103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1075349748134613, |
| "step": 5900, |
| "valid_targets_mean": 1372.6, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 6.2027310924369745, |
| "grad_norm": 0.9299916077128926, |
| "learning_rate": 1.564280165366956e-06, |
| "loss": 0.1104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11143974959850311, |
| "step": 5905, |
| "valid_targets_mean": 1323.6, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 6.207983193277311, |
| "grad_norm": 0.9520206844500675, |
| "learning_rate": 1.544033398025886e-06, |
| "loss": 0.1164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12437736988067627, |
| "step": 5910, |
| "valid_targets_mean": 1597.7, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 6.213235294117647, |
| "grad_norm": 0.8264419715144223, |
| "learning_rate": 1.5239132524033951e-06, |
| "loss": 0.0983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09098273515701294, |
| "step": 5915, |
| "valid_targets_mean": 1270.8, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 6.218487394957983, |
| "grad_norm": 0.9121347316675537, |
| "learning_rate": 1.50391986653871e-06, |
| "loss": 0.1151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10781864076852798, |
| "step": 5920, |
| "valid_targets_mean": 1388.2, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.223739495798319, |
| "grad_norm": 0.8183103322870855, |
| "learning_rate": 1.4840533776013954e-06, |
| "loss": 0.1116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0995546281337738, |
| "step": 5925, |
| "valid_targets_mean": 1447.2, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 6.2289915966386555, |
| "grad_norm": 0.8695709319336882, |
| "learning_rate": 1.4643139218904035e-06, |
| "loss": 0.1177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1060028076171875, |
| "step": 5930, |
| "valid_targets_mean": 1399.7, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 6.234243697478991, |
| "grad_norm": 0.7936160826191869, |
| "learning_rate": 1.4447016348331477e-06, |
| "loss": 0.1041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10275650769472122, |
| "step": 5935, |
| "valid_targets_mean": 1454.3, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 6.239495798319328, |
| "grad_norm": 1.0003364025533468, |
| "learning_rate": 1.4252166509845777e-06, |
| "loss": 0.1087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1305723935365677, |
| "step": 5940, |
| "valid_targets_mean": 1746.1, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 6.244747899159663, |
| "grad_norm": 0.9039823804020426, |
| "learning_rate": 1.4058591040262259e-06, |
| "loss": 0.1079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1077783852815628, |
| "step": 5945, |
| "valid_targets_mean": 1282.2, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 6.25, |
| "grad_norm": 0.8985676998446693, |
| "learning_rate": 1.3866291267653309e-06, |
| "loss": 0.1031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09621434658765793, |
| "step": 5950, |
| "valid_targets_mean": 1227.6, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 6.255252100840336, |
| "grad_norm": 0.8526105872349939, |
| "learning_rate": 1.3675268511339067e-06, |
| "loss": 0.1043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09855210781097412, |
| "step": 5955, |
| "valid_targets_mean": 1319.1, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 6.260504201680672, |
| "grad_norm": 0.8620937247837483, |
| "learning_rate": 1.3485524081878288e-06, |
| "loss": 0.1069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1124173030257225, |
| "step": 5960, |
| "valid_targets_mean": 1616.5, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 6.265756302521009, |
| "grad_norm": 0.8269435472596893, |
| "learning_rate": 1.3297059281059533e-06, |
| "loss": 0.1092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10087428987026215, |
| "step": 5965, |
| "valid_targets_mean": 1453.0, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 6.2710084033613445, |
| "grad_norm": 0.8464773093003739, |
| "learning_rate": 1.3109875401892146e-06, |
| "loss": 0.111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10120785981416702, |
| "step": 5970, |
| "valid_targets_mean": 1442.0, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 6.276260504201681, |
| "grad_norm": 0.809843624015962, |
| "learning_rate": 1.2923973728597373e-06, |
| "loss": 0.1037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10031883418560028, |
| "step": 5975, |
| "valid_targets_mean": 1548.4, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 6.281512605042017, |
| "grad_norm": 0.8939758957054761, |
| "learning_rate": 1.2739355536599508e-06, |
| "loss": 0.1095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10138392448425293, |
| "step": 5980, |
| "valid_targets_mean": 1359.8, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 6.286764705882353, |
| "grad_norm": 0.9990516754583353, |
| "learning_rate": 1.2556022092517362e-06, |
| "loss": 0.1055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11516615748405457, |
| "step": 5985, |
| "valid_targets_mean": 1478.6, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 6.292016806722689, |
| "grad_norm": 0.8483028409836717, |
| "learning_rate": 1.237397465415524e-06, |
| "loss": 0.1076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0986555963754654, |
| "step": 5990, |
| "valid_targets_mean": 1332.7, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 6.2972689075630255, |
| "grad_norm": 0.9848150205283159, |
| "learning_rate": 1.2193214470494664e-06, |
| "loss": 0.1076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11558929085731506, |
| "step": 5995, |
| "valid_targets_mean": 1622.7, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 6.302521008403361, |
| "grad_norm": 0.9238690287611016, |
| "learning_rate": 1.201374278168541e-06, |
| "loss": 0.0962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08862060308456421, |
| "step": 6000, |
| "valid_targets_mean": 1195.4, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 6.307773109243698, |
| "grad_norm": 0.9550625507498628, |
| "learning_rate": 1.1835560819037429e-06, |
| "loss": 0.1082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12365525960922241, |
| "step": 6005, |
| "valid_targets_mean": 1504.5, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.313025210084033, |
| "grad_norm": 0.8977013451179156, |
| "learning_rate": 1.1658669805012112e-06, |
| "loss": 0.1088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10444406419992447, |
| "step": 6010, |
| "valid_targets_mean": 1580.1, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 6.31827731092437, |
| "grad_norm": 0.9626620928600009, |
| "learning_rate": 1.1483070953213904e-06, |
| "loss": 0.1017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09486856311559677, |
| "step": 6015, |
| "valid_targets_mean": 1158.2, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 6.323529411764706, |
| "grad_norm": 0.857918445866971, |
| "learning_rate": 1.130876546838211e-06, |
| "loss": 0.1092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.107955202460289, |
| "step": 6020, |
| "valid_targets_mean": 1430.4, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 6.328781512605042, |
| "grad_norm": 0.8446463752304134, |
| "learning_rate": 1.1135754546382627e-06, |
| "loss": 0.111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10878735780715942, |
| "step": 6025, |
| "valid_targets_mean": 1590.4, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 6.334033613445378, |
| "grad_norm": 0.8359256112732846, |
| "learning_rate": 1.0964039374199564e-06, |
| "loss": 0.108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10430100560188293, |
| "step": 6030, |
| "valid_targets_mean": 1521.5, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 6.339285714285714, |
| "grad_norm": 0.9402998650985804, |
| "learning_rate": 1.07936211299273e-06, |
| "loss": 0.1083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11771460622549057, |
| "step": 6035, |
| "valid_targets_mean": 1455.2, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 6.34453781512605, |
| "grad_norm": 0.8950360049257687, |
| "learning_rate": 1.0624500982762376e-06, |
| "loss": 0.1031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09641949832439423, |
| "step": 6040, |
| "valid_targets_mean": 1279.4, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 6.349789915966387, |
| "grad_norm": 0.8797683867630403, |
| "learning_rate": 1.045668009299523e-06, |
| "loss": 0.1104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10380536317825317, |
| "step": 6045, |
| "valid_targets_mean": 1366.9, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 6.355042016806722, |
| "grad_norm": 0.8500779068020419, |
| "learning_rate": 1.029015961200266e-06, |
| "loss": 0.1055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08908183872699738, |
| "step": 6050, |
| "valid_targets_mean": 1220.5, |
| "valid_targets_min": 585 |
| }, |
| { |
| "epoch": 6.360294117647059, |
| "grad_norm": 0.963766954956786, |
| "learning_rate": 1.012494068223946e-06, |
| "loss": 0.1142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11748844385147095, |
| "step": 6055, |
| "valid_targets_mean": 1596.4, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 6.3655462184873945, |
| "grad_norm": 1.013786349356977, |
| "learning_rate": 9.961024437230948e-07, |
| "loss": 0.1081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10118795186281204, |
| "step": 6060, |
| "valid_targets_mean": 1401.3, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 6.370798319327731, |
| "grad_norm": 0.8907088069055336, |
| "learning_rate": 9.798412001565038e-07, |
| "loss": 0.1095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10110174119472504, |
| "step": 6065, |
| "valid_targets_mean": 1546.8, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 6.376050420168067, |
| "grad_norm": 0.836878249917925, |
| "learning_rate": 9.63710449088453e-07, |
| "loss": 0.1052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0972297191619873, |
| "step": 6070, |
| "valid_targets_mean": 1284.4, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 6.381302521008403, |
| "grad_norm": 0.8342602387448971, |
| "learning_rate": 9.477103011879408e-07, |
| "loss": 0.1035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0927862748503685, |
| "step": 6075, |
| "valid_targets_mean": 1356.6, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 6.38655462184874, |
| "grad_norm": 0.9521526310876444, |
| "learning_rate": 9.318408662279399e-07, |
| "loss": 0.1113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12353593111038208, |
| "step": 6080, |
| "valid_targets_mean": 1564.5, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 6.391806722689076, |
| "grad_norm": 0.8338141493940605, |
| "learning_rate": 9.161022530846253e-07, |
| "loss": 0.0993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09638993442058563, |
| "step": 6085, |
| "valid_targets_mean": 1604.7, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 6.397058823529412, |
| "grad_norm": 0.9780093813312944, |
| "learning_rate": 9.004945697366452e-07, |
| "loss": 0.1, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09383905678987503, |
| "step": 6090, |
| "valid_targets_mean": 1383.4, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 6.402310924369748, |
| "grad_norm": 0.891231287791507, |
| "learning_rate": 8.850179232643641e-07, |
| "loss": 0.1047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10458773374557495, |
| "step": 6095, |
| "valid_targets_mean": 1482.5, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 6.407563025210084, |
| "grad_norm": 0.8092854746476409, |
| "learning_rate": 8.696724198491369e-07, |
| "loss": 0.1152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10784599184989929, |
| "step": 6100, |
| "valid_targets_mean": 1603.6, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 6.41281512605042, |
| "grad_norm": 0.9405797225301739, |
| "learning_rate": 8.544581647725825e-07, |
| "loss": 0.1025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10436847805976868, |
| "step": 6105, |
| "valid_targets_mean": 1517.9, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 6.418067226890757, |
| "grad_norm": 0.8958196229325652, |
| "learning_rate": 8.393752624158603e-07, |
| "loss": 0.102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10442647337913513, |
| "step": 6110, |
| "valid_targets_mean": 1516.2, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 6.423319327731092, |
| "grad_norm": 0.8319689597681014, |
| "learning_rate": 8.244238162589435e-07, |
| "loss": 0.0991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10206621140241623, |
| "step": 6115, |
| "valid_targets_mean": 1606.8, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 6.428571428571429, |
| "grad_norm": 0.8710279467847112, |
| "learning_rate": 8.096039288799251e-07, |
| "loss": 0.0907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09631064534187317, |
| "step": 6120, |
| "valid_targets_mean": 1328.7, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 6.4338235294117645, |
| "grad_norm": 0.8396789652735168, |
| "learning_rate": 7.949157019543064e-07, |
| "loss": 0.1038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10037371516227722, |
| "step": 6125, |
| "valid_targets_mean": 1396.2, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 6.439075630252101, |
| "grad_norm": 0.8987178018129869, |
| "learning_rate": 7.803592362542911e-07, |
| "loss": 0.0992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10167519003152847, |
| "step": 6130, |
| "valid_targets_mean": 1352.9, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 6.444327731092437, |
| "grad_norm": 0.8464981713812435, |
| "learning_rate": 7.659346316481086e-07, |
| "loss": 0.0978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09975661337375641, |
| "step": 6135, |
| "valid_targets_mean": 1479.4, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 6.449579831932773, |
| "grad_norm": 0.8500419492524814, |
| "learning_rate": 7.516419870993296e-07, |
| "loss": 0.1026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09866391867399216, |
| "step": 6140, |
| "valid_targets_mean": 1501.2, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 6.454831932773109, |
| "grad_norm": 0.8846021286748634, |
| "learning_rate": 7.374814006661667e-07, |
| "loss": 0.1004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0995045006275177, |
| "step": 6145, |
| "valid_targets_mean": 1419.9, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 6.4600840336134455, |
| "grad_norm": 0.9586129744458028, |
| "learning_rate": 7.234529695008241e-07, |
| "loss": 0.1043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1108023077249527, |
| "step": 6150, |
| "valid_targets_mean": 1587.2, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 6.465336134453781, |
| "grad_norm": 1.136739780639734, |
| "learning_rate": 7.095567898488175e-07, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20650501549243927, |
| "step": 6155, |
| "valid_targets_mean": 3546.9, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 6.470588235294118, |
| "grad_norm": 1.156568540868847, |
| "learning_rate": 6.957929570483224e-07, |
| "loss": 0.2101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2196894884109497, |
| "step": 6160, |
| "valid_targets_mean": 4000.6, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 6.475840336134453, |
| "grad_norm": 1.0910237455501957, |
| "learning_rate": 6.821615655295155e-07, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19706688821315765, |
| "step": 6165, |
| "valid_targets_mean": 4063.9, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 6.48109243697479, |
| "grad_norm": 0.9433508198462144, |
| "learning_rate": 6.686627088139253e-07, |
| "loss": 0.1925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18134765326976776, |
| "step": 6170, |
| "valid_targets_mean": 3747.0, |
| "valid_targets_min": 1561 |
| }, |
| { |
| "epoch": 6.486344537815126, |
| "grad_norm": 0.9443013244173882, |
| "learning_rate": 6.552964795137895e-07, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.206732839345932, |
| "step": 6175, |
| "valid_targets_mean": 3562.5, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 6.491596638655462, |
| "grad_norm": 0.7981181274477949, |
| "learning_rate": 6.420629693314317e-07, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1745770275592804, |
| "step": 6180, |
| "valid_targets_mean": 3911.4, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 6.496848739495798, |
| "grad_norm": 1.0053288601599724, |
| "learning_rate": 6.289622690586151e-07, |
| "loss": 0.1802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21677300333976746, |
| "step": 6185, |
| "valid_targets_mean": 5753.8, |
| "valid_targets_min": 2060 |
| }, |
| { |
| "epoch": 6.5021008403361344, |
| "grad_norm": 0.8097609883366772, |
| "learning_rate": 6.159944685759289e-07, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19428494572639465, |
| "step": 6190, |
| "valid_targets_mean": 3728.6, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 6.507352941176471, |
| "grad_norm": 0.8064900139004815, |
| "learning_rate": 6.031596568521792e-07, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20241563022136688, |
| "step": 6195, |
| "valid_targets_mean": 3554.0, |
| "valid_targets_min": 1689 |
| }, |
| { |
| "epoch": 6.512605042016807, |
| "grad_norm": 0.776184144360134, |
| "learning_rate": 5.904579219437567e-07, |
| "loss": 0.1902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1855916827917099, |
| "step": 6200, |
| "valid_targets_mean": 3708.1, |
| "valid_targets_min": 1697 |
| }, |
| { |
| "epoch": 6.517857142857143, |
| "grad_norm": 0.7831624701562231, |
| "learning_rate": 5.778893509940497e-07, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2027127742767334, |
| "step": 6205, |
| "valid_targets_mean": 3652.6, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 6.523109243697479, |
| "grad_norm": 0.7592030323419526, |
| "learning_rate": 5.654540302328526e-07, |
| "loss": 0.1901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18956655263900757, |
| "step": 6210, |
| "valid_targets_mean": 4036.1, |
| "valid_targets_min": 1552 |
| }, |
| { |
| "epoch": 6.5283613445378155, |
| "grad_norm": 0.7395667543125498, |
| "learning_rate": 5.531520449757465e-07, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1876063048839569, |
| "step": 6215, |
| "valid_targets_mean": 3543.5, |
| "valid_targets_min": 1439 |
| }, |
| { |
| "epoch": 6.533613445378151, |
| "grad_norm": 0.7046765053549935, |
| "learning_rate": 5.409834796235447e-07, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1793154776096344, |
| "step": 6220, |
| "valid_targets_mean": 3287.0, |
| "valid_targets_min": 1402 |
| }, |
| { |
| "epoch": 6.538865546218488, |
| "grad_norm": 0.7352367532176454, |
| "learning_rate": 5.28948417661701e-07, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19139184057712555, |
| "step": 6225, |
| "valid_targets_mean": 3423.9, |
| "valid_targets_min": 1586 |
| }, |
| { |
| "epoch": 6.544117647058823, |
| "grad_norm": 0.7217587370221558, |
| "learning_rate": 5.170469416597223e-07, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18540339171886444, |
| "step": 6230, |
| "valid_targets_mean": 3406.0, |
| "valid_targets_min": 1538 |
| }, |
| { |
| "epoch": 6.54936974789916, |
| "grad_norm": 0.8448265208591422, |
| "learning_rate": 5.05279133270633e-07, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18816813826560974, |
| "step": 6235, |
| "valid_targets_mean": 2954.0, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 6.554621848739496, |
| "grad_norm": 0.7796897965938916, |
| "learning_rate": 4.936450732303866e-07, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.198177307844162, |
| "step": 6240, |
| "valid_targets_mean": 3051.8, |
| "valid_targets_min": 1362 |
| }, |
| { |
| "epoch": 6.559873949579832, |
| "grad_norm": 0.6964707697678552, |
| "learning_rate": 4.821448413573237e-07, |
| "loss": 0.1875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1926005631685257, |
| "step": 6245, |
| "valid_targets_mean": 3620.5, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 6.565126050420168, |
| "grad_norm": 0.7685525826201484, |
| "learning_rate": 4.70778516551631e-07, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18368004262447357, |
| "step": 6250, |
| "valid_targets_mean": 3103.6, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 6.570378151260504, |
| "grad_norm": 0.7299698999315323, |
| "learning_rate": 4.595461767947829e-07, |
| "loss": 0.1849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19365397095680237, |
| "step": 6255, |
| "valid_targets_mean": 3592.7, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 6.57563025210084, |
| "grad_norm": 0.7134849644818172, |
| "learning_rate": 4.484478991490249e-07, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18238605558872223, |
| "step": 6260, |
| "valid_targets_mean": 3632.1, |
| "valid_targets_min": 1785 |
| }, |
| { |
| "epoch": 6.580882352941177, |
| "grad_norm": 0.7566638135613766, |
| "learning_rate": 4.374837597568338e-07, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17180000245571136, |
| "step": 6265, |
| "valid_targets_mean": 3557.1, |
| "valid_targets_min": 1957 |
| }, |
| { |
| "epoch": 6.586134453781512, |
| "grad_norm": 0.7212160746237427, |
| "learning_rate": 4.266538338403936e-07, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17052122950553894, |
| "step": 6270, |
| "valid_targets_mean": 3230.6, |
| "valid_targets_min": 1570 |
| }, |
| { |
| "epoch": 6.591386554621849, |
| "grad_norm": 0.7590336258795505, |
| "learning_rate": 4.159581957010894e-07, |
| "loss": 0.1834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18137861788272858, |
| "step": 6275, |
| "valid_targets_mean": 3023.7, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 6.5966386554621845, |
| "grad_norm": 0.7939812548685019, |
| "learning_rate": 4.0539691871898545e-07, |
| "loss": 0.1811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20064428448677063, |
| "step": 6280, |
| "valid_targets_mean": 3056.6, |
| "valid_targets_min": 1293 |
| }, |
| { |
| "epoch": 6.601890756302521, |
| "grad_norm": 0.7459390024198103, |
| "learning_rate": 3.949700753523344e-07, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16911663115024567, |
| "step": 6285, |
| "valid_targets_mean": 2915.6, |
| "valid_targets_min": 1687 |
| }, |
| { |
| "epoch": 6.607142857142857, |
| "grad_norm": 0.8123891604766348, |
| "learning_rate": 3.8467773713707134e-07, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19759421050548553, |
| "step": 6290, |
| "valid_targets_mean": 2985.1, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 6.612394957983193, |
| "grad_norm": 0.7820274649796405, |
| "learning_rate": 3.7451997468632486e-07, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17913171648979187, |
| "step": 6295, |
| "valid_targets_mean": 3195.0, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 6.617647058823529, |
| "grad_norm": 0.7958593118852751, |
| "learning_rate": 3.6449685768993327e-07, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19205614924430847, |
| "step": 6300, |
| "valid_targets_mean": 3106.2, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 6.6228991596638656, |
| "grad_norm": 0.727974701275133, |
| "learning_rate": 3.5460845491396944e-07, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1842992901802063, |
| "step": 6305, |
| "valid_targets_mean": 3189.5, |
| "valid_targets_min": 1896 |
| }, |
| { |
| "epoch": 6.628151260504202, |
| "grad_norm": 0.737246932634588, |
| "learning_rate": 3.448548342002589e-07, |
| "loss": 0.184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18911173939704895, |
| "step": 6310, |
| "valid_targets_mean": 3278.9, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 6.633403361344538, |
| "grad_norm": 0.7200101677641911, |
| "learning_rate": 3.352360624659312e-07, |
| "loss": 0.1844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19001314043998718, |
| "step": 6315, |
| "valid_targets_mean": 3398.8, |
| "valid_targets_min": 1270 |
| }, |
| { |
| "epoch": 6.6386554621848735, |
| "grad_norm": 0.6991330740624144, |
| "learning_rate": 3.2575220570294276e-07, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1835232377052307, |
| "step": 6320, |
| "valid_targets_mean": 3829.2, |
| "valid_targets_min": 1668 |
| }, |
| { |
| "epoch": 6.64390756302521, |
| "grad_norm": 0.6942560490970551, |
| "learning_rate": 3.164033289776369e-07, |
| "loss": 0.1857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18814723193645477, |
| "step": 6325, |
| "valid_targets_mean": 3426.9, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 6.649159663865547, |
| "grad_norm": 0.7240553846645934, |
| "learning_rate": 3.071894964302935e-07, |
| "loss": 0.1851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19533832371234894, |
| "step": 6330, |
| "valid_targets_mean": 3523.6, |
| "valid_targets_min": 1858 |
| }, |
| { |
| "epoch": 6.654411764705882, |
| "grad_norm": 0.6784877207352158, |
| "learning_rate": 2.981107712746867e-07, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16024400293827057, |
| "step": 6335, |
| "valid_targets_mean": 3161.2, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 6.659663865546219, |
| "grad_norm": 0.8123686861228415, |
| "learning_rate": 2.891672157976522e-07, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.212624192237854, |
| "step": 6340, |
| "valid_targets_mean": 2948.9, |
| "valid_targets_min": 1812 |
| }, |
| { |
| "epoch": 6.6649159663865545, |
| "grad_norm": 0.7276516066486569, |
| "learning_rate": 2.803588913586608e-07, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17187952995300293, |
| "step": 6345, |
| "valid_targets_mean": 3107.7, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 6.670168067226891, |
| "grad_norm": 0.6887997469688529, |
| "learning_rate": 2.716858583894033e-07, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16475774347782135, |
| "step": 6350, |
| "valid_targets_mean": 3372.6, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 6.675420168067227, |
| "grad_norm": 0.7520402794788272, |
| "learning_rate": 2.6314817639335964e-07, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17598888278007507, |
| "step": 6355, |
| "valid_targets_mean": 3305.2, |
| "valid_targets_min": 1673 |
| }, |
| { |
| "epoch": 6.680672268907563, |
| "grad_norm": 0.6523534201108536, |
| "learning_rate": 2.547459039454103e-07, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15471762418746948, |
| "step": 6360, |
| "valid_targets_mean": 3933.0, |
| "valid_targets_min": 1869 |
| }, |
| { |
| "epoch": 6.685924369747899, |
| "grad_norm": 0.8552212655149624, |
| "learning_rate": 2.4647909869142117e-07, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20678521692752838, |
| "step": 6365, |
| "valid_targets_mean": 3010.2, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 6.6911764705882355, |
| "grad_norm": 0.7322859160819369, |
| "learning_rate": 2.3834781734784817e-07, |
| "loss": 0.1877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18106794357299805, |
| "step": 6370, |
| "valid_targets_mean": 3055.6, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 6.696428571428571, |
| "grad_norm": 0.738490804680364, |
| "learning_rate": 2.3035211570135995e-07, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17908601462841034, |
| "step": 6375, |
| "valid_targets_mean": 3442.4, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 6.701680672268908, |
| "grad_norm": 0.7971361125915069, |
| "learning_rate": 2.224920486084403e-07, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18598723411560059, |
| "step": 6380, |
| "valid_targets_mean": 3041.9, |
| "valid_targets_min": 1955 |
| }, |
| { |
| "epoch": 6.706932773109243, |
| "grad_norm": 0.7900277569565785, |
| "learning_rate": 2.1476766999502408e-07, |
| "loss": 0.1855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18570013344287872, |
| "step": 6385, |
| "valid_targets_mean": 3640.2, |
| "valid_targets_min": 1628 |
| }, |
| { |
| "epoch": 6.71218487394958, |
| "grad_norm": 0.6556232945874763, |
| "learning_rate": 2.071790328561152e-07, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1550453007221222, |
| "step": 6390, |
| "valid_targets_mean": 3358.4, |
| "valid_targets_min": 1482 |
| }, |
| { |
| "epoch": 6.717436974789916, |
| "grad_norm": 0.6812790984777259, |
| "learning_rate": 1.997261892554403e-07, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15719173848628998, |
| "step": 6395, |
| "valid_targets_mean": 3460.4, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 6.722689075630252, |
| "grad_norm": 0.7769101571262454, |
| "learning_rate": 1.9240919032506688e-07, |
| "loss": 0.1875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2275974154472351, |
| "step": 6400, |
| "valid_targets_mean": 3728.4, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 6.727941176470588, |
| "grad_norm": 0.7389737083348429, |
| "learning_rate": 1.8522808626507683e-07, |
| "loss": 0.1859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1957985758781433, |
| "step": 6405, |
| "valid_targets_mean": 3940.4, |
| "valid_targets_min": 1658 |
| }, |
| { |
| "epoch": 6.733193277310924, |
| "grad_norm": 0.77498392264914, |
| "learning_rate": 1.781829263432111e-07, |
| "loss": 0.1812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1999933421611786, |
| "step": 6410, |
| "valid_targets_mean": 3536.9, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 6.73844537815126, |
| "grad_norm": 0.7005856165044073, |
| "learning_rate": 1.7127375889452569e-07, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1850917786359787, |
| "step": 6415, |
| "valid_targets_mean": 3351.2, |
| "valid_targets_min": 2010 |
| }, |
| { |
| "epoch": 6.743697478991597, |
| "grad_norm": 0.7167520426399059, |
| "learning_rate": 1.6450063132107396e-07, |
| "loss": 0.196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18986815214157104, |
| "step": 6420, |
| "valid_targets_mean": 3498.6, |
| "valid_targets_min": 1172 |
| }, |
| { |
| "epoch": 6.748949579831933, |
| "grad_norm": 0.6942759631181366, |
| "learning_rate": 1.5786359009156928e-07, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18716512620449066, |
| "step": 6425, |
| "valid_targets_mean": 3863.8, |
| "valid_targets_min": 1229 |
| }, |
| { |
| "epoch": 6.754201680672269, |
| "grad_norm": 0.6936745579008864, |
| "learning_rate": 1.5136268074107398e-07, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1890535056591034, |
| "step": 6430, |
| "valid_targets_mean": 3600.5, |
| "valid_targets_min": 1523 |
| }, |
| { |
| "epoch": 6.759453781512605, |
| "grad_norm": 0.7070845571059466, |
| "learning_rate": 1.44997947870682e-07, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17694947123527527, |
| "step": 6435, |
| "valid_targets_mean": 3623.9, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 6.764705882352941, |
| "grad_norm": 0.7375315587768612, |
| "learning_rate": 1.3876943514721465e-07, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17876756191253662, |
| "step": 6440, |
| "valid_targets_mean": 3535.2, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 6.769957983193278, |
| "grad_norm": 0.7430227920142868, |
| "learning_rate": 1.3267718530292296e-07, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18011704087257385, |
| "step": 6445, |
| "valid_targets_mean": 3071.5, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 6.775210084033613, |
| "grad_norm": 0.6530774473575953, |
| "learning_rate": 1.267212401351925e-07, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1584375500679016, |
| "step": 6450, |
| "valid_targets_mean": 3779.1, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 6.78046218487395, |
| "grad_norm": 0.6882124626090157, |
| "learning_rate": 1.2090164050625907e-07, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1654224693775177, |
| "step": 6455, |
| "valid_targets_mean": 3330.2, |
| "valid_targets_min": 1853 |
| }, |
| { |
| "epoch": 6.785714285714286, |
| "grad_norm": 0.7044440655396256, |
| "learning_rate": 1.1521842634292013e-07, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17785203456878662, |
| "step": 6460, |
| "valid_targets_mean": 3327.8, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 6.790966386554622, |
| "grad_norm": 0.8200049965639139, |
| "learning_rate": 1.0967163663627044e-07, |
| "loss": 0.1765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18418024480342865, |
| "step": 6465, |
| "valid_targets_mean": 2920.6, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 6.796218487394958, |
| "grad_norm": 0.7154441982579451, |
| "learning_rate": 1.0426130944143353e-07, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1741981953382492, |
| "step": 6470, |
| "valid_targets_mean": 3539.7, |
| "valid_targets_min": 996 |
| }, |
| { |
| "epoch": 6.801470588235294, |
| "grad_norm": 0.6654603332753054, |
| "learning_rate": 9.898748187729513e-08, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16577930748462677, |
| "step": 6475, |
| "valid_targets_mean": 3357.1, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 6.80672268907563, |
| "grad_norm": 0.8172505155020807, |
| "learning_rate": 9.385019012625007e-08, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21172448992729187, |
| "step": 6480, |
| "valid_targets_mean": 3613.5, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 6.811974789915967, |
| "grad_norm": 0.6891423541136645, |
| "learning_rate": 8.884946943395811e-08, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14347678422927856, |
| "step": 6485, |
| "valid_targets_mean": 3327.4, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 6.817226890756302, |
| "grad_norm": 0.7516599357315075, |
| "learning_rate": 8.398535410910402e-08, |
| "loss": 0.1838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18097805976867676, |
| "step": 6490, |
| "valid_targets_mean": 2790.8, |
| "valid_targets_min": 1649 |
| }, |
| { |
| "epoch": 6.822478991596639, |
| "grad_norm": 0.7616811039107437, |
| "learning_rate": 7.925787752314674e-08, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18834054470062256, |
| "step": 6495, |
| "valid_targets_mean": 2811.8, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 6.8277310924369745, |
| "grad_norm": 0.7317487761588832, |
| "learning_rate": 7.466707211010838e-08, |
| "loss": 0.1919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20096731185913086, |
| "step": 6500, |
| "valid_targets_mean": 3420.2, |
| "valid_targets_min": 1720 |
| }, |
| { |
| "epoch": 6.832983193277311, |
| "grad_norm": 0.6976502515107287, |
| "learning_rate": 7.02129693663478e-08, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18510772287845612, |
| "step": 6505, |
| "valid_targets_mean": 3542.7, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 6.838235294117647, |
| "grad_norm": 0.8023438462902227, |
| "learning_rate": 6.589559985033189e-08, |
| "loss": 0.1815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17661021649837494, |
| "step": 6510, |
| "valid_targets_mean": 3049.7, |
| "valid_targets_min": 1643 |
| }, |
| { |
| "epoch": 6.843487394957983, |
| "grad_norm": 0.6905962109077173, |
| "learning_rate": 6.171499318244234e-08, |
| "loss": 0.1897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19038131833076477, |
| "step": 6515, |
| "valid_targets_mean": 3757.8, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 6.848739495798319, |
| "grad_norm": 0.7819298312536493, |
| "learning_rate": 5.767117804476696e-08, |
| "loss": 0.1895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.188393235206604, |
| "step": 6520, |
| "valid_targets_mean": 3715.1, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 6.8539915966386555, |
| "grad_norm": 0.7603239023118682, |
| "learning_rate": 5.376418218089541e-08, |
| "loss": 0.1934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20249368250370026, |
| "step": 6525, |
| "valid_targets_mean": 3321.9, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 6.859243697478991, |
| "grad_norm": 0.8027496504534014, |
| "learning_rate": 4.99940323957393e-08, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2095927596092224, |
| "step": 6530, |
| "valid_targets_mean": 3713.2, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 6.864495798319328, |
| "grad_norm": 0.7827471840659329, |
| "learning_rate": 4.63607545553435e-08, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19427041709423065, |
| "step": 6535, |
| "valid_targets_mean": 2961.8, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 6.869747899159664, |
| "grad_norm": 0.8495916082471087, |
| "learning_rate": 4.2864373586706254e-08, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20868608355522156, |
| "step": 6540, |
| "valid_targets_mean": 3012.6, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 6.875, |
| "grad_norm": 0.7058473937236638, |
| "learning_rate": 3.950491347761487e-08, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19130313396453857, |
| "step": 6545, |
| "valid_targets_mean": 3639.9, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 6.880252100840336, |
| "grad_norm": 0.8058046651510254, |
| "learning_rate": 3.628239727647254e-08, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17615005373954773, |
| "step": 6550, |
| "valid_targets_mean": 4017.4, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 6.885504201680672, |
| "grad_norm": 0.7986547158784268, |
| "learning_rate": 3.319684709215176e-08, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20986217260360718, |
| "step": 6555, |
| "valid_targets_mean": 3178.8, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 6.890756302521009, |
| "grad_norm": 0.7069871681601839, |
| "learning_rate": 3.024828409383007e-08, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18144480884075165, |
| "step": 6560, |
| "valid_targets_mean": 3633.9, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 6.8960084033613445, |
| "grad_norm": 0.747775716498079, |
| "learning_rate": 2.743672851085233e-08, |
| "loss": 0.196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19807741045951843, |
| "step": 6565, |
| "valid_targets_mean": 3981.0, |
| "valid_targets_min": 1464 |
| }, |
| { |
| "epoch": 6.901260504201681, |
| "grad_norm": 1.0660860736808098, |
| "learning_rate": 2.4762199632588634e-08, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1948835551738739, |
| "step": 6570, |
| "valid_targets_mean": 2612.0, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 6.906512605042017, |
| "grad_norm": 0.8171298625094956, |
| "learning_rate": 2.2224715808309983e-08, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18982771039009094, |
| "step": 6575, |
| "valid_targets_mean": 3489.8, |
| "valid_targets_min": 1457 |
| }, |
| { |
| "epoch": 6.911764705882353, |
| "grad_norm": 0.7615110154926487, |
| "learning_rate": 1.9824294447043923e-08, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.186547189950943, |
| "step": 6580, |
| "valid_targets_mean": 3059.1, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 6.917016806722689, |
| "grad_norm": 0.7778984161564974, |
| "learning_rate": 1.7560952017481313e-08, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19061462581157684, |
| "step": 6585, |
| "valid_targets_mean": 3259.2, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 6.9222689075630255, |
| "grad_norm": 0.7069596850632259, |
| "learning_rate": 1.5434704047836424e-08, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17042481899261475, |
| "step": 6590, |
| "valid_targets_mean": 3337.9, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 6.927521008403361, |
| "grad_norm": 0.7072879579761938, |
| "learning_rate": 1.344556512576256e-08, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19188648462295532, |
| "step": 6595, |
| "valid_targets_mean": 4091.9, |
| "valid_targets_min": 1876 |
| }, |
| { |
| "epoch": 6.932773109243698, |
| "grad_norm": 0.7505076999505291, |
| "learning_rate": 1.1593548898236606e-08, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1926942616701126, |
| "step": 6600, |
| "valid_targets_mean": 3705.8, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 6.938025210084033, |
| "grad_norm": 0.831906921551297, |
| "learning_rate": 9.878668071474639e-09, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16769427061080933, |
| "step": 6605, |
| "valid_targets_mean": 3030.8, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 6.94327731092437, |
| "grad_norm": 0.7424388421322633, |
| "learning_rate": 8.3009344108409e-09, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17962056398391724, |
| "step": 6610, |
| "valid_targets_mean": 3366.9, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 6.948529411764706, |
| "grad_norm": 0.676120936221246, |
| "learning_rate": 6.860358740763406e-09, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17056873440742493, |
| "step": 6615, |
| "valid_targets_mean": 3651.0, |
| "valid_targets_min": 1295 |
| }, |
| { |
| "epoch": 6.953781512605042, |
| "grad_norm": 0.7276545536651401, |
| "learning_rate": 5.55695094467179e-09, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19623544812202454, |
| "step": 6620, |
| "valid_targets_mean": 3583.6, |
| "valid_targets_min": 1598 |
| }, |
| { |
| "epoch": 6.959033613445378, |
| "grad_norm": 0.7364736521570804, |
| "learning_rate": 4.3907199649151355e-09, |
| "loss": 0.198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17404237389564514, |
| "step": 6625, |
| "valid_targets_mean": 2903.2, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 6.964285714285714, |
| "grad_norm": 0.8283192384968932, |
| "learning_rate": 3.361673802708687e-09, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2022954821586609, |
| "step": 6630, |
| "valid_targets_mean": 3116.1, |
| "valid_targets_min": 1621 |
| }, |
| { |
| "epoch": 6.96953781512605, |
| "grad_norm": 0.853057291277257, |
| "learning_rate": 2.469819518080563e-09, |
| "loss": 0.1754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19089040160179138, |
| "step": 6635, |
| "valid_targets_mean": 3081.4, |
| "valid_targets_min": 1858 |
| }, |
| { |
| "epoch": 6.974789915966387, |
| "grad_norm": 0.6873113252451049, |
| "learning_rate": 1.7151632298140209e-09, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15922731161117554, |
| "step": 6640, |
| "valid_targets_mean": 3470.7, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 6.980042016806722, |
| "grad_norm": 0.754724576359931, |
| "learning_rate": 1.0977101154163727e-09, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19214347004890442, |
| "step": 6645, |
| "valid_targets_mean": 3584.2, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 6.985294117647059, |
| "grad_norm": 0.8029047273305313, |
| "learning_rate": 6.174644110767958e-10, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17756588757038116, |
| "step": 6650, |
| "valid_targets_mean": 2940.8, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 6.990546218487395, |
| "grad_norm": 0.7749949104741897, |
| "learning_rate": 2.744294116419077e-10, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18697890639305115, |
| "step": 6655, |
| "valid_targets_mean": 3248.2, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 6.995798319327731, |
| "grad_norm": 0.7329373554307617, |
| "learning_rate": 6.860747058468064e-11, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18864449858665466, |
| "step": 6660, |
| "valid_targets_mean": 3728.8, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2101745903491974, |
| "step": 6664, |
| "total_flos": 1189003618287616.0, |
| "train_loss": 0.21699104300674413, |
| "train_runtime": 24543.5183, |
| "train_samples_per_second": 4.344, |
| "train_steps_per_second": 0.272, |
| "valid_targets_mean": 3715.1, |
| "valid_targets_min": 791 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 6664, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 200, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1189003618287616.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|