{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 7140, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.004901960784313725, "grad_norm": 10.20928865918908, "learning_rate": 2.2408963585434175e-07, "loss": 0.6185, "loss_nan_ranks": 0, "loss_rank_avg": 0.5775138139724731, "step": 5, "valid_targets_mean": 2510.1, "valid_targets_min": 783 }, { "epoch": 0.00980392156862745, "grad_norm": 9.23497201065913, "learning_rate": 5.042016806722689e-07, "loss": 0.5949, "loss_nan_ranks": 0, "loss_rank_avg": 0.573584794998169, "step": 10, "valid_targets_mean": 2837.1, "valid_targets_min": 700 }, { "epoch": 0.014705882352941176, "grad_norm": 11.158774276653146, "learning_rate": 7.843137254901962e-07, "loss": 0.644, "loss_nan_ranks": 0, "loss_rank_avg": 0.6744149327278137, "step": 15, "valid_targets_mean": 1654.6, "valid_targets_min": 516 }, { "epoch": 0.0196078431372549, "grad_norm": 9.567542813890764, "learning_rate": 1.0644257703081233e-06, "loss": 0.6143, "loss_nan_ranks": 0, "loss_rank_avg": 0.6221225261688232, "step": 20, "valid_targets_mean": 2297.6, "valid_targets_min": 998 }, { "epoch": 0.024509803921568627, "grad_norm": 10.35194264022352, "learning_rate": 1.3445378151260504e-06, "loss": 0.5931, "loss_nan_ranks": 0, "loss_rank_avg": 0.7201113700866699, "step": 25, "valid_targets_mean": 1942.3, "valid_targets_min": 719 }, { "epoch": 0.029411764705882353, "grad_norm": 6.019435455219015, "learning_rate": 1.6246498599439778e-06, "loss": 0.5995, "loss_nan_ranks": 0, "loss_rank_avg": 0.5141686201095581, "step": 30, "valid_targets_mean": 2379.7, "valid_targets_min": 608 }, { "epoch": 0.03431372549019608, "grad_norm": 5.347753558046135, "learning_rate": 1.904761904761905e-06, "loss": 0.5534, "loss_nan_ranks": 0, "loss_rank_avg": 0.5356568694114685, "step": 35, "valid_targets_mean": 2166.6, "valid_targets_min": 663 }, { "epoch": 0.0392156862745098, "grad_norm": 4.620742455700474, "learning_rate": 2.184873949579832e-06, "loss": 0.4874, "loss_nan_ranks": 0, "loss_rank_avg": 0.5212767124176025, "step": 40, "valid_targets_mean": 1865.9, "valid_targets_min": 524 }, { "epoch": 0.04411764705882353, "grad_norm": 3.4604614828952194, "learning_rate": 2.4649859943977594e-06, "loss": 0.4418, "loss_nan_ranks": 0, "loss_rank_avg": 0.4115924835205078, "step": 45, "valid_targets_mean": 2360.3, "valid_targets_min": 836 }, { "epoch": 0.049019607843137254, "grad_norm": 2.926821476599717, "learning_rate": 2.7450980392156867e-06, "loss": 0.426, "loss_nan_ranks": 0, "loss_rank_avg": 0.4429447650909424, "step": 50, "valid_targets_mean": 1996.1, "valid_targets_min": 968 }, { "epoch": 0.05392156862745098, "grad_norm": 1.9890421518892802, "learning_rate": 3.0252100840336137e-06, "loss": 0.4483, "loss_nan_ranks": 0, "loss_rank_avg": 0.4572969973087311, "step": 55, "valid_targets_mean": 1957.2, "valid_targets_min": 464 }, { "epoch": 0.058823529411764705, "grad_norm": 1.6865611538561944, "learning_rate": 3.305322128851541e-06, "loss": 0.3748, "loss_nan_ranks": 0, "loss_rank_avg": 0.39461690187454224, "step": 60, "valid_targets_mean": 1830.6, "valid_targets_min": 518 }, { "epoch": 0.06372549019607843, "grad_norm": 1.3527111817446995, "learning_rate": 3.585434173669468e-06, "loss": 0.3612, "loss_nan_ranks": 0, "loss_rank_avg": 0.4330475330352783, "step": 65, "valid_targets_mean": 1900.5, "valid_targets_min": 664 }, { "epoch": 0.06862745098039216, "grad_norm": 1.19163364826996, "learning_rate": 3.865546218487396e-06, "loss": 0.372, "loss_nan_ranks": 0, "loss_rank_avg": 0.3685574531555176, "step": 70, "valid_targets_mean": 1673.1, "valid_targets_min": 497 }, { "epoch": 0.07352941176470588, "grad_norm": 0.9397906346537187, "learning_rate": 4.145658263305323e-06, "loss": 0.3291, "loss_nan_ranks": 0, "loss_rank_avg": 0.3561197519302368, "step": 75, "valid_targets_mean": 2279.2, "valid_targets_min": 720 }, { "epoch": 0.0784313725490196, "grad_norm": 0.727700887008284, "learning_rate": 4.4257703081232496e-06, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.2575701177120209, "step": 80, "valid_targets_mean": 2609.6, "valid_targets_min": 730 }, { "epoch": 0.08333333333333333, "grad_norm": 0.8886691451113053, "learning_rate": 4.705882352941177e-06, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.29151153564453125, "step": 85, "valid_targets_mean": 1739.9, "valid_targets_min": 640 }, { "epoch": 0.08823529411764706, "grad_norm": 0.7084752420049867, "learning_rate": 4.985994397759104e-06, "loss": 0.3002, "loss_nan_ranks": 0, "loss_rank_avg": 0.2468690723180771, "step": 90, "valid_targets_mean": 2406.2, "valid_targets_min": 795 }, { "epoch": 0.09313725490196079, "grad_norm": 0.8183678064858451, "learning_rate": 5.266106442577032e-06, "loss": 0.3088, "loss_nan_ranks": 0, "loss_rank_avg": 0.2936941981315613, "step": 95, "valid_targets_mean": 2030.6, "valid_targets_min": 609 }, { "epoch": 0.09803921568627451, "grad_norm": 0.8376415918043708, "learning_rate": 5.546218487394959e-06, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.3431953489780426, "step": 100, "valid_targets_mean": 2092.2, "valid_targets_min": 794 }, { "epoch": 0.10294117647058823, "grad_norm": 0.6813076714555519, "learning_rate": 5.826330532212886e-06, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.2565889358520508, "step": 105, "valid_targets_mean": 2320.1, "valid_targets_min": 567 }, { "epoch": 0.10784313725490197, "grad_norm": 0.7381189363611336, "learning_rate": 6.106442577030814e-06, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.2865998148918152, "step": 110, "valid_targets_mean": 2249.0, "valid_targets_min": 1219 }, { "epoch": 0.11274509803921569, "grad_norm": 0.6544891537578502, "learning_rate": 6.386554621848739e-06, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.23120339214801788, "step": 115, "valid_targets_mean": 2653.5, "valid_targets_min": 337 }, { "epoch": 0.11764705882352941, "grad_norm": 0.7137286431407412, "learning_rate": 6.666666666666667e-06, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.28938379883766174, "step": 120, "valid_targets_mean": 2329.7, "valid_targets_min": 540 }, { "epoch": 0.12254901960784313, "grad_norm": 0.7257208667414642, "learning_rate": 6.946778711484594e-06, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.2607773244380951, "step": 125, "valid_targets_mean": 2316.9, "valid_targets_min": 619 }, { "epoch": 0.12745098039215685, "grad_norm": 0.7230258011962319, "learning_rate": 7.226890756302521e-06, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.21410706639289856, "step": 130, "valid_targets_mean": 2270.0, "valid_targets_min": 665 }, { "epoch": 0.1323529411764706, "grad_norm": 0.5759410981582812, "learning_rate": 7.507002801120449e-06, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.20663133263587952, "step": 135, "valid_targets_mean": 3114.1, "valid_targets_min": 721 }, { "epoch": 0.13725490196078433, "grad_norm": 0.7572665669740622, "learning_rate": 7.787114845938376e-06, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.2611826956272125, "step": 140, "valid_targets_mean": 2193.1, "valid_targets_min": 722 }, { "epoch": 0.14215686274509803, "grad_norm": 0.7714401933508285, "learning_rate": 8.067226890756303e-06, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.2228604406118393, "step": 145, "valid_targets_mean": 2312.3, "valid_targets_min": 615 }, { "epoch": 0.14705882352941177, "grad_norm": 0.7473849126557415, "learning_rate": 8.34733893557423e-06, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.26429224014282227, "step": 150, "valid_targets_mean": 2596.1, "valid_targets_min": 582 }, { "epoch": 0.15196078431372548, "grad_norm": 0.8790059261164762, "learning_rate": 8.627450980392157e-06, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.2524535357952118, "step": 155, "valid_targets_mean": 1923.6, "valid_targets_min": 807 }, { "epoch": 0.1568627450980392, "grad_norm": 0.6881021835316934, "learning_rate": 8.907563025210085e-06, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.22635899484157562, "step": 160, "valid_targets_mean": 1896.2, "valid_targets_min": 602 }, { "epoch": 0.16176470588235295, "grad_norm": 0.690388606612483, "learning_rate": 9.187675070028012e-06, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.21718770265579224, "step": 165, "valid_targets_mean": 1991.8, "valid_targets_min": 633 }, { "epoch": 0.16666666666666666, "grad_norm": 0.8425889137005795, "learning_rate": 9.467787114845938e-06, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.23774409294128418, "step": 170, "valid_targets_mean": 1627.6, "valid_targets_min": 468 }, { "epoch": 0.1715686274509804, "grad_norm": 0.7091511823027294, "learning_rate": 9.747899159663867e-06, "loss": 0.2156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1945105493068695, "step": 175, "valid_targets_mean": 2712.4, "valid_targets_min": 815 }, { "epoch": 0.17647058823529413, "grad_norm": 0.7962789255731376, "learning_rate": 1.0028011204481793e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.30094513297080994, "step": 180, "valid_targets_mean": 1933.2, "valid_targets_min": 613 }, { "epoch": 0.18137254901960784, "grad_norm": 0.8709581990029245, "learning_rate": 1.030812324929972e-05, "loss": 0.2629, "loss_nan_ranks": 0, "loss_rank_avg": 0.24878257513046265, "step": 185, "valid_targets_mean": 2173.3, "valid_targets_min": 524 }, { "epoch": 0.18627450980392157, "grad_norm": 0.672591990213361, "learning_rate": 1.0588235294117648e-05, "loss": 0.2283, "loss_nan_ranks": 0, "loss_rank_avg": 0.21655958890914917, "step": 190, "valid_targets_mean": 2481.3, "valid_targets_min": 640 }, { "epoch": 0.19117647058823528, "grad_norm": 0.5077039092070841, "learning_rate": 1.0868347338935574e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.18501999974250793, "step": 195, "valid_targets_mean": 3169.5, "valid_targets_min": 754 }, { "epoch": 0.19607843137254902, "grad_norm": 0.6393343276686302, "learning_rate": 1.1148459383753503e-05, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.20450522005558014, "step": 200, "valid_targets_mean": 2330.5, "valid_targets_min": 752 }, { "epoch": 0.20098039215686275, "grad_norm": 0.7377664172401819, "learning_rate": 1.1428571428571429e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.24033306539058685, "step": 205, "valid_targets_mean": 2058.1, "valid_targets_min": 821 }, { "epoch": 0.20588235294117646, "grad_norm": 0.7084884926960634, "learning_rate": 1.1708683473389357e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.23557499051094055, "step": 210, "valid_targets_mean": 2050.4, "valid_targets_min": 720 }, { "epoch": 0.2107843137254902, "grad_norm": 1.0188002373707512, "learning_rate": 1.1988795518207284e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.29192501306533813, "step": 215, "valid_targets_mean": 1503.8, "valid_targets_min": 711 }, { "epoch": 0.21568627450980393, "grad_norm": 0.6626325047822198, "learning_rate": 1.2268907563025212e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.20884019136428833, "step": 220, "valid_targets_mean": 2474.2, "valid_targets_min": 699 }, { "epoch": 0.22058823529411764, "grad_norm": 0.6367170883319628, "learning_rate": 1.2549019607843138e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.2049025297164917, "step": 225, "valid_targets_mean": 2471.3, "valid_targets_min": 761 }, { "epoch": 0.22549019607843138, "grad_norm": 0.7420048828864545, "learning_rate": 1.2829131652661067e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.2391299456357956, "step": 230, "valid_targets_mean": 2442.0, "valid_targets_min": 634 }, { "epoch": 0.23039215686274508, "grad_norm": 0.9380517123817401, "learning_rate": 1.3109243697478993e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.2618740200996399, "step": 235, "valid_targets_mean": 1533.4, "valid_targets_min": 682 }, { "epoch": 0.23529411764705882, "grad_norm": 0.6743370799947248, "learning_rate": 1.338935574229692e-05, "loss": 0.2154, "loss_nan_ranks": 0, "loss_rank_avg": 0.2558346390724182, "step": 240, "valid_targets_mean": 2312.7, "valid_targets_min": 530 }, { "epoch": 0.24019607843137256, "grad_norm": 0.6221079049005317, "learning_rate": 1.3669467787114848e-05, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.18583598732948303, "step": 245, "valid_targets_mean": 2520.4, "valid_targets_min": 746 }, { "epoch": 0.24509803921568626, "grad_norm": 0.8012148275172146, "learning_rate": 1.3949579831932774e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.22044017910957336, "step": 250, "valid_targets_mean": 2009.4, "valid_targets_min": 820 }, { "epoch": 0.25, "grad_norm": 0.6180778632070758, "learning_rate": 1.4229691876750703e-05, "loss": 0.1938, "loss_nan_ranks": 0, "loss_rank_avg": 0.18992581963539124, "step": 255, "valid_targets_mean": 2631.8, "valid_targets_min": 856 }, { "epoch": 0.2549019607843137, "grad_norm": 0.8993994771670876, "learning_rate": 1.4509803921568629e-05, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.21689380705356598, "step": 260, "valid_targets_mean": 1633.8, "valid_targets_min": 324 }, { "epoch": 0.25980392156862747, "grad_norm": 0.8889748801968507, "learning_rate": 1.4789915966386557e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.2001081109046936, "step": 265, "valid_targets_mean": 2276.2, "valid_targets_min": 776 }, { "epoch": 0.2647058823529412, "grad_norm": 0.8677882826227222, "learning_rate": 1.5070028011204482e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.19296003878116608, "step": 270, "valid_targets_mean": 2239.6, "valid_targets_min": 820 }, { "epoch": 0.2696078431372549, "grad_norm": 0.786172042943967, "learning_rate": 1.535014005602241e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.20809459686279297, "step": 275, "valid_targets_mean": 1825.3, "valid_targets_min": 701 }, { "epoch": 0.27450980392156865, "grad_norm": 0.6695572664647559, "learning_rate": 1.5630252100840337e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.18365135788917542, "step": 280, "valid_targets_mean": 2497.1, "valid_targets_min": 681 }, { "epoch": 0.27941176470588236, "grad_norm": 0.8627662588551201, "learning_rate": 1.5910364145658263e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.22431831061840057, "step": 285, "valid_targets_mean": 2399.4, "valid_targets_min": 1180 }, { "epoch": 0.28431372549019607, "grad_norm": 0.8410412603652976, "learning_rate": 1.6190476190476193e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.20205965638160706, "step": 290, "valid_targets_mean": 1758.8, "valid_targets_min": 614 }, { "epoch": 0.28921568627450983, "grad_norm": 0.749243931310914, "learning_rate": 1.647058823529412e-05, "loss": 0.2169, "loss_nan_ranks": 0, "loss_rank_avg": 0.20068684220314026, "step": 295, "valid_targets_mean": 1806.8, "valid_targets_min": 589 }, { "epoch": 0.29411764705882354, "grad_norm": 1.1731365321469984, "learning_rate": 1.6750700280112046e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.3024446964263916, "step": 300, "valid_targets_mean": 1756.7, "valid_targets_min": 458 }, { "epoch": 0.29901960784313725, "grad_norm": 0.5547867627065093, "learning_rate": 1.7030812324929973e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.1652289479970932, "step": 305, "valid_targets_mean": 2662.3, "valid_targets_min": 700 }, { "epoch": 0.30392156862745096, "grad_norm": 0.6045886405973347, "learning_rate": 1.7310924369747902e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.14137142896652222, "step": 310, "valid_targets_mean": 3014.4, "valid_targets_min": 952 }, { "epoch": 0.3088235294117647, "grad_norm": 0.6337281237898196, "learning_rate": 1.759103641456583e-05, "loss": 0.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.1614706665277481, "step": 315, "valid_targets_mean": 2457.1, "valid_targets_min": 757 }, { "epoch": 0.3137254901960784, "grad_norm": 0.7994521931285774, "learning_rate": 1.7871148459383755e-05, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.29927748441696167, "step": 320, "valid_targets_mean": 2256.4, "valid_targets_min": 858 }, { "epoch": 0.31862745098039214, "grad_norm": 0.6877920338669534, "learning_rate": 1.8151260504201682e-05, "loss": 0.2215, "loss_nan_ranks": 0, "loss_rank_avg": 0.18461309373378754, "step": 325, "valid_targets_mean": 2309.9, "valid_targets_min": 357 }, { "epoch": 0.3235294117647059, "grad_norm": 0.8324024546914552, "learning_rate": 1.843137254901961e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.19263777136802673, "step": 330, "valid_targets_mean": 1769.6, "valid_targets_min": 569 }, { "epoch": 0.3284313725490196, "grad_norm": 0.9991213846200081, "learning_rate": 1.8711484593837535e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.2420213520526886, "step": 335, "valid_targets_mean": 1401.4, "valid_targets_min": 801 }, { "epoch": 0.3333333333333333, "grad_norm": 0.6238168794305411, "learning_rate": 1.899159663865546e-05, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.17140337824821472, "step": 340, "valid_targets_mean": 2009.0, "valid_targets_min": 580 }, { "epoch": 0.3382352941176471, "grad_norm": 0.6728967307166305, "learning_rate": 1.927170868347339e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.19629782438278198, "step": 345, "valid_targets_mean": 2363.2, "valid_targets_min": 610 }, { "epoch": 0.3431372549019608, "grad_norm": 0.6374538764985028, "learning_rate": 1.9551820728291318e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.1695806384086609, "step": 350, "valid_targets_mean": 2499.8, "valid_targets_min": 781 }, { "epoch": 0.3480392156862745, "grad_norm": 0.7086989901290757, "learning_rate": 1.9831932773109244e-05, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.22146835923194885, "step": 355, "valid_targets_mean": 2031.7, "valid_targets_min": 779 }, { "epoch": 0.35294117647058826, "grad_norm": 0.8759913313729994, "learning_rate": 2.011204481792717e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.2633894681930542, "step": 360, "valid_targets_mean": 2092.2, "valid_targets_min": 815 }, { "epoch": 0.35784313725490197, "grad_norm": 0.5654576745582779, "learning_rate": 2.0392156862745097e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.15165485441684723, "step": 365, "valid_targets_mean": 2529.6, "valid_targets_min": 551 }, { "epoch": 0.3627450980392157, "grad_norm": 0.6916207113885678, "learning_rate": 2.0672268907563027e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.19615793228149414, "step": 370, "valid_targets_mean": 2093.1, "valid_targets_min": 734 }, { "epoch": 0.36764705882352944, "grad_norm": 0.8691395575013329, "learning_rate": 2.0952380952380954e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.2099282443523407, "step": 375, "valid_targets_mean": 2353.9, "valid_targets_min": 816 }, { "epoch": 0.37254901960784315, "grad_norm": 0.5336835398911135, "learning_rate": 2.123249299719888e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.15454989671707153, "step": 380, "valid_targets_mean": 2968.2, "valid_targets_min": 720 }, { "epoch": 0.37745098039215685, "grad_norm": 0.6264965338350452, "learning_rate": 2.1512605042016807e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.19402390718460083, "step": 385, "valid_targets_mean": 2708.5, "valid_targets_min": 1008 }, { "epoch": 0.38235294117647056, "grad_norm": 0.6054769755806432, "learning_rate": 2.1792717086834733e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.16077178716659546, "step": 390, "valid_targets_mean": 2332.9, "valid_targets_min": 722 }, { "epoch": 0.3872549019607843, "grad_norm": 0.6871014526711019, "learning_rate": 2.2072829131652663e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.19740639626979828, "step": 395, "valid_targets_mean": 2283.4, "valid_targets_min": 678 }, { "epoch": 0.39215686274509803, "grad_norm": 0.6946444755001282, "learning_rate": 2.235294117647059e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.177214115858078, "step": 400, "valid_targets_mean": 2111.4, "valid_targets_min": 724 }, { "epoch": 0.39705882352941174, "grad_norm": 0.7039019894945975, "learning_rate": 2.2633053221288516e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.19564135372638702, "step": 405, "valid_targets_mean": 2236.6, "valid_targets_min": 627 }, { "epoch": 0.4019607843137255, "grad_norm": 0.7862930643002248, "learning_rate": 2.2913165266106443e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.17840075492858887, "step": 410, "valid_targets_mean": 1734.5, "valid_targets_min": 727 }, { "epoch": 0.4068627450980392, "grad_norm": 0.6757610019636033, "learning_rate": 2.3193277310924373e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.145016148686409, "step": 415, "valid_targets_mean": 1852.9, "valid_targets_min": 814 }, { "epoch": 0.4117647058823529, "grad_norm": 0.5408656516456666, "learning_rate": 2.34733893557423e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1631423830986023, "step": 420, "valid_targets_mean": 3106.1, "valid_targets_min": 1037 }, { "epoch": 0.4166666666666667, "grad_norm": 0.5558016162889798, "learning_rate": 2.3753501400560226e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.1663081794977188, "step": 425, "valid_targets_mean": 2749.5, "valid_targets_min": 457 }, { "epoch": 0.4215686274509804, "grad_norm": 0.5880655917189165, "learning_rate": 2.4033613445378152e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.16312886774539948, "step": 430, "valid_targets_mean": 2623.3, "valid_targets_min": 745 }, { "epoch": 0.4264705882352941, "grad_norm": 0.7344574592722877, "learning_rate": 2.431372549019608e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.2649971544742584, "step": 435, "valid_targets_mean": 2264.2, "valid_targets_min": 694 }, { "epoch": 0.43137254901960786, "grad_norm": 0.6302873204915442, "learning_rate": 2.459383753501401e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.1764337718486786, "step": 440, "valid_targets_mean": 2357.9, "valid_targets_min": 747 }, { "epoch": 0.4362745098039216, "grad_norm": 0.7622364081121474, "learning_rate": 2.4873949579831935e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.1960497498512268, "step": 445, "valid_targets_mean": 1879.4, "valid_targets_min": 620 }, { "epoch": 0.4411764705882353, "grad_norm": 0.7533017366222997, "learning_rate": 2.515406162464986e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.2160189002752304, "step": 450, "valid_targets_mean": 1974.1, "valid_targets_min": 657 }, { "epoch": 0.44607843137254904, "grad_norm": 0.634266879787467, "learning_rate": 2.5434173669467788e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.2114112675189972, "step": 455, "valid_targets_mean": 2598.1, "valid_targets_min": 713 }, { "epoch": 0.45098039215686275, "grad_norm": 0.6398501184472496, "learning_rate": 2.5714285714285718e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.14820167422294617, "step": 460, "valid_targets_mean": 2284.9, "valid_targets_min": 722 }, { "epoch": 0.45588235294117646, "grad_norm": 0.6685908833242333, "learning_rate": 2.5994397759103644e-05, "loss": 0.1851, "loss_nan_ranks": 0, "loss_rank_avg": 0.17728768289089203, "step": 465, "valid_targets_mean": 2262.2, "valid_targets_min": 563 }, { "epoch": 0.46078431372549017, "grad_norm": 0.5843431974090029, "learning_rate": 2.627450980392157e-05, "loss": 0.1904, "loss_nan_ranks": 0, "loss_rank_avg": 0.181320920586586, "step": 470, "valid_targets_mean": 2510.9, "valid_targets_min": 775 }, { "epoch": 0.46568627450980393, "grad_norm": 0.4774970152103178, "learning_rate": 2.6554621848739497e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.12849435210227966, "step": 475, "valid_targets_mean": 3068.2, "valid_targets_min": 646 }, { "epoch": 0.47058823529411764, "grad_norm": 0.5934817185344419, "learning_rate": 2.6834733893557424e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.1902085244655609, "step": 480, "valid_targets_mean": 2842.9, "valid_targets_min": 961 }, { "epoch": 0.47549019607843135, "grad_norm": 0.8021530951461361, "learning_rate": 2.7114845938375354e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.22121350467205048, "step": 485, "valid_targets_mean": 1811.6, "valid_targets_min": 568 }, { "epoch": 0.4803921568627451, "grad_norm": 0.7090056473413902, "learning_rate": 2.739495798319328e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.20266397297382355, "step": 490, "valid_targets_mean": 2183.2, "valid_targets_min": 704 }, { "epoch": 0.4852941176470588, "grad_norm": 0.5565085839690194, "learning_rate": 2.7675070028011207e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.16087017953395844, "step": 495, "valid_targets_mean": 2603.2, "valid_targets_min": 675 }, { "epoch": 0.49019607843137253, "grad_norm": 0.716565785096359, "learning_rate": 2.7955182072829133e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.2089020311832428, "step": 500, "valid_targets_mean": 2193.8, "valid_targets_min": 502 }, { "epoch": 0.4950980392156863, "grad_norm": 0.6524679837642853, "learning_rate": 2.8235294117647063e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.19976428151130676, "step": 505, "valid_targets_mean": 2135.9, "valid_targets_min": 824 }, { "epoch": 0.5, "grad_norm": 0.5937060048137175, "learning_rate": 2.851540616246499e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.1664942055940628, "step": 510, "valid_targets_mean": 2461.0, "valid_targets_min": 559 }, { "epoch": 0.5049019607843137, "grad_norm": 0.7057958054146954, "learning_rate": 2.8795518207282916e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.19686059653759003, "step": 515, "valid_targets_mean": 2053.7, "valid_targets_min": 647 }, { "epoch": 0.5098039215686274, "grad_norm": 0.8351575004625197, "learning_rate": 2.9075630252100843e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.2226218283176422, "step": 520, "valid_targets_mean": 1817.9, "valid_targets_min": 518 }, { "epoch": 0.5147058823529411, "grad_norm": 0.9431458056923483, "learning_rate": 2.935574229691877e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.17681443691253662, "step": 525, "valid_targets_mean": 2532.9, "valid_targets_min": 793 }, { "epoch": 0.5196078431372549, "grad_norm": 0.6557987732231455, "learning_rate": 2.96358543417367e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.1878250688314438, "step": 530, "valid_targets_mean": 2121.4, "valid_targets_min": 848 }, { "epoch": 0.5245098039215687, "grad_norm": 0.6775473688447424, "learning_rate": 2.9915966386554626e-05, "loss": 0.1879, "loss_nan_ranks": 0, "loss_rank_avg": 0.19594591856002808, "step": 535, "valid_targets_mean": 2717.2, "valid_targets_min": 734 }, { "epoch": 0.5294117647058824, "grad_norm": 0.7493448799041711, "learning_rate": 3.0196078431372552e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.17323686182498932, "step": 540, "valid_targets_mean": 2848.9, "valid_targets_min": 737 }, { "epoch": 0.5343137254901961, "grad_norm": 0.6055245402355067, "learning_rate": 3.047619047619048e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.18262027204036713, "step": 545, "valid_targets_mean": 2384.7, "valid_targets_min": 803 }, { "epoch": 0.5392156862745098, "grad_norm": 0.9951931981576938, "learning_rate": 3.075630252100841e-05, "loss": 0.2105, "loss_nan_ranks": 0, "loss_rank_avg": 0.19094133377075195, "step": 550, "valid_targets_mean": 1880.9, "valid_targets_min": 536 }, { "epoch": 0.5441176470588235, "grad_norm": 0.5361891619372162, "learning_rate": 3.1036414565826335e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.18571898341178894, "step": 555, "valid_targets_mean": 2702.5, "valid_targets_min": 917 }, { "epoch": 0.5490196078431373, "grad_norm": 0.7382597364245482, "learning_rate": 3.131652661064426e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.20009863376617432, "step": 560, "valid_targets_mean": 1987.9, "valid_targets_min": 658 }, { "epoch": 0.553921568627451, "grad_norm": 0.49271312001793305, "learning_rate": 3.159663865546219e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.13765659928321838, "step": 565, "valid_targets_mean": 2502.9, "valid_targets_min": 613 }, { "epoch": 0.5588235294117647, "grad_norm": 0.6602153309510624, "learning_rate": 3.1876750700280114e-05, "loss": 0.1843, "loss_nan_ranks": 0, "loss_rank_avg": 0.17571693658828735, "step": 570, "valid_targets_mean": 1902.5, "valid_targets_min": 738 }, { "epoch": 0.5637254901960784, "grad_norm": 0.5846536461117092, "learning_rate": 3.215686274509804e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.15587720274925232, "step": 575, "valid_targets_mean": 2710.6, "valid_targets_min": 826 }, { "epoch": 0.5686274509803921, "grad_norm": 0.614800842745419, "learning_rate": 3.243697478991597e-05, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.20170342922210693, "step": 580, "valid_targets_mean": 2353.9, "valid_targets_min": 635 }, { "epoch": 0.5735294117647058, "grad_norm": 0.7805665554727105, "learning_rate": 3.2717086834733894e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.21049509942531586, "step": 585, "valid_targets_mean": 1816.6, "valid_targets_min": 621 }, { "epoch": 0.5784313725490197, "grad_norm": 0.7649845650415136, "learning_rate": 3.299719887955182e-05, "loss": 0.1875, "loss_nan_ranks": 0, "loss_rank_avg": 0.2008473128080368, "step": 590, "valid_targets_mean": 1650.5, "valid_targets_min": 697 }, { "epoch": 0.5833333333333334, "grad_norm": 0.6457466336174561, "learning_rate": 3.3277310924369754e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.17701813578605652, "step": 595, "valid_targets_mean": 1995.9, "valid_targets_min": 731 }, { "epoch": 0.5882352941176471, "grad_norm": 0.5562439326577053, "learning_rate": 3.355742296918768e-05, "loss": 0.1843, "loss_nan_ranks": 0, "loss_rank_avg": 0.1580512523651123, "step": 600, "valid_targets_mean": 2415.7, "valid_targets_min": 593 }, { "epoch": 0.5931372549019608, "grad_norm": 0.56877429322566, "learning_rate": 3.383753501400561e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.1642981469631195, "step": 605, "valid_targets_mean": 2748.0, "valid_targets_min": 1005 }, { "epoch": 0.5980392156862745, "grad_norm": 0.548679259946226, "learning_rate": 3.411764705882353e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.17865321040153503, "step": 610, "valid_targets_mean": 2435.0, "valid_targets_min": 546 }, { "epoch": 0.6029411764705882, "grad_norm": 0.631089481529247, "learning_rate": 3.439775910364146e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.19993621110916138, "step": 615, "valid_targets_mean": 2594.4, "valid_targets_min": 677 }, { "epoch": 0.6078431372549019, "grad_norm": 0.5810814829277858, "learning_rate": 3.4677871148459386e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.1496606171131134, "step": 620, "valid_targets_mean": 2420.2, "valid_targets_min": 611 }, { "epoch": 0.6127450980392157, "grad_norm": 0.6657496107127471, "learning_rate": 3.495798319327731e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.1836290955543518, "step": 625, "valid_targets_mean": 2130.9, "valid_targets_min": 705 }, { "epoch": 0.6176470588235294, "grad_norm": 0.5600295328636472, "learning_rate": 3.523809523809524e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.14458300173282623, "step": 630, "valid_targets_mean": 2431.5, "valid_targets_min": 765 }, { "epoch": 0.6225490196078431, "grad_norm": 0.49976024934437707, "learning_rate": 3.5518207282913166e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.17662914097309113, "step": 635, "valid_targets_mean": 3142.9, "valid_targets_min": 848 }, { "epoch": 0.6274509803921569, "grad_norm": 0.6240957673215978, "learning_rate": 3.57983193277311e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.20896753668785095, "step": 640, "valid_targets_mean": 2600.9, "valid_targets_min": 1251 }, { "epoch": 0.6323529411764706, "grad_norm": 0.7125271464926058, "learning_rate": 3.6078431372549025e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.17587466537952423, "step": 645, "valid_targets_mean": 2187.2, "valid_targets_min": 625 }, { "epoch": 0.6372549019607843, "grad_norm": 0.681219377242786, "learning_rate": 3.635854341736695e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.1565675586462021, "step": 650, "valid_targets_mean": 1880.1, "valid_targets_min": 578 }, { "epoch": 0.6421568627450981, "grad_norm": 0.540781252427908, "learning_rate": 3.663865546218488e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.16999506950378418, "step": 655, "valid_targets_mean": 2553.5, "valid_targets_min": 631 }, { "epoch": 0.6470588235294118, "grad_norm": 0.5599693819997887, "learning_rate": 3.6918767507002805e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.16493026912212372, "step": 660, "valid_targets_mean": 2483.2, "valid_targets_min": 771 }, { "epoch": 0.6519607843137255, "grad_norm": 0.6013502015737507, "learning_rate": 3.719887955182073e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.13749179244041443, "step": 665, "valid_targets_mean": 2236.2, "valid_targets_min": 720 }, { "epoch": 0.6568627450980392, "grad_norm": 0.8440572077136491, "learning_rate": 3.747899159663866e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.20680469274520874, "step": 670, "valid_targets_mean": 1549.4, "valid_targets_min": 645 }, { "epoch": 0.6617647058823529, "grad_norm": 0.49979150890191865, "learning_rate": 3.7759103641456584e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.1284269243478775, "step": 675, "valid_targets_mean": 2789.7, "valid_targets_min": 920 }, { "epoch": 0.6666666666666666, "grad_norm": 0.5527405271398915, "learning_rate": 3.803921568627451e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.16107848286628723, "step": 680, "valid_targets_mean": 2213.6, "valid_targets_min": 727 }, { "epoch": 0.6715686274509803, "grad_norm": 0.45853328959246625, "learning_rate": 3.8319327731092444e-05, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.14330020546913147, "step": 685, "valid_targets_mean": 2835.4, "valid_targets_min": 700 }, { "epoch": 0.6764705882352942, "grad_norm": 0.6033883535487085, "learning_rate": 3.859943977591037e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.170333594083786, "step": 690, "valid_targets_mean": 2644.1, "valid_targets_min": 804 }, { "epoch": 0.6813725490196079, "grad_norm": 0.48758852132532277, "learning_rate": 3.88795518207283e-05, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.12590698897838593, "step": 695, "valid_targets_mean": 3071.6, "valid_targets_min": 545 }, { "epoch": 0.6862745098039216, "grad_norm": 0.605661287906157, "learning_rate": 3.915966386554622e-05, "loss": 0.1915, "loss_nan_ranks": 0, "loss_rank_avg": 0.17962878942489624, "step": 700, "valid_targets_mean": 1955.1, "valid_targets_min": 652 }, { "epoch": 0.6911764705882353, "grad_norm": 0.5020242290872657, "learning_rate": 3.943977591036415e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.1520138829946518, "step": 705, "valid_targets_mean": 2484.9, "valid_targets_min": 824 }, { "epoch": 0.696078431372549, "grad_norm": 0.6111840324281157, "learning_rate": 3.971988795518208e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.15317299962043762, "step": 710, "valid_targets_mean": 2317.1, "valid_targets_min": 834 }, { "epoch": 0.7009803921568627, "grad_norm": 0.5706697841930912, "learning_rate": 4e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.1541549265384674, "step": 715, "valid_targets_mean": 2519.8, "valid_targets_min": 549 }, { "epoch": 0.7058823529411765, "grad_norm": 0.6242837873790525, "learning_rate": 3.9999940247222794e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.17146050930023193, "step": 720, "valid_targets_mean": 2097.7, "valid_targets_min": 648 }, { "epoch": 0.7107843137254902, "grad_norm": 0.6320865522891047, "learning_rate": 3.99997609892482e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.16714760661125183, "step": 725, "valid_targets_mean": 2100.1, "valid_targets_min": 567 }, { "epoch": 0.7156862745098039, "grad_norm": 0.6259492059085117, "learning_rate": 3.9999462227147346e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1846911460161209, "step": 730, "valid_targets_mean": 2340.9, "valid_targets_min": 717 }, { "epoch": 0.7205882352941176, "grad_norm": 0.5649591929759424, "learning_rate": 3.999904396270541e-05, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.14328107237815857, "step": 735, "valid_targets_mean": 1948.3, "valid_targets_min": 623 }, { "epoch": 0.7254901960784313, "grad_norm": 0.5989473820452854, "learning_rate": 3.999850619842165e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.19438403844833374, "step": 740, "valid_targets_mean": 2225.5, "valid_targets_min": 898 }, { "epoch": 0.7303921568627451, "grad_norm": 0.5877131427477353, "learning_rate": 3.9997848937509344e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.17539003491401672, "step": 745, "valid_targets_mean": 2403.7, "valid_targets_min": 610 }, { "epoch": 0.7352941176470589, "grad_norm": 0.6133368132701967, "learning_rate": 3.9997072183895813e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.17177073657512665, "step": 750, "valid_targets_mean": 2129.9, "valid_targets_min": 605 }, { "epoch": 0.7401960784313726, "grad_norm": 0.6243605903426748, "learning_rate": 3.999617594222238e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.20242561399936676, "step": 755, "valid_targets_mean": 1891.8, "valid_targets_min": 746 }, { "epoch": 0.7450980392156863, "grad_norm": 0.5781945029504527, "learning_rate": 3.999516021784433e-05, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.2293742150068283, "step": 760, "valid_targets_mean": 2518.5, "valid_targets_min": 849 }, { "epoch": 0.75, "grad_norm": 0.5246759562973626, "learning_rate": 3.999402501683091e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.1456177830696106, "step": 765, "valid_targets_mean": 2379.1, "valid_targets_min": 716 }, { "epoch": 0.7549019607843137, "grad_norm": 1.3105893523432963, "learning_rate": 3.9992770345965246e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.16315758228302002, "step": 770, "valid_targets_mean": 2101.8, "valid_targets_min": 726 }, { "epoch": 0.7598039215686274, "grad_norm": 0.48875268576869824, "learning_rate": 3.999139621274435e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.14056408405303955, "step": 775, "valid_targets_mean": 2588.0, "valid_targets_min": 730 }, { "epoch": 0.7647058823529411, "grad_norm": 0.5815354015567381, "learning_rate": 3.998990262537906e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.1769942045211792, "step": 780, "valid_targets_mean": 2086.6, "valid_targets_min": 674 }, { "epoch": 0.7696078431372549, "grad_norm": 0.5580499155747178, "learning_rate": 3.998828959279397e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.16807660460472107, "step": 785, "valid_targets_mean": 2295.8, "valid_targets_min": 704 }, { "epoch": 0.7745098039215687, "grad_norm": 0.6543312744336789, "learning_rate": 3.998655712462739e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.23026910424232483, "step": 790, "valid_targets_mean": 2343.8, "valid_targets_min": 789 }, { "epoch": 0.7794117647058824, "grad_norm": 0.5133434881456423, "learning_rate": 3.9984705231231305e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.1757199764251709, "step": 795, "valid_targets_mean": 2698.2, "valid_targets_min": 947 }, { "epoch": 0.7843137254901961, "grad_norm": 0.4829365196833064, "learning_rate": 3.9982733923671285e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.1341038942337036, "step": 800, "valid_targets_mean": 2727.9, "valid_targets_min": 934 }, { "epoch": 0.7892156862745098, "grad_norm": 0.5478275817278946, "learning_rate": 3.998064321372645e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.17312784492969513, "step": 805, "valid_targets_mean": 2547.9, "valid_targets_min": 1030 }, { "epoch": 0.7941176470588235, "grad_norm": 0.5569452846395607, "learning_rate": 3.9978433113889374e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.19361044466495514, "step": 810, "valid_targets_mean": 2531.6, "valid_targets_min": 789 }, { "epoch": 0.7990196078431373, "grad_norm": 0.5416020837107107, "learning_rate": 3.997610363736601e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.156791090965271, "step": 815, "valid_targets_mean": 2386.6, "valid_targets_min": 788 }, { "epoch": 0.803921568627451, "grad_norm": 0.5762887091632245, "learning_rate": 3.997365479807562e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.19870856404304504, "step": 820, "valid_targets_mean": 2393.2, "valid_targets_min": 764 }, { "epoch": 0.8088235294117647, "grad_norm": 0.6286459807846932, "learning_rate": 3.997108661065072e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.2093677967786789, "step": 825, "valid_targets_mean": 2101.6, "valid_targets_min": 739 }, { "epoch": 0.8137254901960784, "grad_norm": 0.4993822078208516, "learning_rate": 3.996839909043693e-05, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.13117878139019012, "step": 830, "valid_targets_mean": 2134.5, "valid_targets_min": 705 }, { "epoch": 0.8186274509803921, "grad_norm": 0.6887032555539322, "learning_rate": 3.996559225349292e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.18981419503688812, "step": 835, "valid_targets_mean": 1885.4, "valid_targets_min": 767 }, { "epoch": 0.8235294117647058, "grad_norm": 0.4824669004092395, "learning_rate": 3.996266611659034e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455826759338379, "step": 840, "valid_targets_mean": 2453.9, "valid_targets_min": 837 }, { "epoch": 0.8284313725490197, "grad_norm": 0.6045939644368779, "learning_rate": 3.995962069721367e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.1643049120903015, "step": 845, "valid_targets_mean": 1984.4, "valid_targets_min": 684 }, { "epoch": 0.8333333333333334, "grad_norm": 0.6432148110358881, "learning_rate": 3.995645601356011e-05, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.1854993999004364, "step": 850, "valid_targets_mean": 1761.9, "valid_targets_min": 526 }, { "epoch": 0.8382352941176471, "grad_norm": 0.5344791129446362, "learning_rate": 3.995317208453955e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.14876899123191833, "step": 855, "valid_targets_mean": 2241.1, "valid_targets_min": 656 }, { "epoch": 0.8431372549019608, "grad_norm": 0.6242488703641825, "learning_rate": 3.994976892977437e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.17894625663757324, "step": 860, "valid_targets_mean": 2074.5, "valid_targets_min": 735 }, { "epoch": 0.8480392156862745, "grad_norm": 0.7029980773261847, "learning_rate": 3.994624656959937e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.1853296309709549, "step": 865, "valid_targets_mean": 1878.5, "valid_targets_min": 933 }, { "epoch": 0.8529411764705882, "grad_norm": 0.5157657178693743, "learning_rate": 3.994260502506162e-05, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.1443462073802948, "step": 870, "valid_targets_mean": 2428.6, "valid_targets_min": 471 }, { "epoch": 0.8578431372549019, "grad_norm": 0.614121702051816, "learning_rate": 3.9938844317920364e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.19413134455680847, "step": 875, "valid_targets_mean": 1949.9, "valid_targets_min": 605 }, { "epoch": 0.8627450980392157, "grad_norm": 0.584377991874969, "learning_rate": 3.9934964470646875e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.2134077399969101, "step": 880, "valid_targets_mean": 2511.8, "valid_targets_min": 699 }, { "epoch": 0.8676470588235294, "grad_norm": 0.5150088309759572, "learning_rate": 3.993096550642431e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.13996057212352753, "step": 885, "valid_targets_mean": 2704.8, "valid_targets_min": 607 }, { "epoch": 0.8725490196078431, "grad_norm": 0.5550186393534331, "learning_rate": 3.99268474491476e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.17755350470542908, "step": 890, "valid_targets_mean": 2633.4, "valid_targets_min": 808 }, { "epoch": 0.8774509803921569, "grad_norm": 0.4441972349671847, "learning_rate": 3.9922610323423285e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.14680537581443787, "step": 895, "valid_targets_mean": 3068.7, "valid_targets_min": 720 }, { "epoch": 0.8823529411764706, "grad_norm": 0.5485344567306873, "learning_rate": 3.991825415456935e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.1684146523475647, "step": 900, "valid_targets_mean": 2122.2, "valid_targets_min": 745 }, { "epoch": 0.8872549019607843, "grad_norm": 0.4650801011694969, "learning_rate": 3.991377896861513e-05, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.15383949875831604, "step": 905, "valid_targets_mean": 2715.5, "valid_targets_min": 922 }, { "epoch": 0.8921568627450981, "grad_norm": 0.5320235845602149, "learning_rate": 3.99091847923011e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.15561532974243164, "step": 910, "valid_targets_mean": 2538.2, "valid_targets_min": 1012 }, { "epoch": 0.8970588235294118, "grad_norm": 0.45876070962592214, "learning_rate": 3.990447165307873e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.146046981215477, "step": 915, "valid_targets_mean": 2568.5, "valid_targets_min": 534 }, { "epoch": 0.9019607843137255, "grad_norm": 0.5921830084761494, "learning_rate": 3.989963957911035e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.17852135002613068, "step": 920, "valid_targets_mean": 2035.5, "valid_targets_min": 784 }, { "epoch": 0.9068627450980392, "grad_norm": 0.5578416790380244, "learning_rate": 3.989468859926893e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.15424934029579163, "step": 925, "valid_targets_mean": 2060.3, "valid_targets_min": 837 }, { "epoch": 0.9117647058823529, "grad_norm": 0.61427402855988, "learning_rate": 3.9889618743137954e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.20084241032600403, "step": 930, "valid_targets_mean": 2377.2, "valid_targets_min": 750 }, { "epoch": 0.9166666666666666, "grad_norm": 0.617879885813731, "learning_rate": 3.988443004101123e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.19452977180480957, "step": 935, "valid_targets_mean": 1994.8, "valid_targets_min": 761 }, { "epoch": 0.9215686274509803, "grad_norm": 0.5918025094232898, "learning_rate": 3.9879122523892686e-05, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.16469812393188477, "step": 940, "valid_targets_mean": 1928.2, "valid_targets_min": 671 }, { "epoch": 0.9264705882352942, "grad_norm": 0.47030820264667533, "learning_rate": 3.987369622349621e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.1485341638326645, "step": 945, "valid_targets_mean": 2903.6, "valid_targets_min": 739 }, { "epoch": 0.9313725490196079, "grad_norm": 0.5720177758819267, "learning_rate": 3.986815117224546e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.23535758256912231, "step": 950, "valid_targets_mean": 2154.2, "valid_targets_min": 697 }, { "epoch": 0.9362745098039216, "grad_norm": 0.491844040588146, "learning_rate": 3.986248740327365e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.14158077538013458, "step": 955, "valid_targets_mean": 2549.4, "valid_targets_min": 787 }, { "epoch": 0.9411764705882353, "grad_norm": 0.6672714337590078, "learning_rate": 3.985670495042338e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.19034962356090546, "step": 960, "valid_targets_mean": 1762.1, "valid_targets_min": 513 }, { "epoch": 0.946078431372549, "grad_norm": 0.5107414628675888, "learning_rate": 3.98508038482464e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.16910362243652344, "step": 965, "valid_targets_mean": 2209.5, "valid_targets_min": 743 }, { "epoch": 0.9509803921568627, "grad_norm": 0.7159936896599701, "learning_rate": 3.984478413200345e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.18525683879852295, "step": 970, "valid_targets_mean": 2314.8, "valid_targets_min": 786 }, { "epoch": 0.9558823529411765, "grad_norm": 0.5069431684151768, "learning_rate": 3.983864583766399e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.15477177500724792, "step": 975, "valid_targets_mean": 2671.3, "valid_targets_min": 819 }, { "epoch": 0.9607843137254902, "grad_norm": 0.5442502847606222, "learning_rate": 3.983238900190604e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.1818421185016632, "step": 980, "valid_targets_mean": 2540.2, "valid_targets_min": 995 }, { "epoch": 0.9656862745098039, "grad_norm": 0.5846293701433558, "learning_rate": 3.9826013662115934e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.15935450792312622, "step": 985, "valid_targets_mean": 2114.6, "valid_targets_min": 798 }, { "epoch": 0.9705882352941176, "grad_norm": 0.7518939257172016, "learning_rate": 3.981951985638811e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.16909798979759216, "step": 990, "valid_targets_mean": 1665.1, "valid_targets_min": 632 }, { "epoch": 0.9754901960784313, "grad_norm": 0.4994396623985315, "learning_rate": 3.981290762352483e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.14983665943145752, "step": 995, "valid_targets_mean": 2305.2, "valid_targets_min": 721 }, { "epoch": 0.9803921568627451, "grad_norm": 0.586025245179539, "learning_rate": 3.9806177003036046e-05, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.16798822581768036, "step": 1000, "valid_targets_mean": 2330.8, "valid_targets_min": 837 }, { "epoch": 0.9852941176470589, "grad_norm": 1.0406909868224459, "learning_rate": 3.979932803513908e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.18792645633220673, "step": 1005, "valid_targets_mean": 2235.0, "valid_targets_min": 821 }, { "epoch": 0.9901960784313726, "grad_norm": 0.6058346652555415, "learning_rate": 3.979236076075841e-05, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.17952141165733337, "step": 1010, "valid_targets_mean": 1793.4, "valid_targets_min": 446 }, { "epoch": 0.9950980392156863, "grad_norm": 0.5394004450746253, "learning_rate": 3.9785275221525447e-05, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.1644574999809265, "step": 1015, "valid_targets_mean": 1957.1, "valid_targets_min": 650 }, { "epoch": 1.0, "grad_norm": 0.5123401147066629, "learning_rate": 3.977807145977824e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.17188802361488342, "step": 1020, "valid_targets_mean": 2460.4, "valid_targets_min": 979 }, { "epoch": 1.0049019607843137, "grad_norm": 0.5838212653448689, "learning_rate": 3.977074951856128e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.16549797356128693, "step": 1025, "valid_targets_mean": 2017.8, "valid_targets_min": 559 }, { "epoch": 1.0098039215686274, "grad_norm": 0.6174829915961145, "learning_rate": 3.976330944162519e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.20157307386398315, "step": 1030, "valid_targets_mean": 2135.1, "valid_targets_min": 714 }, { "epoch": 1.0147058823529411, "grad_norm": 0.4828068003627354, "learning_rate": 3.975575127342651e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.17932741343975067, "step": 1035, "valid_targets_mean": 2793.8, "valid_targets_min": 960 }, { "epoch": 1.0196078431372548, "grad_norm": 0.62074325806201, "learning_rate": 3.974807505912737e-05, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.20777440071105957, "step": 1040, "valid_targets_mean": 2069.4, "valid_targets_min": 884 }, { "epoch": 1.0245098039215685, "grad_norm": 0.5157537624193805, "learning_rate": 3.974028084459531e-05, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.1442909985780716, "step": 1045, "valid_targets_mean": 2144.7, "valid_targets_min": 663 }, { "epoch": 1.0294117647058822, "grad_norm": 0.5275408083767269, "learning_rate": 3.973236867640291e-05, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591978371143341, "step": 1050, "valid_targets_mean": 2433.8, "valid_targets_min": 540 }, { "epoch": 1.0343137254901962, "grad_norm": 0.6054568333033143, "learning_rate": 3.972433860182757e-05, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.1705915629863739, "step": 1055, "valid_targets_mean": 1799.0, "valid_targets_min": 864 }, { "epoch": 1.0392156862745099, "grad_norm": 0.6782539679662744, "learning_rate": 3.971619066885122e-05, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.16509351134300232, "step": 1060, "valid_targets_mean": 1800.1, "valid_targets_min": 865 }, { "epoch": 1.0441176470588236, "grad_norm": 0.49281399947041626, "learning_rate": 3.9707924926160026e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.14969328045845032, "step": 1065, "valid_targets_mean": 2801.4, "valid_targets_min": 1152 }, { "epoch": 1.0490196078431373, "grad_norm": 0.588840531018445, "learning_rate": 3.96995414231441e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.1991569846868515, "step": 1070, "valid_targets_mean": 2264.0, "valid_targets_min": 700 }, { "epoch": 1.053921568627451, "grad_norm": 0.6841222391097739, "learning_rate": 3.969104020989718e-05, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.21732574701309204, "step": 1075, "valid_targets_mean": 1794.9, "valid_targets_min": 590 }, { "epoch": 1.0588235294117647, "grad_norm": 0.515045459549045, "learning_rate": 3.96824213372164e-05, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.1259552240371704, "step": 1080, "valid_targets_mean": 2122.6, "valid_targets_min": 723 }, { "epoch": 1.0637254901960784, "grad_norm": 0.5616565763943626, "learning_rate": 3.9673684856601915e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.14568236470222473, "step": 1085, "valid_targets_mean": 1993.7, "valid_targets_min": 663 }, { "epoch": 1.0686274509803921, "grad_norm": 0.5261562423211233, "learning_rate": 3.9664830820256605e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.1599075198173523, "step": 1090, "valid_targets_mean": 2128.1, "valid_targets_min": 726 }, { "epoch": 1.0735294117647058, "grad_norm": 0.43934072499401866, "learning_rate": 3.965585928108581e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.11759766191244125, "step": 1095, "valid_targets_mean": 2754.6, "valid_targets_min": 839 }, { "epoch": 1.0784313725490196, "grad_norm": 0.6033318921088762, "learning_rate": 3.964677029269697e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.13802024722099304, "step": 1100, "valid_targets_mean": 2244.1, "valid_targets_min": 694 }, { "epoch": 1.0833333333333333, "grad_norm": 0.5046328382489379, "learning_rate": 3.963756390939931e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.14507150650024414, "step": 1105, "valid_targets_mean": 2527.9, "valid_targets_min": 652 }, { "epoch": 1.088235294117647, "grad_norm": 0.5022528514006354, "learning_rate": 3.962824018620353e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.158194899559021, "step": 1110, "valid_targets_mean": 2257.4, "valid_targets_min": 786 }, { "epoch": 1.093137254901961, "grad_norm": 0.4675384543996388, "learning_rate": 3.9618799178821454e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.16208568215370178, "step": 1115, "valid_targets_mean": 2411.1, "valid_targets_min": 776 }, { "epoch": 1.0980392156862746, "grad_norm": 0.6462739777449577, "learning_rate": 3.960924094366574e-05, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.17548783123493195, "step": 1120, "valid_targets_mean": 1877.2, "valid_targets_min": 559 }, { "epoch": 1.1029411764705883, "grad_norm": 0.5646237353311311, "learning_rate": 3.959956553784948e-05, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.15153411030769348, "step": 1125, "valid_targets_mean": 2764.0, "valid_targets_min": 919 }, { "epoch": 1.107843137254902, "grad_norm": 0.4540975480652281, "learning_rate": 3.9589773019185924e-05, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.12593434751033783, "step": 1130, "valid_targets_mean": 2523.4, "valid_targets_min": 892 }, { "epoch": 1.1127450980392157, "grad_norm": 0.5547544466967875, "learning_rate": 3.957986344618809e-05, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.14328861236572266, "step": 1135, "valid_targets_mean": 2087.6, "valid_targets_min": 658 }, { "epoch": 1.1176470588235294, "grad_norm": 0.592476178518575, "learning_rate": 3.956983687806843e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.1588444709777832, "step": 1140, "valid_targets_mean": 1868.7, "valid_targets_min": 560 }, { "epoch": 1.1225490196078431, "grad_norm": 0.5970021551092038, "learning_rate": 3.955969337473846e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.15817104279994965, "step": 1145, "valid_targets_mean": 2292.9, "valid_targets_min": 764 }, { "epoch": 1.1274509803921569, "grad_norm": 0.5962854116508299, "learning_rate": 3.954943299680844e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.1732129156589508, "step": 1150, "valid_targets_mean": 2063.4, "valid_targets_min": 1125 }, { "epoch": 1.1323529411764706, "grad_norm": 0.6896713797977306, "learning_rate": 3.953905580558698e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.2036602646112442, "step": 1155, "valid_targets_mean": 1861.2, "valid_targets_min": 609 }, { "epoch": 1.1372549019607843, "grad_norm": 0.5073490806892655, "learning_rate": 3.952856186308068e-05, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.15630340576171875, "step": 1160, "valid_targets_mean": 2235.9, "valid_targets_min": 720 }, { "epoch": 1.142156862745098, "grad_norm": 0.45334538233451205, "learning_rate": 3.951795123199375e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1358206868171692, "step": 1165, "valid_targets_mean": 2691.2, "valid_targets_min": 754 }, { "epoch": 1.1470588235294117, "grad_norm": 0.4652006849941343, "learning_rate": 3.950722397572766e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.14758041501045227, "step": 1170, "valid_targets_mean": 2904.9, "valid_targets_min": 1057 }, { "epoch": 1.1519607843137254, "grad_norm": 0.562043728061584, "learning_rate": 3.949638015838076e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1432192176580429, "step": 1175, "valid_targets_mean": 1881.5, "valid_targets_min": 740 }, { "epoch": 1.156862745098039, "grad_norm": 0.7702082160549727, "learning_rate": 3.948541984474784e-05, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.15741848945617676, "step": 1180, "valid_targets_mean": 2464.0, "valid_targets_min": 827 }, { "epoch": 1.161764705882353, "grad_norm": 0.5224013259456193, "learning_rate": 3.947434310031986e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.14922982454299927, "step": 1185, "valid_targets_mean": 2077.6, "valid_targets_min": 679 }, { "epoch": 1.1666666666666667, "grad_norm": 0.5631555063513266, "learning_rate": 3.94631499912834e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.15543070435523987, "step": 1190, "valid_targets_mean": 2052.9, "valid_targets_min": 684 }, { "epoch": 1.1715686274509804, "grad_norm": 0.45985075769888245, "learning_rate": 3.945184058452044e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.15431955456733704, "step": 1195, "valid_targets_mean": 2501.5, "valid_targets_min": 680 }, { "epoch": 1.1764705882352942, "grad_norm": 0.544135678064552, "learning_rate": 3.944041494760779e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.14121049642562866, "step": 1200, "valid_targets_mean": 2084.9, "valid_targets_min": 534 }, { "epoch": 1.1813725490196079, "grad_norm": 0.43080987042558744, "learning_rate": 3.9428873148816815e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.12293718755245209, "step": 1205, "valid_targets_mean": 2903.8, "valid_targets_min": 638 }, { "epoch": 1.1862745098039216, "grad_norm": 0.5346019417820428, "learning_rate": 3.9417215257112975e-05, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.13670134544372559, "step": 1210, "valid_targets_mean": 2017.1, "valid_targets_min": 659 }, { "epoch": 1.1911764705882353, "grad_norm": 0.5740555345382163, "learning_rate": 3.94054413421554e-05, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.16550078988075256, "step": 1215, "valid_targets_mean": 2116.8, "valid_targets_min": 874 }, { "epoch": 1.196078431372549, "grad_norm": 0.5276636605184202, "learning_rate": 3.9393551474296506e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.13549819588661194, "step": 1220, "valid_targets_mean": 2193.8, "valid_targets_min": 1090 }, { "epoch": 1.2009803921568627, "grad_norm": 0.4329687250201491, "learning_rate": 3.938154572458156e-05, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.12151844054460526, "step": 1225, "valid_targets_mean": 2738.6, "valid_targets_min": 771 }, { "epoch": 1.2058823529411764, "grad_norm": 0.7280188503712324, "learning_rate": 3.936942416474825e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.20381173491477966, "step": 1230, "valid_targets_mean": 2216.9, "valid_targets_min": 567 }, { "epoch": 1.2107843137254901, "grad_norm": 0.6188709430418583, "learning_rate": 3.935718686722626e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.18018341064453125, "step": 1235, "valid_targets_mean": 1980.0, "valid_targets_min": 819 }, { "epoch": 1.215686274509804, "grad_norm": 0.49994332511469786, "learning_rate": 3.934483390513683e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.13865551352500916, "step": 1240, "valid_targets_mean": 2634.1, "valid_targets_min": 744 }, { "epoch": 1.2205882352941178, "grad_norm": 0.4609019249907111, "learning_rate": 3.933236535229236e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.13344664871692657, "step": 1245, "valid_targets_mean": 2502.8, "valid_targets_min": 767 }, { "epoch": 1.2254901960784315, "grad_norm": 0.6946779226729973, "learning_rate": 3.931978128319591e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.18459130823612213, "step": 1250, "valid_targets_mean": 2516.1, "valid_targets_min": 648 }, { "epoch": 1.2303921568627452, "grad_norm": 0.3847744756653841, "learning_rate": 3.9307081773040774e-05, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.11731822788715363, "step": 1255, "valid_targets_mean": 3076.5, "valid_targets_min": 802 }, { "epoch": 1.2352941176470589, "grad_norm": 0.4905255095526249, "learning_rate": 3.929426689771007e-05, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.14215940237045288, "step": 1260, "valid_targets_mean": 2219.2, "valid_targets_min": 605 }, { "epoch": 1.2401960784313726, "grad_norm": 0.5140168836960785, "learning_rate": 3.9281336733776224e-05, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.1484440267086029, "step": 1265, "valid_targets_mean": 2392.3, "valid_targets_min": 833 }, { "epoch": 1.2450980392156863, "grad_norm": 0.510281749270732, "learning_rate": 3.926829135850056e-05, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.13769188523292542, "step": 1270, "valid_targets_mean": 2149.2, "valid_targets_min": 837 }, { "epoch": 1.25, "grad_norm": 0.47694160804760755, "learning_rate": 3.925513084983282e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.1289670467376709, "step": 1275, "valid_targets_mean": 2160.6, "valid_targets_min": 799 }, { "epoch": 1.2549019607843137, "grad_norm": 0.5769961746495987, "learning_rate": 3.924185528641071e-05, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.16923269629478455, "step": 1280, "valid_targets_mean": 1923.4, "valid_targets_min": 572 }, { "epoch": 1.2598039215686274, "grad_norm": 0.5097251595214417, "learning_rate": 3.9228464747559384e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.14006245136260986, "step": 1285, "valid_targets_mean": 2251.9, "valid_targets_min": 837 }, { "epoch": 1.2647058823529411, "grad_norm": 0.48366970496366835, "learning_rate": 3.921495931329105e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.13093242049217224, "step": 1290, "valid_targets_mean": 2366.6, "valid_targets_min": 518 }, { "epoch": 1.2696078431372548, "grad_norm": 0.5781181664431445, "learning_rate": 3.920133906430442e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.1567743420600891, "step": 1295, "valid_targets_mean": 2257.6, "valid_targets_min": 745 }, { "epoch": 1.2745098039215685, "grad_norm": 0.41978393338444187, "learning_rate": 3.918760408198426e-05, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.14441536366939545, "step": 1300, "valid_targets_mean": 2817.1, "valid_targets_min": 1095 }, { "epoch": 1.2794117647058822, "grad_norm": 0.5308275909805295, "learning_rate": 3.9173754448400914e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.16451840102672577, "step": 1305, "valid_targets_mean": 2491.2, "valid_targets_min": 541 }, { "epoch": 1.284313725490196, "grad_norm": 0.5311164209246302, "learning_rate": 3.915979024630978e-05, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.14257512986660004, "step": 1310, "valid_targets_mean": 2018.1, "valid_targets_min": 570 }, { "epoch": 1.2892156862745099, "grad_norm": 0.4234229529058526, "learning_rate": 3.9145711559150854e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.1336820423603058, "step": 1315, "valid_targets_mean": 2803.6, "valid_targets_min": 676 }, { "epoch": 1.2941176470588236, "grad_norm": 0.5124680921691537, "learning_rate": 3.9131518471048194e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.16409265995025635, "step": 1320, "valid_targets_mean": 2254.1, "valid_targets_min": 591 }, { "epoch": 1.2990196078431373, "grad_norm": 0.5398508535353193, "learning_rate": 3.911721106680944e-05, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.16770967841148376, "step": 1325, "valid_targets_mean": 2107.1, "valid_targets_min": 716 }, { "epoch": 1.303921568627451, "grad_norm": 0.47066254116435274, "learning_rate": 3.910278943192531e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.1523783802986145, "step": 1330, "valid_targets_mean": 2441.0, "valid_targets_min": 776 }, { "epoch": 1.3088235294117647, "grad_norm": 0.5302196796070335, "learning_rate": 3.9088253652569085e-05, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.1501566767692566, "step": 1335, "valid_targets_mean": 2072.9, "valid_targets_min": 709 }, { "epoch": 1.3137254901960784, "grad_norm": 0.6412977475076532, "learning_rate": 3.907360381559608e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.14073000848293304, "step": 1340, "valid_targets_mean": 2276.2, "valid_targets_min": 612 }, { "epoch": 1.3186274509803921, "grad_norm": 0.5172240165827114, "learning_rate": 3.9058840008543136e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.14915066957473755, "step": 1345, "valid_targets_mean": 2422.1, "valid_targets_min": 244 }, { "epoch": 1.3235294117647058, "grad_norm": 0.4079599036566721, "learning_rate": 3.9043962319628096e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.11990423500537872, "step": 1350, "valid_targets_mean": 2620.1, "valid_targets_min": 514 }, { "epoch": 1.3284313725490196, "grad_norm": 0.48696050356601855, "learning_rate": 3.902897083774929e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.13719043135643005, "step": 1355, "valid_targets_mean": 2365.3, "valid_targets_min": 864 }, { "epoch": 1.3333333333333333, "grad_norm": 0.5203167774413222, "learning_rate": 3.9013865652484984e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.15943309664726257, "step": 1360, "valid_targets_mean": 2323.3, "valid_targets_min": 801 }, { "epoch": 1.3382352941176472, "grad_norm": 0.549425828566385, "learning_rate": 3.8998646854092854e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.15190866589546204, "step": 1365, "valid_targets_mean": 2337.4, "valid_targets_min": 640 }, { "epoch": 1.343137254901961, "grad_norm": 0.600237727151271, "learning_rate": 3.898331453350944e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.20173123478889465, "step": 1370, "valid_targets_mean": 1845.9, "valid_targets_min": 520 }, { "epoch": 1.3480392156862746, "grad_norm": 0.5032072364639573, "learning_rate": 3.896786878234963e-05, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.15287765860557556, "step": 1375, "valid_targets_mean": 2130.8, "valid_targets_min": 680 }, { "epoch": 1.3529411764705883, "grad_norm": 0.6833370573017062, "learning_rate": 3.8952309692906074e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.18234968185424805, "step": 1380, "valid_targets_mean": 1924.2, "valid_targets_min": 659 }, { "epoch": 1.357843137254902, "grad_norm": 0.41478093075036826, "learning_rate": 3.893663735814865e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.13855645060539246, "step": 1385, "valid_targets_mean": 2631.2, "valid_targets_min": 591 }, { "epoch": 1.3627450980392157, "grad_norm": 0.5585388314174717, "learning_rate": 3.89208518717239e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.1809864044189453, "step": 1390, "valid_targets_mean": 1917.9, "valid_targets_min": 785 }, { "epoch": 1.3676470588235294, "grad_norm": 0.4525025154823127, "learning_rate": 3.89049533279545e-05, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.14793044328689575, "step": 1395, "valid_targets_mean": 2488.4, "valid_targets_min": 819 }, { "epoch": 1.3725490196078431, "grad_norm": 0.4840178712448558, "learning_rate": 3.888894182183866e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.1626589596271515, "step": 1400, "valid_targets_mean": 2406.2, "valid_targets_min": 607 }, { "epoch": 1.3774509803921569, "grad_norm": 0.47327404010363494, "learning_rate": 3.887281744904959e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.13927535712718964, "step": 1405, "valid_targets_mean": 2618.0, "valid_targets_min": 1047 }, { "epoch": 1.3823529411764706, "grad_norm": 0.5818804209128727, "learning_rate": 3.885658030593487e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.12791548669338226, "step": 1410, "valid_targets_mean": 2182.4, "valid_targets_min": 768 }, { "epoch": 1.3872549019607843, "grad_norm": 0.5149356554417958, "learning_rate": 3.884023048951597e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.17590127885341644, "step": 1415, "valid_targets_mean": 2380.0, "valid_targets_min": 741 }, { "epoch": 1.392156862745098, "grad_norm": 0.4027707139908952, "learning_rate": 3.8823768097487555e-05, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.11872929334640503, "step": 1420, "valid_targets_mean": 2956.5, "valid_targets_min": 1389 }, { "epoch": 1.3970588235294117, "grad_norm": 0.5121711907073138, "learning_rate": 3.8807193228217006e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.15116044878959656, "step": 1425, "valid_targets_mean": 2139.8, "valid_targets_min": 715 }, { "epoch": 1.4019607843137254, "grad_norm": 0.4615092163821721, "learning_rate": 3.879050598074377e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.16094964742660522, "step": 1430, "valid_targets_mean": 2579.1, "valid_targets_min": 944 }, { "epoch": 1.406862745098039, "grad_norm": 0.4837425625903746, "learning_rate": 3.877370645477878e-05, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.1381511688232422, "step": 1435, "valid_targets_mean": 2226.8, "valid_targets_min": 363 }, { "epoch": 1.4117647058823528, "grad_norm": 0.49885604510183423, "learning_rate": 3.875679475070386e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.13402841985225677, "step": 1440, "valid_targets_mean": 1817.2, "valid_targets_min": 357 }, { "epoch": 1.4166666666666667, "grad_norm": 0.5948084146879866, "learning_rate": 3.873977096957115e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.15349772572517395, "step": 1445, "valid_targets_mean": 2068.1, "valid_targets_min": 721 }, { "epoch": 1.4215686274509804, "grad_norm": 0.43546114760012355, "learning_rate": 3.872263521310248e-05, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.1208997517824173, "step": 1450, "valid_targets_mean": 2656.3, "valid_targets_min": 795 }, { "epoch": 1.4264705882352942, "grad_norm": 0.41007339804542614, "learning_rate": 3.870538758368874e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.12087947130203247, "step": 1455, "valid_targets_mean": 2850.0, "valid_targets_min": 689 }, { "epoch": 1.4313725490196079, "grad_norm": 0.5477355070675948, "learning_rate": 3.868802818438931e-05, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.14966945350170135, "step": 1460, "valid_targets_mean": 2159.5, "valid_targets_min": 887 }, { "epoch": 1.4362745098039216, "grad_norm": 0.5084422208686458, "learning_rate": 3.8670557118931406e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.15912967920303345, "step": 1465, "valid_targets_mean": 2255.6, "valid_targets_min": 890 }, { "epoch": 1.4411764705882353, "grad_norm": 0.5106364860275668, "learning_rate": 3.8652974491709524e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488266885280609, "step": 1470, "valid_targets_mean": 2155.7, "valid_targets_min": 652 }, { "epoch": 1.446078431372549, "grad_norm": 0.5123306890644707, "learning_rate": 3.863528040778473e-05, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.16354094445705414, "step": 1475, "valid_targets_mean": 2284.4, "valid_targets_min": 800 }, { "epoch": 1.4509803921568627, "grad_norm": 0.59057508765795, "learning_rate": 3.861747497288409e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.1789345145225525, "step": 1480, "valid_targets_mean": 2036.8, "valid_targets_min": 890 }, { "epoch": 1.4558823529411764, "grad_norm": 0.4268181984593978, "learning_rate": 3.859955829340002e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.13590224087238312, "step": 1485, "valid_targets_mean": 2580.3, "valid_targets_min": 523 }, { "epoch": 1.4607843137254901, "grad_norm": 0.5925211684186468, "learning_rate": 3.8581530476389665e-05, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.1535499542951584, "step": 1490, "valid_targets_mean": 2115.8, "valid_targets_min": 549 }, { "epoch": 1.465686274509804, "grad_norm": 0.4175992000283523, "learning_rate": 3.8563391629574226e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.13089969754219055, "step": 1495, "valid_targets_mean": 2766.2, "valid_targets_min": 789 }, { "epoch": 1.4705882352941178, "grad_norm": 0.4916655913807976, "learning_rate": 3.8545141861338355e-05, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.15090090036392212, "step": 1500, "valid_targets_mean": 2067.1, "valid_targets_min": 309 }, { "epoch": 1.4754901960784315, "grad_norm": 0.5271031406287625, "learning_rate": 3.8526781280729494e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.1575801819562912, "step": 1505, "valid_targets_mean": 2504.5, "valid_targets_min": 715 }, { "epoch": 1.4803921568627452, "grad_norm": 0.4701289225402125, "learning_rate": 3.85083099974572e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.15561668574810028, "step": 1510, "valid_targets_mean": 2856.8, "valid_targets_min": 774 }, { "epoch": 1.4852941176470589, "grad_norm": 0.5494676935044653, "learning_rate": 3.848972812189253e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.18085089325904846, "step": 1515, "valid_targets_mean": 2039.9, "valid_targets_min": 626 }, { "epoch": 1.4901960784313726, "grad_norm": 0.6263018300453485, "learning_rate": 3.847103576506734e-05, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.15949448943138123, "step": 1520, "valid_targets_mean": 1484.6, "valid_targets_min": 635 }, { "epoch": 1.4950980392156863, "grad_norm": 0.46999594845254383, "learning_rate": 3.845223303867366e-05, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.13206514716148376, "step": 1525, "valid_targets_mean": 2437.2, "valid_targets_min": 593 }, { "epoch": 1.5, "grad_norm": 0.5255301328952996, "learning_rate": 3.8433320055063e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.15027153491973877, "step": 1530, "valid_targets_mean": 1982.6, "valid_targets_min": 707 }, { "epoch": 1.5049019607843137, "grad_norm": 0.5347904846455934, "learning_rate": 3.84142969272457e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.19537004828453064, "step": 1535, "valid_targets_mean": 2316.7, "valid_targets_min": 711 }, { "epoch": 1.5098039215686274, "grad_norm": 0.5646663834321809, "learning_rate": 3.8395163768890214e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.17573268711566925, "step": 1540, "valid_targets_mean": 1757.5, "valid_targets_min": 622 }, { "epoch": 1.5147058823529411, "grad_norm": 0.5658551765278447, "learning_rate": 3.837592069432248e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.15337808430194855, "step": 1545, "valid_targets_mean": 2001.4, "valid_targets_min": 663 }, { "epoch": 1.5196078431372548, "grad_norm": 0.38422117950519047, "learning_rate": 3.8356567818525235e-05, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.11618193984031677, "step": 1550, "valid_targets_mean": 2760.7, "valid_targets_min": 853 }, { "epoch": 1.5245098039215685, "grad_norm": 0.5217212912328395, "learning_rate": 3.8337105257137264e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.15121859312057495, "step": 1555, "valid_targets_mean": 2225.5, "valid_targets_min": 737 }, { "epoch": 1.5294117647058822, "grad_norm": 0.5285773256463285, "learning_rate": 3.8317533126452773e-05, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.15342125296592712, "step": 1560, "valid_targets_mean": 2033.9, "valid_targets_min": 765 }, { "epoch": 1.534313725490196, "grad_norm": 0.45981631765341807, "learning_rate": 3.829785154342069e-05, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.13747870922088623, "step": 1565, "valid_targets_mean": 2533.3, "valid_targets_min": 629 }, { "epoch": 1.5392156862745097, "grad_norm": 0.4170627519498316, "learning_rate": 3.8278060625643945e-05, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.1535811424255371, "step": 1570, "valid_targets_mean": 2868.6, "valid_targets_min": 943 }, { "epoch": 1.5441176470588234, "grad_norm": 0.3896454803749676, "learning_rate": 3.825816049137876e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.11401885747909546, "step": 1575, "valid_targets_mean": 2787.1, "valid_targets_min": 817 }, { "epoch": 1.5490196078431373, "grad_norm": 0.5002979894193942, "learning_rate": 3.823815125953396e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.1406538188457489, "step": 1580, "valid_targets_mean": 2422.6, "valid_targets_min": 689 }, { "epoch": 1.553921568627451, "grad_norm": 0.56850834145191, "learning_rate": 3.821803304967027e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.1491360068321228, "step": 1585, "valid_targets_mean": 1996.2, "valid_targets_min": 527 }, { "epoch": 1.5588235294117647, "grad_norm": 0.4998315996038415, "learning_rate": 3.819780598199958e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.15458178520202637, "step": 1590, "valid_targets_mean": 2790.4, "valid_targets_min": 748 }, { "epoch": 1.5637254901960784, "grad_norm": 0.6662479740719508, "learning_rate": 3.8177470177384227e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.1752540022134781, "step": 1595, "valid_targets_mean": 1685.2, "valid_targets_min": 474 }, { "epoch": 1.5686274509803921, "grad_norm": 0.46836465561013363, "learning_rate": 3.81570257573363e-05, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.14558619260787964, "step": 1600, "valid_targets_mean": 2609.4, "valid_targets_min": 890 }, { "epoch": 1.5735294117647058, "grad_norm": 0.7066979739662512, "learning_rate": 3.813647284401689e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1357910931110382, "step": 1605, "valid_targets_mean": 1793.6, "valid_targets_min": 574 }, { "epoch": 1.5784313725490198, "grad_norm": 0.49109212337132546, "learning_rate": 3.811581156023536e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.14518040418624878, "step": 1610, "valid_targets_mean": 2120.4, "valid_targets_min": 773 }, { "epoch": 1.5833333333333335, "grad_norm": 0.5111836333604469, "learning_rate": 3.809504202944861e-05, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.14256779849529266, "step": 1615, "valid_targets_mean": 1982.6, "valid_targets_min": 696 }, { "epoch": 1.5882352941176472, "grad_norm": 0.9023676798605845, "learning_rate": 3.807416437576036e-05, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.1626691222190857, "step": 1620, "valid_targets_mean": 1895.9, "valid_targets_min": 647 }, { "epoch": 1.593137254901961, "grad_norm": 0.5123255661123512, "learning_rate": 3.80531787239204e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.16807357966899872, "step": 1625, "valid_targets_mean": 2144.9, "valid_targets_min": 807 }, { "epoch": 1.5980392156862746, "grad_norm": 0.491171773292401, "learning_rate": 3.803208519932381e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.2099742591381073, "step": 1630, "valid_targets_mean": 2904.7, "valid_targets_min": 950 }, { "epoch": 1.6029411764705883, "grad_norm": 0.3905325983675772, "learning_rate": 3.8010883928010265e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1118234246969223, "step": 1635, "valid_targets_mean": 2854.1, "valid_targets_min": 700 }, { "epoch": 1.607843137254902, "grad_norm": 0.5356632738991045, "learning_rate": 3.798957503666325e-05, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.17137929797172546, "step": 1640, "valid_targets_mean": 2408.6, "valid_targets_min": 655 }, { "epoch": 1.6127450980392157, "grad_norm": 0.47756403160814764, "learning_rate": 3.7968158652609306e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.13389216363430023, "step": 1645, "valid_targets_mean": 2166.3, "valid_targets_min": 724 }, { "epoch": 1.6176470588235294, "grad_norm": 0.6104217262915782, "learning_rate": 3.7946634903817284e-05, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.17253968119621277, "step": 1650, "valid_targets_mean": 2078.8, "valid_targets_min": 529 }, { "epoch": 1.6225490196078431, "grad_norm": 0.7027710890124704, "learning_rate": 3.792500391889755e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.14878009259700775, "step": 1655, "valid_targets_mean": 2058.6, "valid_targets_min": 718 }, { "epoch": 1.6274509803921569, "grad_norm": 0.5478596948797649, "learning_rate": 3.790326582710125e-05, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.14182859659194946, "step": 1660, "valid_targets_mean": 2234.1, "valid_targets_min": 650 }, { "epoch": 1.6323529411764706, "grad_norm": 0.5465599142774893, "learning_rate": 3.788142075831952e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.15382519364356995, "step": 1665, "valid_targets_mean": 1936.5, "valid_targets_min": 952 }, { "epoch": 1.6372549019607843, "grad_norm": 0.577878109070135, "learning_rate": 3.7859468843082716e-05, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.17845892906188965, "step": 1670, "valid_targets_mean": 2106.3, "valid_targets_min": 877 }, { "epoch": 1.642156862745098, "grad_norm": 0.48117276564009087, "learning_rate": 3.7837410212559623e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.14203675091266632, "step": 1675, "valid_targets_mean": 2077.6, "valid_targets_min": 729 }, { "epoch": 1.6470588235294117, "grad_norm": 0.5585520122750612, "learning_rate": 3.781524499855668e-05, "loss": 0.1463, "loss_nan_ranks": 0, "loss_rank_avg": 0.15015847980976105, "step": 1680, "valid_targets_mean": 1771.9, "valid_targets_min": 642 }, { "epoch": 1.6519607843137254, "grad_norm": 0.4289941836302043, "learning_rate": 3.779297333351721e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.11602067947387695, "step": 1685, "valid_targets_mean": 2702.9, "valid_targets_min": 750 }, { "epoch": 1.656862745098039, "grad_norm": 0.4886606859408909, "learning_rate": 3.777059535052059e-05, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.15592262148857117, "step": 1690, "valid_targets_mean": 2242.9, "valid_targets_min": 856 }, { "epoch": 1.6617647058823528, "grad_norm": 0.603285219664727, "learning_rate": 3.774811118328149e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.18172068893909454, "step": 1695, "valid_targets_mean": 1707.1, "valid_targets_min": 529 }, { "epoch": 1.6666666666666665, "grad_norm": 0.5302230844470484, "learning_rate": 3.772552096614904e-05, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.15116459131240845, "step": 1700, "valid_targets_mean": 2325.4, "valid_targets_min": 634 }, { "epoch": 1.6715686274509802, "grad_norm": 0.6006361801337328, "learning_rate": 3.7702824834106066e-05, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.1827220320701599, "step": 1705, "valid_targets_mean": 2108.4, "valid_targets_min": 533 }, { "epoch": 1.6764705882352942, "grad_norm": 0.4592856246938828, "learning_rate": 3.768002292276826e-05, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.12549643218517303, "step": 1710, "valid_targets_mean": 2249.1, "valid_targets_min": 724 }, { "epoch": 1.6813725490196079, "grad_norm": 0.6134998129989979, "learning_rate": 3.765711536838338e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.18850260972976685, "step": 1715, "valid_targets_mean": 1851.9, "valid_targets_min": 687 }, { "epoch": 1.6862745098039216, "grad_norm": 0.49997491291599816, "learning_rate": 3.763410230783042e-05, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.203414186835289, "step": 1720, "valid_targets_mean": 2292.8, "valid_targets_min": 572 }, { "epoch": 1.6911764705882353, "grad_norm": 0.47966143153752505, "learning_rate": 3.7610983878618816e-05, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.14274010062217712, "step": 1725, "valid_targets_mean": 2055.4, "valid_targets_min": 610 }, { "epoch": 1.696078431372549, "grad_norm": 0.5041314204689977, "learning_rate": 3.7587760218887595e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.17796386778354645, "step": 1730, "valid_targets_mean": 2114.6, "valid_targets_min": 598 }, { "epoch": 1.7009803921568627, "grad_norm": 0.5496728194221527, "learning_rate": 3.756443146740457e-05, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.1596316248178482, "step": 1735, "valid_targets_mean": 1827.0, "valid_targets_min": 829 }, { "epoch": 1.7058823529411766, "grad_norm": 0.5933172007849838, "learning_rate": 3.7540997763565525e-05, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.16515210270881653, "step": 1740, "valid_targets_mean": 1805.4, "valid_targets_min": 688 }, { "epoch": 1.7107843137254903, "grad_norm": 0.5533001908804063, "learning_rate": 3.751745924739333e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.16086289286613464, "step": 1745, "valid_targets_mean": 2245.2, "valid_targets_min": 637 }, { "epoch": 1.715686274509804, "grad_norm": 0.3625773782586867, "learning_rate": 3.7493816059537174e-05, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.10024596750736237, "step": 1750, "valid_targets_mean": 2614.1, "valid_targets_min": 738 }, { "epoch": 1.7205882352941178, "grad_norm": 0.4920024696196442, "learning_rate": 3.747006834127166e-05, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591131091117859, "step": 1755, "valid_targets_mean": 2266.2, "valid_targets_min": 744 }, { "epoch": 1.7254901960784315, "grad_norm": 0.40531676129734534, "learning_rate": 3.7446216234496e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.11736778914928436, "step": 1760, "valid_targets_mean": 2764.4, "valid_targets_min": 676 }, { "epoch": 1.7303921568627452, "grad_norm": 0.5413087543165096, "learning_rate": 3.742225988173315e-05, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.16685521602630615, "step": 1765, "valid_targets_mean": 1968.8, "valid_targets_min": 610 }, { "epoch": 1.7352941176470589, "grad_norm": 0.5458227730487121, "learning_rate": 3.7398199426128995e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.14602074027061462, "step": 1770, "valid_targets_mean": 1909.1, "valid_targets_min": 812 }, { "epoch": 1.7401960784313726, "grad_norm": 0.4399415602242103, "learning_rate": 3.737403501145141e-05, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.14302271604537964, "step": 1775, "valid_targets_mean": 2533.6, "valid_targets_min": 943 }, { "epoch": 1.7450980392156863, "grad_norm": 0.5607709048920859, "learning_rate": 3.7349766782089515e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.18201008439064026, "step": 1780, "valid_targets_mean": 1960.6, "valid_targets_min": 742 }, { "epoch": 1.75, "grad_norm": 0.5414297127263566, "learning_rate": 3.732539488305269e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.16086480021476746, "step": 1785, "valid_targets_mean": 2153.8, "valid_targets_min": 754 }, { "epoch": 1.7549019607843137, "grad_norm": 0.5278807774304168, "learning_rate": 3.73009194599698e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.15399423241615295, "step": 1790, "valid_targets_mean": 1997.1, "valid_targets_min": 570 }, { "epoch": 1.7598039215686274, "grad_norm": 0.5043590546147471, "learning_rate": 3.727634065908833e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.15289407968521118, "step": 1795, "valid_targets_mean": 2063.8, "valid_targets_min": 549 }, { "epoch": 1.7647058823529411, "grad_norm": 0.44386672927984044, "learning_rate": 3.725165862727341e-05, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.1439841389656067, "step": 1800, "valid_targets_mean": 2574.6, "valid_targets_min": 724 }, { "epoch": 1.7696078431372548, "grad_norm": 0.6067341975360978, "learning_rate": 3.722687351200704e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.1851101666688919, "step": 1805, "valid_targets_mean": 1918.6, "valid_targets_min": 767 }, { "epoch": 1.7745098039215685, "grad_norm": 0.5472528253501442, "learning_rate": 3.720198546138718e-05, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.1516643464565277, "step": 1810, "valid_targets_mean": 1931.3, "valid_targets_min": 635 }, { "epoch": 1.7794117647058822, "grad_norm": 0.5273521005478816, "learning_rate": 3.717699462412683e-05, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.12933941185474396, "step": 1815, "valid_targets_mean": 2039.8, "valid_targets_min": 525 }, { "epoch": 1.784313725490196, "grad_norm": 0.6077315011956368, "learning_rate": 3.715190114955319e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.17466555535793304, "step": 1820, "valid_targets_mean": 1669.6, "valid_targets_min": 494 }, { "epoch": 1.7892156862745097, "grad_norm": 0.512358696269543, "learning_rate": 3.712670518760674e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.1617322564125061, "step": 1825, "valid_targets_mean": 2220.2, "valid_targets_min": 761 }, { "epoch": 1.7941176470588234, "grad_norm": 0.4336332041487301, "learning_rate": 3.7101406888840345e-05, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.15320450067520142, "step": 1830, "valid_targets_mean": 2737.3, "valid_targets_min": 820 }, { "epoch": 1.7990196078431373, "grad_norm": 0.4883048284620736, "learning_rate": 3.707600640441837e-05, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.13818612694740295, "step": 1835, "valid_targets_mean": 2208.4, "valid_targets_min": 490 }, { "epoch": 1.803921568627451, "grad_norm": 0.43072754382140194, "learning_rate": 3.705050388611577e-05, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.13516834378242493, "step": 1840, "valid_targets_mean": 2813.6, "valid_targets_min": 695 }, { "epoch": 1.8088235294117647, "grad_norm": 0.48514804711619286, "learning_rate": 3.702489948631716e-05, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.1558280736207962, "step": 1845, "valid_targets_mean": 2298.6, "valid_targets_min": 848 }, { "epoch": 1.8137254901960784, "grad_norm": 0.43686024221397773, "learning_rate": 3.6999193358015955e-05, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.13829517364501953, "step": 1850, "valid_targets_mean": 2430.9, "valid_targets_min": 769 }, { "epoch": 1.8186274509803921, "grad_norm": 0.41757476802350063, "learning_rate": 3.697338565481339e-05, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.13145369291305542, "step": 1855, "valid_targets_mean": 2702.2, "valid_targets_min": 910 }, { "epoch": 1.8235294117647058, "grad_norm": 0.4474403426831047, "learning_rate": 3.694747653091768e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.1498376429080963, "step": 1860, "valid_targets_mean": 2116.8, "valid_targets_min": 1030 }, { "epoch": 1.8284313725490198, "grad_norm": 0.38358293329939164, "learning_rate": 3.692146614114303e-05, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.10769416391849518, "step": 1865, "valid_targets_mean": 2927.0, "valid_targets_min": 748 }, { "epoch": 1.8333333333333335, "grad_norm": 0.4665869269944144, "learning_rate": 3.689535464090873e-05, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.1278778612613678, "step": 1870, "valid_targets_mean": 2084.3, "valid_targets_min": 459 }, { "epoch": 1.8382352941176472, "grad_norm": 0.5307097608707636, "learning_rate": 3.686914218623827e-05, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.14258277416229248, "step": 1875, "valid_targets_mean": 2299.4, "valid_targets_min": 502 }, { "epoch": 1.843137254901961, "grad_norm": 0.6080976433925368, "learning_rate": 3.684282893375832e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.19785189628601074, "step": 1880, "valid_targets_mean": 1875.2, "valid_targets_min": 540 }, { "epoch": 1.8480392156862746, "grad_norm": 0.5217574684853883, "learning_rate": 3.681641504069789e-05, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.16252940893173218, "step": 1885, "valid_targets_mean": 1984.9, "valid_targets_min": 698 }, { "epoch": 1.8529411764705883, "grad_norm": 0.47220196862435904, "learning_rate": 3.678990066488732e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.1338098645210266, "step": 1890, "valid_targets_mean": 2058.9, "valid_targets_min": 697 }, { "epoch": 1.857843137254902, "grad_norm": 0.6141551360587747, "learning_rate": 3.676328596475737e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.16199412941932678, "step": 1895, "valid_targets_mean": 1510.5, "valid_targets_min": 605 }, { "epoch": 1.8627450980392157, "grad_norm": 0.5205786315285574, "learning_rate": 3.673657109933825e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.14440283179283142, "step": 1900, "valid_targets_mean": 1927.1, "valid_targets_min": 557 }, { "epoch": 1.8676470588235294, "grad_norm": 0.4953417684318436, "learning_rate": 3.6709756228258735e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.1402466744184494, "step": 1905, "valid_targets_mean": 2096.1, "valid_targets_min": 759 }, { "epoch": 1.8725490196078431, "grad_norm": 0.4604839145265826, "learning_rate": 3.66828415117451e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.1322975754737854, "step": 1910, "valid_targets_mean": 2135.5, "valid_targets_min": 629 }, { "epoch": 1.8774509803921569, "grad_norm": 0.6455850290038503, "learning_rate": 3.665582711062025e-05, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.22754456102848053, "step": 1915, "valid_targets_mean": 1907.5, "valid_targets_min": 617 }, { "epoch": 1.8823529411764706, "grad_norm": 0.4715702383406565, "learning_rate": 3.662871318630274e-05, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.15306609869003296, "step": 1920, "valid_targets_mean": 2446.2, "valid_targets_min": 816 }, { "epoch": 1.8872549019607843, "grad_norm": 0.41736403813308404, "learning_rate": 3.6601499900805806e-05, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.13367821276187897, "step": 1925, "valid_targets_mean": 3024.9, "valid_targets_min": 1184 }, { "epoch": 1.892156862745098, "grad_norm": 0.5399907281651121, "learning_rate": 3.657418741673638e-05, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.13740979135036469, "step": 1930, "valid_targets_mean": 1898.3, "valid_targets_min": 530 }, { "epoch": 1.8970588235294117, "grad_norm": 0.5478245298908677, "learning_rate": 3.654677589729413e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.14879709482192993, "step": 1935, "valid_targets_mean": 2260.4, "valid_targets_min": 329 }, { "epoch": 1.9019607843137254, "grad_norm": 0.5065828787704405, "learning_rate": 3.6519265506270514e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.1565818339586258, "step": 1940, "valid_targets_mean": 2250.4, "valid_targets_min": 424 }, { "epoch": 1.906862745098039, "grad_norm": 0.36373265285176326, "learning_rate": 3.649165640804775e-05, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.11532604694366455, "step": 1945, "valid_targets_mean": 2804.2, "valid_targets_min": 919 }, { "epoch": 1.9117647058823528, "grad_norm": 0.5378415324082915, "learning_rate": 3.6463948767597865e-05, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.1640024185180664, "step": 1950, "valid_targets_mean": 1955.8, "valid_targets_min": 796 }, { "epoch": 1.9166666666666665, "grad_norm": 0.5486860769413845, "learning_rate": 3.643614275048172e-05, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.13714325428009033, "step": 1955, "valid_targets_mean": 1825.2, "valid_targets_min": 647 }, { "epoch": 1.9215686274509802, "grad_norm": 0.4885348084048327, "learning_rate": 3.640823852284797e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.14006605744361877, "step": 1960, "valid_targets_mean": 2088.1, "valid_targets_min": 832 }, { "epoch": 1.9264705882352942, "grad_norm": 0.43492961451338746, "learning_rate": 3.6380236251432135e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1264418661594391, "step": 1965, "valid_targets_mean": 2195.3, "valid_targets_min": 776 }, { "epoch": 1.9313725490196079, "grad_norm": 0.40264611933976796, "learning_rate": 3.635213610355556e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.13179033994674683, "step": 1970, "valid_targets_mean": 2733.8, "valid_targets_min": 568 }, { "epoch": 1.9362745098039216, "grad_norm": 0.36990460761813326, "learning_rate": 3.632393824712444e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.1107700914144516, "step": 1975, "valid_targets_mean": 2647.9, "valid_targets_min": 777 }, { "epoch": 1.9411764705882353, "grad_norm": 0.41248718120084454, "learning_rate": 3.6295642850628785e-05, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.10980524122714996, "step": 1980, "valid_targets_mean": 2564.8, "valid_targets_min": 513 }, { "epoch": 1.946078431372549, "grad_norm": 0.43158575489604406, "learning_rate": 3.626725008314146e-05, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.1632903516292572, "step": 1985, "valid_targets_mean": 2678.8, "valid_targets_min": 635 }, { "epoch": 1.9509803921568627, "grad_norm": 0.3745578920161323, "learning_rate": 3.623876011431714e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.11174066364765167, "step": 1990, "valid_targets_mean": 2612.4, "valid_targets_min": 593 }, { "epoch": 1.9558823529411766, "grad_norm": 0.5970799142780278, "learning_rate": 3.621017311439127e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.15000393986701965, "step": 1995, "valid_targets_mean": 2207.6, "valid_targets_min": 575 }, { "epoch": 1.9607843137254903, "grad_norm": 0.6391894361261641, "learning_rate": 3.6181489254179154e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.1867298036813736, "step": 2000, "valid_targets_mean": 1771.7, "valid_targets_min": 607 }, { "epoch": 1.965686274509804, "grad_norm": 0.5067121980202994, "learning_rate": 3.6152708705074805e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.2050846666097641, "step": 2005, "valid_targets_mean": 2280.9, "valid_targets_min": 793 }, { "epoch": 1.9705882352941178, "grad_norm": 0.42741514259257013, "learning_rate": 3.612383163904999e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.16011744737625122, "step": 2010, "valid_targets_mean": 2644.6, "valid_targets_min": 826 }, { "epoch": 1.9754901960784315, "grad_norm": 0.4918328620919532, "learning_rate": 3.609485822865321e-05, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.15025535225868225, "step": 2015, "valid_targets_mean": 2447.8, "valid_targets_min": 946 }, { "epoch": 1.9803921568627452, "grad_norm": 0.4516353716793599, "learning_rate": 3.606578864700863e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.13741713762283325, "step": 2020, "valid_targets_mean": 2252.0, "valid_targets_min": 935 }, { "epoch": 1.9852941176470589, "grad_norm": 0.5604190301899437, "learning_rate": 3.603662306781507e-05, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.16286993026733398, "step": 2025, "valid_targets_mean": 2178.6, "valid_targets_min": 611 }, { "epoch": 1.9901960784313726, "grad_norm": 0.527379241441151, "learning_rate": 3.600736166534499e-05, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.17896302044391632, "step": 2030, "valid_targets_mean": 1935.2, "valid_targets_min": 780 }, { "epoch": 1.9950980392156863, "grad_norm": 0.5231350069083546, "learning_rate": 3.597800461444337e-05, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.15988443791866302, "step": 2035, "valid_targets_mean": 1890.6, "valid_targets_min": 602 }, { "epoch": 2.0, "grad_norm": 0.3655620271489274, "learning_rate": 3.5948552090526747e-05, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.10807867348194122, "step": 2040, "valid_targets_mean": 2740.8, "valid_targets_min": 636 }, { "epoch": 2.0049019607843137, "grad_norm": 0.44853090320448885, "learning_rate": 3.591900426958214e-05, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.12851010262966156, "step": 2045, "valid_targets_mean": 2482.2, "valid_targets_min": 1061 }, { "epoch": 2.0098039215686274, "grad_norm": 0.4583868678990238, "learning_rate": 3.5889361328165984e-05, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.12361206114292145, "step": 2050, "valid_targets_mean": 2640.2, "valid_targets_min": 682 }, { "epoch": 2.014705882352941, "grad_norm": 0.552121520532339, "learning_rate": 3.5859623443403073e-05, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.17563346028327942, "step": 2055, "valid_targets_mean": 2000.2, "valid_targets_min": 659 }, { "epoch": 2.019607843137255, "grad_norm": 0.5194438436937125, "learning_rate": 3.582979079298554e-05, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.14061996340751648, "step": 2060, "valid_targets_mean": 2127.3, "valid_targets_min": 596 }, { "epoch": 2.0245098039215685, "grad_norm": 0.47306084034707796, "learning_rate": 3.579986355517176e-05, "loss": 0.1338, "loss_nan_ranks": 0, "loss_rank_avg": 0.1396002471446991, "step": 2065, "valid_targets_mean": 2682.8, "valid_targets_min": 707 }, { "epoch": 2.0294117647058822, "grad_norm": 0.46665365715691065, "learning_rate": 3.576984190878528e-05, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.14326587319374084, "step": 2070, "valid_targets_mean": 2272.3, "valid_targets_min": 791 }, { "epoch": 2.034313725490196, "grad_norm": 0.61689314251335, "learning_rate": 3.5739726033213785e-05, "loss": 0.1171, "loss_nan_ranks": 0, "loss_rank_avg": 0.14959578216075897, "step": 2075, "valid_targets_mean": 1627.8, "valid_targets_min": 660 }, { "epoch": 2.0392156862745097, "grad_norm": 0.5457065769996188, "learning_rate": 3.570951610840798e-05, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.13586756587028503, "step": 2080, "valid_targets_mean": 2058.1, "valid_targets_min": 684 }, { "epoch": 2.0441176470588234, "grad_norm": 0.4753398929172197, "learning_rate": 3.567921231488057e-05, "loss": 0.1238, "loss_nan_ranks": 0, "loss_rank_avg": 0.11476504802703857, "step": 2085, "valid_targets_mean": 2186.1, "valid_targets_min": 722 }, { "epoch": 2.049019607843137, "grad_norm": 0.4759520403773523, "learning_rate": 3.564881483370512e-05, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.10093535482883453, "step": 2090, "valid_targets_mean": 2484.3, "valid_targets_min": 944 }, { "epoch": 2.053921568627451, "grad_norm": 0.47588801985114326, "learning_rate": 3.561832384651506e-05, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.12644708156585693, "step": 2095, "valid_targets_mean": 2357.6, "valid_targets_min": 715 }, { "epoch": 2.0588235294117645, "grad_norm": 0.7125143297196016, "learning_rate": 3.5587739535502454e-05, "loss": 0.133, "loss_nan_ranks": 0, "loss_rank_avg": 0.1273224800825119, "step": 2100, "valid_targets_mean": 2272.1, "valid_targets_min": 654 }, { "epoch": 2.063725490196078, "grad_norm": 0.5202077844278824, "learning_rate": 3.5557062083417094e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.1436024308204651, "step": 2105, "valid_targets_mean": 2256.0, "valid_targets_min": 805 }, { "epoch": 2.0686274509803924, "grad_norm": 0.6356593180787531, "learning_rate": 3.5526291673565256e-05, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.1912994682788849, "step": 2110, "valid_targets_mean": 2107.8, "valid_targets_min": 801 }, { "epoch": 2.073529411764706, "grad_norm": 0.40074516453340914, "learning_rate": 3.5495428489808696e-05, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.11367502808570862, "step": 2115, "valid_targets_mean": 2840.8, "valid_targets_min": 602 }, { "epoch": 2.0784313725490198, "grad_norm": 0.592311502287731, "learning_rate": 3.546447271656351e-05, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.1876107156276703, "step": 2120, "valid_targets_mean": 2378.8, "valid_targets_min": 743 }, { "epoch": 2.0833333333333335, "grad_norm": 0.5815462989037039, "learning_rate": 3.5433424538799024e-05, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.14821037650108337, "step": 2125, "valid_targets_mean": 2055.6, "valid_targets_min": 544 }, { "epoch": 2.088235294117647, "grad_norm": 0.5589277406530077, "learning_rate": 3.5402284142036733e-05, "loss": 0.1258, "loss_nan_ranks": 0, "loss_rank_avg": 0.1250324249267578, "step": 2130, "valid_targets_mean": 1668.1, "valid_targets_min": 545 }, { "epoch": 2.093137254901961, "grad_norm": 0.43853845260878704, "learning_rate": 3.5371051712349156e-05, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.11538475751876831, "step": 2135, "valid_targets_mean": 2481.9, "valid_targets_min": 761 }, { "epoch": 2.0980392156862746, "grad_norm": 0.5412188024421883, "learning_rate": 3.533972743635874e-05, "loss": 0.1235, "loss_nan_ranks": 0, "loss_rank_avg": 0.15065398812294006, "step": 2140, "valid_targets_mean": 2122.2, "valid_targets_min": 703 }, { "epoch": 2.1029411764705883, "grad_norm": 0.511228541672383, "learning_rate": 3.530831150123672e-05, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.10731547325849533, "step": 2145, "valid_targets_mean": 2195.9, "valid_targets_min": 646 }, { "epoch": 2.107843137254902, "grad_norm": 0.6186996765892316, "learning_rate": 3.527680409470205e-05, "loss": 0.1302, "loss_nan_ranks": 0, "loss_rank_avg": 0.1374223530292511, "step": 2150, "valid_targets_mean": 1655.9, "valid_targets_min": 502 }, { "epoch": 2.1127450980392157, "grad_norm": 0.5274842444330995, "learning_rate": 3.524520540502021e-05, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.125177264213562, "step": 2155, "valid_targets_mean": 1779.2, "valid_targets_min": 593 }, { "epoch": 2.1176470588235294, "grad_norm": 0.39573551657318656, "learning_rate": 3.521351562100218e-05, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.09408603608608246, "step": 2160, "valid_targets_mean": 2624.2, "valid_targets_min": 679 }, { "epoch": 2.122549019607843, "grad_norm": 0.49074741867654176, "learning_rate": 3.518173493200318e-05, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.12309744954109192, "step": 2165, "valid_targets_mean": 2309.3, "valid_targets_min": 673 }, { "epoch": 2.127450980392157, "grad_norm": 0.528817977555379, "learning_rate": 3.514986352792169e-05, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.11972697079181671, "step": 2170, "valid_targets_mean": 2068.5, "valid_targets_min": 730 }, { "epoch": 2.1323529411764706, "grad_norm": 0.47728039921295046, "learning_rate": 3.511790159919818e-05, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.1214258000254631, "step": 2175, "valid_targets_mean": 2368.5, "valid_targets_min": 827 }, { "epoch": 2.1372549019607843, "grad_norm": 0.48897620372182415, "learning_rate": 3.508584933681406e-05, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.1263759583234787, "step": 2180, "valid_targets_mean": 2689.0, "valid_targets_min": 669 }, { "epoch": 2.142156862745098, "grad_norm": 0.5061688289772812, "learning_rate": 3.5053706932290496e-05, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.11041820049285889, "step": 2185, "valid_targets_mean": 2251.2, "valid_targets_min": 654 }, { "epoch": 2.1470588235294117, "grad_norm": 0.43813308425959413, "learning_rate": 3.502147457768727e-05, "loss": 0.1227, "loss_nan_ranks": 0, "loss_rank_avg": 0.10830570757389069, "step": 2190, "valid_targets_mean": 2631.1, "valid_targets_min": 777 }, { "epoch": 2.1519607843137254, "grad_norm": 0.968182961952041, "learning_rate": 3.4989152465601674e-05, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.12635761499404907, "step": 2195, "valid_targets_mean": 2246.6, "valid_targets_min": 497 }, { "epoch": 2.156862745098039, "grad_norm": 0.49739085063558636, "learning_rate": 3.4956740789167295e-05, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.13866953551769257, "step": 2200, "valid_targets_mean": 2214.8, "valid_targets_min": 779 }, { "epoch": 2.161764705882353, "grad_norm": 0.5962862027967147, "learning_rate": 3.492423974205289e-05, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.15598756074905396, "step": 2205, "valid_targets_mean": 1891.1, "valid_targets_min": 792 }, { "epoch": 2.1666666666666665, "grad_norm": 0.5592001479661793, "learning_rate": 3.489164951846126e-05, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.13359807431697845, "step": 2210, "valid_targets_mean": 2060.6, "valid_targets_min": 741 }, { "epoch": 2.1715686274509802, "grad_norm": 0.5689778264268539, "learning_rate": 3.485897031312803e-05, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.15123270452022552, "step": 2215, "valid_targets_mean": 1901.0, "valid_targets_min": 720 }, { "epoch": 2.176470588235294, "grad_norm": 0.5298808530933589, "learning_rate": 3.482620232132053e-05, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.1346893608570099, "step": 2220, "valid_targets_mean": 2066.5, "valid_targets_min": 744 }, { "epoch": 2.1813725490196076, "grad_norm": 0.49863038928798403, "learning_rate": 3.479334573883661e-05, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.1366402953863144, "step": 2225, "valid_targets_mean": 2096.5, "valid_targets_min": 447 }, { "epoch": 2.186274509803922, "grad_norm": 0.5628304884727421, "learning_rate": 3.476040076200349e-05, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595756709575653, "step": 2230, "valid_targets_mean": 2224.7, "valid_targets_min": 776 }, { "epoch": 2.1911764705882355, "grad_norm": 0.5623315824364589, "learning_rate": 3.4727367587676526e-05, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.13027265667915344, "step": 2235, "valid_targets_mean": 1854.1, "valid_targets_min": 629 }, { "epoch": 2.196078431372549, "grad_norm": 0.473141662338017, "learning_rate": 3.469424641323814e-05, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.12759196758270264, "step": 2240, "valid_targets_mean": 2349.1, "valid_targets_min": 518 }, { "epoch": 2.200980392156863, "grad_norm": 0.41221711934436744, "learning_rate": 3.4661037436596526e-05, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.10086143016815186, "step": 2245, "valid_targets_mean": 2314.2, "valid_targets_min": 720 }, { "epoch": 2.2058823529411766, "grad_norm": 0.46078471255102504, "learning_rate": 3.462774085618456e-05, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.13009145855903625, "step": 2250, "valid_targets_mean": 2152.8, "valid_targets_min": 747 }, { "epoch": 2.2107843137254903, "grad_norm": 0.4447788825171731, "learning_rate": 3.459435687095854e-05, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.1283532679080963, "step": 2255, "valid_targets_mean": 2686.1, "valid_targets_min": 564 }, { "epoch": 2.215686274509804, "grad_norm": 0.4495583706963151, "learning_rate": 3.456088568039706e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.12000022828578949, "step": 2260, "valid_targets_mean": 2626.5, "valid_targets_min": 887 }, { "epoch": 2.2205882352941178, "grad_norm": 0.4341070451837946, "learning_rate": 3.4527327484499774e-05, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.11233153194189072, "step": 2265, "valid_targets_mean": 2346.6, "valid_targets_min": 649 }, { "epoch": 2.2254901960784315, "grad_norm": 0.6511108625477997, "learning_rate": 3.4493682483786224e-05, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.1597345620393753, "step": 2270, "valid_targets_mean": 1768.8, "valid_targets_min": 803 }, { "epoch": 2.230392156862745, "grad_norm": 0.5060816776168183, "learning_rate": 3.445995087929463e-05, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.12492702901363373, "step": 2275, "valid_targets_mean": 1925.5, "valid_targets_min": 848 }, { "epoch": 2.235294117647059, "grad_norm": 0.3940204045235387, "learning_rate": 3.44261328725807e-05, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.12375809997320175, "step": 2280, "valid_targets_mean": 2956.6, "valid_targets_min": 1185 }, { "epoch": 2.2401960784313726, "grad_norm": 0.444465719098011, "learning_rate": 3.439222866571642e-05, "loss": 0.1115, "loss_nan_ranks": 0, "loss_rank_avg": 0.12371980398893356, "step": 2285, "valid_targets_mean": 2072.8, "valid_targets_min": 598 }, { "epoch": 2.2450980392156863, "grad_norm": 0.4260395688487762, "learning_rate": 3.435823846128884e-05, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.13873659074306488, "step": 2290, "valid_targets_mean": 2553.1, "valid_targets_min": 693 }, { "epoch": 2.25, "grad_norm": 0.43623375929776165, "learning_rate": 3.4324162462398866e-05, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.11390223354101181, "step": 2295, "valid_targets_mean": 2437.5, "valid_targets_min": 661 }, { "epoch": 2.2549019607843137, "grad_norm": 0.3515272676523296, "learning_rate": 3.429000087266006e-05, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.09347573667764664, "step": 2300, "valid_targets_mean": 3243.8, "valid_targets_min": 1082 }, { "epoch": 2.2598039215686274, "grad_norm": 0.4408806721575717, "learning_rate": 3.425575389619741e-05, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.11834917962551117, "step": 2305, "valid_targets_mean": 2635.5, "valid_targets_min": 593 }, { "epoch": 2.264705882352941, "grad_norm": 0.5346131341964713, "learning_rate": 3.4221421737646104e-05, "loss": 0.1238, "loss_nan_ranks": 0, "loss_rank_avg": 0.12321878224611282, "step": 2310, "valid_targets_mean": 2153.0, "valid_targets_min": 754 }, { "epoch": 2.269607843137255, "grad_norm": 0.5305132857296478, "learning_rate": 3.418700460215033e-05, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.12815603613853455, "step": 2315, "valid_targets_mean": 2050.9, "valid_targets_min": 762 }, { "epoch": 2.2745098039215685, "grad_norm": 0.48597505457985135, "learning_rate": 3.415250269536203e-05, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.1451520174741745, "step": 2320, "valid_targets_mean": 2444.1, "valid_targets_min": 759 }, { "epoch": 2.2794117647058822, "grad_norm": 0.5662194806363534, "learning_rate": 3.411791622343967e-05, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.13560031354427338, "step": 2325, "valid_targets_mean": 1847.0, "valid_targets_min": 818 }, { "epoch": 2.284313725490196, "grad_norm": 0.451292753609537, "learning_rate": 3.408324539304704e-05, "loss": 0.1133, "loss_nan_ranks": 0, "loss_rank_avg": 0.11846590787172318, "step": 2330, "valid_targets_mean": 2227.3, "valid_targets_min": 749 }, { "epoch": 2.2892156862745097, "grad_norm": 0.4404840749164589, "learning_rate": 3.404849041135197e-05, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.11944162845611572, "step": 2335, "valid_targets_mean": 2625.9, "valid_targets_min": 722 }, { "epoch": 2.2941176470588234, "grad_norm": 0.4777756658786973, "learning_rate": 3.4013651486025135e-05, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.12575772404670715, "step": 2340, "valid_targets_mean": 2447.4, "valid_targets_min": 666 }, { "epoch": 2.299019607843137, "grad_norm": 0.5519792965011824, "learning_rate": 3.3978728825238787e-05, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.14594820141792297, "step": 2345, "valid_targets_mean": 2089.8, "valid_targets_min": 700 }, { "epoch": 2.303921568627451, "grad_norm": 0.5812553672215698, "learning_rate": 3.394372263766552e-05, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.10362367331981659, "step": 2350, "valid_targets_mean": 2284.7, "valid_targets_min": 817 }, { "epoch": 2.3088235294117645, "grad_norm": 0.4691399073192363, "learning_rate": 3.390863313247702e-05, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.11229017376899719, "step": 2355, "valid_targets_mean": 2364.8, "valid_targets_min": 680 }, { "epoch": 2.313725490196078, "grad_norm": 0.49890381302134496, "learning_rate": 3.3873460519342847e-05, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.1161687970161438, "step": 2360, "valid_targets_mean": 2548.6, "valid_targets_min": 720 }, { "epoch": 2.318627450980392, "grad_norm": 0.48881421124675306, "learning_rate": 3.3838205008429114e-05, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.10132157802581787, "step": 2365, "valid_targets_mean": 2347.0, "valid_targets_min": 677 }, { "epoch": 2.323529411764706, "grad_norm": 0.5687640140377678, "learning_rate": 3.38028668103973e-05, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.15966284275054932, "step": 2370, "valid_targets_mean": 2005.6, "valid_targets_min": 842 }, { "epoch": 2.3284313725490198, "grad_norm": 0.5241977540459799, "learning_rate": 3.376744613640294e-05, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.12451574206352234, "step": 2375, "valid_targets_mean": 2067.6, "valid_targets_min": 970 }, { "epoch": 2.3333333333333335, "grad_norm": 0.4441320290066578, "learning_rate": 3.37319431980944e-05, "loss": 0.1186, "loss_nan_ranks": 0, "loss_rank_avg": 0.12139909714460373, "step": 2380, "valid_targets_mean": 2486.1, "valid_targets_min": 776 }, { "epoch": 2.338235294117647, "grad_norm": 0.3958964877558289, "learning_rate": 3.369635820761162e-05, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.10344143211841583, "step": 2385, "valid_targets_mean": 2639.9, "valid_targets_min": 820 }, { "epoch": 2.343137254901961, "grad_norm": 0.4235899191085017, "learning_rate": 3.3660691377584774e-05, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.11542128026485443, "step": 2390, "valid_targets_mean": 2604.4, "valid_targets_min": 645 }, { "epoch": 2.3480392156862746, "grad_norm": 0.4510881066136338, "learning_rate": 3.362494292113308e-05, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.1214420273900032, "step": 2395, "valid_targets_mean": 2498.9, "valid_targets_min": 1012 }, { "epoch": 2.3529411764705883, "grad_norm": 0.5100119277747269, "learning_rate": 3.358911305186351e-05, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.1164846122264862, "step": 2400, "valid_targets_mean": 1774.4, "valid_targets_min": 572 }, { "epoch": 2.357843137254902, "grad_norm": 0.4567649270223125, "learning_rate": 3.355320198386947e-05, "loss": 0.1166, "loss_nan_ranks": 0, "loss_rank_avg": 0.10715487599372864, "step": 2405, "valid_targets_mean": 2297.6, "valid_targets_min": 673 }, { "epoch": 2.3627450980392157, "grad_norm": 0.4873938724406906, "learning_rate": 3.351720993172957e-05, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.11813487857580185, "step": 2410, "valid_targets_mean": 2144.9, "valid_targets_min": 766 }, { "epoch": 2.3676470588235294, "grad_norm": 0.4469656890585901, "learning_rate": 3.3481137110506305e-05, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.10170838981866837, "step": 2415, "valid_targets_mean": 2247.9, "valid_targets_min": 689 }, { "epoch": 2.372549019607843, "grad_norm": 0.47619819728984353, "learning_rate": 3.344498373574482e-05, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.14894942939281464, "step": 2420, "valid_targets_mean": 2214.6, "valid_targets_min": 731 }, { "epoch": 2.377450980392157, "grad_norm": 0.5003725526992597, "learning_rate": 3.340875002347156e-05, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.13846082985401154, "step": 2425, "valid_targets_mean": 2310.4, "valid_targets_min": 699 }, { "epoch": 2.3823529411764706, "grad_norm": 0.5491326217204983, "learning_rate": 3.337243619019301e-05, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.1536971479654312, "step": 2430, "valid_targets_mean": 1858.8, "valid_targets_min": 715 }, { "epoch": 2.3872549019607843, "grad_norm": 0.5328613699348111, "learning_rate": 3.3336042452894425e-05, "loss": 0.1144, "loss_nan_ranks": 0, "loss_rank_avg": 0.11894248425960541, "step": 2435, "valid_targets_mean": 1888.1, "valid_targets_min": 658 }, { "epoch": 2.392156862745098, "grad_norm": 0.5532164249157558, "learning_rate": 3.329956902903848e-05, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.14720863103866577, "step": 2440, "valid_targets_mean": 2460.6, "valid_targets_min": 523 }, { "epoch": 2.3970588235294117, "grad_norm": 0.6305635545547962, "learning_rate": 3.326301613656402e-05, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.16992811858654022, "step": 2445, "valid_targets_mean": 2158.1, "valid_targets_min": 834 }, { "epoch": 2.4019607843137254, "grad_norm": 0.47367213497868, "learning_rate": 3.322638399388472e-05, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.12942060828208923, "step": 2450, "valid_targets_mean": 2176.0, "valid_targets_min": 913 }, { "epoch": 2.406862745098039, "grad_norm": 0.5708011022431659, "learning_rate": 3.318967281988782e-05, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.1652604639530182, "step": 2455, "valid_targets_mean": 2101.6, "valid_targets_min": 819 }, { "epoch": 2.411764705882353, "grad_norm": 0.5099338224778304, "learning_rate": 3.3152882833932766e-05, "loss": 0.1178, "loss_nan_ranks": 0, "loss_rank_avg": 0.127591073513031, "step": 2460, "valid_targets_mean": 2128.4, "valid_targets_min": 615 }, { "epoch": 2.4166666666666665, "grad_norm": 0.5003755514174549, "learning_rate": 3.311601425584996e-05, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.13985368609428406, "step": 2465, "valid_targets_mean": 2125.7, "valid_targets_min": 740 }, { "epoch": 2.4215686274509802, "grad_norm": 0.5924950139777752, "learning_rate": 3.3079067305939366e-05, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.14252334833145142, "step": 2470, "valid_targets_mean": 2268.9, "valid_targets_min": 1037 }, { "epoch": 2.426470588235294, "grad_norm": 0.5314224716211676, "learning_rate": 3.3042042204969296e-05, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.14862433075904846, "step": 2475, "valid_targets_mean": 2261.7, "valid_targets_min": 560 }, { "epoch": 2.431372549019608, "grad_norm": 0.506747952151037, "learning_rate": 3.3004939174175e-05, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.139796644449234, "step": 2480, "valid_targets_mean": 2169.8, "valid_targets_min": 735 }, { "epoch": 2.436274509803922, "grad_norm": 0.5891764902816398, "learning_rate": 3.296775843525739e-05, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.12421401590108871, "step": 2485, "valid_targets_mean": 1692.9, "valid_targets_min": 641 }, { "epoch": 2.4411764705882355, "grad_norm": 0.39384181544170843, "learning_rate": 3.293050021038171e-05, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.12514618039131165, "step": 2490, "valid_targets_mean": 2835.9, "valid_targets_min": 890 }, { "epoch": 2.446078431372549, "grad_norm": 0.5466808342373171, "learning_rate": 3.289316472217621e-05, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.15848739445209503, "step": 2495, "valid_targets_mean": 1778.9, "valid_targets_min": 602 }, { "epoch": 2.450980392156863, "grad_norm": 0.4536221374191153, "learning_rate": 3.285575219373079e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.11861887574195862, "step": 2500, "valid_targets_mean": 2401.6, "valid_targets_min": 809 }, { "epoch": 2.4558823529411766, "grad_norm": 0.39556844985138695, "learning_rate": 3.2818262848595696e-05, "loss": 0.1168, "loss_nan_ranks": 0, "loss_rank_avg": 0.09962082654237747, "step": 2505, "valid_targets_mean": 2596.6, "valid_targets_min": 922 }, { "epoch": 2.4607843137254903, "grad_norm": 0.5563691562257486, "learning_rate": 3.2780696910780185e-05, "loss": 0.1209, "loss_nan_ranks": 0, "loss_rank_avg": 0.14485809206962585, "step": 2510, "valid_targets_mean": 1906.2, "valid_targets_min": 696 }, { "epoch": 2.465686274509804, "grad_norm": 0.48374305437067666, "learning_rate": 3.274305460475116e-05, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.1370125412940979, "step": 2515, "valid_targets_mean": 2272.5, "valid_targets_min": 680 }, { "epoch": 2.4705882352941178, "grad_norm": 0.4042482270802887, "learning_rate": 3.270533615543186e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.11950810253620148, "step": 2520, "valid_targets_mean": 2691.9, "valid_targets_min": 522 }, { "epoch": 2.4754901960784315, "grad_norm": 0.7546679032370863, "learning_rate": 3.2667541788200496e-05, "loss": 0.1359, "loss_nan_ranks": 0, "loss_rank_avg": 0.11613636463880539, "step": 2525, "valid_targets_mean": 2143.2, "valid_targets_min": 643 }, { "epoch": 2.480392156862745, "grad_norm": 0.41794384750016256, "learning_rate": 3.26296717288889e-05, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.1214665025472641, "step": 2530, "valid_targets_mean": 2751.1, "valid_targets_min": 1144 }, { "epoch": 2.485294117647059, "grad_norm": 0.5553263208758342, "learning_rate": 3.2591726203781205e-05, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.13100360333919525, "step": 2535, "valid_targets_mean": 2431.9, "valid_targets_min": 693 }, { "epoch": 2.4901960784313726, "grad_norm": 0.47914372549026196, "learning_rate": 3.255370543961245e-05, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.1484772264957428, "step": 2540, "valid_targets_mean": 2592.8, "valid_targets_min": 771 }, { "epoch": 2.4950980392156863, "grad_norm": 0.4662138254088204, "learning_rate": 3.2515609663567266e-05, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.16803815960884094, "step": 2545, "valid_targets_mean": 2494.6, "valid_targets_min": 633 }, { "epoch": 2.5, "grad_norm": 0.3930868423643063, "learning_rate": 3.247743910327849e-05, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.11918853223323822, "step": 2550, "valid_targets_mean": 2764.6, "valid_targets_min": 1225 }, { "epoch": 2.5049019607843137, "grad_norm": 0.5290514066877043, "learning_rate": 3.2439193986825835e-05, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.1352325975894928, "step": 2555, "valid_targets_mean": 2115.9, "valid_targets_min": 519 }, { "epoch": 2.5098039215686274, "grad_norm": 0.46854808906106793, "learning_rate": 3.240087454273448e-05, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.12803807854652405, "step": 2560, "valid_targets_mean": 2416.5, "valid_targets_min": 615 }, { "epoch": 2.514705882352941, "grad_norm": 0.43005809391608746, "learning_rate": 3.2362480999973744e-05, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.1205533966422081, "step": 2565, "valid_targets_mean": 2505.1, "valid_targets_min": 1080 }, { "epoch": 2.519607843137255, "grad_norm": 0.547921133473076, "learning_rate": 3.2324013587955716e-05, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.1539292335510254, "step": 2570, "valid_targets_mean": 2068.6, "valid_targets_min": 700 }, { "epoch": 2.5245098039215685, "grad_norm": 0.48177977616801043, "learning_rate": 3.228547253653386e-05, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.13383543491363525, "step": 2575, "valid_targets_mean": 2834.5, "valid_targets_min": 790 }, { "epoch": 2.5294117647058822, "grad_norm": 0.4326265292915774, "learning_rate": 3.2246858076001674e-05, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.12128859758377075, "step": 2580, "valid_targets_mean": 2535.4, "valid_targets_min": 986 }, { "epoch": 2.534313725490196, "grad_norm": 0.5318647060540064, "learning_rate": 3.2208170437091267e-05, "loss": 0.1199, "loss_nan_ranks": 0, "loss_rank_avg": 0.12436534464359283, "step": 2585, "valid_targets_mean": 2196.9, "valid_targets_min": 701 }, { "epoch": 2.5392156862745097, "grad_norm": 0.4846752026333883, "learning_rate": 3.216940985097203e-05, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433335542678833, "step": 2590, "valid_targets_mean": 2433.1, "valid_targets_min": 727 }, { "epoch": 2.5441176470588234, "grad_norm": 0.4239896532044266, "learning_rate": 3.213057654924924e-05, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.11380953341722488, "step": 2595, "valid_targets_mean": 2302.8, "valid_targets_min": 808 }, { "epoch": 2.549019607843137, "grad_norm": 0.44078999516335776, "learning_rate": 3.2091670763962645e-05, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.12046624720096588, "step": 2600, "valid_targets_mean": 2539.6, "valid_targets_min": 837 }, { "epoch": 2.553921568627451, "grad_norm": 0.5939898023952678, "learning_rate": 3.205269272758513e-05, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.11827564239501953, "step": 2605, "valid_targets_mean": 2455.4, "valid_targets_min": 723 }, { "epoch": 2.5588235294117645, "grad_norm": 0.5448767219249958, "learning_rate": 3.201364267302128e-05, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.13409531116485596, "step": 2610, "valid_targets_mean": 1850.7, "valid_targets_min": 731 }, { "epoch": 2.563725490196078, "grad_norm": 0.47561028426644697, "learning_rate": 3.1974520833606016e-05, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.11841538548469543, "step": 2615, "valid_targets_mean": 2128.8, "valid_targets_min": 663 }, { "epoch": 2.568627450980392, "grad_norm": 0.5378413990458727, "learning_rate": 3.1935327443103195e-05, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.12730035185813904, "step": 2620, "valid_targets_mean": 1888.8, "valid_targets_min": 741 }, { "epoch": 2.5735294117647056, "grad_norm": 0.4922033292560799, "learning_rate": 3.189606273570422e-05, "loss": 0.1395, "loss_nan_ranks": 0, "loss_rank_avg": 0.13984598219394684, "step": 2625, "valid_targets_mean": 2094.8, "valid_targets_min": 726 }, { "epoch": 2.5784313725490198, "grad_norm": 0.6332583070833103, "learning_rate": 3.18567269460266e-05, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.1428709626197815, "step": 2630, "valid_targets_mean": 1739.6, "valid_targets_min": 843 }, { "epoch": 2.5833333333333335, "grad_norm": 0.5513161663336141, "learning_rate": 3.1817320309112625e-05, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.14765672385692596, "step": 2635, "valid_targets_mean": 1715.8, "valid_targets_min": 795 }, { "epoch": 2.588235294117647, "grad_norm": 0.6440133895872631, "learning_rate": 3.1777843060427876e-05, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.15483424067497253, "step": 2640, "valid_targets_mean": 1774.8, "valid_targets_min": 514 }, { "epoch": 2.593137254901961, "grad_norm": 0.5336887900173594, "learning_rate": 3.173829543585989e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.20561406016349792, "step": 2645, "valid_targets_mean": 2104.5, "valid_targets_min": 530 }, { "epoch": 2.5980392156862746, "grad_norm": 0.4490637951442281, "learning_rate": 3.1698677671716716e-05, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.1061968132853508, "step": 2650, "valid_targets_mean": 1995.6, "valid_targets_min": 715 }, { "epoch": 2.6029411764705883, "grad_norm": 0.502444501852284, "learning_rate": 3.1658990004725464e-05, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.11915481835603714, "step": 2655, "valid_targets_mean": 2343.6, "valid_targets_min": 714 }, { "epoch": 2.607843137254902, "grad_norm": 0.5390839949044163, "learning_rate": 3.1619232672031e-05, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.1582946479320526, "step": 2660, "valid_targets_mean": 2198.4, "valid_targets_min": 655 }, { "epoch": 2.6127450980392157, "grad_norm": 0.5051852498871383, "learning_rate": 3.157940591119442e-05, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.15259839594364166, "step": 2665, "valid_targets_mean": 1985.2, "valid_targets_min": 784 }, { "epoch": 2.6176470588235294, "grad_norm": 0.49993466913907697, "learning_rate": 3.153950996019166e-05, "loss": 0.1162, "loss_nan_ranks": 0, "loss_rank_avg": 0.12850934267044067, "step": 2670, "valid_targets_mean": 2113.2, "valid_targets_min": 526 }, { "epoch": 2.622549019607843, "grad_norm": 0.5137848708127476, "learning_rate": 3.149954505741214e-05, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.1415955126285553, "step": 2675, "valid_targets_mean": 1886.8, "valid_targets_min": 806 }, { "epoch": 2.627450980392157, "grad_norm": 0.49292793100332416, "learning_rate": 3.1459511441657225e-05, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.13631919026374817, "step": 2680, "valid_targets_mean": 2043.3, "valid_targets_min": 688 }, { "epoch": 2.6323529411764706, "grad_norm": 0.5216681230311012, "learning_rate": 3.141940935213891e-05, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.12248043715953827, "step": 2685, "valid_targets_mean": 2078.9, "valid_targets_min": 605 }, { "epoch": 2.6372549019607843, "grad_norm": 0.4707375189641917, "learning_rate": 3.13792390284783e-05, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.13096097111701965, "step": 2690, "valid_targets_mean": 2617.3, "valid_targets_min": 825 }, { "epoch": 2.642156862745098, "grad_norm": 0.5264160275079668, "learning_rate": 3.1339000710704234e-05, "loss": 0.1327, "loss_nan_ranks": 0, "loss_rank_avg": 0.1339496374130249, "step": 2695, "valid_targets_mean": 1860.3, "valid_targets_min": 691 }, { "epoch": 2.6470588235294117, "grad_norm": 1.8516330663101164, "learning_rate": 3.129869463925185e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.128217414021492, "step": 2700, "valid_targets_mean": 2713.3, "valid_targets_min": 869 }, { "epoch": 2.6519607843137254, "grad_norm": 0.5964001445350231, "learning_rate": 3.125832105496112e-05, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.14027449488639832, "step": 2705, "valid_targets_mean": 1682.3, "valid_targets_min": 753 }, { "epoch": 2.656862745098039, "grad_norm": 0.46865445803340855, "learning_rate": 3.12178801990754e-05, "loss": 0.133, "loss_nan_ranks": 0, "loss_rank_avg": 0.15145006775856018, "step": 2710, "valid_targets_mean": 2126.5, "valid_targets_min": 692 }, { "epoch": 2.661764705882353, "grad_norm": 0.5266520204218963, "learning_rate": 3.1177372313240056e-05, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.14159266650676727, "step": 2715, "valid_targets_mean": 2026.8, "valid_targets_min": 668 }, { "epoch": 2.6666666666666665, "grad_norm": 0.47431158065227663, "learning_rate": 3.1136797639500946e-05, "loss": 0.1327, "loss_nan_ranks": 0, "loss_rank_avg": 0.1264529824256897, "step": 2720, "valid_targets_mean": 2156.2, "valid_targets_min": 663 }, { "epoch": 2.6715686274509802, "grad_norm": 0.46172333007882593, "learning_rate": 3.109615642030302e-05, "loss": 0.1186, "loss_nan_ranks": 0, "loss_rank_avg": 0.12161999940872192, "step": 2725, "valid_targets_mean": 2365.8, "valid_targets_min": 596 }, { "epoch": 2.6764705882352944, "grad_norm": 0.5417612997694451, "learning_rate": 3.105544889848885e-05, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.15983346104621887, "step": 2730, "valid_targets_mean": 1985.2, "valid_targets_min": 458 }, { "epoch": 2.681372549019608, "grad_norm": 0.5602903369720046, "learning_rate": 3.101467531729718e-05, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.1274542212486267, "step": 2735, "valid_targets_mean": 1546.2, "valid_targets_min": 591 }, { "epoch": 2.686274509803922, "grad_norm": 0.4499642056569709, "learning_rate": 3.0973835920361485e-05, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.12221525609493256, "step": 2740, "valid_targets_mean": 2619.2, "valid_targets_min": 923 }, { "epoch": 2.6911764705882355, "grad_norm": 0.49926621820934225, "learning_rate": 3.093293095170849e-05, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.14079585671424866, "step": 2745, "valid_targets_mean": 1941.2, "valid_targets_min": 676 }, { "epoch": 2.696078431372549, "grad_norm": 0.47853732191376075, "learning_rate": 3.089196065575676e-05, "loss": 0.1178, "loss_nan_ranks": 0, "loss_rank_avg": 0.13084784150123596, "step": 2750, "valid_targets_mean": 2173.8, "valid_targets_min": 756 }, { "epoch": 2.700980392156863, "grad_norm": 0.4604079974584735, "learning_rate": 3.0850925277315193e-05, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.1272059977054596, "step": 2755, "valid_targets_mean": 2368.0, "valid_targets_min": 720 }, { "epoch": 2.7058823529411766, "grad_norm": 0.5077703112679872, "learning_rate": 3.080982506158155e-05, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.12848421931266785, "step": 2760, "valid_targets_mean": 1888.6, "valid_targets_min": 679 }, { "epoch": 2.7107843137254903, "grad_norm": 0.4333748156398904, "learning_rate": 3.076866025414107e-05, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.10613423585891724, "step": 2765, "valid_targets_mean": 2228.8, "valid_targets_min": 650 }, { "epoch": 2.715686274509804, "grad_norm": 0.5617367615142488, "learning_rate": 3.072743110096487e-05, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.11530651152133942, "step": 2770, "valid_targets_mean": 2036.8, "valid_targets_min": 678 }, { "epoch": 2.7205882352941178, "grad_norm": 0.5711011470753721, "learning_rate": 3.0686137848408616e-05, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.14303429424762726, "step": 2775, "valid_targets_mean": 1693.8, "valid_targets_min": 324 }, { "epoch": 2.7254901960784315, "grad_norm": 0.5488360852479225, "learning_rate": 3.064478074321095e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1471487134695053, "step": 2780, "valid_targets_mean": 1827.1, "valid_targets_min": 570 }, { "epoch": 2.730392156862745, "grad_norm": 0.5149112512414382, "learning_rate": 3.060336003249206e-05, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.12844215333461761, "step": 2785, "valid_targets_mean": 1996.3, "valid_targets_min": 655 }, { "epoch": 2.735294117647059, "grad_norm": 0.5573426653011521, "learning_rate": 3.056187596375221e-05, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.1358461081981659, "step": 2790, "valid_targets_mean": 1847.9, "valid_targets_min": 781 }, { "epoch": 2.7401960784313726, "grad_norm": 0.4614772672771677, "learning_rate": 3.052032878487022e-05, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.13471747934818268, "step": 2795, "valid_targets_mean": 2591.0, "valid_targets_min": 734 }, { "epoch": 2.7450980392156863, "grad_norm": 0.5562205728473466, "learning_rate": 3.047871874410201e-05, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.13988906145095825, "step": 2800, "valid_targets_mean": 1747.5, "valid_targets_min": 637 }, { "epoch": 2.75, "grad_norm": 0.5350979428814614, "learning_rate": 3.0437046090079165e-05, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.12228747457265854, "step": 2805, "valid_targets_mean": 1716.3, "valid_targets_min": 734 }, { "epoch": 2.7549019607843137, "grad_norm": 0.5068335768270578, "learning_rate": 3.039531107180733e-05, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.12163315713405609, "step": 2810, "valid_targets_mean": 2055.1, "valid_targets_min": 723 }, { "epoch": 2.7598039215686274, "grad_norm": 0.4353854673960122, "learning_rate": 3.0353513938664855e-05, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.1248159259557724, "step": 2815, "valid_targets_mean": 2709.1, "valid_targets_min": 788 }, { "epoch": 2.764705882352941, "grad_norm": 0.5757889526569985, "learning_rate": 3.03116549404012e-05, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.12588320672512054, "step": 2820, "valid_targets_mean": 1643.4, "valid_targets_min": 665 }, { "epoch": 2.769607843137255, "grad_norm": 0.4571194123253969, "learning_rate": 3.0269734327135514e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.1337161362171173, "step": 2825, "valid_targets_mean": 2302.4, "valid_targets_min": 970 }, { "epoch": 2.7745098039215685, "grad_norm": 0.452298983086843, "learning_rate": 3.0227752349355105e-05, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.11990043520927429, "step": 2830, "valid_targets_mean": 2196.6, "valid_targets_min": 702 }, { "epoch": 2.7794117647058822, "grad_norm": 0.5137398992266271, "learning_rate": 3.018570925791395e-05, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.12331690639257431, "step": 2835, "valid_targets_mean": 1878.5, "valid_targets_min": 612 }, { "epoch": 2.784313725490196, "grad_norm": 0.47457896935510097, "learning_rate": 3.0143605304031185e-05, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.12229996919631958, "step": 2840, "valid_targets_mean": 2376.8, "valid_targets_min": 758 }, { "epoch": 2.7892156862745097, "grad_norm": 0.45690022114892714, "learning_rate": 3.0101440739289644e-05, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.12366802990436554, "step": 2845, "valid_targets_mean": 2346.6, "valid_targets_min": 608 }, { "epoch": 2.7941176470588234, "grad_norm": 0.42759880074470524, "learning_rate": 3.00592158156343e-05, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.10269932448863983, "step": 2850, "valid_targets_mean": 2301.4, "valid_targets_min": 839 }, { "epoch": 2.799019607843137, "grad_norm": 0.4304115392133804, "learning_rate": 3.00169307853708e-05, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.11028525233268738, "step": 2855, "valid_targets_mean": 2272.4, "valid_targets_min": 788 }, { "epoch": 2.803921568627451, "grad_norm": 0.4605724095449812, "learning_rate": 2.9974585901163955e-05, "loss": 0.1268, "loss_nan_ranks": 0, "loss_rank_avg": 0.12313034385442734, "step": 2860, "valid_targets_mean": 2610.8, "valid_targets_min": 888 }, { "epoch": 2.8088235294117645, "grad_norm": 0.5421500878681277, "learning_rate": 2.9932181416036186e-05, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.15357518196105957, "step": 2865, "valid_targets_mean": 2295.1, "valid_targets_min": 742 }, { "epoch": 2.813725490196078, "grad_norm": 0.4288979220922448, "learning_rate": 2.988971758336609e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.10890544950962067, "step": 2870, "valid_targets_mean": 2487.8, "valid_targets_min": 610 }, { "epoch": 2.818627450980392, "grad_norm": 0.5839474906818637, "learning_rate": 2.9847194656886846e-05, "loss": 0.1245, "loss_nan_ranks": 0, "loss_rank_avg": 0.1326325386762619, "step": 2875, "valid_targets_mean": 1586.2, "valid_targets_min": 523 }, { "epoch": 2.8235294117647056, "grad_norm": 0.3943595738679273, "learning_rate": 2.980461289068475e-05, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.10610520839691162, "step": 2880, "valid_targets_mean": 2857.4, "valid_targets_min": 761 }, { "epoch": 2.8284313725490198, "grad_norm": 0.3995014892923764, "learning_rate": 2.97619725391977e-05, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.10689753293991089, "step": 2885, "valid_targets_mean": 2595.2, "valid_targets_min": 917 }, { "epoch": 2.8333333333333335, "grad_norm": 0.4339660498932304, "learning_rate": 2.9719273857213607e-05, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.11175128817558289, "step": 2890, "valid_targets_mean": 2714.3, "valid_targets_min": 524 }, { "epoch": 2.838235294117647, "grad_norm": 0.4824549484105122, "learning_rate": 2.967651709986898e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.1368466168642044, "step": 2895, "valid_targets_mean": 2335.1, "valid_targets_min": 725 }, { "epoch": 2.843137254901961, "grad_norm": 0.49320253448063933, "learning_rate": 2.9633702522647314e-05, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.1290884166955948, "step": 2900, "valid_targets_mean": 2013.7, "valid_targets_min": 495 }, { "epoch": 2.8480392156862746, "grad_norm": 0.4512954249823614, "learning_rate": 2.959083038137758e-05, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.11821623891592026, "step": 2905, "valid_targets_mean": 2283.9, "valid_targets_min": 582 }, { "epoch": 2.8529411764705883, "grad_norm": 0.48511395512197114, "learning_rate": 2.9547900932232755e-05, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.12425636500120163, "step": 2910, "valid_targets_mean": 2048.6, "valid_targets_min": 694 }, { "epoch": 2.857843137254902, "grad_norm": 0.5655839453858921, "learning_rate": 2.95049144317282e-05, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.12589307129383087, "step": 2915, "valid_targets_mean": 1768.5, "valid_targets_min": 713 }, { "epoch": 2.8627450980392157, "grad_norm": 0.4545048327238555, "learning_rate": 2.9461871136720205e-05, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.13439792394638062, "step": 2920, "valid_targets_mean": 2661.6, "valid_targets_min": 580 }, { "epoch": 2.8676470588235294, "grad_norm": 0.4197095410493635, "learning_rate": 2.9418771304404408e-05, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.11430007219314575, "step": 2925, "valid_targets_mean": 2748.2, "valid_targets_min": 858 }, { "epoch": 2.872549019607843, "grad_norm": 0.4762686149288785, "learning_rate": 2.9375615192314272e-05, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.13634362816810608, "step": 2930, "valid_targets_mean": 2192.4, "valid_targets_min": 744 }, { "epoch": 2.877450980392157, "grad_norm": 0.6573835179007171, "learning_rate": 2.9332403058319562e-05, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.17557133734226227, "step": 2935, "valid_targets_mean": 1823.9, "valid_targets_min": 777 }, { "epoch": 2.8823529411764706, "grad_norm": 0.5697771049283034, "learning_rate": 2.928913516062477e-05, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.13310866057872772, "step": 2940, "valid_targets_mean": 1937.6, "valid_targets_min": 765 }, { "epoch": 2.8872549019607843, "grad_norm": 0.4815531389610093, "learning_rate": 2.9245811757767605e-05, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.10856365412473679, "step": 2945, "valid_targets_mean": 2188.1, "valid_targets_min": 725 }, { "epoch": 2.892156862745098, "grad_norm": 0.3525092757314404, "learning_rate": 2.920243310861743e-05, "loss": 0.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.08762288838624954, "step": 2950, "valid_targets_mean": 2877.1, "valid_targets_min": 633 }, { "epoch": 2.8970588235294117, "grad_norm": 0.44362286093916375, "learning_rate": 2.9158999472373727e-05, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.1400848627090454, "step": 2955, "valid_targets_mean": 2650.9, "valid_targets_min": 747 }, { "epoch": 2.9019607843137254, "grad_norm": 0.466533540036814, "learning_rate": 2.911551110856453e-05, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.12361754477024078, "step": 2960, "valid_targets_mean": 2421.5, "valid_targets_min": 714 }, { "epoch": 2.906862745098039, "grad_norm": 0.4275932951009806, "learning_rate": 2.9071968277044885e-05, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.11012598872184753, "step": 2965, "valid_targets_mean": 2530.9, "valid_targets_min": 696 }, { "epoch": 2.911764705882353, "grad_norm": 0.47645750491140126, "learning_rate": 2.9028371237995315e-05, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.11943289637565613, "step": 2970, "valid_targets_mean": 2157.4, "valid_targets_min": 787 }, { "epoch": 2.9166666666666665, "grad_norm": 0.5751641720681621, "learning_rate": 2.8984720251920228e-05, "loss": 0.1259, "loss_nan_ranks": 0, "loss_rank_avg": 0.134115070104599, "step": 2975, "valid_targets_mean": 2491.7, "valid_targets_min": 855 }, { "epoch": 2.9215686274509802, "grad_norm": 0.5048594686042459, "learning_rate": 2.8941015579646388e-05, "loss": 0.1326, "loss_nan_ranks": 0, "loss_rank_avg": 0.1326657235622406, "step": 2980, "valid_targets_mean": 2276.6, "valid_targets_min": 715 }, { "epoch": 2.9264705882352944, "grad_norm": 0.5218701473555022, "learning_rate": 2.8897257482321354e-05, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.1356755495071411, "step": 2985, "valid_targets_mean": 2125.2, "valid_targets_min": 716 }, { "epoch": 2.931372549019608, "grad_norm": 0.5719581951550526, "learning_rate": 2.88534462214119e-05, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.13416975736618042, "step": 2990, "valid_targets_mean": 1582.3, "valid_targets_min": 618 }, { "epoch": 2.936274509803922, "grad_norm": 0.4676682934177474, "learning_rate": 2.8809582058702497e-05, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.13310152292251587, "step": 2995, "valid_targets_mean": 2478.7, "valid_targets_min": 738 }, { "epoch": 2.9411764705882355, "grad_norm": 0.5153112474110181, "learning_rate": 2.8765665256293683e-05, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.12872923910617828, "step": 3000, "valid_targets_mean": 2084.5, "valid_targets_min": 716 }, { "epoch": 2.946078431372549, "grad_norm": 0.4820570169126928, "learning_rate": 2.8721696076600553e-05, "loss": 0.1338, "loss_nan_ranks": 0, "loss_rank_avg": 0.1477794647216797, "step": 3005, "valid_targets_mean": 2277.9, "valid_targets_min": 606 }, { "epoch": 2.950980392156863, "grad_norm": 0.5316651065874668, "learning_rate": 2.8677674782351164e-05, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.13892558217048645, "step": 3010, "valid_targets_mean": 2058.4, "valid_targets_min": 613 }, { "epoch": 2.9558823529411766, "grad_norm": 0.47285568304817926, "learning_rate": 2.863360163658498e-05, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.10545437037944794, "step": 3015, "valid_targets_mean": 2418.2, "valid_targets_min": 1094 }, { "epoch": 2.9607843137254903, "grad_norm": 0.5576570344201479, "learning_rate": 2.8589476902651284e-05, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.14480185508728027, "step": 3020, "valid_targets_mean": 2428.8, "valid_targets_min": 932 }, { "epoch": 2.965686274509804, "grad_norm": 0.3720697472883488, "learning_rate": 2.854530084420762e-05, "loss": 0.1085, "loss_nan_ranks": 0, "loss_rank_avg": 0.0960945338010788, "step": 3025, "valid_targets_mean": 2547.1, "valid_targets_min": 516 }, { "epoch": 2.9705882352941178, "grad_norm": 0.3715873526257619, "learning_rate": 2.85010737252182e-05, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.10219788551330566, "step": 3030, "valid_targets_mean": 2670.9, "valid_targets_min": 669 }, { "epoch": 2.9754901960784315, "grad_norm": 0.6195399543085092, "learning_rate": 2.845679580995235e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.1750684678554535, "step": 3035, "valid_targets_mean": 1722.1, "valid_targets_min": 634 }, { "epoch": 2.980392156862745, "grad_norm": 0.44368210641722294, "learning_rate": 2.84124673629829e-05, "loss": 0.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.12278378009796143, "step": 3040, "valid_targets_mean": 2512.6, "valid_targets_min": 844 }, { "epoch": 2.985294117647059, "grad_norm": 0.5160554435392198, "learning_rate": 2.836808864918464e-05, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.1273147016763687, "step": 3045, "valid_targets_mean": 2230.9, "valid_targets_min": 893 }, { "epoch": 2.9901960784313726, "grad_norm": 0.5018491404792775, "learning_rate": 2.8323659933732704e-05, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.14495849609375, "step": 3050, "valid_targets_mean": 2451.2, "valid_targets_min": 741 }, { "epoch": 2.9950980392156863, "grad_norm": 0.47228194271588314, "learning_rate": 2.827918148210101e-05, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.12136131525039673, "step": 3055, "valid_targets_mean": 2365.8, "valid_targets_min": 858 }, { "epoch": 3.0, "grad_norm": 0.41747992787256166, "learning_rate": 2.823465356006066e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.0959467664361, "step": 3060, "valid_targets_mean": 2515.4, "valid_targets_min": 653 }, { "epoch": 3.0049019607843137, "grad_norm": 0.45268172105117166, "learning_rate": 2.819007643367835e-05, "loss": 0.1141, "loss_nan_ranks": 0, "loss_rank_avg": 0.107194684445858, "step": 3065, "valid_targets_mean": 2481.1, "valid_targets_min": 819 }, { "epoch": 3.0098039215686274, "grad_norm": 0.48782268263068046, "learning_rate": 2.814545036931479e-05, "loss": 0.1128, "loss_nan_ranks": 0, "loss_rank_avg": 0.10597293078899384, "step": 3070, "valid_targets_mean": 2368.9, "valid_targets_min": 780 }, { "epoch": 3.014705882352941, "grad_norm": 0.42013415537790194, "learning_rate": 2.810077563362312e-05, "loss": 0.0953, "loss_nan_ranks": 0, "loss_rank_avg": 0.09026814997196198, "step": 3075, "valid_targets_mean": 2636.4, "valid_targets_min": 706 }, { "epoch": 3.019607843137255, "grad_norm": 0.493550574092022, "learning_rate": 2.8056052493547277e-05, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.12190809100866318, "step": 3080, "valid_targets_mean": 2430.9, "valid_targets_min": 692 }, { "epoch": 3.0245098039215685, "grad_norm": 0.5881502044936036, "learning_rate": 2.8011281216320446e-05, "loss": 0.1074, "loss_nan_ranks": 0, "loss_rank_avg": 0.11721500754356384, "step": 3085, "valid_targets_mean": 1814.4, "valid_targets_min": 640 }, { "epoch": 3.0294117647058822, "grad_norm": 0.5220105505984863, "learning_rate": 2.7966462069463454e-05, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.11271218955516815, "step": 3090, "valid_targets_mean": 2519.4, "valid_targets_min": 704 }, { "epoch": 3.034313725490196, "grad_norm": 0.6222515663568035, "learning_rate": 2.792159532078314e-05, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.13791202008724213, "step": 3095, "valid_targets_mean": 1671.6, "valid_targets_min": 723 }, { "epoch": 3.0392156862745097, "grad_norm": 0.5465811429304228, "learning_rate": 2.787668123837079e-05, "loss": 0.1144, "loss_nan_ranks": 0, "loss_rank_avg": 0.12078981846570969, "step": 3100, "valid_targets_mean": 1913.5, "valid_targets_min": 758 }, { "epoch": 3.0441176470588234, "grad_norm": 0.5118828378244067, "learning_rate": 2.7831720090600526e-05, "loss": 0.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.11368224769830704, "step": 3105, "valid_targets_mean": 2430.1, "valid_targets_min": 974 }, { "epoch": 3.049019607843137, "grad_norm": 0.49206966044764583, "learning_rate": 2.778671214612768e-05, "loss": 0.1102, "loss_nan_ranks": 0, "loss_rank_avg": 0.1097177192568779, "step": 3110, "valid_targets_mean": 2724.2, "valid_targets_min": 878 }, { "epoch": 3.053921568627451, "grad_norm": 0.542050378970244, "learning_rate": 2.7741657673887234e-05, "loss": 0.1079, "loss_nan_ranks": 0, "loss_rank_avg": 0.11170881241559982, "step": 3115, "valid_targets_mean": 1963.5, "valid_targets_min": 759 }, { "epoch": 3.0588235294117645, "grad_norm": 0.4966603322376902, "learning_rate": 2.7696556943092163e-05, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.10189454257488251, "step": 3120, "valid_targets_mean": 2127.2, "valid_targets_min": 757 }, { "epoch": 3.063725490196078, "grad_norm": 0.4162238126926009, "learning_rate": 2.7651410223231855e-05, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.09815062582492828, "step": 3125, "valid_targets_mean": 2666.4, "valid_targets_min": 683 }, { "epoch": 3.0686274509803924, "grad_norm": 0.4999830676990576, "learning_rate": 2.7606217784070518e-05, "loss": 0.1132, "loss_nan_ranks": 0, "loss_rank_avg": 0.10285164415836334, "step": 3130, "valid_targets_mean": 2044.8, "valid_targets_min": 754 }, { "epoch": 3.073529411764706, "grad_norm": 0.45664697329434784, "learning_rate": 2.7560979895645508e-05, "loss": 0.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.1548200249671936, "step": 3135, "valid_targets_mean": 2774.8, "valid_targets_min": 789 }, { "epoch": 3.0784313725490198, "grad_norm": 0.6033862754408237, "learning_rate": 2.7515696828265778e-05, "loss": 0.1103, "loss_nan_ranks": 0, "loss_rank_avg": 0.11691197752952576, "step": 3140, "valid_targets_mean": 1985.6, "valid_targets_min": 714 }, { "epoch": 3.0833333333333335, "grad_norm": 0.5519436809793806, "learning_rate": 2.7470368852510235e-05, "loss": 0.1133, "loss_nan_ranks": 0, "loss_rank_avg": 0.12123852223157883, "step": 3145, "valid_targets_mean": 1779.9, "valid_targets_min": 687 }, { "epoch": 3.088235294117647, "grad_norm": 0.6712077515102802, "learning_rate": 2.7424996239226118e-05, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.13345475494861603, "step": 3150, "valid_targets_mean": 1769.3, "valid_targets_min": 511 }, { "epoch": 3.093137254901961, "grad_norm": 0.6947461203066284, "learning_rate": 2.73795792595274e-05, "loss": 0.1129, "loss_nan_ranks": 0, "loss_rank_avg": 0.136090487241745, "step": 3155, "valid_targets_mean": 1951.0, "valid_targets_min": 744 }, { "epoch": 3.0980392156862746, "grad_norm": 0.595632721442861, "learning_rate": 2.733411818479313e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.10106316208839417, "step": 3160, "valid_targets_mean": 2653.4, "valid_targets_min": 1135 }, { "epoch": 3.1029411764705883, "grad_norm": 0.5915082015158023, "learning_rate": 2.7288613286665877e-05, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.11444532871246338, "step": 3165, "valid_targets_mean": 1782.6, "valid_targets_min": 832 }, { "epoch": 3.107843137254902, "grad_norm": 0.4258687271969111, "learning_rate": 2.724306483705004e-05, "loss": 0.1058, "loss_nan_ranks": 0, "loss_rank_avg": 0.10663177818059921, "step": 3170, "valid_targets_mean": 2679.2, "valid_targets_min": 858 }, { "epoch": 3.1127450980392157, "grad_norm": 0.5434705921669944, "learning_rate": 2.719747310811023e-05, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.10878196358680725, "step": 3175, "valid_targets_mean": 1852.3, "valid_targets_min": 712 }, { "epoch": 3.1176470588235294, "grad_norm": 0.518948863407975, "learning_rate": 2.7151838372269724e-05, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.10524100065231323, "step": 3180, "valid_targets_mean": 2033.2, "valid_targets_min": 776 }, { "epoch": 3.122549019607843, "grad_norm": 0.5670597404893448, "learning_rate": 2.7106160902208736e-05, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.11880999803543091, "step": 3185, "valid_targets_mean": 1744.6, "valid_targets_min": 524 }, { "epoch": 3.127450980392157, "grad_norm": 0.4593924657033769, "learning_rate": 2.706044097086281e-05, "loss": 0.1062, "loss_nan_ranks": 0, "loss_rank_avg": 0.0906146839261055, "step": 3190, "valid_targets_mean": 2278.1, "valid_targets_min": 651 }, { "epoch": 3.1323529411764706, "grad_norm": 0.5302919704743427, "learning_rate": 2.701467885142126e-05, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.11191104352474213, "step": 3195, "valid_targets_mean": 2203.2, "valid_targets_min": 798 }, { "epoch": 3.1372549019607843, "grad_norm": 0.46770851652221684, "learning_rate": 2.696887481732545e-05, "loss": 0.1083, "loss_nan_ranks": 0, "loss_rank_avg": 0.08962736278772354, "step": 3200, "valid_targets_mean": 2317.0, "valid_targets_min": 485 }, { "epoch": 3.142156862745098, "grad_norm": 0.461711248997322, "learning_rate": 2.6923029142267195e-05, "loss": 0.1086, "loss_nan_ranks": 0, "loss_rank_avg": 0.10215017199516296, "step": 3205, "valid_targets_mean": 2429.4, "valid_targets_min": 741 }, { "epoch": 3.1470588235294117, "grad_norm": 0.5124333477538516, "learning_rate": 2.6877142100187157e-05, "loss": 0.1114, "loss_nan_ranks": 0, "loss_rank_avg": 0.10358607769012451, "step": 3210, "valid_targets_mean": 1864.0, "valid_targets_min": 536 }, { "epoch": 3.1519607843137254, "grad_norm": 0.3616554988301426, "learning_rate": 2.6831213965273133e-05, "loss": 0.1061, "loss_nan_ranks": 0, "loss_rank_avg": 0.08923672884702682, "step": 3215, "valid_targets_mean": 2760.3, "valid_targets_min": 464 }, { "epoch": 3.156862745098039, "grad_norm": 0.5006444640458854, "learning_rate": 2.6785245011958498e-05, "loss": 0.1088, "loss_nan_ranks": 0, "loss_rank_avg": 0.10196967422962189, "step": 3220, "valid_targets_mean": 2452.2, "valid_targets_min": 894 }, { "epoch": 3.161764705882353, "grad_norm": 0.4732082212550895, "learning_rate": 2.6739235514920516e-05, "loss": 0.1089, "loss_nan_ranks": 0, "loss_rank_avg": 0.10402283817529678, "step": 3225, "valid_targets_mean": 2514.3, "valid_targets_min": 992 }, { "epoch": 3.1666666666666665, "grad_norm": 0.39259653455459503, "learning_rate": 2.6693185749078696e-05, "loss": 0.0996, "loss_nan_ranks": 0, "loss_rank_avg": 0.09591707587242126, "step": 3230, "valid_targets_mean": 2907.6, "valid_targets_min": 702 }, { "epoch": 3.1715686274509802, "grad_norm": 0.5506349591543678, "learning_rate": 2.6647095989593194e-05, "loss": 0.1088, "loss_nan_ranks": 0, "loss_rank_avg": 0.11052503436803818, "step": 3235, "valid_targets_mean": 2068.1, "valid_targets_min": 744 }, { "epoch": 3.176470588235294, "grad_norm": 0.5110012783834129, "learning_rate": 2.660096651186312e-05, "loss": 0.1029, "loss_nan_ranks": 0, "loss_rank_avg": 0.10590462386608124, "step": 3240, "valid_targets_mean": 2004.8, "valid_targets_min": 632 }, { "epoch": 3.1813725490196076, "grad_norm": 0.48429980261496486, "learning_rate": 2.65547975915249e-05, "loss": 0.1171, "loss_nan_ranks": 0, "loss_rank_avg": 0.10138334333896637, "step": 3245, "valid_targets_mean": 2139.9, "valid_targets_min": 697 }, { "epoch": 3.186274509803922, "grad_norm": 0.49960885032231134, "learning_rate": 2.6508589504450674e-05, "loss": 0.1131, "loss_nan_ranks": 0, "loss_rank_avg": 0.10819289833307266, "step": 3250, "valid_targets_mean": 1949.6, "valid_targets_min": 715 }, { "epoch": 3.1911764705882355, "grad_norm": 0.41048885954549186, "learning_rate": 2.6462342526746582e-05, "loss": 0.0986, "loss_nan_ranks": 0, "loss_rank_avg": 0.08373367786407471, "step": 3255, "valid_targets_mean": 2581.2, "valid_targets_min": 447 }, { "epoch": 3.196078431372549, "grad_norm": 0.5789520695615816, "learning_rate": 2.6416056934751163e-05, "loss": 0.1106, "loss_nan_ranks": 0, "loss_rank_avg": 0.09594295173883438, "step": 3260, "valid_targets_mean": 1791.2, "valid_targets_min": 503 }, { "epoch": 3.200980392156863, "grad_norm": 0.4565834458818512, "learning_rate": 2.6369733005033693e-05, "loss": 0.1097, "loss_nan_ranks": 0, "loss_rank_avg": 0.1069725751876831, "step": 3265, "valid_targets_mean": 2500.2, "valid_targets_min": 582 }, { "epoch": 3.2058823529411766, "grad_norm": 0.5371663721783211, "learning_rate": 2.6323371014392503e-05, "loss": 0.1136, "loss_nan_ranks": 0, "loss_rank_avg": 0.12323896586894989, "step": 3270, "valid_targets_mean": 2023.4, "valid_targets_min": 635 }, { "epoch": 3.2107843137254903, "grad_norm": 0.46676874397280727, "learning_rate": 2.6276971239853368e-05, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.10574575513601303, "step": 3275, "valid_targets_mean": 2582.6, "valid_targets_min": 674 }, { "epoch": 3.215686274509804, "grad_norm": 0.47929248550882253, "learning_rate": 2.6230533958667833e-05, "loss": 0.1079, "loss_nan_ranks": 0, "loss_rank_avg": 0.10941387712955475, "step": 3280, "valid_targets_mean": 2438.4, "valid_targets_min": 682 }, { "epoch": 3.2205882352941178, "grad_norm": 0.4962450070888328, "learning_rate": 2.618405944831154e-05, "loss": 0.109, "loss_nan_ranks": 0, "loss_rank_avg": 0.10915249586105347, "step": 3285, "valid_targets_mean": 2119.5, "valid_targets_min": 704 }, { "epoch": 3.2254901960784315, "grad_norm": 0.4534435959489161, "learning_rate": 2.6137547986482607e-05, "loss": 0.1147, "loss_nan_ranks": 0, "loss_rank_avg": 0.09829148650169373, "step": 3290, "valid_targets_mean": 2296.5, "valid_targets_min": 761 }, { "epoch": 3.230392156862745, "grad_norm": 0.5648115539160723, "learning_rate": 2.6090999851099924e-05, "loss": 0.1189, "loss_nan_ranks": 0, "loss_rank_avg": 0.1307239532470703, "step": 3295, "valid_targets_mean": 2227.4, "valid_targets_min": 625 }, { "epoch": 3.235294117647059, "grad_norm": 0.5798437771314721, "learning_rate": 2.604441532030153e-05, "loss": 0.1023, "loss_nan_ranks": 0, "loss_rank_avg": 0.11284209787845612, "step": 3300, "valid_targets_mean": 1850.4, "valid_targets_min": 548 }, { "epoch": 3.2401960784313726, "grad_norm": 0.45163997776172005, "learning_rate": 2.599779467244294e-05, "loss": 0.1065, "loss_nan_ranks": 0, "loss_rank_avg": 0.09802794456481934, "step": 3305, "valid_targets_mean": 2635.2, "valid_targets_min": 803 }, { "epoch": 3.2450980392156863, "grad_norm": 0.5649182130019871, "learning_rate": 2.595113818609547e-05, "loss": 0.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.1129395067691803, "step": 3310, "valid_targets_mean": 1722.3, "valid_targets_min": 765 }, { "epoch": 3.25, "grad_norm": 0.4884299890008094, "learning_rate": 2.590444614004458e-05, "loss": 0.1054, "loss_nan_ranks": 0, "loss_rank_avg": 0.11049424111843109, "step": 3315, "valid_targets_mean": 2286.6, "valid_targets_min": 801 }, { "epoch": 3.2549019607843137, "grad_norm": 0.4484177235028694, "learning_rate": 2.585771881328821e-05, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.08890993893146515, "step": 3320, "valid_targets_mean": 2585.2, "valid_targets_min": 548 }, { "epoch": 3.2598039215686274, "grad_norm": 0.5045433489277796, "learning_rate": 2.5810956485035125e-05, "loss": 0.1101, "loss_nan_ranks": 0, "loss_rank_avg": 0.12246538698673248, "step": 3325, "valid_targets_mean": 2569.7, "valid_targets_min": 927 }, { "epoch": 3.264705882352941, "grad_norm": 0.4652730472828903, "learning_rate": 2.5764159434703215e-05, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.10294139385223389, "step": 3330, "valid_targets_mean": 2296.1, "valid_targets_min": 678 }, { "epoch": 3.269607843137255, "grad_norm": 0.5793296301279914, "learning_rate": 2.5717327941917855e-05, "loss": 0.1108, "loss_nan_ranks": 0, "loss_rank_avg": 0.09359988570213318, "step": 3335, "valid_targets_mean": 2318.1, "valid_targets_min": 593 }, { "epoch": 3.2745098039215685, "grad_norm": 0.5084318900806167, "learning_rate": 2.567046228651022e-05, "loss": 0.102, "loss_nan_ranks": 0, "loss_rank_avg": 0.11955564469099045, "step": 3340, "valid_targets_mean": 2201.9, "valid_targets_min": 663 }, { "epoch": 3.2794117647058822, "grad_norm": 0.6829491331460958, "learning_rate": 2.5623562748515615e-05, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.14061784744262695, "step": 3345, "valid_targets_mean": 1760.6, "valid_targets_min": 661 }, { "epoch": 3.284313725490196, "grad_norm": 0.5653936654283042, "learning_rate": 2.557662960817181e-05, "loss": 0.0989, "loss_nan_ranks": 0, "loss_rank_avg": 0.09769532829523087, "step": 3350, "valid_targets_mean": 2158.1, "valid_targets_min": 770 }, { "epoch": 3.2892156862745097, "grad_norm": 0.4175355963316871, "learning_rate": 2.552966314591735e-05, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.08977030217647552, "step": 3355, "valid_targets_mean": 2686.6, "valid_targets_min": 659 }, { "epoch": 3.2941176470588234, "grad_norm": 0.4751300485635002, "learning_rate": 2.5482663642389883e-05, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.08631863445043564, "step": 3360, "valid_targets_mean": 2316.3, "valid_targets_min": 627 }, { "epoch": 3.299019607843137, "grad_norm": 0.555883518092085, "learning_rate": 2.5435631378424504e-05, "loss": 0.1058, "loss_nan_ranks": 0, "loss_rank_avg": 0.10301592946052551, "step": 3365, "valid_targets_mean": 1677.7, "valid_targets_min": 688 }, { "epoch": 3.303921568627451, "grad_norm": 0.6179203271979932, "learning_rate": 2.5388566635052052e-05, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.1356745958328247, "step": 3370, "valid_targets_mean": 1944.9, "valid_targets_min": 747 }, { "epoch": 3.3088235294117645, "grad_norm": 0.4676890698107417, "learning_rate": 2.5341469693497434e-05, "loss": 0.1085, "loss_nan_ranks": 0, "loss_rank_avg": 0.11229351162910461, "step": 3375, "valid_targets_mean": 2420.8, "valid_targets_min": 821 }, { "epoch": 3.313725490196078, "grad_norm": 0.48905784664475677, "learning_rate": 2.529434083517796e-05, "loss": 0.1134, "loss_nan_ranks": 0, "loss_rank_avg": 0.11473777890205383, "step": 3380, "valid_targets_mean": 2472.6, "valid_targets_min": 776 }, { "epoch": 3.318627450980392, "grad_norm": 0.5941023968549567, "learning_rate": 2.5247180341701652e-05, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.12429068982601166, "step": 3385, "valid_targets_mean": 1746.0, "valid_targets_min": 625 }, { "epoch": 3.323529411764706, "grad_norm": 0.4207492309955242, "learning_rate": 2.5199988494865545e-05, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.09677383303642273, "step": 3390, "valid_targets_mean": 2596.6, "valid_targets_min": 648 }, { "epoch": 3.3284313725490198, "grad_norm": 0.6212127423535296, "learning_rate": 2.5152765576654035e-05, "loss": 0.1042, "loss_nan_ranks": 0, "loss_rank_avg": 0.09490111470222473, "step": 3395, "valid_targets_mean": 2402.4, "valid_targets_min": 780 }, { "epoch": 3.3333333333333335, "grad_norm": 0.5428852197642803, "learning_rate": 2.5105511869237176e-05, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.11736579239368439, "step": 3400, "valid_targets_mean": 2132.8, "valid_targets_min": 903 }, { "epoch": 3.338235294117647, "grad_norm": 0.6068835771442634, "learning_rate": 2.5058227654968986e-05, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.1142382025718689, "step": 3405, "valid_targets_mean": 2071.6, "valid_targets_min": 878 }, { "epoch": 3.343137254901961, "grad_norm": 0.3980675116079957, "learning_rate": 2.5010913216385778e-05, "loss": 0.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.08887724578380585, "step": 3410, "valid_targets_mean": 2649.5, "valid_targets_min": 696 }, { "epoch": 3.3480392156862746, "grad_norm": 0.5921220488695144, "learning_rate": 2.496356883620448e-05, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.13174962997436523, "step": 3415, "valid_targets_mean": 1664.5, "valid_targets_min": 690 }, { "epoch": 3.3529411764705883, "grad_norm": 0.4555660361067227, "learning_rate": 2.491619479732089e-05, "loss": 0.1092, "loss_nan_ranks": 0, "loss_rank_avg": 0.09527282416820526, "step": 3420, "valid_targets_mean": 2478.8, "valid_targets_min": 734 }, { "epoch": 3.357843137254902, "grad_norm": 0.6222613588669669, "learning_rate": 2.4868791382808053e-05, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.12515193223953247, "step": 3425, "valid_targets_mean": 1625.1, "valid_targets_min": 612 }, { "epoch": 3.3627450980392157, "grad_norm": 0.5514835585510608, "learning_rate": 2.4821358875914546e-05, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.12040072679519653, "step": 3430, "valid_targets_mean": 2105.8, "valid_targets_min": 663 }, { "epoch": 3.3676470588235294, "grad_norm": 0.5961299236034482, "learning_rate": 2.477389756006276e-05, "loss": 0.1153, "loss_nan_ranks": 0, "loss_rank_avg": 0.14823094010353088, "step": 3435, "valid_targets_mean": 2278.8, "valid_targets_min": 682 }, { "epoch": 3.372549019607843, "grad_norm": 0.6437966485612172, "learning_rate": 2.4726407718847237e-05, "loss": 0.1134, "loss_nan_ranks": 0, "loss_rank_avg": 0.12897151708602905, "step": 3440, "valid_targets_mean": 1771.4, "valid_targets_min": 643 }, { "epoch": 3.377450980392157, "grad_norm": 0.5267111874802913, "learning_rate": 2.4678889636032976e-05, "loss": 0.1072, "loss_nan_ranks": 0, "loss_rank_avg": 0.10938486456871033, "step": 3445, "valid_targets_mean": 1924.3, "valid_targets_min": 650 }, { "epoch": 3.3823529411764706, "grad_norm": 0.496231210125758, "learning_rate": 2.4631343595553707e-05, "loss": 0.1081, "loss_nan_ranks": 0, "loss_rank_avg": 0.09718477725982666, "step": 3450, "valid_targets_mean": 2110.4, "valid_targets_min": 853 }, { "epoch": 3.3872549019607843, "grad_norm": 0.7417323818704427, "learning_rate": 2.4583769881510243e-05, "loss": 0.1209, "loss_nan_ranks": 0, "loss_rank_avg": 0.12951020896434784, "step": 3455, "valid_targets_mean": 2396.2, "valid_targets_min": 720 }, { "epoch": 3.392156862745098, "grad_norm": 0.686014144744929, "learning_rate": 2.453616877816872e-05, "loss": 0.1199, "loss_nan_ranks": 0, "loss_rank_avg": 0.10813941061496735, "step": 3460, "valid_targets_mean": 2572.1, "valid_targets_min": 746 }, { "epoch": 3.3970588235294117, "grad_norm": 0.46956228200489375, "learning_rate": 2.4488540569958957e-05, "loss": 0.1034, "loss_nan_ranks": 0, "loss_rank_avg": 0.10174999386072159, "step": 3465, "valid_targets_mean": 2273.4, "valid_targets_min": 567 }, { "epoch": 3.4019607843137254, "grad_norm": 0.47202061673863827, "learning_rate": 2.4440885541472734e-05, "loss": 0.1111, "loss_nan_ranks": 0, "loss_rank_avg": 0.1065269336104393, "step": 3470, "valid_targets_mean": 2521.2, "valid_targets_min": 634 }, { "epoch": 3.406862745098039, "grad_norm": 0.4710834442443773, "learning_rate": 2.439320397746207e-05, "loss": 0.1008, "loss_nan_ranks": 0, "loss_rank_avg": 0.09578939527273178, "step": 3475, "valid_targets_mean": 2454.9, "valid_targets_min": 807 }, { "epoch": 3.411764705882353, "grad_norm": 0.534990938857518, "learning_rate": 2.434549616283755e-05, "loss": 0.1144, "loss_nan_ranks": 0, "loss_rank_avg": 0.13655036687850952, "step": 3480, "valid_targets_mean": 2208.6, "valid_targets_min": 916 }, { "epoch": 3.4166666666666665, "grad_norm": 0.5569406603515846, "learning_rate": 2.4297762382666628e-05, "loss": 0.1135, "loss_nan_ranks": 0, "loss_rank_avg": 0.11844809353351593, "step": 3485, "valid_targets_mean": 2206.2, "valid_targets_min": 1016 }, { "epoch": 3.4215686274509802, "grad_norm": 0.573221969522095, "learning_rate": 2.4250002922171887e-05, "loss": 0.1166, "loss_nan_ranks": 0, "loss_rank_avg": 0.1180095300078392, "step": 3490, "valid_targets_mean": 2059.7, "valid_targets_min": 719 }, { "epoch": 3.426470588235294, "grad_norm": 0.5023184061613964, "learning_rate": 2.4202218066729377e-05, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.12228246033191681, "step": 3495, "valid_targets_mean": 2557.6, "valid_targets_min": 631 }, { "epoch": 3.431372549019608, "grad_norm": 0.4804109211903169, "learning_rate": 2.415440810186687e-05, "loss": 0.112, "loss_nan_ranks": 0, "loss_rank_avg": 0.12410437315702438, "step": 3500, "valid_targets_mean": 2642.3, "valid_targets_min": 662 }, { "epoch": 3.436274509803922, "grad_norm": 0.7160334396984808, "learning_rate": 2.4106573313262186e-05, "loss": 0.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.1095886379480362, "step": 3505, "valid_targets_mean": 2399.1, "valid_targets_min": 606 }, { "epoch": 3.4411764705882355, "grad_norm": 0.573633678368746, "learning_rate": 2.405871398674148e-05, "loss": 0.1036, "loss_nan_ranks": 0, "loss_rank_avg": 0.12151598930358887, "step": 3510, "valid_targets_mean": 1821.2, "valid_targets_min": 660 }, { "epoch": 3.446078431372549, "grad_norm": 0.47876480518730624, "learning_rate": 2.4010830408277507e-05, "loss": 0.1064, "loss_nan_ranks": 0, "loss_rank_avg": 0.1134987398982048, "step": 3515, "valid_targets_mean": 2287.1, "valid_targets_min": 867 }, { "epoch": 3.450980392156863, "grad_norm": 0.48121870038783876, "learning_rate": 2.3962922863987956e-05, "loss": 0.1132, "loss_nan_ranks": 0, "loss_rank_avg": 0.09954457730054855, "step": 3520, "valid_targets_mean": 2372.2, "valid_targets_min": 697 }, { "epoch": 3.4558823529411766, "grad_norm": 0.5242680043426456, "learning_rate": 2.3914991640133707e-05, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.15709488093852997, "step": 3525, "valid_targets_mean": 2238.8, "valid_targets_min": 840 }, { "epoch": 3.4607843137254903, "grad_norm": 0.43408849677146805, "learning_rate": 2.3867037023117123e-05, "loss": 0.1001, "loss_nan_ranks": 0, "loss_rank_avg": 0.08314131200313568, "step": 3530, "valid_targets_mean": 2221.2, "valid_targets_min": 699 }, { "epoch": 3.465686274509804, "grad_norm": 0.4397584871724824, "learning_rate": 2.3819059299480375e-05, "loss": 0.1284, "loss_nan_ranks": 0, "loss_rank_avg": 0.1028500497341156, "step": 3535, "valid_targets_mean": 2543.4, "valid_targets_min": 649 }, { "epoch": 3.4705882352941178, "grad_norm": 0.49009687013344777, "learning_rate": 2.3771058755903686e-05, "loss": 0.1047, "loss_nan_ranks": 0, "loss_rank_avg": 0.10757431387901306, "step": 3540, "valid_targets_mean": 2223.6, "valid_targets_min": 650 }, { "epoch": 3.4754901960784315, "grad_norm": 0.39557937893345524, "learning_rate": 2.372303567920362e-05, "loss": 0.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.09384208172559738, "step": 3545, "valid_targets_mean": 2953.0, "valid_targets_min": 1049 }, { "epoch": 3.480392156862745, "grad_norm": 0.4895551988114163, "learning_rate": 2.367499035633141e-05, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.10619791597127914, "step": 3550, "valid_targets_mean": 1790.4, "valid_targets_min": 670 }, { "epoch": 3.485294117647059, "grad_norm": 0.5343919639111113, "learning_rate": 2.3626923074371196e-05, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.112095907330513, "step": 3555, "valid_targets_mean": 2142.9, "valid_targets_min": 700 }, { "epoch": 3.4901960784313726, "grad_norm": 0.39309956805603796, "learning_rate": 2.357883412053834e-05, "loss": 0.0982, "loss_nan_ranks": 0, "loss_rank_avg": 0.07599136233329773, "step": 3560, "valid_targets_mean": 2629.5, "valid_targets_min": 715 }, { "epoch": 3.4950980392156863, "grad_norm": 0.5743979416820177, "learning_rate": 2.3530723782177702e-05, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.11538234353065491, "step": 3565, "valid_targets_mean": 1909.1, "valid_targets_min": 580 }, { "epoch": 3.5, "grad_norm": 0.4267696073720374, "learning_rate": 2.3482592346761905e-05, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.08938651531934738, "step": 3570, "valid_targets_mean": 2519.2, "valid_targets_min": 845 }, { "epoch": 3.5049019607843137, "grad_norm": 0.48972900333651787, "learning_rate": 2.3434440101889644e-05, "loss": 0.1036, "loss_nan_ranks": 0, "loss_rank_avg": 0.09942841529846191, "step": 3575, "valid_targets_mean": 2042.9, "valid_targets_min": 869 }, { "epoch": 3.5098039215686274, "grad_norm": 0.5748476170765656, "learning_rate": 2.338626733528396e-05, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.1080469936132431, "step": 3580, "valid_targets_mean": 1870.4, "valid_targets_min": 468 }, { "epoch": 3.514705882352941, "grad_norm": 0.5453346260954157, "learning_rate": 2.3338074334790513e-05, "loss": 0.1075, "loss_nan_ranks": 0, "loss_rank_avg": 0.12305852770805359, "step": 3585, "valid_targets_mean": 2156.6, "valid_targets_min": 841 }, { "epoch": 3.519607843137255, "grad_norm": 0.4046360880578505, "learning_rate": 2.3289861388375857e-05, "loss": 0.1108, "loss_nan_ranks": 0, "loss_rank_avg": 0.08819185197353363, "step": 3590, "valid_targets_mean": 2738.9, "valid_targets_min": 799 }, { "epoch": 3.5245098039215685, "grad_norm": 0.6118714832043691, "learning_rate": 2.3241628784125746e-05, "loss": 0.109, "loss_nan_ranks": 0, "loss_rank_avg": 0.13428336381912231, "step": 3595, "valid_targets_mean": 1819.1, "valid_targets_min": 717 }, { "epoch": 3.5294117647058822, "grad_norm": 0.5313367384075776, "learning_rate": 2.319337681024338e-05, "loss": 0.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.13841737806797028, "step": 3600, "valid_targets_mean": 2279.8, "valid_targets_min": 774 }, { "epoch": 3.534313725490196, "grad_norm": 0.5936013371744282, "learning_rate": 2.314510575504771e-05, "loss": 0.1141, "loss_nan_ranks": 0, "loss_rank_avg": 0.12145009636878967, "step": 3605, "valid_targets_mean": 2184.8, "valid_targets_min": 863 }, { "epoch": 3.5392156862745097, "grad_norm": 0.4501094327540122, "learning_rate": 2.3096815906971685e-05, "loss": 0.1034, "loss_nan_ranks": 0, "loss_rank_avg": 0.10091482102870941, "step": 3610, "valid_targets_mean": 2419.2, "valid_targets_min": 961 }, { "epoch": 3.5441176470588234, "grad_norm": 0.5917686920531069, "learning_rate": 2.3048507554560565e-05, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.11512914299964905, "step": 3615, "valid_targets_mean": 1797.6, "valid_targets_min": 563 }, { "epoch": 3.549019607843137, "grad_norm": 0.6255611571989778, "learning_rate": 2.3000180986470175e-05, "loss": 0.107, "loss_nan_ranks": 0, "loss_rank_avg": 0.13142108917236328, "step": 3620, "valid_targets_mean": 1911.9, "valid_targets_min": 576 }, { "epoch": 3.553921568627451, "grad_norm": 0.5167486005612478, "learning_rate": 2.2951836491465177e-05, "loss": 0.1022, "loss_nan_ranks": 0, "loss_rank_avg": 0.1105874553322792, "step": 3625, "valid_targets_mean": 2156.2, "valid_targets_min": 329 }, { "epoch": 3.5588235294117645, "grad_norm": 0.5154655734331977, "learning_rate": 2.290347435841736e-05, "loss": 0.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.12183243036270142, "step": 3630, "valid_targets_mean": 2346.5, "valid_targets_min": 816 }, { "epoch": 3.563725490196078, "grad_norm": 0.5223303986667628, "learning_rate": 2.285509487630389e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.15623009204864502, "step": 3635, "valid_targets_mean": 2398.6, "valid_targets_min": 609 }, { "epoch": 3.568627450980392, "grad_norm": 0.4470634454069301, "learning_rate": 2.2806698334205612e-05, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.11349236220121384, "step": 3640, "valid_targets_mean": 2423.0, "valid_targets_min": 744 }, { "epoch": 3.5735294117647056, "grad_norm": 0.5404202109658872, "learning_rate": 2.2758285021305312e-05, "loss": 0.1025, "loss_nan_ranks": 0, "loss_rank_avg": 0.10349144786596298, "step": 3645, "valid_targets_mean": 1936.6, "valid_targets_min": 598 }, { "epoch": 3.5784313725490198, "grad_norm": 0.530293394551295, "learning_rate": 2.2709855226885975e-05, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.11319459229707718, "step": 3650, "valid_targets_mean": 2097.7, "valid_targets_min": 634 }, { "epoch": 3.5833333333333335, "grad_norm": 0.47036735332011803, "learning_rate": 2.266140924032908e-05, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.10819728672504425, "step": 3655, "valid_targets_mean": 2694.6, "valid_targets_min": 1356 }, { "epoch": 3.588235294117647, "grad_norm": 0.5151780573315811, "learning_rate": 2.2612947351112836e-05, "loss": 0.1135, "loss_nan_ranks": 0, "loss_rank_avg": 0.1199716329574585, "step": 3660, "valid_targets_mean": 2438.4, "valid_targets_min": 924 }, { "epoch": 3.593137254901961, "grad_norm": 0.4298760911534975, "learning_rate": 2.2564469848810503e-05, "loss": 0.1049, "loss_nan_ranks": 0, "loss_rank_avg": 0.09393537044525146, "step": 3665, "valid_targets_mean": 2601.8, "valid_targets_min": 965 }, { "epoch": 3.5980392156862746, "grad_norm": 0.5502702790614998, "learning_rate": 2.2515977023088613e-05, "loss": 0.104, "loss_nan_ranks": 0, "loss_rank_avg": 0.13896121084690094, "step": 3670, "valid_targets_mean": 2215.3, "valid_targets_min": 778 }, { "epoch": 3.6029411764705883, "grad_norm": 0.578499401998039, "learning_rate": 2.246746916370527e-05, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.12631025910377502, "step": 3675, "valid_targets_mean": 1959.6, "valid_targets_min": 560 }, { "epoch": 3.607843137254902, "grad_norm": 0.623239876434199, "learning_rate": 2.241894656050841e-05, "loss": 0.1117, "loss_nan_ranks": 0, "loss_rank_avg": 0.13602277636528015, "step": 3680, "valid_targets_mean": 1764.9, "valid_targets_min": 591 }, { "epoch": 3.6127450980392157, "grad_norm": 0.600465231043324, "learning_rate": 2.237040950343406e-05, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.12396884709596634, "step": 3685, "valid_targets_mean": 1924.8, "valid_targets_min": 794 }, { "epoch": 3.6176470588235294, "grad_norm": 0.7319348639656394, "learning_rate": 2.2321858282504606e-05, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.15651845932006836, "step": 3690, "valid_targets_mean": 1656.2, "valid_targets_min": 795 }, { "epoch": 3.622549019607843, "grad_norm": 0.5398063229503928, "learning_rate": 2.2273293187827093e-05, "loss": 0.104, "loss_nan_ranks": 0, "loss_rank_avg": 0.12730857729911804, "step": 3695, "valid_targets_mean": 1967.0, "valid_targets_min": 573 }, { "epoch": 3.627450980392157, "grad_norm": 0.7037019842887797, "learning_rate": 2.2224714509591436e-05, "loss": 0.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.14245694875717163, "step": 3700, "valid_targets_mean": 1353.9, "valid_targets_min": 530 }, { "epoch": 3.6323529411764706, "grad_norm": 0.49584176697366805, "learning_rate": 2.2176122538068738e-05, "loss": 0.1088, "loss_nan_ranks": 0, "loss_rank_avg": 0.0984085351228714, "step": 3705, "valid_targets_mean": 2135.8, "valid_targets_min": 726 }, { "epoch": 3.6372549019607843, "grad_norm": 0.378093430237812, "learning_rate": 2.212751756360952e-05, "loss": 0.1005, "loss_nan_ranks": 0, "loss_rank_avg": 0.08473532646894455, "step": 3710, "valid_targets_mean": 2742.5, "valid_targets_min": 655 }, { "epoch": 3.642156862745098, "grad_norm": 0.45671211592262223, "learning_rate": 2.2078899876642e-05, "loss": 0.1145, "loss_nan_ranks": 0, "loss_rank_avg": 0.09947746247053146, "step": 3715, "valid_targets_mean": 2311.5, "valid_targets_min": 869 }, { "epoch": 3.6470588235294117, "grad_norm": 0.6022808568063974, "learning_rate": 2.2030269767670368e-05, "loss": 0.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.12485545873641968, "step": 3720, "valid_targets_mean": 1894.9, "valid_targets_min": 753 }, { "epoch": 3.6519607843137254, "grad_norm": 0.4816296256677648, "learning_rate": 2.1981627527273023e-05, "loss": 0.1057, "loss_nan_ranks": 0, "loss_rank_avg": 0.1067422479391098, "step": 3725, "valid_targets_mean": 2501.2, "valid_targets_min": 765 }, { "epoch": 3.656862745098039, "grad_norm": 0.48952979423754794, "learning_rate": 2.1932973446100863e-05, "loss": 0.1064, "loss_nan_ranks": 0, "loss_rank_avg": 0.10704466700553894, "step": 3730, "valid_targets_mean": 2467.1, "valid_targets_min": 725 }, { "epoch": 3.661764705882353, "grad_norm": 0.5489743475632907, "learning_rate": 2.1884307814875537e-05, "loss": 0.1209, "loss_nan_ranks": 0, "loss_rank_avg": 0.1270291805267334, "step": 3735, "valid_targets_mean": 1769.5, "valid_targets_min": 534 }, { "epoch": 3.6666666666666665, "grad_norm": 0.4766948278075901, "learning_rate": 2.18356309243877e-05, "loss": 0.1088, "loss_nan_ranks": 0, "loss_rank_avg": 0.09539386630058289, "step": 3740, "valid_targets_mean": 2464.4, "valid_targets_min": 497 }, { "epoch": 3.6715686274509802, "grad_norm": 0.4847705657231007, "learning_rate": 2.1786943065495302e-05, "loss": 0.1113, "loss_nan_ranks": 0, "loss_rank_avg": 0.0939837098121643, "step": 3745, "valid_targets_mean": 2143.0, "valid_targets_min": 518 }, { "epoch": 3.6764705882352944, "grad_norm": 0.48673504467946466, "learning_rate": 2.173824452912181e-05, "loss": 0.1086, "loss_nan_ranks": 0, "loss_rank_avg": 0.10983025282621384, "step": 3750, "valid_targets_mean": 2503.6, "valid_targets_min": 731 }, { "epoch": 3.681372549019608, "grad_norm": 0.6394630567515267, "learning_rate": 2.1689535606254517e-05, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.13665525615215302, "step": 3755, "valid_targets_mean": 1859.1, "valid_targets_min": 424 }, { "epoch": 3.686274509803922, "grad_norm": 0.5404637568110688, "learning_rate": 2.164081658794276e-05, "loss": 0.1086, "loss_nan_ranks": 0, "loss_rank_avg": 0.11135978996753693, "step": 3760, "valid_targets_mean": 2087.4, "valid_targets_min": 784 }, { "epoch": 3.6911764705882355, "grad_norm": 0.5275619152100403, "learning_rate": 2.1592087765296186e-05, "loss": 0.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.1140526682138443, "step": 3765, "valid_targets_mean": 2225.5, "valid_targets_min": 1330 }, { "epoch": 3.696078431372549, "grad_norm": 0.4205808571949082, "learning_rate": 2.154334942948307e-05, "loss": 0.102, "loss_nan_ranks": 0, "loss_rank_avg": 0.09243638813495636, "step": 3770, "valid_targets_mean": 2574.8, "valid_targets_min": 789 }, { "epoch": 3.700980392156863, "grad_norm": 0.403760695863388, "learning_rate": 2.149460187172849e-05, "loss": 0.0959, "loss_nan_ranks": 0, "loss_rank_avg": 0.08560940623283386, "step": 3775, "valid_targets_mean": 2659.8, "valid_targets_min": 724 }, { "epoch": 3.7058823529411766, "grad_norm": 0.4755601372114485, "learning_rate": 2.144584538331264e-05, "loss": 0.1093, "loss_nan_ranks": 0, "loss_rank_avg": 0.12424452602863312, "step": 3780, "valid_targets_mean": 2388.5, "valid_targets_min": 609 }, { "epoch": 3.7107843137254903, "grad_norm": 0.5410875160432338, "learning_rate": 2.139708025556909e-05, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.1277793049812317, "step": 3785, "valid_targets_mean": 2157.8, "valid_targets_min": 621 }, { "epoch": 3.715686274509804, "grad_norm": 0.5018258824660917, "learning_rate": 2.1348306779883004e-05, "loss": 0.1162, "loss_nan_ranks": 0, "loss_rank_avg": 0.11679060012102127, "step": 3790, "valid_targets_mean": 2386.1, "valid_targets_min": 674 }, { "epoch": 3.7205882352941178, "grad_norm": 0.4285080068758283, "learning_rate": 2.1299525247689466e-05, "loss": 0.1083, "loss_nan_ranks": 0, "loss_rank_avg": 0.08835404366254807, "step": 3795, "valid_targets_mean": 2637.9, "valid_targets_min": 929 }, { "epoch": 3.7254901960784315, "grad_norm": 0.530318250431301, "learning_rate": 2.1250735950471664e-05, "loss": 0.1225, "loss_nan_ranks": 0, "loss_rank_avg": 0.11783511936664581, "step": 3800, "valid_targets_mean": 2486.4, "valid_targets_min": 589 }, { "epoch": 3.730392156862745, "grad_norm": 0.44985130125257894, "learning_rate": 2.12019391797592e-05, "loss": 0.103, "loss_nan_ranks": 0, "loss_rank_avg": 0.08755841851234436, "step": 3805, "valid_targets_mean": 2712.6, "valid_targets_min": 939 }, { "epoch": 3.735294117647059, "grad_norm": 0.5286935035251132, "learning_rate": 2.1153135227126337e-05, "loss": 0.1053, "loss_nan_ranks": 0, "loss_rank_avg": 0.10353609919548035, "step": 3810, "valid_targets_mean": 2064.2, "valid_targets_min": 337 }, { "epoch": 3.7401960784313726, "grad_norm": 0.4601036655576194, "learning_rate": 2.1104324384190234e-05, "loss": 0.098, "loss_nan_ranks": 0, "loss_rank_avg": 0.10336270183324814, "step": 3815, "valid_targets_mean": 2523.7, "valid_targets_min": 790 }, { "epoch": 3.7450980392156863, "grad_norm": 0.561715253391712, "learning_rate": 2.105550694260925e-05, "loss": 0.1085, "loss_nan_ranks": 0, "loss_rank_avg": 0.10617645829916, "step": 3820, "valid_targets_mean": 1696.9, "valid_targets_min": 543 }, { "epoch": 3.75, "grad_norm": 0.508039672374628, "learning_rate": 2.1006683194081144e-05, "loss": 0.1106, "loss_nan_ranks": 0, "loss_rank_avg": 0.12362570315599442, "step": 3825, "valid_targets_mean": 2148.6, "valid_targets_min": 544 }, { "epoch": 3.7549019607843137, "grad_norm": 0.5062010089032453, "learning_rate": 2.0957853430341373e-05, "loss": 0.1065, "loss_nan_ranks": 0, "loss_rank_avg": 0.10452181100845337, "step": 3830, "valid_targets_mean": 2122.1, "valid_targets_min": 725 }, { "epoch": 3.7598039215686274, "grad_norm": 0.447000980086604, "learning_rate": 2.090901794316135e-05, "loss": 0.104, "loss_nan_ranks": 0, "loss_rank_avg": 0.09081129729747772, "step": 3835, "valid_targets_mean": 2808.3, "valid_targets_min": 922 }, { "epoch": 3.764705882352941, "grad_norm": 0.49795009536099594, "learning_rate": 2.086017702434666e-05, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.12170379608869553, "step": 3840, "valid_targets_mean": 2495.4, "valid_targets_min": 720 }, { "epoch": 3.769607843137255, "grad_norm": 0.44563295566531946, "learning_rate": 2.081133096573535e-05, "loss": 0.1231, "loss_nan_ranks": 0, "loss_rank_avg": 0.1004648432135582, "step": 3845, "valid_targets_mean": 2524.3, "valid_targets_min": 737 }, { "epoch": 3.7745098039215685, "grad_norm": 0.47095104017094225, "learning_rate": 2.0762480059196207e-05, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.09739089012145996, "step": 3850, "valid_targets_mean": 2408.9, "valid_targets_min": 809 }, { "epoch": 3.7794117647058822, "grad_norm": 0.4882628996629055, "learning_rate": 2.0713624596626945e-05, "loss": 0.1145, "loss_nan_ranks": 0, "loss_rank_avg": 0.10591503232717514, "step": 3855, "valid_targets_mean": 2017.6, "valid_targets_min": 564 }, { "epoch": 3.784313725490196, "grad_norm": 0.49785785642908204, "learning_rate": 2.0664764869952535e-05, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.12032024562358856, "step": 3860, "valid_targets_mean": 2626.7, "valid_targets_min": 693 }, { "epoch": 3.7892156862745097, "grad_norm": 0.40453258551835614, "learning_rate": 2.061590117112341e-05, "loss": 0.1052, "loss_nan_ranks": 0, "loss_rank_avg": 0.1063418835401535, "step": 3865, "valid_targets_mean": 2805.0, "valid_targets_min": 848 }, { "epoch": 3.7941176470588234, "grad_norm": 0.4375416998410625, "learning_rate": 2.056703379211373e-05, "loss": 0.1078, "loss_nan_ranks": 0, "loss_rank_avg": 0.11425399035215378, "step": 3870, "valid_targets_mean": 2723.6, "valid_targets_min": 539 }, { "epoch": 3.799019607843137, "grad_norm": 0.45739452140837245, "learning_rate": 2.0518163024919677e-05, "loss": 0.1022, "loss_nan_ranks": 0, "loss_rank_avg": 0.09378018975257874, "step": 3875, "valid_targets_mean": 2357.4, "valid_targets_min": 693 }, { "epoch": 3.803921568627451, "grad_norm": 0.5672950655638906, "learning_rate": 2.0469289161557637e-05, "loss": 0.1059, "loss_nan_ranks": 0, "loss_rank_avg": 0.1068982183933258, "step": 3880, "valid_targets_mean": 2123.6, "valid_targets_min": 782 }, { "epoch": 3.8088235294117645, "grad_norm": 0.6099769627480358, "learning_rate": 2.042041249406253e-05, "loss": 0.1041, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426199972629547, "step": 3885, "valid_targets_mean": 2168.8, "valid_targets_min": 740 }, { "epoch": 3.813725490196078, "grad_norm": 0.5004067455512964, "learning_rate": 2.0371533314486017e-05, "loss": 0.1033, "loss_nan_ranks": 0, "loss_rank_avg": 0.11419737339019775, "step": 3890, "valid_targets_mean": 2435.4, "valid_targets_min": 647 }, { "epoch": 3.818627450980392, "grad_norm": 0.5661678936881082, "learning_rate": 2.0322651914894754e-05, "loss": 0.109, "loss_nan_ranks": 0, "loss_rank_avg": 0.14499229192733765, "step": 3895, "valid_targets_mean": 2460.9, "valid_targets_min": 730 }, { "epoch": 3.8235294117647056, "grad_norm": 0.49732546990907106, "learning_rate": 2.02737685873687e-05, "loss": 0.1071, "loss_nan_ranks": 0, "loss_rank_avg": 0.11961804330348969, "step": 3900, "valid_targets_mean": 2059.0, "valid_targets_min": 704 }, { "epoch": 3.8284313725490198, "grad_norm": 0.4993481866260662, "learning_rate": 2.0224883623999313e-05, "loss": 0.114, "loss_nan_ranks": 0, "loss_rank_avg": 0.10117202252149582, "step": 3905, "valid_targets_mean": 2220.4, "valid_targets_min": 893 }, { "epoch": 3.8333333333333335, "grad_norm": 0.5538681599370652, "learning_rate": 2.0175997316887802e-05, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.109494149684906, "step": 3910, "valid_targets_mean": 1981.0, "valid_targets_min": 661 }, { "epoch": 3.838235294117647, "grad_norm": 0.45218493019291356, "learning_rate": 2.012710995814345e-05, "loss": 0.1074, "loss_nan_ranks": 0, "loss_rank_avg": 0.09603475034236908, "step": 3915, "valid_targets_mean": 2731.0, "valid_targets_min": 862 }, { "epoch": 3.843137254901961, "grad_norm": 0.44119940995141127, "learning_rate": 2.0078221839881805e-05, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.10505522787570953, "step": 3920, "valid_targets_mean": 2638.4, "valid_targets_min": 909 }, { "epoch": 3.8480392156862746, "grad_norm": 0.4960608782273173, "learning_rate": 2.0029333254222934e-05, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.11102761328220367, "step": 3925, "valid_targets_mean": 1909.0, "valid_targets_min": 620 }, { "epoch": 3.8529411764705883, "grad_norm": 0.5586535920480638, "learning_rate": 1.9980444493289725e-05, "loss": 0.108, "loss_nan_ranks": 0, "loss_rank_avg": 0.12268592417240143, "step": 3930, "valid_targets_mean": 2376.0, "valid_targets_min": 725 }, { "epoch": 3.857843137254902, "grad_norm": 0.5393773385617813, "learning_rate": 1.9931555849206106e-05, "loss": 0.1101, "loss_nan_ranks": 0, "loss_rank_avg": 0.11982365697622299, "step": 3935, "valid_targets_mean": 2329.8, "valid_targets_min": 616 }, { "epoch": 3.8627450980392157, "grad_norm": 0.4725284612750934, "learning_rate": 1.9882667614095287e-05, "loss": 0.1088, "loss_nan_ranks": 0, "loss_rank_avg": 0.10902339220046997, "step": 3940, "valid_targets_mean": 2420.7, "valid_targets_min": 713 }, { "epoch": 3.8676470588235294, "grad_norm": 0.4171871943502758, "learning_rate": 1.9833780080078063e-05, "loss": 0.0977, "loss_nan_ranks": 0, "loss_rank_avg": 0.0916203111410141, "step": 3945, "valid_targets_mean": 2523.8, "valid_targets_min": 745 }, { "epoch": 3.872549019607843, "grad_norm": 0.5163398783108317, "learning_rate": 1.9784893539271026e-05, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.10017865151166916, "step": 3950, "valid_targets_mean": 1958.1, "valid_targets_min": 680 }, { "epoch": 3.877450980392157, "grad_norm": 0.7754438443029995, "learning_rate": 1.9736008283784824e-05, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.1341777741909027, "step": 3955, "valid_targets_mean": 1683.8, "valid_targets_min": 731 }, { "epoch": 3.8823529411764706, "grad_norm": 0.5273279125239405, "learning_rate": 1.9687124605722448e-05, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.12256628274917603, "step": 3960, "valid_targets_mean": 2042.1, "valid_targets_min": 790 }, { "epoch": 3.8872549019607843, "grad_norm": 0.4144565504865219, "learning_rate": 1.963824279717744e-05, "loss": 0.0989, "loss_nan_ranks": 0, "loss_rank_avg": 0.0842713862657547, "step": 3965, "valid_targets_mean": 2443.1, "valid_targets_min": 687 }, { "epoch": 3.892156862745098, "grad_norm": 0.5679541187571767, "learning_rate": 1.9589363150232194e-05, "loss": 0.1084, "loss_nan_ranks": 0, "loss_rank_avg": 0.11258754879236221, "step": 3970, "valid_targets_mean": 1869.7, "valid_targets_min": 844 }, { "epoch": 3.8970588235294117, "grad_norm": 0.5272383246437135, "learning_rate": 1.9540485956956166e-05, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.12583494186401367, "step": 3975, "valid_targets_mean": 2390.6, "valid_targets_min": 733 }, { "epoch": 3.9019607843137254, "grad_norm": 0.49411797125684626, "learning_rate": 1.9491611509404156e-05, "loss": 0.1092, "loss_nan_ranks": 0, "loss_rank_avg": 0.11986801028251648, "step": 3980, "valid_targets_mean": 2076.8, "valid_targets_min": 683 }, { "epoch": 3.906862745098039, "grad_norm": 0.5683723121360503, "learning_rate": 1.9442740099614573e-05, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.12163309752941132, "step": 3985, "valid_targets_mean": 2084.8, "valid_targets_min": 949 }, { "epoch": 3.911764705882353, "grad_norm": 0.4366403979214397, "learning_rate": 1.9393872019607658e-05, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.10083067417144775, "step": 3990, "valid_targets_mean": 2892.9, "valid_targets_min": 790 }, { "epoch": 3.9166666666666665, "grad_norm": 0.47443132807924027, "learning_rate": 1.9345007561383755e-05, "loss": 0.0997, "loss_nan_ranks": 0, "loss_rank_avg": 0.09945064783096313, "step": 3995, "valid_targets_mean": 2261.6, "valid_targets_min": 998 }, { "epoch": 3.9215686274509802, "grad_norm": 0.6756799450871543, "learning_rate": 1.929614701692159e-05, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440548300743103, "step": 4000, "valid_targets_mean": 1480.9, "valid_targets_min": 684 }, { "epoch": 3.9264705882352944, "grad_norm": 0.6431235449873466, "learning_rate": 1.924729067817646e-05, "loss": 0.1093, "loss_nan_ranks": 0, "loss_rank_avg": 0.12017422914505005, "step": 4005, "valid_targets_mean": 1699.6, "valid_targets_min": 521 }, { "epoch": 3.931372549019608, "grad_norm": 0.5361794880222236, "learning_rate": 1.919843883707858e-05, "loss": 0.1043, "loss_nan_ranks": 0, "loss_rank_avg": 0.12894302606582642, "step": 4010, "valid_targets_mean": 2346.9, "valid_targets_min": 810 }, { "epoch": 3.936274509803922, "grad_norm": 0.5846150875543148, "learning_rate": 1.9149591785531256e-05, "loss": 0.1127, "loss_nan_ranks": 0, "loss_rank_avg": 0.12245102971792221, "step": 4015, "valid_targets_mean": 1880.8, "valid_targets_min": 677 }, { "epoch": 3.9411764705882355, "grad_norm": 0.6251138407178463, "learning_rate": 1.9100749815409185e-05, "loss": 0.1075, "loss_nan_ranks": 0, "loss_rank_avg": 0.1449219137430191, "step": 4020, "valid_targets_mean": 1870.9, "valid_targets_min": 625 }, { "epoch": 3.946078431372549, "grad_norm": 0.4889900134198115, "learning_rate": 1.905191321855671e-05, "loss": 0.1081, "loss_nan_ranks": 0, "loss_rank_avg": 0.10330167412757874, "step": 4025, "valid_targets_mean": 2078.4, "valid_targets_min": 695 }, { "epoch": 3.950980392156863, "grad_norm": 0.4651475351048309, "learning_rate": 1.9003082286786056e-05, "loss": 0.1115, "loss_nan_ranks": 0, "loss_rank_avg": 0.1023440957069397, "step": 4030, "valid_targets_mean": 2225.9, "valid_targets_min": 647 }, { "epoch": 3.9558823529411766, "grad_norm": 0.4021607738658494, "learning_rate": 1.895425731187561e-05, "loss": 0.0951, "loss_nan_ranks": 0, "loss_rank_avg": 0.08778274804353714, "step": 4035, "valid_targets_mean": 2479.3, "valid_targets_min": 602 }, { "epoch": 3.9607843137254903, "grad_norm": 0.6217464371869531, "learning_rate": 1.8905438585568148e-05, "loss": 0.1233, "loss_nan_ranks": 0, "loss_rank_avg": 0.12868231534957886, "step": 4040, "valid_targets_mean": 1891.4, "valid_targets_min": 754 }, { "epoch": 3.965686274509804, "grad_norm": 0.4856130983795896, "learning_rate": 1.8856626399569114e-05, "loss": 0.1046, "loss_nan_ranks": 0, "loss_rank_avg": 0.112669438123703, "step": 4045, "valid_targets_mean": 2243.1, "valid_targets_min": 534 }, { "epoch": 3.9705882352941178, "grad_norm": 0.4750769123731014, "learning_rate": 1.880782104554489e-05, "loss": 0.098, "loss_nan_ranks": 0, "loss_rank_avg": 0.09736385941505432, "step": 4050, "valid_targets_mean": 2243.9, "valid_targets_min": 482 }, { "epoch": 3.9754901960784315, "grad_norm": 0.405301707427997, "learning_rate": 1.875902281512101e-05, "loss": 0.1037, "loss_nan_ranks": 0, "loss_rank_avg": 0.08424034714698792, "step": 4055, "valid_targets_mean": 2575.7, "valid_targets_min": 848 }, { "epoch": 3.980392156862745, "grad_norm": 0.4561960422936826, "learning_rate": 1.8710231999880446e-05, "loss": 0.1052, "loss_nan_ranks": 0, "loss_rank_avg": 0.09456402063369751, "step": 4060, "valid_targets_mean": 2422.7, "valid_targets_min": 613 }, { "epoch": 3.985294117647059, "grad_norm": 0.3696563343388035, "learning_rate": 1.866144889136189e-05, "loss": 0.0976, "loss_nan_ranks": 0, "loss_rank_avg": 0.07512452453374863, "step": 4065, "valid_targets_mean": 2838.2, "valid_targets_min": 823 }, { "epoch": 3.9901960784313726, "grad_norm": 0.46963438097328625, "learning_rate": 1.861267378105795e-05, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.12728336453437805, "step": 4070, "valid_targets_mean": 2365.9, "valid_targets_min": 591 }, { "epoch": 3.9950980392156863, "grad_norm": 0.4803268550916603, "learning_rate": 1.856390696041345e-05, "loss": 0.1158, "loss_nan_ranks": 0, "loss_rank_avg": 0.10719768702983856, "step": 4075, "valid_targets_mean": 2434.1, "valid_targets_min": 812 }, { "epoch": 4.0, "grad_norm": 0.5293457714014153, "learning_rate": 1.8515148720823703e-05, "loss": 0.1031, "loss_nan_ranks": 0, "loss_rank_avg": 0.10042376816272736, "step": 4080, "valid_targets_mean": 1962.6, "valid_targets_min": 623 }, { "epoch": 4.004901960784314, "grad_norm": 0.5644338107149101, "learning_rate": 1.846639935363272e-05, "loss": 0.0947, "loss_nan_ranks": 0, "loss_rank_avg": 0.09875704348087311, "step": 4085, "valid_targets_mean": 1990.8, "valid_targets_min": 780 }, { "epoch": 4.009803921568627, "grad_norm": 0.4444963540738002, "learning_rate": 1.8417659150131507e-05, "loss": 0.0906, "loss_nan_ranks": 0, "loss_rank_avg": 0.07949922233819962, "step": 4090, "valid_targets_mean": 2462.4, "valid_targets_min": 472 }, { "epoch": 4.014705882352941, "grad_norm": 0.5230285801588905, "learning_rate": 1.8368928401556334e-05, "loss": 0.0913, "loss_nan_ranks": 0, "loss_rank_avg": 0.09187965095043182, "step": 4095, "valid_targets_mean": 2216.2, "valid_targets_min": 715 }, { "epoch": 4.019607843137255, "grad_norm": 0.444478652714691, "learning_rate": 1.8320207399086936e-05, "loss": 0.091, "loss_nan_ranks": 0, "loss_rank_avg": 0.08924181759357452, "step": 4100, "valid_targets_mean": 2502.8, "valid_targets_min": 520 }, { "epoch": 4.0245098039215685, "grad_norm": 0.4467580920948847, "learning_rate": 1.827149643384484e-05, "loss": 0.0838, "loss_nan_ranks": 0, "loss_rank_avg": 0.0863981693983078, "step": 4105, "valid_targets_mean": 3037.9, "valid_targets_min": 960 }, { "epoch": 4.029411764705882, "grad_norm": 0.5074124961478061, "learning_rate": 1.8222795796891596e-05, "loss": 0.093, "loss_nan_ranks": 0, "loss_rank_avg": 0.09525004774332047, "step": 4110, "valid_targets_mean": 2213.2, "valid_targets_min": 776 }, { "epoch": 4.034313725490196, "grad_norm": 0.4688138171504505, "learning_rate": 1.8174105779227038e-05, "loss": 0.0834, "loss_nan_ranks": 0, "loss_rank_avg": 0.07826852798461914, "step": 4115, "valid_targets_mean": 2524.2, "valid_targets_min": 704 }, { "epoch": 4.03921568627451, "grad_norm": 0.5495964133592056, "learning_rate": 1.8125426671787535e-05, "loss": 0.0829, "loss_nan_ranks": 0, "loss_rank_avg": 0.08855336904525757, "step": 4120, "valid_targets_mean": 2184.7, "valid_targets_min": 742 }, { "epoch": 4.044117647058823, "grad_norm": 0.6649719549369908, "learning_rate": 1.8076758765444272e-05, "loss": 0.0954, "loss_nan_ranks": 0, "loss_rank_avg": 0.10872084647417068, "step": 4125, "valid_targets_mean": 1982.1, "valid_targets_min": 905 }, { "epoch": 4.049019607843137, "grad_norm": 0.558854630746821, "learning_rate": 1.8028102351001515e-05, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.07840010523796082, "step": 4130, "valid_targets_mean": 2404.1, "valid_targets_min": 635 }, { "epoch": 4.053921568627451, "grad_norm": 0.5709714861960441, "learning_rate": 1.7979457719194847e-05, "loss": 0.1013, "loss_nan_ranks": 0, "loss_rank_avg": 0.09838423132896423, "step": 4135, "valid_targets_mean": 2030.4, "valid_targets_min": 715 }, { "epoch": 4.0588235294117645, "grad_norm": 0.6188829630512815, "learning_rate": 1.7930825160689448e-05, "loss": 0.1066, "loss_nan_ranks": 0, "loss_rank_avg": 0.14148059487342834, "step": 4140, "valid_targets_mean": 1973.7, "valid_targets_min": 678 }, { "epoch": 4.063725490196078, "grad_norm": 0.5426801567468893, "learning_rate": 1.7882204966078377e-05, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.09950780123472214, "step": 4145, "valid_targets_mean": 2231.3, "valid_targets_min": 801 }, { "epoch": 4.068627450980392, "grad_norm": 0.47654840956847533, "learning_rate": 1.7833597425880786e-05, "loss": 0.1008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0965999960899353, "step": 4150, "valid_targets_mean": 2403.3, "valid_targets_min": 712 }, { "epoch": 4.073529411764706, "grad_norm": 0.5293696212843991, "learning_rate": 1.7785002830540225e-05, "loss": 0.0871, "loss_nan_ranks": 0, "loss_rank_avg": 0.08954203128814697, "step": 4155, "valid_targets_mean": 2344.8, "valid_targets_min": 538 }, { "epoch": 4.078431372549019, "grad_norm": 0.5975080969452089, "learning_rate": 1.7736421470422915e-05, "loss": 0.0865, "loss_nan_ranks": 0, "loss_rank_avg": 0.09741682559251785, "step": 4160, "valid_targets_mean": 2047.7, "valid_targets_min": 660 }, { "epoch": 4.083333333333333, "grad_norm": 0.48604759979340684, "learning_rate": 1.7687853635815953e-05, "loss": 0.0943, "loss_nan_ranks": 0, "loss_rank_avg": 0.08825595676898956, "step": 4165, "valid_targets_mean": 2451.2, "valid_targets_min": 1195 }, { "epoch": 4.088235294117647, "grad_norm": 0.5268849125233499, "learning_rate": 1.7639299616925645e-05, "loss": 0.0897, "loss_nan_ranks": 0, "loss_rank_avg": 0.13385260105133057, "step": 4170, "valid_targets_mean": 2277.0, "valid_targets_min": 718 }, { "epoch": 4.0931372549019605, "grad_norm": 0.492794433426126, "learning_rate": 1.7590759703875752e-05, "loss": 0.0926, "loss_nan_ranks": 0, "loss_rank_avg": 0.10988749563694, "step": 4175, "valid_targets_mean": 2417.8, "valid_targets_min": 847 }, { "epoch": 4.098039215686274, "grad_norm": 0.6013133531068834, "learning_rate": 1.7542234186705722e-05, "loss": 0.0941, "loss_nan_ranks": 0, "loss_rank_avg": 0.09224649518728256, "step": 4180, "valid_targets_mean": 1765.2, "valid_targets_min": 721 }, { "epoch": 4.102941176470588, "grad_norm": 0.7495395672799343, "learning_rate": 1.7493723355368995e-05, "loss": 0.1011, "loss_nan_ranks": 0, "loss_rank_avg": 0.10524407029151917, "step": 4185, "valid_targets_mean": 1362.1, "valid_targets_min": 595 }, { "epoch": 4.107843137254902, "grad_norm": 0.6364621332679006, "learning_rate": 1.744522749973127e-05, "loss": 0.1011, "loss_nan_ranks": 0, "loss_rank_avg": 0.08376060426235199, "step": 4190, "valid_targets_mean": 1726.0, "valid_targets_min": 732 }, { "epoch": 4.112745098039215, "grad_norm": 0.5201856732191488, "learning_rate": 1.7396746909568748e-05, "loss": 0.0934, "loss_nan_ranks": 0, "loss_rank_avg": 0.0875372588634491, "step": 4195, "valid_targets_mean": 2352.5, "valid_targets_min": 541 }, { "epoch": 4.117647058823529, "grad_norm": 0.49596492927230623, "learning_rate": 1.7348281874566417e-05, "loss": 0.0909, "loss_nan_ranks": 0, "loss_rank_avg": 0.08408987522125244, "step": 4200, "valid_targets_mean": 2508.0, "valid_targets_min": 891 }, { "epoch": 4.122549019607843, "grad_norm": 0.5693396360569704, "learning_rate": 1.7299832684316323e-05, "loss": 0.085, "loss_nan_ranks": 0, "loss_rank_avg": 0.09746822714805603, "step": 4205, "valid_targets_mean": 2194.4, "valid_targets_min": 618 }, { "epoch": 4.127450980392156, "grad_norm": 0.43092782426008985, "learning_rate": 1.725139962831584e-05, "loss": 0.0917, "loss_nan_ranks": 0, "loss_rank_avg": 0.09253295511007309, "step": 4210, "valid_targets_mean": 2626.4, "valid_targets_min": 610 }, { "epoch": 4.132352941176471, "grad_norm": 0.4724890600327457, "learning_rate": 1.7202982995965912e-05, "loss": 0.0948, "loss_nan_ranks": 0, "loss_rank_avg": 0.0815335363149643, "step": 4215, "valid_targets_mean": 2930.8, "valid_targets_min": 720 }, { "epoch": 4.137254901960785, "grad_norm": 0.5689305179379935, "learning_rate": 1.7154583076569376e-05, "loss": 0.0986, "loss_nan_ranks": 0, "loss_rank_avg": 0.08635899424552917, "step": 4220, "valid_targets_mean": 2238.6, "valid_targets_min": 676 }, { "epoch": 4.142156862745098, "grad_norm": 0.47177819632108414, "learning_rate": 1.7106200159329197e-05, "loss": 0.0872, "loss_nan_ranks": 0, "loss_rank_avg": 0.08042912185192108, "step": 4225, "valid_targets_mean": 2839.6, "valid_targets_min": 867 }, { "epoch": 4.147058823529412, "grad_norm": 0.48065078368458986, "learning_rate": 1.705783453334673e-05, "loss": 0.0943, "loss_nan_ranks": 0, "loss_rank_avg": 0.08426964282989502, "step": 4230, "valid_targets_mean": 2610.4, "valid_targets_min": 950 }, { "epoch": 4.151960784313726, "grad_norm": 0.6553478415791882, "learning_rate": 1.7009486487620024e-05, "loss": 0.1046, "loss_nan_ranks": 0, "loss_rank_avg": 0.09982205182313919, "step": 4235, "valid_targets_mean": 1791.4, "valid_targets_min": 662 }, { "epoch": 4.1568627450980395, "grad_norm": 0.6041270719163585, "learning_rate": 1.6961156311042085e-05, "loss": 0.0959, "loss_nan_ranks": 0, "loss_rank_avg": 0.11420536041259766, "step": 4240, "valid_targets_mean": 2226.8, "valid_targets_min": 801 }, { "epoch": 4.161764705882353, "grad_norm": 0.5619416375343212, "learning_rate": 1.6912844292399143e-05, "loss": 0.0955, "loss_nan_ranks": 0, "loss_rank_avg": 0.0868932455778122, "step": 4245, "valid_targets_mean": 1945.8, "valid_targets_min": 829 }, { "epoch": 4.166666666666667, "grad_norm": 0.6065314115589832, "learning_rate": 1.6864550720368915e-05, "loss": 0.0953, "loss_nan_ranks": 0, "loss_rank_avg": 0.11492280662059784, "step": 4250, "valid_targets_mean": 2105.5, "valid_targets_min": 907 }, { "epoch": 4.171568627450981, "grad_norm": 0.5544175260955679, "learning_rate": 1.6816275883518917e-05, "loss": 0.0886, "loss_nan_ranks": 0, "loss_rank_avg": 0.08502060174942017, "step": 4255, "valid_targets_mean": 2211.4, "valid_targets_min": 515 }, { "epoch": 4.176470588235294, "grad_norm": 0.5310513730362705, "learning_rate": 1.6768020070304704e-05, "loss": 0.0905, "loss_nan_ranks": 0, "loss_rank_avg": 0.09640628099441528, "step": 4260, "valid_targets_mean": 2702.8, "valid_targets_min": 621 }, { "epoch": 4.181372549019608, "grad_norm": 0.7288794320718324, "learning_rate": 1.6719783569068154e-05, "loss": 0.0955, "loss_nan_ranks": 0, "loss_rank_avg": 0.10868661850690842, "step": 4265, "valid_targets_mean": 1660.6, "valid_targets_min": 524 }, { "epoch": 4.186274509803922, "grad_norm": 0.49490583836739976, "learning_rate": 1.6671566668035765e-05, "loss": 0.094, "loss_nan_ranks": 0, "loss_rank_avg": 0.08493231236934662, "step": 4270, "valid_targets_mean": 2460.1, "valid_targets_min": 485 }, { "epoch": 4.1911764705882355, "grad_norm": 0.548822021790285, "learning_rate": 1.6623369655316915e-05, "loss": 0.0975, "loss_nan_ranks": 0, "loss_rank_avg": 0.09106888622045517, "step": 4275, "valid_targets_mean": 2058.1, "valid_targets_min": 610 }, { "epoch": 4.196078431372549, "grad_norm": 0.5580145934153147, "learning_rate": 1.657519281890213e-05, "loss": 0.0871, "loss_nan_ranks": 0, "loss_rank_avg": 0.08765994012355804, "step": 4280, "valid_targets_mean": 1777.9, "valid_targets_min": 726 }, { "epoch": 4.200980392156863, "grad_norm": 0.45822454413438735, "learning_rate": 1.6527036446661396e-05, "loss": 0.0929, "loss_nan_ranks": 0, "loss_rank_avg": 0.08106301724910736, "step": 4285, "valid_targets_mean": 3128.1, "valid_targets_min": 988 }, { "epoch": 4.205882352941177, "grad_norm": 0.6180110752258359, "learning_rate": 1.647890082634241e-05, "loss": 0.096, "loss_nan_ranks": 0, "loss_rank_avg": 0.1506294459104538, "step": 4290, "valid_targets_mean": 2282.9, "valid_targets_min": 867 }, { "epoch": 4.21078431372549, "grad_norm": 0.5445669104444656, "learning_rate": 1.6430786245568865e-05, "loss": 0.0844, "loss_nan_ranks": 0, "loss_rank_avg": 0.09008940309286118, "step": 4295, "valid_targets_mean": 2389.7, "valid_targets_min": 812 }, { "epoch": 4.215686274509804, "grad_norm": 0.5055418184306785, "learning_rate": 1.638269299183875e-05, "loss": 0.0932, "loss_nan_ranks": 0, "loss_rank_avg": 0.08286339044570923, "step": 4300, "valid_targets_mean": 2237.7, "valid_targets_min": 647 }, { "epoch": 4.220588235294118, "grad_norm": 0.453249556971749, "learning_rate": 1.6334621352522606e-05, "loss": 0.0912, "loss_nan_ranks": 0, "loss_rank_avg": 0.09033799916505814, "step": 4305, "valid_targets_mean": 2639.6, "valid_targets_min": 695 }, { "epoch": 4.2254901960784315, "grad_norm": 0.6613125276955629, "learning_rate": 1.6286571614861845e-05, "loss": 0.1013, "loss_nan_ranks": 0, "loss_rank_avg": 0.09440892934799194, "step": 4310, "valid_targets_mean": 1669.6, "valid_targets_min": 625 }, { "epoch": 4.230392156862745, "grad_norm": 0.5980358240831692, "learning_rate": 1.6238544065966974e-05, "loss": 0.0972, "loss_nan_ranks": 0, "loss_rank_avg": 0.09913182258605957, "step": 4315, "valid_targets_mean": 1975.6, "valid_targets_min": 622 }, { "epoch": 4.235294117647059, "grad_norm": 0.511127190936502, "learning_rate": 1.6190538992815945e-05, "loss": 0.1012, "loss_nan_ranks": 0, "loss_rank_avg": 0.11423664540052414, "step": 4320, "valid_targets_mean": 2052.5, "valid_targets_min": 541 }, { "epoch": 4.240196078431373, "grad_norm": 0.5626942407060462, "learning_rate": 1.6142556682252404e-05, "loss": 0.0953, "loss_nan_ranks": 0, "loss_rank_avg": 0.09917297214269638, "step": 4325, "valid_targets_mean": 2183.7, "valid_targets_min": 697 }, { "epoch": 4.245098039215686, "grad_norm": 0.6911199917714397, "learning_rate": 1.609459742098398e-05, "loss": 0.1068, "loss_nan_ranks": 0, "loss_rank_avg": 0.14647285640239716, "step": 4330, "valid_targets_mean": 1848.5, "valid_targets_min": 740 }, { "epoch": 4.25, "grad_norm": 0.531542801596997, "learning_rate": 1.604666149558057e-05, "loss": 0.0868, "loss_nan_ranks": 0, "loss_rank_avg": 0.09663405269384384, "step": 4335, "valid_targets_mean": 2882.6, "valid_targets_min": 1324 }, { "epoch": 4.254901960784314, "grad_norm": 0.5773829854027778, "learning_rate": 1.5998749192472666e-05, "loss": 0.1095, "loss_nan_ranks": 0, "loss_rank_avg": 0.11062102019786835, "step": 4340, "valid_targets_mean": 1834.8, "valid_targets_min": 447 }, { "epoch": 4.259803921568627, "grad_norm": 0.5691933965635515, "learning_rate": 1.595086079794955e-05, "loss": 0.0996, "loss_nan_ranks": 0, "loss_rank_avg": 0.08927673101425171, "step": 4345, "valid_targets_mean": 1940.2, "valid_targets_min": 542 }, { "epoch": 4.264705882352941, "grad_norm": 0.46575860504404326, "learning_rate": 1.5902996598157705e-05, "loss": 0.0976, "loss_nan_ranks": 0, "loss_rank_avg": 0.09074290096759796, "step": 4350, "valid_targets_mean": 2670.6, "valid_targets_min": 788 }, { "epoch": 4.269607843137255, "grad_norm": 0.4873669002421505, "learning_rate": 1.5855156879099012e-05, "loss": 0.093, "loss_nan_ranks": 0, "loss_rank_avg": 0.08654345571994781, "step": 4355, "valid_targets_mean": 2558.1, "valid_targets_min": 963 }, { "epoch": 4.2745098039215685, "grad_norm": 0.57544806936859, "learning_rate": 1.5807341926629073e-05, "loss": 0.0922, "loss_nan_ranks": 0, "loss_rank_avg": 0.10240624845027924, "step": 4360, "valid_targets_mean": 2204.3, "valid_targets_min": 740 }, { "epoch": 4.279411764705882, "grad_norm": 0.667247621859043, "learning_rate": 1.575955202645551e-05, "loss": 0.1035, "loss_nan_ranks": 0, "loss_rank_avg": 0.11562317609786987, "step": 4365, "valid_targets_mean": 2166.3, "valid_targets_min": 809 }, { "epoch": 4.284313725490196, "grad_norm": 0.5322428960008451, "learning_rate": 1.571178746413625e-05, "loss": 0.0957, "loss_nan_ranks": 0, "loss_rank_avg": 0.09002898633480072, "step": 4370, "valid_targets_mean": 2169.4, "valid_targets_min": 700 }, { "epoch": 4.28921568627451, "grad_norm": 0.44379666480899166, "learning_rate": 1.5664048525077827e-05, "loss": 0.0948, "loss_nan_ranks": 0, "loss_rank_avg": 0.07158397883176804, "step": 4375, "valid_targets_mean": 3081.1, "valid_targets_min": 748 }, { "epoch": 4.294117647058823, "grad_norm": 0.5134899363308195, "learning_rate": 1.5616335494533644e-05, "loss": 0.1019, "loss_nan_ranks": 0, "loss_rank_avg": 0.085150808095932, "step": 4380, "valid_targets_mean": 2649.4, "valid_targets_min": 910 }, { "epoch": 4.299019607843137, "grad_norm": 0.5633333659303986, "learning_rate": 1.5568648657602316e-05, "loss": 0.0902, "loss_nan_ranks": 0, "loss_rank_avg": 0.08845022320747375, "step": 4385, "valid_targets_mean": 1813.4, "valid_targets_min": 721 }, { "epoch": 4.303921568627451, "grad_norm": 0.4207910793387121, "learning_rate": 1.5520988299225942e-05, "loss": 0.0994, "loss_nan_ranks": 0, "loss_rank_avg": 0.08506350219249725, "step": 4390, "valid_targets_mean": 3005.1, "valid_targets_min": 718 }, { "epoch": 4.3088235294117645, "grad_norm": 0.5975251690244275, "learning_rate": 1.5473354704188397e-05, "loss": 0.1012, "loss_nan_ranks": 0, "loss_rank_avg": 0.08913823962211609, "step": 4395, "valid_targets_mean": 1923.8, "valid_targets_min": 728 }, { "epoch": 4.313725490196078, "grad_norm": 0.5423697805466529, "learning_rate": 1.5425748157113632e-05, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.1019233986735344, "step": 4400, "valid_targets_mean": 2368.1, "valid_targets_min": 682 }, { "epoch": 4.318627450980392, "grad_norm": 0.5387628160624569, "learning_rate": 1.5378168942464003e-05, "loss": 0.0852, "loss_nan_ranks": 0, "loss_rank_avg": 0.09121586382389069, "step": 4405, "valid_targets_mean": 2608.4, "valid_targets_min": 596 }, { "epoch": 4.323529411764706, "grad_norm": 0.5633768847500502, "learning_rate": 1.5330617344538517e-05, "loss": 0.0932, "loss_nan_ranks": 0, "loss_rank_avg": 0.08939993381500244, "step": 4410, "valid_targets_mean": 1958.5, "valid_targets_min": 704 }, { "epoch": 4.328431372549019, "grad_norm": 0.7836118578665316, "learning_rate": 1.528309364747118e-05, "loss": 0.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.12606091797351837, "step": 4415, "valid_targets_mean": 1545.8, "valid_targets_min": 682 }, { "epoch": 4.333333333333333, "grad_norm": 0.7139630949750333, "learning_rate": 1.5235598135229291e-05, "loss": 0.0998, "loss_nan_ranks": 0, "loss_rank_avg": 0.10998935997486115, "step": 4420, "valid_targets_mean": 2041.0, "valid_targets_min": 826 }, { "epoch": 4.338235294117647, "grad_norm": 0.6463858784540754, "learning_rate": 1.5188131091611715e-05, "loss": 0.0944, "loss_nan_ranks": 0, "loss_rank_avg": 0.11081689596176147, "step": 4425, "valid_targets_mean": 1975.4, "valid_targets_min": 788 }, { "epoch": 4.3431372549019605, "grad_norm": 0.6052231565253691, "learning_rate": 1.5140692800247218e-05, "loss": 0.1046, "loss_nan_ranks": 0, "loss_rank_avg": 0.09583979099988937, "step": 4430, "valid_targets_mean": 1846.4, "valid_targets_min": 648 }, { "epoch": 4.348039215686274, "grad_norm": 0.46120014193765946, "learning_rate": 1.5093283544592776e-05, "loss": 0.0908, "loss_nan_ranks": 0, "loss_rank_avg": 0.08437848836183548, "step": 4435, "valid_targets_mean": 2861.5, "valid_targets_min": 511 }, { "epoch": 4.352941176470588, "grad_norm": 0.4357769914711236, "learning_rate": 1.504590360793186e-05, "loss": 0.0875, "loss_nan_ranks": 0, "loss_rank_avg": 0.07600148022174835, "step": 4440, "valid_targets_mean": 2830.0, "valid_targets_min": 742 }, { "epoch": 4.357843137254902, "grad_norm": 0.7829148140428298, "learning_rate": 1.4998553273372732e-05, "loss": 0.0873, "loss_nan_ranks": 0, "loss_rank_avg": 0.10139364749193192, "step": 4445, "valid_targets_mean": 1361.4, "valid_targets_min": 720 }, { "epoch": 4.362745098039215, "grad_norm": 0.5434292008208409, "learning_rate": 1.4951232823846807e-05, "loss": 0.0965, "loss_nan_ranks": 0, "loss_rank_avg": 0.07670040428638458, "step": 4450, "valid_targets_mean": 2044.3, "valid_targets_min": 640 }, { "epoch": 4.367647058823529, "grad_norm": 0.45939612712149325, "learning_rate": 1.490394254210691e-05, "loss": 0.0988, "loss_nan_ranks": 0, "loss_rank_avg": 0.07639499008655548, "step": 4455, "valid_targets_mean": 2279.1, "valid_targets_min": 646 }, { "epoch": 4.372549019607844, "grad_norm": 0.5477638681309787, "learning_rate": 1.4856682710725605e-05, "loss": 0.0937, "loss_nan_ranks": 0, "loss_rank_avg": 0.09940779954195023, "step": 4460, "valid_targets_mean": 2314.7, "valid_targets_min": 812 }, { "epoch": 4.377450980392156, "grad_norm": 0.6193221420104923, "learning_rate": 1.4809453612093507e-05, "loss": 0.1, "loss_nan_ranks": 0, "loss_rank_avg": 0.12221089005470276, "step": 4465, "valid_targets_mean": 2122.3, "valid_targets_min": 680 }, { "epoch": 4.382352941176471, "grad_norm": 0.5363699703866529, "learning_rate": 1.4762255528417609e-05, "loss": 0.0823, "loss_nan_ranks": 0, "loss_rank_avg": 0.0714312195777893, "step": 4470, "valid_targets_mean": 2175.7, "valid_targets_min": 597 }, { "epoch": 4.387254901960785, "grad_norm": 0.3973947214228722, "learning_rate": 1.4715088741719555e-05, "loss": 0.0802, "loss_nan_ranks": 0, "loss_rank_avg": 0.06857871264219284, "step": 4475, "valid_targets_mean": 3006.4, "valid_targets_min": 739 }, { "epoch": 4.392156862745098, "grad_norm": 0.6548559347394757, "learning_rate": 1.4667953533833994e-05, "loss": 0.093, "loss_nan_ranks": 0, "loss_rank_avg": 0.10961537063121796, "step": 4480, "valid_targets_mean": 1610.0, "valid_targets_min": 572 }, { "epoch": 4.397058823529412, "grad_norm": 0.6143204977429464, "learning_rate": 1.46208501864069e-05, "loss": 0.094, "loss_nan_ranks": 0, "loss_rank_avg": 0.12123645842075348, "step": 4485, "valid_targets_mean": 2003.9, "valid_targets_min": 773 }, { "epoch": 4.401960784313726, "grad_norm": 0.5182077364235051, "learning_rate": 1.4573778980893842e-05, "loss": 0.0843, "loss_nan_ranks": 0, "loss_rank_avg": 0.08992286771535873, "step": 4490, "valid_targets_mean": 2517.8, "valid_targets_min": 669 }, { "epoch": 4.4068627450980395, "grad_norm": 0.48022364706715087, "learning_rate": 1.4526740198558345e-05, "loss": 0.095, "loss_nan_ranks": 0, "loss_rank_avg": 0.07461203634738922, "step": 4495, "valid_targets_mean": 2504.1, "valid_targets_min": 387 }, { "epoch": 4.411764705882353, "grad_norm": 0.6520442662505085, "learning_rate": 1.4479734120470202e-05, "loss": 0.0959, "loss_nan_ranks": 0, "loss_rank_avg": 0.089952252805233, "step": 4500, "valid_targets_mean": 2090.4, "valid_targets_min": 898 }, { "epoch": 4.416666666666667, "grad_norm": 0.6404826866372381, "learning_rate": 1.4432761027503788e-05, "loss": 0.0964, "loss_nan_ranks": 0, "loss_rank_avg": 0.10904596745967865, "step": 4505, "valid_targets_mean": 1745.3, "valid_targets_min": 350 }, { "epoch": 4.421568627450981, "grad_norm": 0.5056249456016008, "learning_rate": 1.4385821200336368e-05, "loss": 0.0866, "loss_nan_ranks": 0, "loss_rank_avg": 0.08835747838020325, "step": 4510, "valid_targets_mean": 2380.8, "valid_targets_min": 776 }, { "epoch": 4.426470588235294, "grad_norm": 0.6402655121728962, "learning_rate": 1.4338914919446452e-05, "loss": 0.0957, "loss_nan_ranks": 0, "loss_rank_avg": 0.11426950991153717, "step": 4515, "valid_targets_mean": 1765.1, "valid_targets_min": 673 }, { "epoch": 4.431372549019608, "grad_norm": 0.48332863889117145, "learning_rate": 1.42920424651121e-05, "loss": 0.0891, "loss_nan_ranks": 0, "loss_rank_avg": 0.07937314361333847, "step": 4520, "valid_targets_mean": 2311.2, "valid_targets_min": 539 }, { "epoch": 4.436274509803922, "grad_norm": 0.583535718159293, "learning_rate": 1.424520411740923e-05, "loss": 0.0922, "loss_nan_ranks": 0, "loss_rank_avg": 0.08863136917352676, "step": 4525, "valid_targets_mean": 2048.4, "valid_targets_min": 907 }, { "epoch": 4.4411764705882355, "grad_norm": 0.4337974903941218, "learning_rate": 1.419840015620999e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.09409506618976593, "step": 4530, "valid_targets_mean": 2672.8, "valid_targets_min": 694 }, { "epoch": 4.446078431372549, "grad_norm": 0.5747359814706138, "learning_rate": 1.415163086118105e-05, "loss": 0.1089, "loss_nan_ranks": 0, "loss_rank_avg": 0.09305723011493683, "step": 4535, "valid_targets_mean": 2288.3, "valid_targets_min": 589 }, { "epoch": 4.450980392156863, "grad_norm": 0.5368082314568046, "learning_rate": 1.4104896511781916e-05, "loss": 0.0956, "loss_nan_ranks": 0, "loss_rank_avg": 0.08980883657932281, "step": 4540, "valid_targets_mean": 2108.5, "valid_targets_min": 679 }, { "epoch": 4.455882352941177, "grad_norm": 0.4427323912880307, "learning_rate": 1.4058197387263327e-05, "loss": 0.0827, "loss_nan_ranks": 0, "loss_rank_avg": 0.07779604941606522, "step": 4545, "valid_targets_mean": 2846.7, "valid_targets_min": 865 }, { "epoch": 4.46078431372549, "grad_norm": 0.5754395884162968, "learning_rate": 1.4011533766665512e-05, "loss": 0.0932, "loss_nan_ranks": 0, "loss_rank_avg": 0.11345474421977997, "step": 4550, "valid_targets_mean": 2048.6, "valid_targets_min": 731 }, { "epoch": 4.465686274509804, "grad_norm": 0.7338185572895771, "learning_rate": 1.396490592881656e-05, "loss": 0.0909, "loss_nan_ranks": 0, "loss_rank_avg": 0.09632228314876556, "step": 4555, "valid_targets_mean": 1559.9, "valid_targets_min": 759 }, { "epoch": 4.470588235294118, "grad_norm": 0.6497231280991327, "learning_rate": 1.3918314152330758e-05, "loss": 0.0973, "loss_nan_ranks": 0, "loss_rank_avg": 0.09701061248779297, "step": 4560, "valid_targets_mean": 1984.2, "valid_targets_min": 858 }, { "epoch": 4.4754901960784315, "grad_norm": 0.4926967911541651, "learning_rate": 1.3871758715606905e-05, "loss": 0.0932, "loss_nan_ranks": 0, "loss_rank_avg": 0.0813327506184578, "step": 4565, "valid_targets_mean": 2670.1, "valid_targets_min": 762 }, { "epoch": 4.480392156862745, "grad_norm": 0.6155351420308762, "learning_rate": 1.3825239896826678e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.09319113940000534, "step": 4570, "valid_targets_mean": 1925.0, "valid_targets_min": 700 }, { "epoch": 4.485294117647059, "grad_norm": 0.5286966094801919, "learning_rate": 1.3778757973952916e-05, "loss": 0.0976, "loss_nan_ranks": 0, "loss_rank_avg": 0.10444878786802292, "step": 4575, "valid_targets_mean": 2229.3, "valid_targets_min": 616 }, { "epoch": 4.490196078431373, "grad_norm": 0.6034568137100172, "learning_rate": 1.3732313224728034e-05, "loss": 0.0967, "loss_nan_ranks": 0, "loss_rank_avg": 0.08842505514621735, "step": 4580, "valid_targets_mean": 2529.2, "valid_targets_min": 823 }, { "epoch": 4.495098039215686, "grad_norm": 0.49921650284434393, "learning_rate": 1.3685905926672307e-05, "loss": 0.0918, "loss_nan_ranks": 0, "loss_rank_avg": 0.09927654266357422, "step": 4585, "valid_targets_mean": 2443.6, "valid_targets_min": 780 }, { "epoch": 4.5, "grad_norm": 0.5430297012879352, "learning_rate": 1.3639536357082213e-05, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.07649785280227661, "step": 4590, "valid_targets_mean": 2006.4, "valid_targets_min": 664 }, { "epoch": 4.504901960784314, "grad_norm": 0.5544828568038234, "learning_rate": 1.3593204793028827e-05, "loss": 0.0939, "loss_nan_ranks": 0, "loss_rank_avg": 0.10276834666728973, "step": 4595, "valid_targets_mean": 2263.1, "valid_targets_min": 799 }, { "epoch": 4.509803921568627, "grad_norm": 0.4257567508568936, "learning_rate": 1.3546911511356109e-05, "loss": 0.0873, "loss_nan_ranks": 0, "loss_rank_avg": 0.06598569452762604, "step": 4600, "valid_targets_mean": 2500.6, "valid_targets_min": 620 }, { "epoch": 4.514705882352941, "grad_norm": 0.5350814926710116, "learning_rate": 1.3500656788679259e-05, "loss": 0.0939, "loss_nan_ranks": 0, "loss_rank_avg": 0.08269689232110977, "step": 4605, "valid_targets_mean": 2247.2, "valid_targets_min": 774 }, { "epoch": 4.519607843137255, "grad_norm": 0.5071553325687435, "learning_rate": 1.3454440901383105e-05, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.08212989568710327, "step": 4610, "valid_targets_mean": 2416.6, "valid_targets_min": 752 }, { "epoch": 4.5245098039215685, "grad_norm": 0.48521769183282765, "learning_rate": 1.3408264125620409e-05, "loss": 0.0962, "loss_nan_ranks": 0, "loss_rank_avg": 0.09017767012119293, "step": 4615, "valid_targets_mean": 2546.1, "valid_targets_min": 635 }, { "epoch": 4.529411764705882, "grad_norm": 0.5302744572378841, "learning_rate": 1.3362126737310218e-05, "loss": 0.0854, "loss_nan_ranks": 0, "loss_rank_avg": 0.07743710279464722, "step": 4620, "valid_targets_mean": 2307.6, "valid_targets_min": 614 }, { "epoch": 4.534313725490196, "grad_norm": 0.5819255012958557, "learning_rate": 1.3316029012136251e-05, "loss": 0.0945, "loss_nan_ranks": 0, "loss_rank_avg": 0.09885326027870178, "step": 4625, "valid_targets_mean": 2172.9, "valid_targets_min": 677 }, { "epoch": 4.53921568627451, "grad_norm": 0.49414618949329153, "learning_rate": 1.3269971225545222e-05, "loss": 0.0852, "loss_nan_ranks": 0, "loss_rank_avg": 0.09445025026798248, "step": 4630, "valid_targets_mean": 2684.0, "valid_targets_min": 762 }, { "epoch": 4.544117647058823, "grad_norm": 0.5097040673012775, "learning_rate": 1.322395365274518e-05, "loss": 0.0887, "loss_nan_ranks": 0, "loss_rank_avg": 0.09663759171962738, "step": 4635, "valid_targets_mean": 2331.1, "valid_targets_min": 807 }, { "epoch": 4.549019607843137, "grad_norm": 0.5251723752326636, "learning_rate": 1.317797656870392e-05, "loss": 0.0918, "loss_nan_ranks": 0, "loss_rank_avg": 0.08932511508464813, "step": 4640, "valid_targets_mean": 2332.5, "valid_targets_min": 652 }, { "epoch": 4.553921568627451, "grad_norm": 0.6185932099393986, "learning_rate": 1.3132040248147275e-05, "loss": 0.0883, "loss_nan_ranks": 0, "loss_rank_avg": 0.0976918414235115, "step": 4645, "valid_targets_mean": 2019.3, "valid_targets_min": 675 }, { "epoch": 4.5588235294117645, "grad_norm": 0.6806589296776067, "learning_rate": 1.3086144965557533e-05, "loss": 0.0959, "loss_nan_ranks": 0, "loss_rank_avg": 0.11448152363300323, "step": 4650, "valid_targets_mean": 1729.6, "valid_targets_min": 788 }, { "epoch": 4.563725490196078, "grad_norm": 0.5779608518902201, "learning_rate": 1.3040290995171741e-05, "loss": 0.0924, "loss_nan_ranks": 0, "loss_rank_avg": 0.07267005741596222, "step": 4655, "valid_targets_mean": 2079.3, "valid_targets_min": 788 }, { "epoch": 4.568627450980392, "grad_norm": 0.6828527890624431, "learning_rate": 1.2994478610980105e-05, "loss": 0.1063, "loss_nan_ranks": 0, "loss_rank_avg": 0.11123380064964294, "step": 4660, "valid_targets_mean": 1486.1, "valid_targets_min": 807 }, { "epoch": 4.573529411764706, "grad_norm": 0.5564317445708631, "learning_rate": 1.2948708086724358e-05, "loss": 0.0981, "loss_nan_ranks": 0, "loss_rank_avg": 0.09014254063367844, "step": 4665, "valid_targets_mean": 2018.9, "valid_targets_min": 459 }, { "epoch": 4.578431372549019, "grad_norm": 0.48228755801063306, "learning_rate": 1.2902979695896078e-05, "loss": 0.085, "loss_nan_ranks": 0, "loss_rank_avg": 0.07801198959350586, "step": 4670, "valid_targets_mean": 2877.0, "valid_targets_min": 567 }, { "epoch": 4.583333333333333, "grad_norm": 0.5410741347026093, "learning_rate": 1.2857293711735106e-05, "loss": 0.0936, "loss_nan_ranks": 0, "loss_rank_avg": 0.10315775126218796, "step": 4675, "valid_targets_mean": 2320.1, "valid_targets_min": 959 }, { "epoch": 4.588235294117647, "grad_norm": 0.6455727403969245, "learning_rate": 1.2811650407227896e-05, "loss": 0.1052, "loss_nan_ranks": 0, "loss_rank_avg": 0.10891681909561157, "step": 4680, "valid_targets_mean": 1875.6, "valid_targets_min": 761 }, { "epoch": 4.5931372549019605, "grad_norm": 0.6265275777081649, "learning_rate": 1.2766050055105845e-05, "loss": 0.0926, "loss_nan_ranks": 0, "loss_rank_avg": 0.0980343222618103, "step": 4685, "valid_targets_mean": 2058.0, "valid_targets_min": 661 }, { "epoch": 4.598039215686274, "grad_norm": 0.5365945342201405, "learning_rate": 1.2720492927843742e-05, "loss": 0.1006, "loss_nan_ranks": 0, "loss_rank_avg": 0.08697868138551712, "step": 4690, "valid_targets_mean": 2090.6, "valid_targets_min": 727 }, { "epoch": 4.602941176470588, "grad_norm": 0.3810046962990753, "learning_rate": 1.267497929765807e-05, "loss": 0.0982, "loss_nan_ranks": 0, "loss_rank_avg": 0.0712059885263443, "step": 4695, "valid_targets_mean": 3317.7, "valid_targets_min": 698 }, { "epoch": 4.607843137254902, "grad_norm": 0.5918911867571459, "learning_rate": 1.2629509436505396e-05, "loss": 0.0927, "loss_nan_ranks": 0, "loss_rank_avg": 0.0884181559085846, "step": 4700, "valid_targets_mean": 2422.4, "valid_targets_min": 566 }, { "epoch": 4.612745098039216, "grad_norm": 0.5213457877084579, "learning_rate": 1.2584083616080787e-05, "loss": 0.1024, "loss_nan_ranks": 0, "loss_rank_avg": 0.0884481742978096, "step": 4705, "valid_targets_mean": 2052.0, "valid_targets_min": 502 }, { "epoch": 4.617647058823529, "grad_norm": 0.567330475510558, "learning_rate": 1.2538702107816121e-05, "loss": 0.0936, "loss_nan_ranks": 0, "loss_rank_avg": 0.11953169852495193, "step": 4710, "valid_targets_mean": 2700.6, "valid_targets_min": 626 }, { "epoch": 4.622549019607844, "grad_norm": 0.6026523328666679, "learning_rate": 1.2493365182878527e-05, "loss": 0.0943, "loss_nan_ranks": 0, "loss_rank_avg": 0.09880198538303375, "step": 4715, "valid_targets_mean": 1875.8, "valid_targets_min": 602 }, { "epoch": 4.627450980392156, "grad_norm": 0.5441784314363494, "learning_rate": 1.2448073112168716e-05, "loss": 0.0868, "loss_nan_ranks": 0, "loss_rank_avg": 0.09551490843296051, "step": 4720, "valid_targets_mean": 2144.7, "valid_targets_min": 759 }, { "epoch": 4.632352941176471, "grad_norm": 0.5798838689286685, "learning_rate": 1.2402826166319382e-05, "loss": 0.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.1071678102016449, "step": 4725, "valid_targets_mean": 2335.9, "valid_targets_min": 859 }, { "epoch": 4.637254901960784, "grad_norm": 0.6052688653087752, "learning_rate": 1.2357624615693605e-05, "loss": 0.0942, "loss_nan_ranks": 0, "loss_rank_avg": 0.10750146210193634, "step": 4730, "valid_targets_mean": 2203.2, "valid_targets_min": 591 }, { "epoch": 4.642156862745098, "grad_norm": 0.5546544496485989, "learning_rate": 1.2312468730383195e-05, "loss": 0.0969, "loss_nan_ranks": 0, "loss_rank_avg": 0.10274793952703476, "step": 4735, "valid_targets_mean": 2163.4, "valid_targets_min": 523 }, { "epoch": 4.647058823529412, "grad_norm": 0.5533444220155, "learning_rate": 1.2267358780207105e-05, "loss": 0.1015, "loss_nan_ranks": 0, "loss_rank_avg": 0.1120515763759613, "step": 4740, "valid_targets_mean": 2334.5, "valid_targets_min": 785 }, { "epoch": 4.651960784313726, "grad_norm": 0.5676611492306864, "learning_rate": 1.2222295034709827e-05, "loss": 0.1005, "loss_nan_ranks": 0, "loss_rank_avg": 0.09991104900836945, "step": 4745, "valid_targets_mean": 2311.3, "valid_targets_min": 638 }, { "epoch": 4.6568627450980395, "grad_norm": 0.48304589572378387, "learning_rate": 1.2177277763159746e-05, "loss": 0.0897, "loss_nan_ranks": 0, "loss_rank_avg": 0.07975605130195618, "step": 4750, "valid_targets_mean": 2585.1, "valid_targets_min": 776 }, { "epoch": 4.661764705882353, "grad_norm": 0.4820375384596627, "learning_rate": 1.2132307234547565e-05, "loss": 0.1059, "loss_nan_ranks": 0, "loss_rank_avg": 0.12615613639354706, "step": 4755, "valid_targets_mean": 2636.7, "valid_targets_min": 592 }, { "epoch": 4.666666666666667, "grad_norm": 0.6077582225101309, "learning_rate": 1.2087383717584684e-05, "loss": 0.0981, "loss_nan_ranks": 0, "loss_rank_avg": 0.0969112291932106, "step": 4760, "valid_targets_mean": 2067.4, "valid_targets_min": 780 }, { "epoch": 4.671568627450981, "grad_norm": 0.5582574957902202, "learning_rate": 1.2042507480701587e-05, "loss": 0.0865, "loss_nan_ranks": 0, "loss_rank_avg": 0.07808205485343933, "step": 4765, "valid_targets_mean": 2271.1, "valid_targets_min": 783 }, { "epoch": 4.676470588235294, "grad_norm": 0.5228146595740085, "learning_rate": 1.1997678792046252e-05, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.10070804506540298, "step": 4770, "valid_targets_mean": 2396.7, "valid_targets_min": 768 }, { "epoch": 4.681372549019608, "grad_norm": 0.8866670649854181, "learning_rate": 1.1952897919482549e-05, "loss": 0.0996, "loss_nan_ranks": 0, "loss_rank_avg": 0.11867621541023254, "step": 4775, "valid_targets_mean": 1673.6, "valid_targets_min": 665 }, { "epoch": 4.686274509803922, "grad_norm": 0.7094125157085205, "learning_rate": 1.1908165130588633e-05, "loss": 0.1008, "loss_nan_ranks": 0, "loss_rank_avg": 0.1672782450914383, "step": 4780, "valid_targets_mean": 1552.0, "valid_targets_min": 548 }, { "epoch": 4.6911764705882355, "grad_norm": 0.5321239377206641, "learning_rate": 1.1863480692655326e-05, "loss": 0.1093, "loss_nan_ranks": 0, "loss_rank_avg": 0.09801702201366425, "step": 4785, "valid_targets_mean": 2317.7, "valid_targets_min": 1126 }, { "epoch": 4.696078431372549, "grad_norm": 0.5302224100951789, "learning_rate": 1.1818844872684566e-05, "loss": 0.0903, "loss_nan_ranks": 0, "loss_rank_avg": 0.0928771048784256, "step": 4790, "valid_targets_mean": 2279.2, "valid_targets_min": 690 }, { "epoch": 4.700980392156863, "grad_norm": 0.6024447446598006, "learning_rate": 1.1774257937387774e-05, "loss": 0.0798, "loss_nan_ranks": 0, "loss_rank_avg": 0.08303597569465637, "step": 4795, "valid_targets_mean": 2043.1, "valid_targets_min": 342 }, { "epoch": 4.705882352941177, "grad_norm": 0.5604418830899587, "learning_rate": 1.1729720153184264e-05, "loss": 0.0945, "loss_nan_ranks": 0, "loss_rank_avg": 0.10681148618459702, "step": 4800, "valid_targets_mean": 2133.1, "valid_targets_min": 753 }, { "epoch": 4.71078431372549, "grad_norm": 0.49573708522463433, "learning_rate": 1.1685231786199664e-05, "loss": 0.1036, "loss_nan_ranks": 0, "loss_rank_avg": 0.08099532872438431, "step": 4805, "valid_targets_mean": 2240.6, "valid_targets_min": 790 }, { "epoch": 4.715686274509804, "grad_norm": 0.5709774627312741, "learning_rate": 1.164079310226434e-05, "loss": 0.089, "loss_nan_ranks": 0, "loss_rank_avg": 0.10106971859931946, "step": 4810, "valid_targets_mean": 2072.1, "valid_targets_min": 726 }, { "epoch": 4.720588235294118, "grad_norm": 0.5301681363435597, "learning_rate": 1.1596404366911744e-05, "loss": 0.1003, "loss_nan_ranks": 0, "loss_rank_avg": 0.10889250785112381, "step": 4815, "valid_targets_mean": 2291.0, "valid_targets_min": 588 }, { "epoch": 4.7254901960784315, "grad_norm": 0.5065174062499794, "learning_rate": 1.1552065845376915e-05, "loss": 0.0987, "loss_nan_ranks": 0, "loss_rank_avg": 0.09046753495931625, "step": 4820, "valid_targets_mean": 2729.2, "valid_targets_min": 909 }, { "epoch": 4.730392156862745, "grad_norm": 0.46010715663863505, "learning_rate": 1.1507777802594831e-05, "loss": 0.0907, "loss_nan_ranks": 0, "loss_rank_avg": 0.0826692283153534, "step": 4825, "valid_targets_mean": 2386.8, "valid_targets_min": 570 }, { "epoch": 4.735294117647059, "grad_norm": 0.48984283135483603, "learning_rate": 1.146354050319884e-05, "loss": 0.085, "loss_nan_ranks": 0, "loss_rank_avg": 0.0765889436006546, "step": 4830, "valid_targets_mean": 2352.8, "valid_targets_min": 652 }, { "epoch": 4.740196078431373, "grad_norm": 0.6000883358087854, "learning_rate": 1.1419354211519104e-05, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.09945641458034515, "step": 4835, "valid_targets_mean": 2212.0, "valid_targets_min": 632 }, { "epoch": 4.745098039215686, "grad_norm": 0.4978854046536584, "learning_rate": 1.1375219191580973e-05, "loss": 0.0881, "loss_nan_ranks": 0, "loss_rank_avg": 0.08206206560134888, "step": 4840, "valid_targets_mean": 2067.2, "valid_targets_min": 760 }, { "epoch": 4.75, "grad_norm": 0.5315947439144812, "learning_rate": 1.133113570710346e-05, "loss": 0.0984, "loss_nan_ranks": 0, "loss_rank_avg": 0.0920734703540802, "step": 4845, "valid_targets_mean": 1935.8, "valid_targets_min": 518 }, { "epoch": 4.754901960784314, "grad_norm": 0.4716458449566336, "learning_rate": 1.1287104021497617e-05, "loss": 0.1046, "loss_nan_ranks": 0, "loss_rank_avg": 0.08418993651866913, "step": 4850, "valid_targets_mean": 2616.8, "valid_targets_min": 731 }, { "epoch": 4.759803921568627, "grad_norm": 0.5301504010187645, "learning_rate": 1.1243124397864999e-05, "loss": 0.1052, "loss_nan_ranks": 0, "loss_rank_avg": 0.10015548765659332, "step": 4855, "valid_targets_mean": 2534.8, "valid_targets_min": 1040 }, { "epoch": 4.764705882352941, "grad_norm": 0.4463389854552508, "learning_rate": 1.1199197098996079e-05, "loss": 0.0907, "loss_nan_ranks": 0, "loss_rank_avg": 0.0668463408946991, "step": 4860, "valid_targets_mean": 2604.6, "valid_targets_min": 726 }, { "epoch": 4.769607843137255, "grad_norm": 0.5763709238343063, "learning_rate": 1.1155322387368663e-05, "loss": 0.0905, "loss_nan_ranks": 0, "loss_rank_avg": 0.08877779543399811, "step": 4865, "valid_targets_mean": 2057.5, "valid_targets_min": 609 }, { "epoch": 4.7745098039215685, "grad_norm": 0.4666198250671742, "learning_rate": 1.1111500525146326e-05, "loss": 0.0874, "loss_nan_ranks": 0, "loss_rank_avg": 0.07614760100841522, "step": 4870, "valid_targets_mean": 2428.4, "valid_targets_min": 903 }, { "epoch": 4.779411764705882, "grad_norm": 0.6826323097336842, "learning_rate": 1.1067731774176883e-05, "loss": 0.1004, "loss_nan_ranks": 0, "loss_rank_avg": 0.09942520409822464, "step": 4875, "valid_targets_mean": 1747.4, "valid_targets_min": 726 }, { "epoch": 4.784313725490196, "grad_norm": 0.7934705417827008, "learning_rate": 1.1024016395990758e-05, "loss": 0.1029, "loss_nan_ranks": 0, "loss_rank_avg": 0.10979147255420685, "step": 4880, "valid_targets_mean": 1707.7, "valid_targets_min": 755 }, { "epoch": 4.78921568627451, "grad_norm": 0.5251535439314821, "learning_rate": 1.0980354651799488e-05, "loss": 0.0866, "loss_nan_ranks": 0, "loss_rank_avg": 0.09340649098157883, "step": 4885, "valid_targets_mean": 2131.6, "valid_targets_min": 744 }, { "epoch": 4.794117647058823, "grad_norm": 0.5444234009344121, "learning_rate": 1.0936746802494124e-05, "loss": 0.0932, "loss_nan_ranks": 0, "loss_rank_avg": 0.10292315483093262, "step": 4890, "valid_targets_mean": 2253.0, "valid_targets_min": 514 }, { "epoch": 4.799019607843137, "grad_norm": 0.4878077628758911, "learning_rate": 1.0893193108643671e-05, "loss": 0.0889, "loss_nan_ranks": 0, "loss_rank_avg": 0.09365487098693848, "step": 4895, "valid_targets_mean": 2397.1, "valid_targets_min": 567 }, { "epoch": 4.803921568627451, "grad_norm": 0.5545755624860067, "learning_rate": 1.084969383049354e-05, "loss": 0.0907, "loss_nan_ranks": 0, "loss_rank_avg": 0.09213241934776306, "step": 4900, "valid_targets_mean": 2270.0, "valid_targets_min": 727 }, { "epoch": 4.8088235294117645, "grad_norm": 0.6017361382666815, "learning_rate": 1.0806249227964e-05, "loss": 0.1001, "loss_nan_ranks": 0, "loss_rank_avg": 0.09305038303136826, "step": 4905, "valid_targets_mean": 1651.3, "valid_targets_min": 720 }, { "epoch": 4.813725490196078, "grad_norm": 0.48831061998554787, "learning_rate": 1.0762859560648634e-05, "loss": 0.1014, "loss_nan_ranks": 0, "loss_rank_avg": 0.08866013586521149, "step": 4910, "valid_targets_mean": 2533.8, "valid_targets_min": 655 }, { "epoch": 4.818627450980392, "grad_norm": 0.5436658478885745, "learning_rate": 1.0719525087812737e-05, "loss": 0.1074, "loss_nan_ranks": 0, "loss_rank_avg": 0.10058622062206268, "step": 4915, "valid_targets_mean": 2305.4, "valid_targets_min": 765 }, { "epoch": 4.823529411764706, "grad_norm": 0.5264234660847347, "learning_rate": 1.0676246068391816e-05, "loss": 0.0919, "loss_nan_ranks": 0, "loss_rank_avg": 0.09133768826723099, "step": 4920, "valid_targets_mean": 2342.2, "valid_targets_min": 691 }, { "epoch": 4.828431372549019, "grad_norm": 0.5865401723602275, "learning_rate": 1.0633022760990046e-05, "loss": 0.1001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0870981216430664, "step": 4925, "valid_targets_mean": 2040.4, "valid_targets_min": 523 }, { "epoch": 4.833333333333333, "grad_norm": 0.5066015819283176, "learning_rate": 1.0589855423878679e-05, "loss": 0.0936, "loss_nan_ranks": 0, "loss_rank_avg": 0.09252853691577911, "step": 4930, "valid_targets_mean": 2513.6, "valid_targets_min": 770 }, { "epoch": 4.838235294117647, "grad_norm": 0.5163264858489794, "learning_rate": 1.0546744314994549e-05, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.08159564435482025, "step": 4935, "valid_targets_mean": 1908.4, "valid_targets_min": 559 }, { "epoch": 4.8431372549019605, "grad_norm": 0.542313951486232, "learning_rate": 1.0503689691938512e-05, "loss": 0.0913, "loss_nan_ranks": 0, "loss_rank_avg": 0.1150393933057785, "step": 4940, "valid_targets_mean": 2331.6, "valid_targets_min": 750 }, { "epoch": 4.848039215686274, "grad_norm": 0.5435833906831937, "learning_rate": 1.046069181197389e-05, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.09760939329862595, "step": 4945, "valid_targets_mean": 2145.4, "valid_targets_min": 773 }, { "epoch": 4.852941176470588, "grad_norm": 0.4369663282479705, "learning_rate": 1.041775093202495e-05, "loss": 0.0996, "loss_nan_ranks": 0, "loss_rank_avg": 0.08269096910953522, "step": 4950, "valid_targets_mean": 3061.4, "valid_targets_min": 765 }, { "epoch": 4.857843137254902, "grad_norm": 0.4758291844439797, "learning_rate": 1.0374867308675388e-05, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.09057286381721497, "step": 4955, "valid_targets_mean": 2415.4, "valid_targets_min": 791 }, { "epoch": 4.862745098039216, "grad_norm": 0.6272118961769553, "learning_rate": 1.0332041198166754e-05, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.09164794534444809, "step": 4960, "valid_targets_mean": 1584.6, "valid_targets_min": 623 }, { "epoch": 4.867647058823529, "grad_norm": 0.5576322781572296, "learning_rate": 1.0289272856396954e-05, "loss": 0.1, "loss_nan_ranks": 0, "loss_rank_avg": 0.1521686166524887, "step": 4965, "valid_targets_mean": 2158.5, "valid_targets_min": 629 }, { "epoch": 4.872549019607844, "grad_norm": 0.49324132743081855, "learning_rate": 1.0246562538918721e-05, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.09149819612503052, "step": 4970, "valid_targets_mean": 2297.7, "valid_targets_min": 663 }, { "epoch": 4.877450980392156, "grad_norm": 0.5383819550781447, "learning_rate": 1.020391050093805e-05, "loss": 0.0908, "loss_nan_ranks": 0, "loss_rank_avg": 0.10303015261888504, "step": 4975, "valid_targets_mean": 2042.1, "valid_targets_min": 722 }, { "epoch": 4.882352941176471, "grad_norm": 0.527883183046873, "learning_rate": 1.0161316997312709e-05, "loss": 0.0859, "loss_nan_ranks": 0, "loss_rank_avg": 0.08816616982221603, "step": 4980, "valid_targets_mean": 2140.2, "valid_targets_min": 591 }, { "epoch": 4.887254901960784, "grad_norm": 0.4867613644619435, "learning_rate": 1.0118782282550716e-05, "loss": 0.0828, "loss_nan_ranks": 0, "loss_rank_avg": 0.10141561925411224, "step": 4985, "valid_targets_mean": 2612.1, "valid_targets_min": 783 }, { "epoch": 4.892156862745098, "grad_norm": 0.5079271131229582, "learning_rate": 1.0076306610808814e-05, "loss": 0.0915, "loss_nan_ranks": 0, "loss_rank_avg": 0.11670317500829697, "step": 4990, "valid_targets_mean": 2409.9, "valid_targets_min": 671 }, { "epoch": 4.897058823529412, "grad_norm": 0.40829801958468664, "learning_rate": 1.0033890235890927e-05, "loss": 0.0921, "loss_nan_ranks": 0, "loss_rank_avg": 0.08440542221069336, "step": 4995, "valid_targets_mean": 3008.8, "valid_targets_min": 602 }, { "epoch": 4.901960784313726, "grad_norm": 0.5894884163587373, "learning_rate": 9.99153341124668e-06, "loss": 0.0934, "loss_nan_ranks": 0, "loss_rank_avg": 0.11752729117870331, "step": 5000, "valid_targets_mean": 1987.6, "valid_targets_min": 759 }, { "epoch": 4.9068627450980395, "grad_norm": 0.6283199481005249, "learning_rate": 9.949236389969867e-06, "loss": 0.1045, "loss_nan_ranks": 0, "loss_rank_avg": 0.09560035169124603, "step": 5005, "valid_targets_mean": 1691.4, "valid_targets_min": 754 }, { "epoch": 4.911764705882353, "grad_norm": 0.7708788939045854, "learning_rate": 9.906999424796924e-06, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.12335900217294693, "step": 5010, "valid_targets_mean": 1527.1, "valid_targets_min": 637 }, { "epoch": 4.916666666666667, "grad_norm": 0.5051261469161019, "learning_rate": 9.864822768105456e-06, "loss": 0.0995, "loss_nan_ranks": 0, "loss_rank_avg": 0.09845969825983047, "step": 5015, "valid_targets_mean": 2510.3, "valid_targets_min": 650 }, { "epoch": 4.921568627450981, "grad_norm": 0.6859191386588651, "learning_rate": 9.822706671912705e-06, "loss": 0.0933, "loss_nan_ranks": 0, "loss_rank_avg": 0.11246706545352936, "step": 5020, "valid_targets_mean": 1509.5, "valid_targets_min": 608 }, { "epoch": 4.926470588235294, "grad_norm": 0.6250735945680871, "learning_rate": 9.780651387874039e-06, "loss": 0.0953, "loss_nan_ranks": 0, "loss_rank_avg": 0.09886276721954346, "step": 5025, "valid_targets_mean": 1722.8, "valid_targets_min": 569 }, { "epoch": 4.931372549019608, "grad_norm": 0.6608007328070579, "learning_rate": 9.738657167281451e-06, "loss": 0.1108, "loss_nan_ranks": 0, "loss_rank_avg": 0.10095824301242828, "step": 5030, "valid_targets_mean": 1996.3, "valid_targets_min": 592 }, { "epoch": 4.936274509803922, "grad_norm": 0.5050703755720812, "learning_rate": 9.696724261062079e-06, "loss": 0.0893, "loss_nan_ranks": 0, "loss_rank_avg": 0.09285195171833038, "step": 5035, "valid_targets_mean": 2361.6, "valid_targets_min": 683 }, { "epoch": 4.9411764705882355, "grad_norm": 0.5243779388155254, "learning_rate": 9.654852919776689e-06, "loss": 0.0897, "loss_nan_ranks": 0, "loss_rank_avg": 0.07373321056365967, "step": 5040, "valid_targets_mean": 2309.0, "valid_targets_min": 606 }, { "epoch": 4.946078431372549, "grad_norm": 0.5484866741806738, "learning_rate": 9.613043393618162e-06, "loss": 0.0941, "loss_nan_ranks": 0, "loss_rank_avg": 0.08428633958101273, "step": 5045, "valid_targets_mean": 2396.1, "valid_targets_min": 820 }, { "epoch": 4.950980392156863, "grad_norm": 0.4760131574819217, "learning_rate": 9.57129593241004e-06, "loss": 0.0968, "loss_nan_ranks": 0, "loss_rank_avg": 0.09283538162708282, "step": 5050, "valid_targets_mean": 2947.1, "valid_targets_min": 1134 }, { "epoch": 4.955882352941177, "grad_norm": 0.7049917083821713, "learning_rate": 9.529610785604995e-06, "loss": 0.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.10550940036773682, "step": 5055, "valid_targets_mean": 1514.4, "valid_targets_min": 672 }, { "epoch": 4.96078431372549, "grad_norm": 0.48941292868914, "learning_rate": 9.487988202283345e-06, "loss": 0.0902, "loss_nan_ranks": 0, "loss_rank_avg": 0.0809384286403656, "step": 5060, "valid_targets_mean": 2195.8, "valid_targets_min": 512 }, { "epoch": 4.965686274509804, "grad_norm": 0.5931382077234513, "learning_rate": 9.446428431151591e-06, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.08493739366531372, "step": 5065, "valid_targets_mean": 2018.6, "valid_targets_min": 457 }, { "epoch": 4.970588235294118, "grad_norm": 0.5893891050217172, "learning_rate": 9.404931720540918e-06, "loss": 0.0924, "loss_nan_ranks": 0, "loss_rank_avg": 0.11142192035913467, "step": 5070, "valid_targets_mean": 2016.1, "valid_targets_min": 459 }, { "epoch": 4.9754901960784315, "grad_norm": 0.6663388117976916, "learning_rate": 9.363498318405679e-06, "loss": 0.0921, "loss_nan_ranks": 0, "loss_rank_avg": 0.10338947176933289, "step": 5075, "valid_targets_mean": 1906.9, "valid_targets_min": 762 }, { "epoch": 4.980392156862745, "grad_norm": 0.5702917919323601, "learning_rate": 9.322128472321973e-06, "loss": 0.093, "loss_nan_ranks": 0, "loss_rank_avg": 0.09254737198352814, "step": 5080, "valid_targets_mean": 2369.6, "valid_targets_min": 718 }, { "epoch": 4.985294117647059, "grad_norm": 0.6006989977907731, "learning_rate": 9.280822429486117e-06, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.10931229591369629, "step": 5085, "valid_targets_mean": 1962.5, "valid_targets_min": 713 }, { "epoch": 4.990196078431373, "grad_norm": 0.6041195773866957, "learning_rate": 9.239580436713178e-06, "loss": 0.1032, "loss_nan_ranks": 0, "loss_rank_avg": 0.09572377055883408, "step": 5090, "valid_targets_mean": 2157.7, "valid_targets_min": 507 }, { "epoch": 4.995098039215686, "grad_norm": 0.6617547843586967, "learning_rate": 9.198402740435527e-06, "loss": 0.0981, "loss_nan_ranks": 0, "loss_rank_avg": 0.132956400513649, "step": 5095, "valid_targets_mean": 2033.6, "valid_targets_min": 681 }, { "epoch": 5.0, "grad_norm": 0.47759667778213716, "learning_rate": 9.157289586701328e-06, "loss": 0.0901, "loss_nan_ranks": 0, "loss_rank_avg": 0.08661957085132599, "step": 5100, "valid_targets_mean": 2665.0, "valid_targets_min": 837 }, { "epoch": 5.004901960784314, "grad_norm": 0.4604848433671045, "learning_rate": 9.116241221173103e-06, "loss": 0.0867, "loss_nan_ranks": 0, "loss_rank_avg": 0.07293270528316498, "step": 5105, "valid_targets_mean": 2602.8, "valid_targets_min": 818 }, { "epoch": 5.009803921568627, "grad_norm": 0.5911007179196364, "learning_rate": 9.075257889126234e-06, "loss": 0.0851, "loss_nan_ranks": 0, "loss_rank_avg": 0.08851397782564163, "step": 5110, "valid_targets_mean": 2199.7, "valid_targets_min": 652 }, { "epoch": 5.014705882352941, "grad_norm": 0.5015517934829464, "learning_rate": 9.0343398354475e-06, "loss": 0.0741, "loss_nan_ranks": 0, "loss_rank_avg": 0.0782584622502327, "step": 5115, "valid_targets_mean": 2538.9, "valid_targets_min": 704 }, { "epoch": 5.019607843137255, "grad_norm": 0.5541843585633855, "learning_rate": 8.993487304633648e-06, "loss": 0.0819, "loss_nan_ranks": 0, "loss_rank_avg": 0.07696060091257095, "step": 5120, "valid_targets_mean": 2012.0, "valid_targets_min": 635 }, { "epoch": 5.0245098039215685, "grad_norm": 0.5085417438896622, "learning_rate": 8.952700540789884e-06, "loss": 0.0894, "loss_nan_ranks": 0, "loss_rank_avg": 0.07348785549402237, "step": 5125, "valid_targets_mean": 2494.4, "valid_targets_min": 940 }, { "epoch": 5.029411764705882, "grad_norm": 0.5189146300290645, "learning_rate": 8.911979787628456e-06, "loss": 0.0736, "loss_nan_ranks": 0, "loss_rank_avg": 0.07135240733623505, "step": 5130, "valid_targets_mean": 2331.8, "valid_targets_min": 785 }, { "epoch": 5.034313725490196, "grad_norm": 0.6293919997645581, "learning_rate": 8.871325288467188e-06, "loss": 0.0986, "loss_nan_ranks": 0, "loss_rank_avg": 0.10753931850194931, "step": 5135, "valid_targets_mean": 2485.3, "valid_targets_min": 703 }, { "epoch": 5.03921568627451, "grad_norm": 0.5845395385864605, "learning_rate": 8.830737286227972e-06, "loss": 0.0819, "loss_nan_ranks": 0, "loss_rank_avg": 0.09616108238697052, "step": 5140, "valid_targets_mean": 2392.1, "valid_targets_min": 799 }, { "epoch": 5.044117647058823, "grad_norm": 0.5407442298797527, "learning_rate": 8.790216023435411e-06, "loss": 0.0937, "loss_nan_ranks": 0, "loss_rank_avg": 0.08268275856971741, "step": 5145, "valid_targets_mean": 2277.2, "valid_targets_min": 619 }, { "epoch": 5.049019607843137, "grad_norm": 0.5343504627780364, "learning_rate": 8.74976174221531e-06, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.07687253504991531, "step": 5150, "valid_targets_mean": 2395.2, "valid_targets_min": 731 }, { "epoch": 5.053921568627451, "grad_norm": 0.503203022422961, "learning_rate": 8.709374684293221e-06, "loss": 0.0795, "loss_nan_ranks": 0, "loss_rank_avg": 0.07528114318847656, "step": 5155, "valid_targets_mean": 2509.9, "valid_targets_min": 424 }, { "epoch": 5.0588235294117645, "grad_norm": 0.4820740870162874, "learning_rate": 8.669055090993041e-06, "loss": 0.0726, "loss_nan_ranks": 0, "loss_rank_avg": 0.06485399603843689, "step": 5160, "valid_targets_mean": 2117.0, "valid_targets_min": 704 }, { "epoch": 5.063725490196078, "grad_norm": 0.6534311563959244, "learning_rate": 8.628803203235536e-06, "loss": 0.0957, "loss_nan_ranks": 0, "loss_rank_avg": 0.11405531316995621, "step": 5165, "valid_targets_mean": 2078.2, "valid_targets_min": 687 }, { "epoch": 5.068627450980392, "grad_norm": 0.5159605033551381, "learning_rate": 8.588619261536904e-06, "loss": 0.0823, "loss_nan_ranks": 0, "loss_rank_avg": 0.07087569683790207, "step": 5170, "valid_targets_mean": 2643.9, "valid_targets_min": 700 }, { "epoch": 5.073529411764706, "grad_norm": 0.6120277300768532, "learning_rate": 8.548503506007363e-06, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.08435557782649994, "step": 5175, "valid_targets_mean": 1904.4, "valid_targets_min": 203 }, { "epoch": 5.078431372549019, "grad_norm": 0.5750915500710682, "learning_rate": 8.508456176349698e-06, "loss": 0.0868, "loss_nan_ranks": 0, "loss_rank_avg": 0.07057558000087738, "step": 5180, "valid_targets_mean": 2130.0, "valid_targets_min": 902 }, { "epoch": 5.083333333333333, "grad_norm": 0.5929571350769494, "learning_rate": 8.468477511857826e-06, "loss": 0.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.08237534761428833, "step": 5185, "valid_targets_mean": 2016.9, "valid_targets_min": 712 }, { "epoch": 5.088235294117647, "grad_norm": 0.49073426404229986, "learning_rate": 8.42856775141537e-06, "loss": 0.0818, "loss_nan_ranks": 0, "loss_rank_avg": 0.07128225266933441, "step": 5190, "valid_targets_mean": 2563.1, "valid_targets_min": 700 }, { "epoch": 5.0931372549019605, "grad_norm": 0.5348493318460731, "learning_rate": 8.388727133494219e-06, "loss": 0.0783, "loss_nan_ranks": 0, "loss_rank_avg": 0.06887640058994293, "step": 5195, "valid_targets_mean": 2482.9, "valid_targets_min": 623 }, { "epoch": 5.098039215686274, "grad_norm": 0.5146171818297789, "learning_rate": 8.348955896153146e-06, "loss": 0.0807, "loss_nan_ranks": 0, "loss_rank_avg": 0.07764531672000885, "step": 5200, "valid_targets_mean": 2469.7, "valid_targets_min": 771 }, { "epoch": 5.102941176470588, "grad_norm": 0.5561557225636563, "learning_rate": 8.30925427703633e-06, "loss": 0.0919, "loss_nan_ranks": 0, "loss_rank_avg": 0.11974679678678513, "step": 5205, "valid_targets_mean": 2453.7, "valid_targets_min": 722 }, { "epoch": 5.107843137254902, "grad_norm": 0.6539916720138971, "learning_rate": 8.269622513371971e-06, "loss": 0.0768, "loss_nan_ranks": 0, "loss_rank_avg": 0.09084124863147736, "step": 5210, "valid_targets_mean": 1766.9, "valid_targets_min": 342 }, { "epoch": 5.112745098039215, "grad_norm": 0.5429121808535396, "learning_rate": 8.230060841970875e-06, "loss": 0.0754, "loss_nan_ranks": 0, "loss_rank_avg": 0.07802797853946686, "step": 5215, "valid_targets_mean": 2213.3, "valid_targets_min": 612 }, { "epoch": 5.117647058823529, "grad_norm": 0.5083279394937158, "learning_rate": 8.190569499225008e-06, "loss": 0.0814, "loss_nan_ranks": 0, "loss_rank_avg": 0.06983786821365356, "step": 5220, "valid_targets_mean": 2548.4, "valid_targets_min": 837 }, { "epoch": 5.122549019607843, "grad_norm": 0.5465649932109973, "learning_rate": 8.1511487211061e-06, "loss": 0.0892, "loss_nan_ranks": 0, "loss_rank_avg": 0.07368411868810654, "step": 5225, "valid_targets_mean": 2058.0, "valid_targets_min": 539 }, { "epoch": 5.127450980392156, "grad_norm": 0.558225572156942, "learning_rate": 8.111798743164267e-06, "loss": 0.0911, "loss_nan_ranks": 0, "loss_rank_avg": 0.08299843966960907, "step": 5230, "valid_targets_mean": 1902.3, "valid_targets_min": 589 }, { "epoch": 5.132352941176471, "grad_norm": 0.5136237271349839, "learning_rate": 8.072519800526542e-06, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.07817132771015167, "step": 5235, "valid_targets_mean": 2501.4, "valid_targets_min": 643 }, { "epoch": 5.137254901960785, "grad_norm": 0.498321689726259, "learning_rate": 8.033312127895518e-06, "loss": 0.0759, "loss_nan_ranks": 0, "loss_rank_avg": 0.09710898995399475, "step": 5240, "valid_targets_mean": 2590.6, "valid_targets_min": 543 }, { "epoch": 5.142156862745098, "grad_norm": 0.7408036748383444, "learning_rate": 7.994175959547939e-06, "loss": 0.0836, "loss_nan_ranks": 0, "loss_rank_avg": 0.11459003388881683, "step": 5245, "valid_targets_mean": 1611.8, "valid_targets_min": 602 }, { "epoch": 5.147058823529412, "grad_norm": 0.4975297290259382, "learning_rate": 7.95511152933327e-06, "loss": 0.0802, "loss_nan_ranks": 0, "loss_rank_avg": 0.06459469348192215, "step": 5250, "valid_targets_mean": 2624.0, "valid_targets_min": 687 }, { "epoch": 5.151960784313726, "grad_norm": 0.7561461760461909, "learning_rate": 7.916119070672325e-06, "loss": 0.0861, "loss_nan_ranks": 0, "loss_rank_avg": 0.0870676040649414, "step": 5255, "valid_targets_mean": 1697.4, "valid_targets_min": 761 }, { "epoch": 5.1568627450980395, "grad_norm": 0.5210675746878989, "learning_rate": 7.87719881655588e-06, "loss": 0.0844, "loss_nan_ranks": 0, "loss_rank_avg": 0.06843873858451843, "step": 5260, "valid_targets_mean": 2269.1, "valid_targets_min": 659 }, { "epoch": 5.161764705882353, "grad_norm": 0.5338645649878168, "learning_rate": 7.83835099954327e-06, "loss": 0.0981, "loss_nan_ranks": 0, "loss_rank_avg": 0.0681375116109848, "step": 5265, "valid_targets_mean": 2572.6, "valid_targets_min": 790 }, { "epoch": 5.166666666666667, "grad_norm": 0.651416544867339, "learning_rate": 7.799575851760982e-06, "loss": 0.0864, "loss_nan_ranks": 0, "loss_rank_avg": 0.08005984127521515, "step": 5270, "valid_targets_mean": 2171.5, "valid_targets_min": 605 }, { "epoch": 5.171568627450981, "grad_norm": 0.6330539334076882, "learning_rate": 7.76087360490129e-06, "loss": 0.0861, "loss_nan_ranks": 0, "loss_rank_avg": 0.09047305583953857, "step": 5275, "valid_targets_mean": 1923.2, "valid_targets_min": 548 }, { "epoch": 5.176470588235294, "grad_norm": 0.44154350607425974, "learning_rate": 7.722244490220873e-06, "loss": 0.0681, "loss_nan_ranks": 0, "loss_rank_avg": 0.06011586636304855, "step": 5280, "valid_targets_mean": 3123.1, "valid_targets_min": 788 }, { "epoch": 5.181372549019608, "grad_norm": 0.5534899671335772, "learning_rate": 7.683688738539414e-06, "loss": 0.0845, "loss_nan_ranks": 0, "loss_rank_avg": 0.0851341038942337, "step": 5285, "valid_targets_mean": 2315.2, "valid_targets_min": 841 }, { "epoch": 5.186274509803922, "grad_norm": 0.568120445090173, "learning_rate": 7.64520658023824e-06, "loss": 0.0915, "loss_nan_ranks": 0, "loss_rank_avg": 0.0778503492474556, "step": 5290, "valid_targets_mean": 2170.7, "valid_targets_min": 678 }, { "epoch": 5.1911764705882355, "grad_norm": 0.4820906324235686, "learning_rate": 7.606798245258941e-06, "loss": 0.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.11274714022874832, "step": 5295, "valid_targets_mean": 2448.4, "valid_targets_min": 697 }, { "epoch": 5.196078431372549, "grad_norm": 0.5565416986397015, "learning_rate": 7.568463963101982e-06, "loss": 0.0858, "loss_nan_ranks": 0, "loss_rank_avg": 0.07629026472568512, "step": 5300, "valid_targets_mean": 2519.6, "valid_targets_min": 564 }, { "epoch": 5.200980392156863, "grad_norm": 0.5875632797684447, "learning_rate": 7.530203962825331e-06, "loss": 0.0767, "loss_nan_ranks": 0, "loss_rank_avg": 0.07195107638835907, "step": 5305, "valid_targets_mean": 2161.2, "valid_targets_min": 567 }, { "epoch": 5.205882352941177, "grad_norm": 0.5878351907497511, "learning_rate": 7.4920184730431275e-06, "loss": 0.0776, "loss_nan_ranks": 0, "loss_rank_avg": 0.06824355572462082, "step": 5310, "valid_targets_mean": 2125.2, "valid_targets_min": 792 }, { "epoch": 5.21078431372549, "grad_norm": 0.6921615760995266, "learning_rate": 7.453907721924285e-06, "loss": 0.0773, "loss_nan_ranks": 0, "loss_rank_avg": 0.08252941071987152, "step": 5315, "valid_targets_mean": 1936.6, "valid_targets_min": 538 }, { "epoch": 5.215686274509804, "grad_norm": 0.6435003909309579, "learning_rate": 7.415871937191111e-06, "loss": 0.0737, "loss_nan_ranks": 0, "loss_rank_avg": 0.07561911642551422, "step": 5320, "valid_targets_mean": 2016.7, "valid_targets_min": 635 }, { "epoch": 5.220588235294118, "grad_norm": 0.5023546345333582, "learning_rate": 7.377911346117992e-06, "loss": 0.0799, "loss_nan_ranks": 0, "loss_rank_avg": 0.06859388202428818, "step": 5325, "valid_targets_mean": 2208.1, "valid_targets_min": 816 }, { "epoch": 5.2254901960784315, "grad_norm": 0.6998975765045649, "learning_rate": 7.340026175530002e-06, "loss": 0.0997, "loss_nan_ranks": 0, "loss_rank_avg": 0.1062772274017334, "step": 5330, "valid_targets_mean": 1918.6, "valid_targets_min": 761 }, { "epoch": 5.230392156862745, "grad_norm": 0.62750845180046, "learning_rate": 7.302216651801546e-06, "loss": 0.0872, "loss_nan_ranks": 0, "loss_rank_avg": 0.07626760005950928, "step": 5335, "valid_targets_mean": 1799.3, "valid_targets_min": 718 }, { "epoch": 5.235294117647059, "grad_norm": 0.5543171693917915, "learning_rate": 7.264483000855036e-06, "loss": 0.0839, "loss_nan_ranks": 0, "loss_rank_avg": 0.07348915934562683, "step": 5340, "valid_targets_mean": 2069.6, "valid_targets_min": 754 }, { "epoch": 5.240196078431373, "grad_norm": 0.7983146319280329, "learning_rate": 7.226825448159524e-06, "loss": 0.0791, "loss_nan_ranks": 0, "loss_rank_avg": 0.08151835203170776, "step": 5345, "valid_targets_mean": 1926.6, "valid_targets_min": 783 }, { "epoch": 5.245098039215686, "grad_norm": 0.5799482989527313, "learning_rate": 7.1892442187293324e-06, "loss": 0.0869, "loss_nan_ranks": 0, "loss_rank_avg": 0.12980447709560394, "step": 5350, "valid_targets_mean": 2295.6, "valid_targets_min": 750 }, { "epoch": 5.25, "grad_norm": 0.4881711367941992, "learning_rate": 7.151739537122755e-06, "loss": 0.083, "loss_nan_ranks": 0, "loss_rank_avg": 0.06775844097137451, "step": 5355, "valid_targets_mean": 2253.4, "valid_targets_min": 621 }, { "epoch": 5.254901960784314, "grad_norm": 0.5353490999682617, "learning_rate": 7.114311627440675e-06, "loss": 0.071, "loss_nan_ranks": 0, "loss_rank_avg": 0.0793384313583374, "step": 5360, "valid_targets_mean": 2420.6, "valid_targets_min": 697 }, { "epoch": 5.259803921568627, "grad_norm": 0.538659559297651, "learning_rate": 7.076960713325242e-06, "loss": 0.0783, "loss_nan_ranks": 0, "loss_rank_avg": 0.0664932131767273, "step": 5365, "valid_targets_mean": 2518.3, "valid_targets_min": 591 }, { "epoch": 5.264705882352941, "grad_norm": 0.6568125968077196, "learning_rate": 7.039687017958545e-06, "loss": 0.0854, "loss_nan_ranks": 0, "loss_rank_avg": 0.0847780704498291, "step": 5370, "valid_targets_mean": 1899.9, "valid_targets_min": 706 }, { "epoch": 5.269607843137255, "grad_norm": 0.6122298995911225, "learning_rate": 7.002490764061274e-06, "loss": 0.0914, "loss_nan_ranks": 0, "loss_rank_avg": 0.09091790020465851, "step": 5375, "valid_targets_mean": 1925.0, "valid_targets_min": 609 }, { "epoch": 5.2745098039215685, "grad_norm": 0.922364301866522, "learning_rate": 6.965372173891369e-06, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.07770726084709167, "step": 5380, "valid_targets_mean": 1841.9, "valid_targets_min": 543 }, { "epoch": 5.279411764705882, "grad_norm": 0.5027301818761994, "learning_rate": 6.928331469242709e-06, "loss": 0.074, "loss_nan_ranks": 0, "loss_rank_avg": 0.07609498500823975, "step": 5385, "valid_targets_mean": 2420.9, "valid_targets_min": 797 }, { "epoch": 5.284313725490196, "grad_norm": 0.5073890103240528, "learning_rate": 6.891368871443795e-06, "loss": 0.0756, "loss_nan_ranks": 0, "loss_rank_avg": 0.0688600093126297, "step": 5390, "valid_targets_mean": 2477.0, "valid_targets_min": 740 }, { "epoch": 5.28921568627451, "grad_norm": 0.5298744083568486, "learning_rate": 6.854484601356426e-06, "loss": 0.0845, "loss_nan_ranks": 0, "loss_rank_avg": 0.07411527633666992, "step": 5395, "valid_targets_mean": 2140.9, "valid_targets_min": 363 }, { "epoch": 5.294117647058823, "grad_norm": 0.5242195295040767, "learning_rate": 6.817678879374341e-06, "loss": 0.0687, "loss_nan_ranks": 0, "loss_rank_avg": 0.06534264236688614, "step": 5400, "valid_targets_mean": 2309.1, "valid_targets_min": 656 }, { "epoch": 5.299019607843137, "grad_norm": 0.4536802947760404, "learning_rate": 6.7809519254219655e-06, "loss": 0.0815, "loss_nan_ranks": 0, "loss_rank_avg": 0.06536039710044861, "step": 5405, "valid_targets_mean": 2977.7, "valid_targets_min": 816 }, { "epoch": 5.303921568627451, "grad_norm": 0.5065375359596163, "learning_rate": 6.744303958953043e-06, "loss": 0.0842, "loss_nan_ranks": 0, "loss_rank_avg": 0.07473203539848328, "step": 5410, "valid_targets_mean": 2966.2, "valid_targets_min": 1232 }, { "epoch": 5.3088235294117645, "grad_norm": 0.5342380006283294, "learning_rate": 6.707735198949344e-06, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.07432928681373596, "step": 5415, "valid_targets_mean": 2556.4, "valid_targets_min": 594 }, { "epoch": 5.313725490196078, "grad_norm": 0.6116252161599829, "learning_rate": 6.671245863919374e-06, "loss": 0.0862, "loss_nan_ranks": 0, "loss_rank_avg": 0.09420572221279144, "step": 5420, "valid_targets_mean": 1872.7, "valid_targets_min": 663 }, { "epoch": 5.318627450980392, "grad_norm": 0.38722492088167965, "learning_rate": 6.634836171897048e-06, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.06971578299999237, "step": 5425, "valid_targets_mean": 3064.0, "valid_targets_min": 549 }, { "epoch": 5.323529411764706, "grad_norm": 0.48575352597613497, "learning_rate": 6.598506340440373e-06, "loss": 0.081, "loss_nan_ranks": 0, "loss_rank_avg": 0.07496002316474915, "step": 5430, "valid_targets_mean": 2613.2, "valid_targets_min": 771 }, { "epoch": 5.328431372549019, "grad_norm": 0.5766518334984045, "learning_rate": 6.562256586630198e-06, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.07142172753810883, "step": 5435, "valid_targets_mean": 2121.6, "valid_targets_min": 812 }, { "epoch": 5.333333333333333, "grad_norm": 0.5616562487814789, "learning_rate": 6.526087127068857e-06, "loss": 0.0811, "loss_nan_ranks": 0, "loss_rank_avg": 0.07984551787376404, "step": 5440, "valid_targets_mean": 2259.9, "valid_targets_min": 757 }, { "epoch": 5.338235294117647, "grad_norm": 0.5297286772555554, "learning_rate": 6.489998177878925e-06, "loss": 0.0907, "loss_nan_ranks": 0, "loss_rank_avg": 0.07350513339042664, "step": 5445, "valid_targets_mean": 2587.9, "valid_targets_min": 765 }, { "epoch": 5.3431372549019605, "grad_norm": 0.4643067993227384, "learning_rate": 6.453989954701882e-06, "loss": 0.0892, "loss_nan_ranks": 0, "loss_rank_avg": 0.0627140998840332, "step": 5450, "valid_targets_mean": 2341.8, "valid_targets_min": 665 }, { "epoch": 5.348039215686274, "grad_norm": 0.7694605309291938, "learning_rate": 6.418062672696877e-06, "loss": 0.0958, "loss_nan_ranks": 0, "loss_rank_avg": 0.10127004981040955, "step": 5455, "valid_targets_mean": 1646.6, "valid_targets_min": 530 }, { "epoch": 5.352941176470588, "grad_norm": 0.6921060023364909, "learning_rate": 6.382216546539395e-06, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.08449102193117142, "step": 5460, "valid_targets_mean": 2167.2, "valid_targets_min": 485 }, { "epoch": 5.357843137254902, "grad_norm": 0.6955216056484889, "learning_rate": 6.346451790419992e-06, "loss": 0.08, "loss_nan_ranks": 0, "loss_rank_avg": 0.07503059506416321, "step": 5465, "valid_targets_mean": 1879.7, "valid_targets_min": 698 }, { "epoch": 5.362745098039215, "grad_norm": 0.42726578395620934, "learning_rate": 6.310768618043011e-06, "loss": 0.0667, "loss_nan_ranks": 0, "loss_rank_avg": 0.06386620551347733, "step": 5470, "valid_targets_mean": 2749.9, "valid_targets_min": 933 }, { "epoch": 5.367647058823529, "grad_norm": 0.5327119640641524, "learning_rate": 6.275167242625331e-06, "loss": 0.0859, "loss_nan_ranks": 0, "loss_rank_avg": 0.06920159608125687, "step": 5475, "valid_targets_mean": 2259.7, "valid_targets_min": 781 }, { "epoch": 5.372549019607844, "grad_norm": 0.5250883694648594, "learning_rate": 6.239647876895045e-06, "loss": 0.0753, "loss_nan_ranks": 0, "loss_rank_avg": 0.07292656600475311, "step": 5480, "valid_targets_mean": 2220.8, "valid_targets_min": 704 }, { "epoch": 5.377450980392156, "grad_norm": 0.6092967365208375, "learning_rate": 6.204210733090241e-06, "loss": 0.0823, "loss_nan_ranks": 0, "loss_rank_avg": 0.09393665939569473, "step": 5485, "valid_targets_mean": 2369.6, "valid_targets_min": 732 }, { "epoch": 5.382352941176471, "grad_norm": 0.6038113201133489, "learning_rate": 6.168856022957685e-06, "loss": 0.0869, "loss_nan_ranks": 0, "loss_rank_avg": 0.09418021887540817, "step": 5490, "valid_targets_mean": 2383.8, "valid_targets_min": 751 }, { "epoch": 5.387254901960785, "grad_norm": 0.5057934505834986, "learning_rate": 6.133583957751585e-06, "loss": 0.0816, "loss_nan_ranks": 0, "loss_rank_avg": 0.07620443403720856, "step": 5495, "valid_targets_mean": 2849.1, "valid_targets_min": 592 }, { "epoch": 5.392156862745098, "grad_norm": 0.5776768115860323, "learning_rate": 6.098394748232333e-06, "loss": 0.0874, "loss_nan_ranks": 0, "loss_rank_avg": 0.08147083967924118, "step": 5500, "valid_targets_mean": 2674.8, "valid_targets_min": 622 }, { "epoch": 5.397058823529412, "grad_norm": 0.6709503859844336, "learning_rate": 6.063288604665227e-06, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.10320451855659485, "step": 5505, "valid_targets_mean": 1907.4, "valid_targets_min": 474 }, { "epoch": 5.401960784313726, "grad_norm": 0.5332746140305541, "learning_rate": 6.028265736819234e-06, "loss": 0.0945, "loss_nan_ranks": 0, "loss_rank_avg": 0.08802657574415207, "step": 5510, "valid_targets_mean": 2443.4, "valid_targets_min": 676 }, { "epoch": 5.4068627450980395, "grad_norm": 0.5303408521919405, "learning_rate": 5.993326353965705e-06, "loss": 0.0852, "loss_nan_ranks": 0, "loss_rank_avg": 0.07660799473524094, "step": 5515, "valid_targets_mean": 2294.6, "valid_targets_min": 721 }, { "epoch": 5.411764705882353, "grad_norm": 0.5504797907176615, "learning_rate": 5.958470664877154e-06, "loss": 0.0775, "loss_nan_ranks": 0, "loss_rank_avg": 0.0719451829791069, "step": 5520, "valid_targets_mean": 2223.8, "valid_targets_min": 759 }, { "epoch": 5.416666666666667, "grad_norm": 0.5048702357817372, "learning_rate": 5.9236988778260144e-06, "loss": 0.0805, "loss_nan_ranks": 0, "loss_rank_avg": 0.07212197780609131, "step": 5525, "valid_targets_mean": 2394.9, "valid_targets_min": 776 }, { "epoch": 5.421568627450981, "grad_norm": 0.5582414610550838, "learning_rate": 5.8890112005833565e-06, "loss": 0.0811, "loss_nan_ranks": 0, "loss_rank_avg": 0.1013210117816925, "step": 5530, "valid_targets_mean": 2547.2, "valid_targets_min": 535 }, { "epoch": 5.426470588235294, "grad_norm": 0.5997664325867221, "learning_rate": 5.854407840417693e-06, "loss": 0.0925, "loss_nan_ranks": 0, "loss_rank_avg": 0.11854314804077148, "step": 5535, "valid_targets_mean": 2110.2, "valid_targets_min": 713 }, { "epoch": 5.431372549019608, "grad_norm": 0.5953673256263169, "learning_rate": 5.819889004093719e-06, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.09450195729732513, "step": 5540, "valid_targets_mean": 2220.2, "valid_targets_min": 711 }, { "epoch": 5.436274509803922, "grad_norm": 0.6808012844229521, "learning_rate": 5.785454897871059e-06, "loss": 0.0917, "loss_nan_ranks": 0, "loss_rank_avg": 0.12832430005073547, "step": 5545, "valid_targets_mean": 2311.3, "valid_targets_min": 742 }, { "epoch": 5.4411764705882355, "grad_norm": 0.5726522699115283, "learning_rate": 5.751105727503057e-06, "loss": 0.0787, "loss_nan_ranks": 0, "loss_rank_avg": 0.0782998651266098, "step": 5550, "valid_targets_mean": 2264.9, "valid_targets_min": 485 }, { "epoch": 5.446078431372549, "grad_norm": 0.5868036175605869, "learning_rate": 5.716841698235553e-06, "loss": 0.0899, "loss_nan_ranks": 0, "loss_rank_avg": 0.07577871531248093, "step": 5555, "valid_targets_mean": 1881.0, "valid_targets_min": 777 }, { "epoch": 5.450980392156863, "grad_norm": 0.5728814564653399, "learning_rate": 5.682663014805631e-06, "loss": 0.088, "loss_nan_ranks": 0, "loss_rank_avg": 0.08744935691356659, "step": 5560, "valid_targets_mean": 2001.8, "valid_targets_min": 640 }, { "epoch": 5.455882352941177, "grad_norm": 0.5131924143447337, "learning_rate": 5.648569881440422e-06, "loss": 0.0871, "loss_nan_ranks": 0, "loss_rank_avg": 0.0721743106842041, "step": 5565, "valid_targets_mean": 2405.6, "valid_targets_min": 604 }, { "epoch": 5.46078431372549, "grad_norm": 0.635324527204431, "learning_rate": 5.6145625018558715e-06, "loss": 0.0831, "loss_nan_ranks": 0, "loss_rank_avg": 0.10122652351856232, "step": 5570, "valid_targets_mean": 2350.2, "valid_targets_min": 598 }, { "epoch": 5.465686274509804, "grad_norm": 0.6267729572441716, "learning_rate": 5.580641079255509e-06, "loss": 0.0961, "loss_nan_ranks": 0, "loss_rank_avg": 0.10425372421741486, "step": 5575, "valid_targets_mean": 1768.8, "valid_targets_min": 790 }, { "epoch": 5.470588235294118, "grad_norm": 0.5930960268540582, "learning_rate": 5.54680581632925e-06, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.07789880037307739, "step": 5580, "valid_targets_mean": 2379.4, "valid_targets_min": 580 }, { "epoch": 5.4754901960784315, "grad_norm": 0.5411247803074882, "learning_rate": 5.513056915252195e-06, "loss": 0.084, "loss_nan_ranks": 0, "loss_rank_avg": 0.07947784662246704, "step": 5585, "valid_targets_mean": 2909.1, "valid_targets_min": 852 }, { "epoch": 5.480392156862745, "grad_norm": 0.5846627085120992, "learning_rate": 5.479394577683404e-06, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.07893018424510956, "step": 5590, "valid_targets_mean": 2389.6, "valid_targets_min": 673 }, { "epoch": 5.485294117647059, "grad_norm": 0.5935404654101385, "learning_rate": 5.44581900476469e-06, "loss": 0.0799, "loss_nan_ranks": 0, "loss_rank_avg": 0.08584611862897873, "step": 5595, "valid_targets_mean": 2056.1, "valid_targets_min": 684 }, { "epoch": 5.490196078431373, "grad_norm": 0.5868161180417224, "learning_rate": 5.412330397119419e-06, "loss": 0.0742, "loss_nan_ranks": 0, "loss_rank_avg": 0.07897976040840149, "step": 5600, "valid_targets_mean": 2170.9, "valid_targets_min": 708 }, { "epoch": 5.495098039215686, "grad_norm": 0.5805575731061238, "learning_rate": 5.3789289548513326e-06, "loss": 0.0785, "loss_nan_ranks": 0, "loss_rank_avg": 0.09302123636007309, "step": 5605, "valid_targets_mean": 2172.2, "valid_targets_min": 800 }, { "epoch": 5.5, "grad_norm": 0.6347183322088364, "learning_rate": 5.345614877543313e-06, "loss": 0.0817, "loss_nan_ranks": 0, "loss_rank_avg": 0.07956665754318237, "step": 5610, "valid_targets_mean": 1914.4, "valid_targets_min": 750 }, { "epoch": 5.504901960784314, "grad_norm": 0.7293893954848631, "learning_rate": 5.312388364256229e-06, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.10558699816465378, "step": 5615, "valid_targets_mean": 1635.8, "valid_targets_min": 688 }, { "epoch": 5.509803921568627, "grad_norm": 0.5270248184938987, "learning_rate": 5.279249613527735e-06, "loss": 0.0742, "loss_nan_ranks": 0, "loss_rank_avg": 0.06831567734479904, "step": 5620, "valid_targets_mean": 2452.7, "valid_targets_min": 734 }, { "epoch": 5.514705882352941, "grad_norm": 0.5350392884902185, "learning_rate": 5.246198823371063e-06, "loss": 0.0736, "loss_nan_ranks": 0, "loss_rank_avg": 0.06904664635658264, "step": 5625, "valid_targets_mean": 2162.8, "valid_targets_min": 808 }, { "epoch": 5.519607843137255, "grad_norm": 0.6344941061658974, "learning_rate": 5.213236191273854e-06, "loss": 0.0884, "loss_nan_ranks": 0, "loss_rank_avg": 0.09255999326705933, "step": 5630, "valid_targets_mean": 2347.1, "valid_targets_min": 865 }, { "epoch": 5.5245098039215685, "grad_norm": 0.6020792880176296, "learning_rate": 5.180361914196996e-06, "loss": 0.0879, "loss_nan_ranks": 0, "loss_rank_avg": 0.09349136054515839, "step": 5635, "valid_targets_mean": 2380.8, "valid_targets_min": 607 }, { "epoch": 5.529411764705882, "grad_norm": 0.5956397945862633, "learning_rate": 5.147576188573433e-06, "loss": 0.0836, "loss_nan_ranks": 0, "loss_rank_avg": 0.09244567155838013, "step": 5640, "valid_targets_mean": 2050.1, "valid_targets_min": 567 }, { "epoch": 5.534313725490196, "grad_norm": 0.5153802600162333, "learning_rate": 5.114879210306967e-06, "loss": 0.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.06410102546215057, "step": 5645, "valid_targets_mean": 2220.6, "valid_targets_min": 560 }, { "epoch": 5.53921568627451, "grad_norm": 0.5903655078820536, "learning_rate": 5.0822711747711365e-06, "loss": 0.0802, "loss_nan_ranks": 0, "loss_rank_avg": 0.07721748948097229, "step": 5650, "valid_targets_mean": 2455.4, "valid_targets_min": 521 }, { "epoch": 5.544117647058823, "grad_norm": 0.5429688822860307, "learning_rate": 5.049752276808002e-06, "loss": 0.0841, "loss_nan_ranks": 0, "loss_rank_avg": 0.0777660384774208, "step": 5655, "valid_targets_mean": 2515.0, "valid_targets_min": 680 }, { "epoch": 5.549019607843137, "grad_norm": 0.5604176522917697, "learning_rate": 5.0173227107270065e-06, "loss": 0.0901, "loss_nan_ranks": 0, "loss_rank_avg": 0.08657435327768326, "step": 5660, "valid_targets_mean": 2180.7, "valid_targets_min": 733 }, { "epoch": 5.553921568627451, "grad_norm": 0.5281339651549892, "learning_rate": 4.984982670303818e-06, "loss": 0.0733, "loss_nan_ranks": 0, "loss_rank_avg": 0.06807395815849304, "step": 5665, "valid_targets_mean": 2235.6, "valid_targets_min": 593 }, { "epoch": 5.5588235294117645, "grad_norm": 0.5690739702658926, "learning_rate": 4.952732348779165e-06, "loss": 0.0743, "loss_nan_ranks": 0, "loss_rank_avg": 0.06617975234985352, "step": 5670, "valid_targets_mean": 2433.0, "valid_targets_min": 720 }, { "epoch": 5.563725490196078, "grad_norm": 0.5656611047345302, "learning_rate": 4.920571938857665e-06, "loss": 0.0716, "loss_nan_ranks": 0, "loss_rank_avg": 0.08199770003557205, "step": 5675, "valid_targets_mean": 2496.0, "valid_targets_min": 742 }, { "epoch": 5.568627450980392, "grad_norm": 0.5265721948588862, "learning_rate": 4.88850163270671e-06, "loss": 0.0753, "loss_nan_ranks": 0, "loss_rank_avg": 0.07681460678577423, "step": 5680, "valid_targets_mean": 2276.1, "valid_targets_min": 634 }, { "epoch": 5.573529411764706, "grad_norm": 0.43922395927036295, "learning_rate": 4.856521621955282e-06, "loss": 0.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.06098077446222305, "step": 5685, "valid_targets_mean": 2503.2, "valid_targets_min": 816 }, { "epoch": 5.578431372549019, "grad_norm": 0.5517412995836757, "learning_rate": 4.824632097692816e-06, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.07269728183746338, "step": 5690, "valid_targets_mean": 2103.2, "valid_targets_min": 835 }, { "epoch": 5.583333333333333, "grad_norm": 0.5648727695267294, "learning_rate": 4.7928332504680876e-06, "loss": 0.0759, "loss_nan_ranks": 0, "loss_rank_avg": 0.07408298552036285, "step": 5695, "valid_targets_mean": 2224.1, "valid_targets_min": 725 }, { "epoch": 5.588235294117647, "grad_norm": 0.4929550418851452, "learning_rate": 4.761125270288041e-06, "loss": 0.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.074101522564888, "step": 5700, "valid_targets_mean": 2437.9, "valid_targets_min": 533 }, { "epoch": 5.5931372549019605, "grad_norm": 0.6146098190528329, "learning_rate": 4.72950834661666e-06, "loss": 0.0815, "loss_nan_ranks": 0, "loss_rank_avg": 0.09067805856466293, "step": 5705, "valid_targets_mean": 2192.0, "valid_targets_min": 613 }, { "epoch": 5.598039215686274, "grad_norm": 0.5713767381680502, "learning_rate": 4.69798266837384e-06, "loss": 0.0752, "loss_nan_ranks": 0, "loss_rank_avg": 0.0734923854470253, "step": 5710, "valid_targets_mean": 2141.4, "valid_targets_min": 729 }, { "epoch": 5.602941176470588, "grad_norm": 0.530929712629617, "learning_rate": 4.666548423934265e-06, "loss": 0.0735, "loss_nan_ranks": 0, "loss_rank_avg": 0.07157990336418152, "step": 5715, "valid_targets_mean": 2109.9, "valid_targets_min": 595 }, { "epoch": 5.607843137254902, "grad_norm": 0.6962615608499858, "learning_rate": 4.635205801126286e-06, "loss": 0.0831, "loss_nan_ranks": 0, "loss_rank_avg": 0.11094634234905243, "step": 5720, "valid_targets_mean": 1813.5, "valid_targets_min": 727 }, { "epoch": 5.612745098039216, "grad_norm": 0.4782088252652507, "learning_rate": 4.603954987230765e-06, "loss": 0.0783, "loss_nan_ranks": 0, "loss_rank_avg": 0.07033517956733704, "step": 5725, "valid_targets_mean": 2793.8, "valid_targets_min": 573 }, { "epoch": 5.617647058823529, "grad_norm": 0.5951363588950894, "learning_rate": 4.572796168980007e-06, "loss": 0.0818, "loss_nan_ranks": 0, "loss_rank_avg": 0.07607996463775635, "step": 5730, "valid_targets_mean": 2104.0, "valid_targets_min": 798 }, { "epoch": 5.622549019607844, "grad_norm": 0.4987162833335496, "learning_rate": 4.541729532556598e-06, "loss": 0.0795, "loss_nan_ranks": 0, "loss_rank_avg": 0.07763554155826569, "step": 5735, "valid_targets_mean": 2146.9, "valid_targets_min": 526 }, { "epoch": 5.627450980392156, "grad_norm": 0.5669056837913017, "learning_rate": 4.5107552635923125e-06, "loss": 0.0798, "loss_nan_ranks": 0, "loss_rank_avg": 0.07391584664583206, "step": 5740, "valid_targets_mean": 2252.2, "valid_targets_min": 761 }, { "epoch": 5.632352941176471, "grad_norm": 0.4535207599733533, "learning_rate": 4.479873547167015e-06, "loss": 0.0784, "loss_nan_ranks": 0, "loss_rank_avg": 0.07132834196090698, "step": 5745, "valid_targets_mean": 2706.5, "valid_targets_min": 655 }, { "epoch": 5.637254901960784, "grad_norm": 0.5964000308881082, "learning_rate": 4.449084567807544e-06, "loss": 0.0703, "loss_nan_ranks": 0, "loss_rank_avg": 0.07358132302761078, "step": 5750, "valid_targets_mean": 1825.4, "valid_targets_min": 688 }, { "epoch": 5.642156862745098, "grad_norm": 0.551048381068549, "learning_rate": 4.41838850948659e-06, "loss": 0.0895, "loss_nan_ranks": 0, "loss_rank_avg": 0.0815672054886818, "step": 5755, "valid_targets_mean": 2226.1, "valid_targets_min": 721 }, { "epoch": 5.647058823529412, "grad_norm": 0.6183042975984667, "learning_rate": 4.38778555562164e-06, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.08897422254085541, "step": 5760, "valid_targets_mean": 2168.8, "valid_targets_min": 640 }, { "epoch": 5.651960784313726, "grad_norm": 0.516411332728326, "learning_rate": 4.357275889073833e-06, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.07211611419916153, "step": 5765, "valid_targets_mean": 2329.8, "valid_targets_min": 954 }, { "epoch": 5.6568627450980395, "grad_norm": 0.6726342729830591, "learning_rate": 4.326859692146898e-06, "loss": 0.0823, "loss_nan_ranks": 0, "loss_rank_avg": 0.07956632971763611, "step": 5770, "valid_targets_mean": 1732.2, "valid_targets_min": 574 }, { "epoch": 5.661764705882353, "grad_norm": 0.6069399571516791, "learning_rate": 4.296537146586061e-06, "loss": 0.0809, "loss_nan_ranks": 0, "loss_rank_avg": 0.08645060658454895, "step": 5775, "valid_targets_mean": 2165.1, "valid_targets_min": 617 }, { "epoch": 5.666666666666667, "grad_norm": 0.6122057076391019, "learning_rate": 4.266308433576955e-06, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.07423560321331024, "step": 5780, "valid_targets_mean": 2185.4, "valid_targets_min": 817 }, { "epoch": 5.671568627450981, "grad_norm": 0.5318258105059224, "learning_rate": 4.236173733744542e-06, "loss": 0.0829, "loss_nan_ranks": 0, "loss_rank_avg": 0.07637228816747665, "step": 5785, "valid_targets_mean": 2447.4, "valid_targets_min": 667 }, { "epoch": 5.676470588235294, "grad_norm": 0.5769559464124637, "learning_rate": 4.206133227152014e-06, "loss": 0.0765, "loss_nan_ranks": 0, "loss_rank_avg": 0.06808263808488846, "step": 5790, "valid_targets_mean": 2259.2, "valid_targets_min": 756 }, { "epoch": 5.681372549019608, "grad_norm": 0.5541240828900388, "learning_rate": 4.1761870932997374e-06, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.09163584560155869, "step": 5795, "valid_targets_mean": 2225.0, "valid_targets_min": 647 }, { "epoch": 5.686274509803922, "grad_norm": 0.7151472521157439, "learning_rate": 4.146335511124186e-06, "loss": 0.0894, "loss_nan_ranks": 0, "loss_rank_avg": 0.07315774261951447, "step": 5800, "valid_targets_mean": 2137.9, "valid_targets_min": 719 }, { "epoch": 5.6911764705882355, "grad_norm": 0.5293164265887055, "learning_rate": 4.11657865899685e-06, "loss": 0.0815, "loss_nan_ranks": 0, "loss_rank_avg": 0.08617638051509857, "step": 5805, "valid_targets_mean": 2464.4, "valid_targets_min": 813 }, { "epoch": 5.696078431372549, "grad_norm": 1.0791096159670817, "learning_rate": 4.086916714723183e-06, "loss": 0.0768, "loss_nan_ranks": 0, "loss_rank_avg": 0.10144323855638504, "step": 5810, "valid_targets_mean": 1979.8, "valid_targets_min": 791 }, { "epoch": 5.700980392156863, "grad_norm": 0.5517469532362859, "learning_rate": 4.057349855541557e-06, "loss": 0.0753, "loss_nan_ranks": 0, "loss_rank_avg": 0.07608313858509064, "step": 5815, "valid_targets_mean": 2220.6, "valid_targets_min": 740 }, { "epoch": 5.705882352941177, "grad_norm": 0.4856089404958147, "learning_rate": 4.02787825812214e-06, "loss": 0.0786, "loss_nan_ranks": 0, "loss_rank_avg": 0.06653439998626709, "step": 5820, "valid_targets_mean": 2393.6, "valid_targets_min": 678 }, { "epoch": 5.71078431372549, "grad_norm": 0.6100738421759316, "learning_rate": 3.998502098565924e-06, "loss": 0.0839, "loss_nan_ranks": 0, "loss_rank_avg": 0.08721679449081421, "step": 5825, "valid_targets_mean": 2000.5, "valid_targets_min": 599 }, { "epoch": 5.715686274509804, "grad_norm": 0.4645738101717131, "learning_rate": 3.969221552403626e-06, "loss": 0.086, "loss_nan_ranks": 0, "loss_rank_avg": 0.06543716788291931, "step": 5830, "valid_targets_mean": 2722.8, "valid_targets_min": 757 }, { "epoch": 5.720588235294118, "grad_norm": 0.6813920591255378, "learning_rate": 3.940036794594633e-06, "loss": 0.0794, "loss_nan_ranks": 0, "loss_rank_avg": 0.0911283940076828, "step": 5835, "valid_targets_mean": 1840.8, "valid_targets_min": 788 }, { "epoch": 5.7254901960784315, "grad_norm": 0.7151713477093936, "learning_rate": 3.910947999525985e-06, "loss": 0.0884, "loss_nan_ranks": 0, "loss_rank_avg": 0.11087524890899658, "step": 5840, "valid_targets_mean": 1622.9, "valid_targets_min": 692 }, { "epoch": 5.730392156862745, "grad_norm": 0.5463288856443642, "learning_rate": 3.881955341011303e-06, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.07577422261238098, "step": 5845, "valid_targets_mean": 2336.6, "valid_targets_min": 778 }, { "epoch": 5.735294117647059, "grad_norm": 0.6439262012281611, "learning_rate": 3.853058992289782e-06, "loss": 0.085, "loss_nan_ranks": 0, "loss_rank_avg": 0.09771288931369781, "step": 5850, "valid_targets_mean": 1823.0, "valid_targets_min": 526 }, { "epoch": 5.740196078431373, "grad_norm": 0.7531604446568076, "learning_rate": 3.824259126025123e-06, "loss": 0.0889, "loss_nan_ranks": 0, "loss_rank_avg": 0.0781392902135849, "step": 5855, "valid_targets_mean": 1648.1, "valid_targets_min": 246 }, { "epoch": 5.745098039215686, "grad_norm": 0.5736859529863001, "learning_rate": 3.7955559143045296e-06, "loss": 0.0757, "loss_nan_ranks": 0, "loss_rank_avg": 0.07947244495153427, "step": 5860, "valid_targets_mean": 2443.7, "valid_targets_min": 557 }, { "epoch": 5.75, "grad_norm": 0.543099315036524, "learning_rate": 3.7669495286376667e-06, "loss": 0.0854, "loss_nan_ranks": 0, "loss_rank_avg": 0.08552545309066772, "step": 5865, "valid_targets_mean": 2266.9, "valid_targets_min": 765 }, { "epoch": 5.754901960784314, "grad_norm": 0.4491128637598562, "learning_rate": 3.738440139955628e-06, "loss": 0.0836, "loss_nan_ranks": 0, "loss_rank_avg": 0.06782278418540955, "step": 5870, "valid_targets_mean": 2791.9, "valid_targets_min": 357 }, { "epoch": 5.759803921568627, "grad_norm": 0.5223104359168639, "learning_rate": 3.7100279186099263e-06, "loss": 0.0726, "loss_nan_ranks": 0, "loss_rank_avg": 0.06796294450759888, "step": 5875, "valid_targets_mean": 1959.1, "valid_targets_min": 711 }, { "epoch": 5.764705882352941, "grad_norm": 0.49720653904211687, "learning_rate": 3.6817130343714814e-06, "loss": 0.0819, "loss_nan_ranks": 0, "loss_rank_avg": 0.07060331106185913, "step": 5880, "valid_targets_mean": 2528.8, "valid_targets_min": 777 }, { "epoch": 5.769607843137255, "grad_norm": 0.5702908165008694, "learning_rate": 3.6534956564295844e-06, "loss": 0.0773, "loss_nan_ranks": 0, "loss_rank_avg": 0.07758490741252899, "step": 5885, "valid_targets_mean": 2392.8, "valid_targets_min": 820 }, { "epoch": 5.7745098039215685, "grad_norm": 0.5124808107408252, "learning_rate": 3.625375953390906e-06, "loss": 0.0804, "loss_nan_ranks": 0, "loss_rank_avg": 0.08320645987987518, "step": 5890, "valid_targets_mean": 2681.4, "valid_targets_min": 975 }, { "epoch": 5.779411764705882, "grad_norm": 0.535163800457717, "learning_rate": 3.597354093278489e-06, "loss": 0.0836, "loss_nan_ranks": 0, "loss_rank_avg": 0.08327630162239075, "step": 5895, "valid_targets_mean": 2386.8, "valid_targets_min": 777 }, { "epoch": 5.784313725490196, "grad_norm": 0.5751280657945049, "learning_rate": 3.5694302435307248e-06, "loss": 0.0815, "loss_nan_ranks": 0, "loss_rank_avg": 0.083884596824646, "step": 5900, "valid_targets_mean": 2702.4, "valid_targets_min": 691 }, { "epoch": 5.78921568627451, "grad_norm": 0.47314846704263797, "learning_rate": 3.5416045710003632e-06, "loss": 0.0843, "loss_nan_ranks": 0, "loss_rank_avg": 0.09700559079647064, "step": 5905, "valid_targets_mean": 2672.6, "valid_targets_min": 512 }, { "epoch": 5.794117647058823, "grad_norm": 0.47095171471968333, "learning_rate": 3.5138772419535315e-06, "loss": 0.0858, "loss_nan_ranks": 0, "loss_rank_avg": 0.06798610091209412, "step": 5910, "valid_targets_mean": 2714.8, "valid_targets_min": 693 }, { "epoch": 5.799019607843137, "grad_norm": 0.49993363026960297, "learning_rate": 3.4862484220687277e-06, "loss": 0.0751, "loss_nan_ranks": 0, "loss_rank_avg": 0.0669768750667572, "step": 5915, "valid_targets_mean": 2422.4, "valid_targets_min": 791 }, { "epoch": 5.803921568627451, "grad_norm": 0.5832018709883363, "learning_rate": 3.458718276435813e-06, "loss": 0.0842, "loss_nan_ranks": 0, "loss_rank_avg": 0.08323369920253754, "step": 5920, "valid_targets_mean": 2593.4, "valid_targets_min": 804 }, { "epoch": 5.8088235294117645, "grad_norm": 0.60658841552699, "learning_rate": 3.4312869695550634e-06, "loss": 0.0761, "loss_nan_ranks": 0, "loss_rank_avg": 0.0748073011636734, "step": 5925, "valid_targets_mean": 1869.9, "valid_targets_min": 788 }, { "epoch": 5.813725490196078, "grad_norm": 0.48601904801057055, "learning_rate": 3.403954665336149e-06, "loss": 0.0669, "loss_nan_ranks": 0, "loss_rank_avg": 0.06104360893368721, "step": 5930, "valid_targets_mean": 2344.1, "valid_targets_min": 812 }, { "epoch": 5.818627450980392, "grad_norm": 0.5235780006216862, "learning_rate": 3.3767215270971755e-06, "loss": 0.0867, "loss_nan_ranks": 0, "loss_rank_avg": 0.11922559142112732, "step": 5935, "valid_targets_mean": 2289.8, "valid_targets_min": 858 }, { "epoch": 5.823529411764706, "grad_norm": 0.6324375338401088, "learning_rate": 3.349587717563709e-06, "loss": 0.0802, "loss_nan_ranks": 0, "loss_rank_avg": 0.08978225290775299, "step": 5940, "valid_targets_mean": 2146.6, "valid_targets_min": 618 }, { "epoch": 5.828431372549019, "grad_norm": 0.6014931507395612, "learning_rate": 3.322553398867807e-06, "loss": 0.0853, "loss_nan_ranks": 0, "loss_rank_avg": 0.07696583867073059, "step": 5945, "valid_targets_mean": 1989.6, "valid_targets_min": 559 }, { "epoch": 5.833333333333333, "grad_norm": 0.6125932724999763, "learning_rate": 3.295618732547021e-06, "loss": 0.0897, "loss_nan_ranks": 0, "loss_rank_avg": 0.12296289205551147, "step": 5950, "valid_targets_mean": 2366.6, "valid_targets_min": 387 }, { "epoch": 5.838235294117647, "grad_norm": 0.58654531214764, "learning_rate": 3.2687838795434623e-06, "loss": 0.0846, "loss_nan_ranks": 0, "loss_rank_avg": 0.07440722733736038, "step": 5955, "valid_targets_mean": 2124.7, "valid_targets_min": 464 }, { "epoch": 5.8431372549019605, "grad_norm": 0.6024776452686876, "learning_rate": 3.242049000202838e-06, "loss": 0.0843, "loss_nan_ranks": 0, "loss_rank_avg": 0.08400903642177582, "step": 5960, "valid_targets_mean": 2285.9, "valid_targets_min": 458 }, { "epoch": 5.848039215686274, "grad_norm": 0.6422151134830493, "learning_rate": 3.215414254273468e-06, "loss": 0.088, "loss_nan_ranks": 0, "loss_rank_avg": 0.11055001616477966, "step": 5965, "valid_targets_mean": 2167.0, "valid_targets_min": 786 }, { "epoch": 5.852941176470588, "grad_norm": 0.6620300611104084, "learning_rate": 3.18887980090536e-06, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.08255288749933243, "step": 5970, "valid_targets_mean": 1708.4, "valid_targets_min": 677 }, { "epoch": 5.857843137254902, "grad_norm": 0.5930788009232768, "learning_rate": 3.16244579864925e-06, "loss": 0.0841, "loss_nan_ranks": 0, "loss_rank_avg": 0.08282943069934845, "step": 5975, "valid_targets_mean": 2136.5, "valid_targets_min": 826 }, { "epoch": 5.862745098039216, "grad_norm": 0.6669457051379303, "learning_rate": 3.1361124054556312e-06, "loss": 0.0832, "loss_nan_ranks": 0, "loss_rank_avg": 0.10319022089242935, "step": 5980, "valid_targets_mean": 2080.8, "valid_targets_min": 985 }, { "epoch": 5.867647058823529, "grad_norm": 0.7614162676195864, "learning_rate": 3.1098797786738433e-06, "loss": 0.085, "loss_nan_ranks": 0, "loss_rank_avg": 0.09599629044532776, "step": 5985, "valid_targets_mean": 1428.2, "valid_targets_min": 597 }, { "epoch": 5.872549019607844, "grad_norm": 0.5860425697430323, "learning_rate": 3.0837480750511182e-06, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.10159435868263245, "step": 5990, "valid_targets_mean": 2192.9, "valid_targets_min": 940 }, { "epoch": 5.877450980392156, "grad_norm": 0.5054169362663372, "learning_rate": 3.0577174507316496e-06, "loss": 0.0742, "loss_nan_ranks": 0, "loss_rank_avg": 0.06875654309988022, "step": 5995, "valid_targets_mean": 2596.9, "valid_targets_min": 536 }, { "epoch": 5.882352941176471, "grad_norm": 0.5199111577493412, "learning_rate": 3.031788061255634e-06, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.07488842308521271, "step": 6000, "valid_targets_mean": 2414.6, "valid_targets_min": 673 }, { "epoch": 5.887254901960784, "grad_norm": 0.563203147883309, "learning_rate": 3.005960061558386e-06, "loss": 0.0824, "loss_nan_ranks": 0, "loss_rank_avg": 0.07726642489433289, "step": 6005, "valid_targets_mean": 2126.5, "valid_targets_min": 654 }, { "epoch": 5.892156862745098, "grad_norm": 0.8120718693179341, "learning_rate": 2.980233605969374e-06, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.09062586724758148, "step": 6010, "valid_targets_mean": 2541.3, "valid_targets_min": 727 }, { "epoch": 5.897058823529412, "grad_norm": 0.6852211896553415, "learning_rate": 2.9546088482113046e-06, "loss": 0.0781, "loss_nan_ranks": 0, "loss_rank_avg": 0.07951194047927856, "step": 6015, "valid_targets_mean": 1838.3, "valid_targets_min": 892 }, { "epoch": 5.901960784313726, "grad_norm": 0.5527062870733078, "learning_rate": 2.9290859413992322e-06, "loss": 0.074, "loss_nan_ranks": 0, "loss_rank_avg": 0.07983888685703278, "step": 6020, "valid_targets_mean": 2328.2, "valid_targets_min": 555 }, { "epoch": 5.9068627450980395, "grad_norm": 0.5587593159739197, "learning_rate": 2.903665038039616e-06, "loss": 0.0884, "loss_nan_ranks": 0, "loss_rank_avg": 0.07825113087892532, "step": 6025, "valid_targets_mean": 2058.4, "valid_targets_min": 669 }, { "epoch": 5.911764705882353, "grad_norm": 0.6497842414090926, "learning_rate": 2.8783462900294035e-06, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.09731444716453552, "step": 6030, "valid_targets_mean": 1918.4, "valid_targets_min": 720 }, { "epoch": 5.916666666666667, "grad_norm": 0.5685987854033889, "learning_rate": 2.8531298486551564e-06, "loss": 0.0769, "loss_nan_ranks": 0, "loss_rank_avg": 0.07977601885795593, "step": 6035, "valid_targets_mean": 2517.5, "valid_targets_min": 695 }, { "epoch": 5.921568627450981, "grad_norm": 0.6558953205650121, "learning_rate": 2.8280158645921042e-06, "loss": 0.0834, "loss_nan_ranks": 0, "loss_rank_avg": 0.07963621616363525, "step": 6040, "valid_targets_mean": 2447.0, "valid_targets_min": 900 }, { "epoch": 5.926470588235294, "grad_norm": 0.5166248894196765, "learning_rate": 2.803004487903287e-06, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.07894115149974823, "step": 6045, "valid_targets_mean": 2478.1, "valid_targets_min": 727 }, { "epoch": 5.931372549019608, "grad_norm": 0.6029700113130794, "learning_rate": 2.778095868038617e-06, "loss": 0.075, "loss_nan_ranks": 0, "loss_rank_avg": 0.0775521844625473, "step": 6050, "valid_targets_mean": 1711.4, "valid_targets_min": 509 }, { "epoch": 5.936274509803922, "grad_norm": 0.6580105250928281, "learning_rate": 2.753290153834023e-06, "loss": 0.0851, "loss_nan_ranks": 0, "loss_rank_avg": 0.08928344398736954, "step": 6055, "valid_targets_mean": 1875.9, "valid_targets_min": 888 }, { "epoch": 5.9411764705882355, "grad_norm": 0.5678302569504097, "learning_rate": 2.728587493510535e-06, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.07457900792360306, "step": 6060, "valid_targets_mean": 2254.5, "valid_targets_min": 865 }, { "epoch": 5.946078431372549, "grad_norm": 0.6494590024071005, "learning_rate": 2.7039880346734016e-06, "loss": 0.0771, "loss_nan_ranks": 0, "loss_rank_avg": 0.09324674308300018, "step": 6065, "valid_targets_mean": 1873.6, "valid_targets_min": 659 }, { "epoch": 5.950980392156863, "grad_norm": 0.4673173745041048, "learning_rate": 2.679491924311226e-06, "loss": 0.0851, "loss_nan_ranks": 0, "loss_rank_avg": 0.07084433734416962, "step": 6070, "valid_targets_mean": 2818.4, "valid_targets_min": 957 }, { "epoch": 5.955882352941177, "grad_norm": 0.6025288740140903, "learning_rate": 2.655099308795077e-06, "loss": 0.0776, "loss_nan_ranks": 0, "loss_rank_avg": 0.08057056367397308, "step": 6075, "valid_targets_mean": 1935.4, "valid_targets_min": 656 }, { "epoch": 5.96078431372549, "grad_norm": 0.6488585540480777, "learning_rate": 2.630810333877598e-06, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.08397980779409409, "step": 6080, "valid_targets_mean": 1951.4, "valid_targets_min": 848 }, { "epoch": 5.965686274509804, "grad_norm": 0.5375473700344824, "learning_rate": 2.606625144692165e-06, "loss": 0.0813, "loss_nan_ranks": 0, "loss_rank_avg": 0.07249542325735092, "step": 6085, "valid_targets_mean": 2204.8, "valid_targets_min": 798 }, { "epoch": 5.970588235294118, "grad_norm": 0.5006793601077577, "learning_rate": 2.582543885752e-06, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.06924687325954437, "step": 6090, "valid_targets_mean": 2698.9, "valid_targets_min": 923 }, { "epoch": 5.9754901960784315, "grad_norm": 0.5050408076456617, "learning_rate": 2.5585667009493053e-06, "loss": 0.0813, "loss_nan_ranks": 0, "loss_rank_avg": 0.06595446169376373, "step": 6095, "valid_targets_mean": 2226.9, "valid_targets_min": 614 }, { "epoch": 5.980392156862745, "grad_norm": 0.5315306645380031, "learning_rate": 2.534693733554425e-06, "loss": 0.0964, "loss_nan_ranks": 0, "loss_rank_avg": 0.08023549616336823, "step": 6100, "valid_targets_mean": 2730.5, "valid_targets_min": 720 }, { "epoch": 5.985294117647059, "grad_norm": 0.703760578715545, "learning_rate": 2.510925126214969e-06, "loss": 0.0803, "loss_nan_ranks": 0, "loss_rank_avg": 0.09702526032924652, "step": 6105, "valid_targets_mean": 1739.1, "valid_targets_min": 637 }, { "epoch": 5.990196078431373, "grad_norm": 0.4674576209361368, "learning_rate": 2.487261020954972e-06, "loss": 0.0879, "loss_nan_ranks": 0, "loss_rank_avg": 0.06910908222198486, "step": 6110, "valid_targets_mean": 2932.8, "valid_targets_min": 824 }, { "epoch": 5.995098039215686, "grad_norm": 0.5152485984762009, "learning_rate": 2.4637015591740276e-06, "loss": 0.0721, "loss_nan_ranks": 0, "loss_rank_avg": 0.06391312181949615, "step": 6115, "valid_targets_mean": 2238.2, "valid_targets_min": 697 }, { "epoch": 6.0, "grad_norm": 0.6130671169794297, "learning_rate": 2.440246881646464e-06, "loss": 0.0788, "loss_nan_ranks": 0, "loss_rank_avg": 0.08633176982402802, "step": 6120, "valid_targets_mean": 1896.4, "valid_targets_min": 704 }, { "epoch": 6.004901960784314, "grad_norm": 0.5430984365740257, "learning_rate": 2.416897128520499e-06, "loss": 0.0688, "loss_nan_ranks": 0, "loss_rank_avg": 0.07396151125431061, "step": 6125, "valid_targets_mean": 2240.2, "valid_targets_min": 685 }, { "epoch": 6.009803921568627, "grad_norm": 0.5763052421927343, "learning_rate": 2.393652439317382e-06, "loss": 0.066, "loss_nan_ranks": 0, "loss_rank_avg": 0.07698511332273483, "step": 6130, "valid_targets_mean": 1928.5, "valid_targets_min": 572 }, { "epoch": 6.014705882352941, "grad_norm": 0.48819703817877225, "learning_rate": 2.370512952930595e-06, "loss": 0.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.06292486190795898, "step": 6135, "valid_targets_mean": 2492.7, "valid_targets_min": 543 }, { "epoch": 6.019607843137255, "grad_norm": 0.5671829047793151, "learning_rate": 2.3474788076249988e-06, "loss": 0.0798, "loss_nan_ranks": 0, "loss_rank_avg": 0.07058997452259064, "step": 6140, "valid_targets_mean": 2339.8, "valid_targets_min": 888 }, { "epoch": 6.0245098039215685, "grad_norm": 0.5496278977860942, "learning_rate": 2.3245501410359972e-06, "loss": 0.0809, "loss_nan_ranks": 0, "loss_rank_avg": 0.07255090028047562, "step": 6145, "valid_targets_mean": 2154.3, "valid_targets_min": 482 }, { "epoch": 6.029411764705882, "grad_norm": 0.4937862359973531, "learning_rate": 2.301727090168744e-06, "loss": 0.0676, "loss_nan_ranks": 0, "loss_rank_avg": 0.0625627338886261, "step": 6150, "valid_targets_mean": 2450.2, "valid_targets_min": 642 }, { "epoch": 6.034313725490196, "grad_norm": 0.5717628053168052, "learning_rate": 2.2790097913973154e-06, "loss": 0.0713, "loss_nan_ranks": 0, "loss_rank_avg": 0.07228903472423553, "step": 6155, "valid_targets_mean": 2367.8, "valid_targets_min": 534 }, { "epoch": 6.03921568627451, "grad_norm": 0.5785020160716992, "learning_rate": 2.256398380463869e-06, "loss": 0.075, "loss_nan_ranks": 0, "loss_rank_avg": 0.09864409267902374, "step": 6160, "valid_targets_mean": 2456.7, "valid_targets_min": 794 }, { "epoch": 6.044117647058823, "grad_norm": 0.804246675079279, "learning_rate": 2.233892992477873e-06, "loss": 0.0809, "loss_nan_ranks": 0, "loss_rank_avg": 0.0953570306301117, "step": 6165, "valid_targets_mean": 1702.3, "valid_targets_min": 697 }, { "epoch": 6.049019607843137, "grad_norm": 0.5222243433110547, "learning_rate": 2.211493761915271e-06, "loss": 0.0658, "loss_nan_ranks": 0, "loss_rank_avg": 0.06962548196315765, "step": 6170, "valid_targets_mean": 2213.9, "valid_targets_min": 490 }, { "epoch": 6.053921568627451, "grad_norm": 0.7161229915529039, "learning_rate": 2.1892008226176763e-06, "loss": 0.0898, "loss_nan_ranks": 0, "loss_rank_avg": 0.10996219515800476, "step": 6175, "valid_targets_mean": 1936.4, "valid_targets_min": 687 }, { "epoch": 6.0588235294117645, "grad_norm": 0.5057245594944937, "learning_rate": 2.1670143077916015e-06, "loss": 0.0729, "loss_nan_ranks": 0, "loss_rank_avg": 0.06661894172430038, "step": 6180, "valid_targets_mean": 2843.9, "valid_targets_min": 776 }, { "epoch": 6.063725490196078, "grad_norm": 0.6052163077723632, "learning_rate": 2.1449343500076304e-06, "loss": 0.077, "loss_nan_ranks": 0, "loss_rank_avg": 0.06724628806114197, "step": 6185, "valid_targets_mean": 2032.4, "valid_targets_min": 594 }, { "epoch": 6.068627450980392, "grad_norm": 0.7024005601958995, "learning_rate": 2.1229610811996503e-06, "loss": 0.0803, "loss_nan_ranks": 0, "loss_rank_avg": 0.07796479761600494, "step": 6190, "valid_targets_mean": 1835.6, "valid_targets_min": 684 }, { "epoch": 6.073529411764706, "grad_norm": 0.45302602525860136, "learning_rate": 2.101094632664038e-06, "loss": 0.074, "loss_nan_ranks": 0, "loss_rank_avg": 0.06258255243301392, "step": 6195, "valid_targets_mean": 2617.1, "valid_targets_min": 692 }, { "epoch": 6.078431372549019, "grad_norm": 0.5491802706652505, "learning_rate": 2.0793351350588953e-06, "loss": 0.0817, "loss_nan_ranks": 0, "loss_rank_avg": 0.06602051109075546, "step": 6200, "valid_targets_mean": 2098.4, "valid_targets_min": 716 }, { "epoch": 6.083333333333333, "grad_norm": 0.6543025395149007, "learning_rate": 2.057682718403269e-06, "loss": 0.0804, "loss_nan_ranks": 0, "loss_rank_avg": 0.0722709521651268, "step": 6205, "valid_targets_mean": 1912.4, "valid_targets_min": 509 }, { "epoch": 6.088235294117647, "grad_norm": 0.7439931048575309, "learning_rate": 2.036137512076353e-06, "loss": 0.077, "loss_nan_ranks": 0, "loss_rank_avg": 0.09067465364933014, "step": 6210, "valid_targets_mean": 1648.8, "valid_targets_min": 684 }, { "epoch": 6.0931372549019605, "grad_norm": 0.4120655244655399, "learning_rate": 2.0146996448167443e-06, "loss": 0.0834, "loss_nan_ranks": 0, "loss_rank_avg": 0.051044829189777374, "step": 6215, "valid_targets_mean": 2614.7, "valid_targets_min": 878 }, { "epoch": 6.098039215686274, "grad_norm": 0.5495070413200112, "learning_rate": 1.993369244721659e-06, "loss": 0.0775, "loss_nan_ranks": 0, "loss_rank_avg": 0.0813751369714737, "step": 6220, "valid_targets_mean": 2856.7, "valid_targets_min": 841 }, { "epoch": 6.102941176470588, "grad_norm": 0.5365374420440991, "learning_rate": 1.9721464392461564e-06, "loss": 0.0673, "loss_nan_ranks": 0, "loss_rank_avg": 0.06650418788194656, "step": 6225, "valid_targets_mean": 2202.2, "valid_targets_min": 387 }, { "epoch": 6.107843137254902, "grad_norm": 0.7655061230649243, "learning_rate": 1.951031355202386e-06, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.09154021739959717, "step": 6230, "valid_targets_mean": 2112.3, "valid_targets_min": 669 }, { "epoch": 6.112745098039215, "grad_norm": 0.6562468194054213, "learning_rate": 1.930024118758853e-06, "loss": 0.0743, "loss_nan_ranks": 0, "loss_rank_avg": 0.08058568090200424, "step": 6235, "valid_targets_mean": 2077.5, "valid_targets_min": 675 }, { "epoch": 6.117647058823529, "grad_norm": 0.6095516260099263, "learning_rate": 1.909124855439617e-06, "loss": 0.0771, "loss_nan_ranks": 0, "loss_rank_avg": 0.09607884287834167, "step": 6240, "valid_targets_mean": 2540.3, "valid_targets_min": 557 }, { "epoch": 6.122549019607843, "grad_norm": 0.5325419229723192, "learning_rate": 1.8883336901235849e-06, "loss": 0.0753, "loss_nan_ranks": 0, "loss_rank_avg": 0.06588293612003326, "step": 6245, "valid_targets_mean": 2171.6, "valid_targets_min": 611 }, { "epoch": 6.127450980392156, "grad_norm": 0.5276564470921136, "learning_rate": 1.86765074704375e-06, "loss": 0.0795, "loss_nan_ranks": 0, "loss_rank_avg": 0.06421571224927902, "step": 6250, "valid_targets_mean": 2687.8, "valid_targets_min": 610 }, { "epoch": 6.132352941176471, "grad_norm": 0.5575953855054443, "learning_rate": 1.847076149786433e-06, "loss": 0.0696, "loss_nan_ranks": 0, "loss_rank_avg": 0.06234298646450043, "step": 6255, "valid_targets_mean": 2139.8, "valid_targets_min": 799 }, { "epoch": 6.137254901960785, "grad_norm": 0.49891548427790866, "learning_rate": 1.826610021290569e-06, "loss": 0.0716, "loss_nan_ranks": 0, "loss_rank_avg": 0.06937284022569656, "step": 6260, "valid_targets_mean": 2843.1, "valid_targets_min": 681 }, { "epoch": 6.142156862745098, "grad_norm": 0.6665462095056259, "learning_rate": 1.8062524838469574e-06, "loss": 0.0762, "loss_nan_ranks": 0, "loss_rank_avg": 0.08383327722549438, "step": 6265, "valid_targets_mean": 2028.3, "valid_targets_min": 700 }, { "epoch": 6.147058823529412, "grad_norm": 0.6691471419132663, "learning_rate": 1.7860036590975439e-06, "loss": 0.0776, "loss_nan_ranks": 0, "loss_rank_avg": 0.08335322141647339, "step": 6270, "valid_targets_mean": 1612.1, "valid_targets_min": 593 }, { "epoch": 6.151960784313726, "grad_norm": 0.6285610224128853, "learning_rate": 1.7658636680346776e-06, "loss": 0.0681, "loss_nan_ranks": 0, "loss_rank_avg": 0.0754515677690506, "step": 6275, "valid_targets_mean": 2081.2, "valid_targets_min": 784 }, { "epoch": 6.1568627450980395, "grad_norm": 0.572293098108352, "learning_rate": 1.745832631000395e-06, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.06705275923013687, "step": 6280, "valid_targets_mean": 2276.4, "valid_targets_min": 927 }, { "epoch": 6.161764705882353, "grad_norm": 0.45124349299968974, "learning_rate": 1.7259106676857084e-06, "loss": 0.0695, "loss_nan_ranks": 0, "loss_rank_avg": 0.0617854930460453, "step": 6285, "valid_targets_mean": 2758.0, "valid_targets_min": 734 }, { "epoch": 6.166666666666667, "grad_norm": 0.628955391242213, "learning_rate": 1.7060978971298791e-06, "loss": 0.071, "loss_nan_ranks": 0, "loss_rank_avg": 0.06164342910051346, "step": 6290, "valid_targets_mean": 2637.5, "valid_targets_min": 958 }, { "epoch": 6.171568627450981, "grad_norm": 0.5621167700542326, "learning_rate": 1.6863944377197162e-06, "loss": 0.0662, "loss_nan_ranks": 0, "loss_rank_avg": 0.06263579428195953, "step": 6295, "valid_targets_mean": 2171.8, "valid_targets_min": 703 }, { "epoch": 6.176470588235294, "grad_norm": 0.5736760579865152, "learning_rate": 1.666800407188862e-06, "loss": 0.0831, "loss_nan_ranks": 0, "loss_rank_avg": 0.11034345626831055, "step": 6300, "valid_targets_mean": 2621.9, "valid_targets_min": 811 }, { "epoch": 6.181372549019608, "grad_norm": 0.5192244127522521, "learning_rate": 1.6473159226170898e-06, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.06342881917953491, "step": 6305, "valid_targets_mean": 2492.2, "valid_targets_min": 760 }, { "epoch": 6.186274509803922, "grad_norm": 0.5645893985791716, "learning_rate": 1.6279411004296042e-06, "loss": 0.0741, "loss_nan_ranks": 0, "loss_rank_avg": 0.07318265736103058, "step": 6310, "valid_targets_mean": 2655.1, "valid_targets_min": 770 }, { "epoch": 6.1911764705882355, "grad_norm": 0.4889759389855647, "learning_rate": 1.6086760563963478e-06, "loss": 0.0726, "loss_nan_ranks": 0, "loss_rank_avg": 0.068635493516922, "step": 6315, "valid_targets_mean": 2335.9, "valid_targets_min": 750 }, { "epoch": 6.196078431372549, "grad_norm": 0.4874921438984983, "learning_rate": 1.5895209056313166e-06, "loss": 0.068, "loss_nan_ranks": 0, "loss_rank_avg": 0.06178947165608406, "step": 6320, "valid_targets_mean": 2636.8, "valid_targets_min": 765 }, { "epoch": 6.200980392156863, "grad_norm": 0.4891287624222315, "learning_rate": 1.5704757625918454e-06, "loss": 0.0691, "loss_nan_ranks": 0, "loss_rank_avg": 0.06538208574056625, "step": 6325, "valid_targets_mean": 3014.9, "valid_targets_min": 1074 }, { "epoch": 6.205882352941177, "grad_norm": 0.5999748822792935, "learning_rate": 1.5515407410779636e-06, "loss": 0.0717, "loss_nan_ranks": 0, "loss_rank_avg": 0.08500402420759201, "step": 6330, "valid_targets_mean": 2314.1, "valid_targets_min": 859 }, { "epoch": 6.21078431372549, "grad_norm": 0.49689354235234345, "learning_rate": 1.5327159542316784e-06, "loss": 0.0705, "loss_nan_ranks": 0, "loss_rank_avg": 0.07124780118465424, "step": 6335, "valid_targets_mean": 2509.1, "valid_targets_min": 775 }, { "epoch": 6.215686274509804, "grad_norm": 0.4661213868566254, "learning_rate": 1.5140015145363163e-06, "loss": 0.0822, "loss_nan_ranks": 0, "loss_rank_avg": 0.05759389325976372, "step": 6340, "valid_targets_mean": 2664.4, "valid_targets_min": 647 }, { "epoch": 6.220588235294118, "grad_norm": 0.6441063247249776, "learning_rate": 1.4953975338158545e-06, "loss": 0.0678, "loss_nan_ranks": 0, "loss_rank_avg": 0.059634268283843994, "step": 6345, "valid_targets_mean": 1688.2, "valid_targets_min": 683 }, { "epoch": 6.2254901960784315, "grad_norm": 0.6443076433004111, "learning_rate": 1.4769041232342464e-06, "loss": 0.0795, "loss_nan_ranks": 0, "loss_rank_avg": 0.10399801284074783, "step": 6350, "valid_targets_mean": 2111.4, "valid_targets_min": 830 }, { "epoch": 6.230392156862745, "grad_norm": 0.5315458798893512, "learning_rate": 1.458521393294754e-06, "loss": 0.0704, "loss_nan_ranks": 0, "loss_rank_avg": 0.061626315116882324, "step": 6355, "valid_targets_mean": 2154.8, "valid_targets_min": 734 }, { "epoch": 6.235294117647059, "grad_norm": 0.5879437478837025, "learning_rate": 1.4402494538392975e-06, "loss": 0.0736, "loss_nan_ranks": 0, "loss_rank_avg": 0.06649856269359589, "step": 6360, "valid_targets_mean": 1821.4, "valid_targets_min": 864 }, { "epoch": 6.240196078431373, "grad_norm": 0.4657404472137014, "learning_rate": 1.4220884140477841e-06, "loss": 0.0663, "loss_nan_ranks": 0, "loss_rank_avg": 0.05414208024740219, "step": 6365, "valid_targets_mean": 2473.9, "valid_targets_min": 719 }, { "epoch": 6.245098039215686, "grad_norm": 0.5742416534799186, "learning_rate": 1.4040383824374738e-06, "loss": 0.0734, "loss_nan_ranks": 0, "loss_rank_avg": 0.07009696960449219, "step": 6370, "valid_targets_mean": 2067.3, "valid_targets_min": 713 }, { "epoch": 6.25, "grad_norm": 0.6270014269516866, "learning_rate": 1.386099466862314e-06, "loss": 0.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.07653535902500153, "step": 6375, "valid_targets_mean": 1960.4, "valid_targets_min": 722 }, { "epoch": 6.254901960784314, "grad_norm": 0.566807267759067, "learning_rate": 1.3682717745123154e-06, "loss": 0.0733, "loss_nan_ranks": 0, "loss_rank_avg": 0.08027191460132599, "step": 6380, "valid_targets_mean": 2312.1, "valid_targets_min": 835 }, { "epoch": 6.259803921568627, "grad_norm": 0.5502588217275843, "learning_rate": 1.3505554119128861e-06, "loss": 0.071, "loss_nan_ranks": 0, "loss_rank_avg": 0.0736890435218811, "step": 6385, "valid_targets_mean": 1971.5, "valid_targets_min": 723 }, { "epoch": 6.264705882352941, "grad_norm": 0.5131370822262248, "learning_rate": 1.3329504849242114e-06, "loss": 0.0679, "loss_nan_ranks": 0, "loss_rank_avg": 0.06139993295073509, "step": 6390, "valid_targets_mean": 2139.0, "valid_targets_min": 697 }, { "epoch": 6.269607843137255, "grad_norm": 0.6748155034034762, "learning_rate": 1.3154570987406202e-06, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.06903311610221863, "step": 6395, "valid_targets_mean": 1693.1, "valid_targets_min": 629 }, { "epoch": 6.2745098039215685, "grad_norm": 0.5579527424856937, "learning_rate": 1.2980753578899563e-06, "loss": 0.0733, "loss_nan_ranks": 0, "loss_rank_avg": 0.07270924001932144, "step": 6400, "valid_targets_mean": 2242.1, "valid_targets_min": 526 }, { "epoch": 6.279411764705882, "grad_norm": 0.6649096720503214, "learning_rate": 1.2808053662329422e-06, "loss": 0.0693, "loss_nan_ranks": 0, "loss_rank_avg": 0.07944712042808533, "step": 6405, "valid_targets_mean": 1749.5, "valid_targets_min": 634 }, { "epoch": 6.284313725490196, "grad_norm": 0.4422205331028691, "learning_rate": 1.2636472269625833e-06, "loss": 0.0733, "loss_nan_ranks": 0, "loss_rank_avg": 0.05389444902539253, "step": 6410, "valid_targets_mean": 2626.2, "valid_targets_min": 539 }, { "epoch": 6.28921568627451, "grad_norm": 0.5066639539553149, "learning_rate": 1.2466010426035214e-06, "loss": 0.0794, "loss_nan_ranks": 0, "loss_rank_avg": 0.06264401972293854, "step": 6415, "valid_targets_mean": 2138.4, "valid_targets_min": 655 }, { "epoch": 6.294117647058823, "grad_norm": 0.7673642339162735, "learning_rate": 1.2296669150114381e-06, "loss": 0.0781, "loss_nan_ranks": 0, "loss_rank_avg": 0.08284231275320053, "step": 6420, "valid_targets_mean": 1619.0, "valid_targets_min": 826 }, { "epoch": 6.299019607843137, "grad_norm": 0.5811878185494508, "learning_rate": 1.2128449453724556e-06, "loss": 0.0738, "loss_nan_ranks": 0, "loss_rank_avg": 0.07080619782209396, "step": 6425, "valid_targets_mean": 2293.2, "valid_targets_min": 671 }, { "epoch": 6.303921568627451, "grad_norm": 0.4888633277532672, "learning_rate": 1.1961352342025135e-06, "loss": 0.066, "loss_nan_ranks": 0, "loss_rank_avg": 0.05815008282661438, "step": 6430, "valid_targets_mean": 2700.2, "valid_targets_min": 712 }, { "epoch": 6.3088235294117645, "grad_norm": 0.6944638611542142, "learning_rate": 1.1795378813467727e-06, "loss": 0.075, "loss_nan_ranks": 0, "loss_rank_avg": 0.08229673653841019, "step": 6435, "valid_targets_mean": 1831.1, "valid_targets_min": 757 }, { "epoch": 6.313725490196078, "grad_norm": 0.5615966039821809, "learning_rate": 1.1630529859790318e-06, "loss": 0.0926, "loss_nan_ranks": 0, "loss_rank_avg": 0.061017826199531555, "step": 6440, "valid_targets_mean": 2502.1, "valid_targets_min": 657 }, { "epoch": 6.318627450980392, "grad_norm": 0.6763422320122082, "learning_rate": 1.1466806466011127e-06, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.08773969858884811, "step": 6445, "valid_targets_mean": 1737.6, "valid_targets_min": 357 }, { "epoch": 6.323529411764706, "grad_norm": 0.5777497347614018, "learning_rate": 1.1304209610422933e-06, "loss": 0.0675, "loss_nan_ranks": 0, "loss_rank_avg": 0.06521066278219223, "step": 6450, "valid_targets_mean": 2161.2, "valid_targets_min": 522 }, { "epoch": 6.328431372549019, "grad_norm": 0.5679910722880794, "learning_rate": 1.1142740264587104e-06, "loss": 0.0654, "loss_nan_ranks": 0, "loss_rank_avg": 0.05448193848133087, "step": 6455, "valid_targets_mean": 2527.9, "valid_targets_min": 710 }, { "epoch": 6.333333333333333, "grad_norm": 0.509042676333728, "learning_rate": 1.0982399393327813e-06, "loss": 0.0736, "loss_nan_ranks": 0, "loss_rank_avg": 0.07492335885763168, "step": 6460, "valid_targets_mean": 2692.8, "valid_targets_min": 612 }, { "epoch": 6.338235294117647, "grad_norm": 0.6072611147130427, "learning_rate": 1.0823187954726322e-06, "loss": 0.0786, "loss_nan_ranks": 0, "loss_rank_avg": 0.07300375401973724, "step": 6465, "valid_targets_mean": 2096.9, "valid_targets_min": 592 }, { "epoch": 6.3431372549019605, "grad_norm": 1.5730165234423314, "learning_rate": 1.0665106900115174e-06, "loss": 0.0706, "loss_nan_ranks": 0, "loss_rank_avg": 0.07045087218284607, "step": 6470, "valid_targets_mean": 2194.9, "valid_targets_min": 677 }, { "epoch": 6.348039215686274, "grad_norm": 0.5320050036216825, "learning_rate": 1.0508157174072563e-06, "loss": 0.072, "loss_nan_ranks": 0, "loss_rank_avg": 0.06787510216236115, "step": 6475, "valid_targets_mean": 2446.6, "valid_targets_min": 683 }, { "epoch": 6.352941176470588, "grad_norm": 0.597125652728074, "learning_rate": 1.0352339714416715e-06, "loss": 0.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.08531296253204346, "step": 6480, "valid_targets_mean": 2121.9, "valid_targets_min": 682 }, { "epoch": 6.357843137254902, "grad_norm": 0.7163258924570245, "learning_rate": 1.0197655452200172e-06, "loss": 0.0916, "loss_nan_ranks": 0, "loss_rank_avg": 0.08984912186861038, "step": 6485, "valid_targets_mean": 1824.8, "valid_targets_min": 641 }, { "epoch": 6.362745098039215, "grad_norm": 0.5664824321655607, "learning_rate": 1.0044105311704455e-06, "loss": 0.0762, "loss_nan_ranks": 0, "loss_rank_avg": 0.07289232313632965, "step": 6490, "valid_targets_mean": 2176.4, "valid_targets_min": 748 }, { "epoch": 6.367647058823529, "grad_norm": 0.6202502575591109, "learning_rate": 9.891690210434235e-07, "loss": 0.0756, "loss_nan_ranks": 0, "loss_rank_avg": 0.07717530429363251, "step": 6495, "valid_targets_mean": 1831.9, "valid_targets_min": 616 }, { "epoch": 6.372549019607844, "grad_norm": 0.5595520685931048, "learning_rate": 9.740411059112031e-07, "loss": 0.0996, "loss_nan_ranks": 0, "loss_rank_avg": 0.06521070003509521, "step": 6500, "valid_targets_mean": 1985.8, "valid_targets_min": 638 }, { "epoch": 6.377450980392156, "grad_norm": 0.6126975781808517, "learning_rate": 9.590268761672838e-07, "loss": 0.0713, "loss_nan_ranks": 0, "loss_rank_avg": 0.08089681714773178, "step": 6505, "valid_targets_mean": 1971.1, "valid_targets_min": 680 }, { "epoch": 6.382352941176471, "grad_norm": 0.5778356925814528, "learning_rate": 9.441264215258595e-07, "loss": 0.0798, "loss_nan_ranks": 0, "loss_rank_avg": 0.07549488544464111, "step": 6510, "valid_targets_mean": 1980.7, "valid_targets_min": 619 }, { "epoch": 6.387254901960785, "grad_norm": 0.5593674597722778, "learning_rate": 9.293398310212831e-07, "loss": 0.0781, "loss_nan_ranks": 0, "loss_rank_avg": 0.0599190816283226, "step": 6515, "valid_targets_mean": 2093.8, "valid_targets_min": 675 }, { "epoch": 6.392156862745098, "grad_norm": 0.6399167415852633, "learning_rate": 9.146671930075412e-07, "loss": 0.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.10022995620965958, "step": 6520, "valid_targets_mean": 1830.9, "valid_targets_min": 727 }, { "epoch": 6.397058823529412, "grad_norm": 0.6140652768928999, "learning_rate": 9.00108595157716e-07, "loss": 0.0713, "loss_nan_ranks": 0, "loss_rank_avg": 0.07537797093391418, "step": 6525, "valid_targets_mean": 2011.1, "valid_targets_min": 698 }, { "epoch": 6.401960784313726, "grad_norm": 0.7285222625014569, "learning_rate": 8.856641244634767e-07, "loss": 0.0764, "loss_nan_ranks": 0, "loss_rank_avg": 0.09332075715065002, "step": 6530, "valid_targets_mean": 1789.8, "valid_targets_min": 930 }, { "epoch": 6.4068627450980395, "grad_norm": 0.542847290160346, "learning_rate": 8.713338672345451e-07, "loss": 0.0709, "loss_nan_ranks": 0, "loss_rank_avg": 0.06750819832086563, "step": 6535, "valid_targets_mean": 2273.8, "valid_targets_min": 731 }, { "epoch": 6.411764705882353, "grad_norm": 0.5668560043361112, "learning_rate": 8.571179090981885e-07, "loss": 0.0751, "loss_nan_ranks": 0, "loss_rank_avg": 0.07465088367462158, "step": 6540, "valid_targets_mean": 2430.4, "valid_targets_min": 847 }, { "epoch": 6.416666666666667, "grad_norm": 0.6375632023114209, "learning_rate": 8.430163349987075e-07, "loss": 0.0851, "loss_nan_ranks": 0, "loss_rank_avg": 0.07439914345741272, "step": 6545, "valid_targets_mean": 1622.2, "valid_targets_min": 800 }, { "epoch": 6.421568627450981, "grad_norm": 0.5292873557345532, "learning_rate": 8.290292291969226e-07, "loss": 0.0824, "loss_nan_ranks": 0, "loss_rank_avg": 0.0702093094587326, "step": 6550, "valid_targets_mean": 2615.8, "valid_targets_min": 1126 }, { "epoch": 6.426470588235294, "grad_norm": 0.5216899096730249, "learning_rate": 8.151566752696704e-07, "loss": 0.0776, "loss_nan_ranks": 0, "loss_rank_avg": 0.08521877229213715, "step": 6555, "valid_targets_mean": 2622.1, "valid_targets_min": 564 }, { "epoch": 6.431372549019608, "grad_norm": 0.6567140287942022, "learning_rate": 8.013987561093217e-07, "loss": 0.0795, "loss_nan_ranks": 0, "loss_rank_avg": 0.07485121488571167, "step": 6560, "valid_targets_mean": 1729.0, "valid_targets_min": 513 }, { "epoch": 6.436274509803922, "grad_norm": 0.601647391705643, "learning_rate": 7.877555539232551e-07, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.08071115612983704, "step": 6565, "valid_targets_mean": 2257.5, "valid_targets_min": 745 }, { "epoch": 6.4411764705882355, "grad_norm": 0.562631688655108, "learning_rate": 7.742271502333998e-07, "loss": 0.0738, "loss_nan_ranks": 0, "loss_rank_avg": 0.09080608189105988, "step": 6570, "valid_targets_mean": 2499.1, "valid_targets_min": 698 }, { "epoch": 6.446078431372549, "grad_norm": 0.5329236768943743, "learning_rate": 7.608136258757248e-07, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.06047336757183075, "step": 6575, "valid_targets_mean": 2170.6, "valid_targets_min": 591 }, { "epoch": 6.450980392156863, "grad_norm": 0.5275499144973336, "learning_rate": 7.475150609997595e-07, "loss": 0.0766, "loss_nan_ranks": 0, "loss_rank_avg": 0.0709349513053894, "step": 6580, "valid_targets_mean": 2400.8, "valid_targets_min": 648 }, { "epoch": 6.455882352941177, "grad_norm": 0.5101600270500972, "learning_rate": 7.343315350681246e-07, "loss": 0.0809, "loss_nan_ranks": 0, "loss_rank_avg": 0.07443030178546906, "step": 6585, "valid_targets_mean": 2751.6, "valid_targets_min": 1062 }, { "epoch": 6.46078431372549, "grad_norm": 0.592728343239668, "learning_rate": 7.212631268560466e-07, "loss": 0.0737, "loss_nan_ranks": 0, "loss_rank_avg": 0.06636979430913925, "step": 6590, "valid_targets_mean": 2612.5, "valid_targets_min": 809 }, { "epoch": 6.465686274509804, "grad_norm": 0.5073605489538774, "learning_rate": 7.083099144508976e-07, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.06348920613527298, "step": 6595, "valid_targets_mean": 2609.2, "valid_targets_min": 692 }, { "epoch": 6.470588235294118, "grad_norm": 0.4888244064732885, "learning_rate": 6.95471975251718e-07, "loss": 0.0676, "loss_nan_ranks": 0, "loss_rank_avg": 0.07031454145908356, "step": 6600, "valid_targets_mean": 2671.5, "valid_targets_min": 803 }, { "epoch": 6.4754901960784315, "grad_norm": 0.48986840780382246, "learning_rate": 6.827493859687572e-07, "loss": 0.0685, "loss_nan_ranks": 0, "loss_rank_avg": 0.05794578790664673, "step": 6605, "valid_targets_mean": 2573.7, "valid_targets_min": 864 }, { "epoch": 6.480392156862745, "grad_norm": 0.5823150173486473, "learning_rate": 6.701422226230225e-07, "loss": 0.0721, "loss_nan_ranks": 0, "loss_rank_avg": 0.0833081379532814, "step": 6610, "valid_targets_mean": 2362.8, "valid_targets_min": 610 }, { "epoch": 6.485294117647059, "grad_norm": 0.5286454997343215, "learning_rate": 6.57650560545815e-07, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.06765834242105484, "step": 6615, "valid_targets_mean": 2444.2, "valid_targets_min": 637 }, { "epoch": 6.490196078431373, "grad_norm": 0.6399951864881893, "learning_rate": 6.452744743782835e-07, "loss": 0.0733, "loss_nan_ranks": 0, "loss_rank_avg": 0.08042435348033905, "step": 6620, "valid_targets_mean": 1860.4, "valid_targets_min": 705 }, { "epoch": 6.495098039215686, "grad_norm": 0.5739546748120099, "learning_rate": 6.330140380709826e-07, "loss": 0.0712, "loss_nan_ranks": 0, "loss_rank_avg": 0.07454740256071091, "step": 6625, "valid_targets_mean": 2359.0, "valid_targets_min": 567 }, { "epoch": 6.5, "grad_norm": 0.5924429822824983, "learning_rate": 6.208693248834241e-07, "loss": 0.0828, "loss_nan_ranks": 0, "loss_rank_avg": 0.10847502946853638, "step": 6630, "valid_targets_mean": 1880.0, "valid_targets_min": 594 }, { "epoch": 6.504901960784314, "grad_norm": 0.618365600846528, "learning_rate": 6.088404073836374e-07, "loss": 0.0875, "loss_nan_ranks": 0, "loss_rank_avg": 0.07501372694969177, "step": 6635, "valid_targets_mean": 2034.2, "valid_targets_min": 642 }, { "epoch": 6.509803921568627, "grad_norm": 0.7514817551450208, "learning_rate": 5.969273574477519e-07, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.09385409951210022, "step": 6640, "valid_targets_mean": 1769.9, "valid_targets_min": 704 }, { "epoch": 6.514705882352941, "grad_norm": 0.6156340459167169, "learning_rate": 5.851302462595465e-07, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.06911460310220718, "step": 6645, "valid_targets_mean": 2101.6, "valid_targets_min": 605 }, { "epoch": 6.519607843137255, "grad_norm": 0.6492120191653313, "learning_rate": 5.734491443100342e-07, "loss": 0.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.07696253806352615, "step": 6650, "valid_targets_mean": 1681.4, "valid_targets_min": 597 }, { "epoch": 6.5245098039215685, "grad_norm": 0.6462025577850812, "learning_rate": 5.618841213970472e-07, "loss": 0.0787, "loss_nan_ranks": 0, "loss_rank_avg": 0.08429364860057831, "step": 6655, "valid_targets_mean": 1914.6, "valid_targets_min": 613 }, { "epoch": 6.529411764705882, "grad_norm": 0.6186638590533011, "learning_rate": 5.504352466248097e-07, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.08027391880750656, "step": 6660, "valid_targets_mean": 1882.0, "valid_targets_min": 719 }, { "epoch": 6.534313725490196, "grad_norm": 0.5970585117284097, "learning_rate": 5.391025884035239e-07, "loss": 0.0735, "loss_nan_ranks": 0, "loss_rank_avg": 0.07223717123270035, "step": 6665, "valid_targets_mean": 1795.7, "valid_targets_min": 614 }, { "epoch": 6.53921568627451, "grad_norm": 0.6393704732605341, "learning_rate": 5.278862144489716e-07, "loss": 0.0807, "loss_nan_ranks": 0, "loss_rank_avg": 0.07152163982391357, "step": 6670, "valid_targets_mean": 2575.4, "valid_targets_min": 741 }, { "epoch": 6.544117647058823, "grad_norm": 0.6110025268089397, "learning_rate": 5.16786191782106e-07, "loss": 0.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.07727265357971191, "step": 6675, "valid_targets_mean": 2013.5, "valid_targets_min": 632 }, { "epoch": 6.549019607843137, "grad_norm": 0.6890547681596108, "learning_rate": 5.058025867286387e-07, "loss": 0.076, "loss_nan_ranks": 0, "loss_rank_avg": 0.08940169960260391, "step": 6680, "valid_targets_mean": 1832.7, "valid_targets_min": 636 }, { "epoch": 6.553921568627451, "grad_norm": 0.526821095063165, "learning_rate": 4.949354649186666e-07, "loss": 0.0726, "loss_nan_ranks": 0, "loss_rank_avg": 0.09530247747898102, "step": 6685, "valid_targets_mean": 2345.0, "valid_targets_min": 468 }, { "epoch": 6.5588235294117645, "grad_norm": 0.5638933046634943, "learning_rate": 4.841848912862568e-07, "loss": 0.0842, "loss_nan_ranks": 0, "loss_rank_avg": 0.06429076939821243, "step": 6690, "valid_targets_mean": 2157.4, "valid_targets_min": 962 }, { "epoch": 6.563725490196078, "grad_norm": 0.7151405526912445, "learning_rate": 4.7355093006907325e-07, "loss": 0.0837, "loss_nan_ranks": 0, "loss_rank_avg": 0.06609296798706055, "step": 6695, "valid_targets_mean": 1982.6, "valid_targets_min": 744 }, { "epoch": 6.568627450980392, "grad_norm": 0.5698233570409097, "learning_rate": 4.630336448079864e-07, "loss": 0.0698, "loss_nan_ranks": 0, "loss_rank_avg": 0.07055316120386124, "step": 6700, "valid_targets_mean": 2221.2, "valid_targets_min": 700 }, { "epoch": 6.573529411764706, "grad_norm": 0.6362640401880392, "learning_rate": 4.5263309834669753e-07, "loss": 0.0728, "loss_nan_ranks": 0, "loss_rank_avg": 0.07047757506370544, "step": 6705, "valid_targets_mean": 2399.4, "valid_targets_min": 651 }, { "epoch": 6.578431372549019, "grad_norm": 0.624490274090889, "learning_rate": 4.423493528313638e-07, "loss": 0.0738, "loss_nan_ranks": 0, "loss_rank_avg": 0.07188694179058075, "step": 6710, "valid_targets_mean": 2270.2, "valid_targets_min": 602 }, { "epoch": 6.583333333333333, "grad_norm": 0.6588545635409063, "learning_rate": 4.3218246971021394e-07, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.10030744224786758, "step": 6715, "valid_targets_mean": 1812.2, "valid_targets_min": 613 }, { "epoch": 6.588235294117647, "grad_norm": 0.6143564999883911, "learning_rate": 4.2213250973319964e-07, "loss": 0.0759, "loss_nan_ranks": 0, "loss_rank_avg": 0.1096772700548172, "step": 6720, "valid_targets_mean": 2134.1, "valid_targets_min": 700 }, { "epoch": 6.5931372549019605, "grad_norm": 0.6373064405570183, "learning_rate": 4.121995329516293e-07, "loss": 0.0757, "loss_nan_ranks": 0, "loss_rank_avg": 0.075977623462677, "step": 6725, "valid_targets_mean": 1834.6, "valid_targets_min": 598 }, { "epoch": 6.598039215686274, "grad_norm": 0.5775137974021963, "learning_rate": 4.0238359871779045e-07, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.07746519148349762, "step": 6730, "valid_targets_mean": 2040.2, "valid_targets_min": 729 }, { "epoch": 6.602941176470588, "grad_norm": 0.6154801243115351, "learning_rate": 3.926847656846189e-07, "loss": 0.0811, "loss_nan_ranks": 0, "loss_rank_avg": 0.07492032647132874, "step": 6735, "valid_targets_mean": 1690.9, "valid_targets_min": 516 }, { "epoch": 6.607843137254902, "grad_norm": 0.5285933942636529, "learning_rate": 3.831030918053369e-07, "loss": 0.068, "loss_nan_ranks": 0, "loss_rank_avg": 0.06620896607637405, "step": 6740, "valid_targets_mean": 2294.8, "valid_targets_min": 955 }, { "epoch": 6.612745098039216, "grad_norm": 0.5893823543019614, "learning_rate": 3.736386343331044e-07, "loss": 0.0818, "loss_nan_ranks": 0, "loss_rank_avg": 0.09671109914779663, "step": 6745, "valid_targets_mean": 2318.4, "valid_targets_min": 853 }, { "epoch": 6.617647058823529, "grad_norm": 0.5462674467458982, "learning_rate": 3.64291449820684e-07, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.061107758432626724, "step": 6750, "valid_targets_mean": 2305.8, "valid_targets_min": 634 }, { "epoch": 6.622549019607844, "grad_norm": 0.6074116112610899, "learning_rate": 3.5506159412010076e-07, "loss": 0.0731, "loss_nan_ranks": 0, "loss_rank_avg": 0.06659223139286041, "step": 6755, "valid_targets_mean": 2211.5, "valid_targets_min": 756 }, { "epoch": 6.627450980392156, "grad_norm": 0.5632099448887126, "learning_rate": 3.4594912238230307e-07, "loss": 0.0715, "loss_nan_ranks": 0, "loss_rank_avg": 0.0652645155787468, "step": 6760, "valid_targets_mean": 2370.2, "valid_targets_min": 502 }, { "epoch": 6.632352941176471, "grad_norm": 0.4944591686617319, "learning_rate": 3.3695408905684456e-07, "loss": 0.0817, "loss_nan_ranks": 0, "loss_rank_avg": 0.054533012211322784, "step": 6765, "valid_targets_mean": 2398.9, "valid_targets_min": 649 }, { "epoch": 6.637254901960784, "grad_norm": 0.5915700018309602, "learning_rate": 3.280765478915449e-07, "loss": 0.0704, "loss_nan_ranks": 0, "loss_rank_avg": 0.07783752679824829, "step": 6770, "valid_targets_mean": 2240.8, "valid_targets_min": 682 }, { "epoch": 6.642156862745098, "grad_norm": 0.49047093994848395, "learning_rate": 3.193165519321739e-07, "loss": 0.0704, "loss_nan_ranks": 0, "loss_rank_avg": 0.0692506730556488, "step": 6775, "valid_targets_mean": 2598.6, "valid_targets_min": 1083 }, { "epoch": 6.647058823529412, "grad_norm": 0.5773913930901008, "learning_rate": 3.1067415352214583e-07, "loss": 0.0798, "loss_nan_ranks": 0, "loss_rank_avg": 0.07195072621107101, "step": 6780, "valid_targets_mean": 2246.1, "valid_targets_min": 654 }, { "epoch": 6.651960784313726, "grad_norm": 0.6854796204536878, "learning_rate": 3.0214940430218996e-07, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.08964002132415771, "step": 6785, "valid_targets_mean": 1977.6, "valid_targets_min": 636 }, { "epoch": 6.6568627450980395, "grad_norm": 0.589375571510179, "learning_rate": 2.9374235521005157e-07, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.0778995007276535, "step": 6790, "valid_targets_mean": 2066.0, "valid_targets_min": 659 }, { "epoch": 6.661764705882353, "grad_norm": 0.5131243023890815, "learning_rate": 2.8545305648018274e-07, "loss": 0.0691, "loss_nan_ranks": 0, "loss_rank_avg": 0.0669882595539093, "step": 6795, "valid_targets_mean": 2585.2, "valid_targets_min": 910 }, { "epoch": 6.666666666666667, "grad_norm": 0.57976654440454, "learning_rate": 2.772815576434429e-07, "loss": 0.0732, "loss_nan_ranks": 0, "loss_rank_avg": 0.07049468159675598, "step": 6800, "valid_targets_mean": 2076.2, "valid_targets_min": 923 }, { "epoch": 6.671568627450981, "grad_norm": 0.6333760051695486, "learning_rate": 2.6922790752681004e-07, "loss": 0.0723, "loss_nan_ranks": 0, "loss_rank_avg": 0.08557892590761185, "step": 6805, "valid_targets_mean": 2019.9, "valid_targets_min": 615 }, { "epoch": 6.676470588235294, "grad_norm": 0.5500510919093051, "learning_rate": 2.6129215425307884e-07, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.07296749949455261, "step": 6810, "valid_targets_mean": 2380.2, "valid_targets_min": 961 }, { "epoch": 6.681372549019608, "grad_norm": 0.5284267171327073, "learning_rate": 2.534743452405786e-07, "loss": 0.0783, "loss_nan_ranks": 0, "loss_rank_avg": 0.07741603255271912, "step": 6815, "valid_targets_mean": 2762.5, "valid_targets_min": 821 }, { "epoch": 6.686274509803922, "grad_norm": 0.5208764125308674, "learning_rate": 2.4577452720289554e-07, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.06157371401786804, "step": 6820, "valid_targets_mean": 2351.6, "valid_targets_min": 744 }, { "epoch": 6.6911764705882355, "grad_norm": 0.7033957323624661, "learning_rate": 2.3819274614857114e-07, "loss": 0.0731, "loss_nan_ranks": 0, "loss_rank_avg": 0.06887654215097427, "step": 6825, "valid_targets_mean": 1957.0, "valid_targets_min": 717 }, { "epoch": 6.696078431372549, "grad_norm": 0.5497440299921376, "learning_rate": 2.3072904738085766e-07, "loss": 0.0799, "loss_nan_ranks": 0, "loss_rank_avg": 0.06968720257282257, "step": 6830, "valid_targets_mean": 2151.9, "valid_targets_min": 649 }, { "epoch": 6.700980392156863, "grad_norm": 0.5027531856286584, "learning_rate": 2.2338347549742956e-07, "loss": 0.0729, "loss_nan_ranks": 0, "loss_rank_avg": 0.07394878566265106, "step": 6835, "valid_targets_mean": 2225.8, "valid_targets_min": 824 }, { "epoch": 6.705882352941177, "grad_norm": 0.4273091436307248, "learning_rate": 2.1615607439011698e-07, "loss": 0.0653, "loss_nan_ranks": 0, "loss_rank_avg": 0.05667303502559662, "step": 6840, "valid_targets_mean": 3133.9, "valid_targets_min": 852 }, { "epoch": 6.71078431372549, "grad_norm": 0.5815477377429077, "learning_rate": 2.0904688724464828e-07, "loss": 0.0845, "loss_nan_ranks": 0, "loss_rank_avg": 0.08845975250005722, "step": 6845, "valid_targets_mean": 2000.3, "valid_targets_min": 549 }, { "epoch": 6.715686274509804, "grad_norm": 1.2981100793881648, "learning_rate": 2.0205595654039012e-07, "loss": 0.0655, "loss_nan_ranks": 0, "loss_rank_avg": 0.06515184044837952, "step": 6850, "valid_targets_mean": 2063.4, "valid_targets_min": 1143 }, { "epoch": 6.720588235294118, "grad_norm": 0.6841758509817507, "learning_rate": 1.9518332405009887e-07, "loss": 0.0798, "loss_nan_ranks": 0, "loss_rank_avg": 0.07749398797750473, "step": 6855, "valid_targets_mean": 1602.4, "valid_targets_min": 732 }, { "epoch": 6.7254901960784315, "grad_norm": 0.4924527381520498, "learning_rate": 1.8842903083965857e-07, "loss": 0.0694, "loss_nan_ranks": 0, "loss_rank_avg": 0.06516847014427185, "step": 6860, "valid_targets_mean": 2914.9, "valid_targets_min": 591 }, { "epoch": 6.730392156862745, "grad_norm": 0.6303188289451982, "learning_rate": 1.8179311726784777e-07, "loss": 0.0757, "loss_nan_ranks": 0, "loss_rank_avg": 0.07469521462917328, "step": 6865, "valid_targets_mean": 2210.1, "valid_targets_min": 811 }, { "epoch": 6.735294117647059, "grad_norm": 0.8053913454744731, "learning_rate": 1.7527562298609524e-07, "loss": 0.0666, "loss_nan_ranks": 0, "loss_rank_avg": 0.06828522682189941, "step": 6870, "valid_targets_mean": 1897.0, "valid_targets_min": 582 }, { "epoch": 6.740196078431373, "grad_norm": 0.5568843332211943, "learning_rate": 1.6887658693823583e-07, "loss": 0.0678, "loss_nan_ranks": 0, "loss_rank_avg": 0.07886748015880585, "step": 6875, "valid_targets_mean": 2553.4, "valid_targets_min": 916 }, { "epoch": 6.745098039215686, "grad_norm": 0.691870344299773, "learning_rate": 1.6259604736029057e-07, "loss": 0.0666, "loss_nan_ranks": 0, "loss_rank_avg": 0.0789848044514656, "step": 6880, "valid_targets_mean": 1709.3, "valid_targets_min": 664 }, { "epoch": 6.75, "grad_norm": 0.5896811602843932, "learning_rate": 1.564340417802246e-07, "loss": 0.0717, "loss_nan_ranks": 0, "loss_rank_avg": 0.07563844323158264, "step": 6885, "valid_targets_mean": 2423.1, "valid_targets_min": 424 }, { "epoch": 6.754901960784314, "grad_norm": 0.5474320570604836, "learning_rate": 1.503906070177341e-07, "loss": 0.0947, "loss_nan_ranks": 0, "loss_rank_avg": 0.08105449378490448, "step": 6890, "valid_targets_mean": 2342.6, "valid_targets_min": 791 }, { "epoch": 6.759803921568627, "grad_norm": 0.6121453772298724, "learning_rate": 1.4446577918401982e-07, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.07447556406259537, "step": 6895, "valid_targets_mean": 2341.2, "valid_targets_min": 549 }, { "epoch": 6.764705882352941, "grad_norm": 0.6114492732117995, "learning_rate": 1.38659593681576e-07, "loss": 0.083, "loss_nan_ranks": 0, "loss_rank_avg": 0.07287880033254623, "step": 6900, "valid_targets_mean": 2059.4, "valid_targets_min": 774 }, { "epoch": 6.769607843137255, "grad_norm": 0.6588140419762275, "learning_rate": 1.3297208520397064e-07, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.07726430892944336, "step": 6905, "valid_targets_mean": 1786.8, "valid_targets_min": 246 }, { "epoch": 6.7745098039215685, "grad_norm": 0.5657506011735933, "learning_rate": 1.274032877356457e-07, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.07481957226991653, "step": 6910, "valid_targets_mean": 2344.2, "valid_targets_min": 655 }, { "epoch": 6.779411764705882, "grad_norm": 0.5928810950417512, "learning_rate": 1.219532345517127e-07, "loss": 0.0709, "loss_nan_ranks": 0, "loss_rank_avg": 0.06960079818964005, "step": 6915, "valid_targets_mean": 1776.4, "valid_targets_min": 503 }, { "epoch": 6.784313725490196, "grad_norm": 0.6762501537064162, "learning_rate": 1.1662195821775746e-07, "loss": 0.0776, "loss_nan_ranks": 0, "loss_rank_avg": 0.0917593464255333, "step": 6920, "valid_targets_mean": 1760.2, "valid_targets_min": 839 }, { "epoch": 6.78921568627451, "grad_norm": 0.5864555760924591, "learning_rate": 1.1140949058963125e-07, "loss": 0.0892, "loss_nan_ranks": 0, "loss_rank_avg": 0.08153297007083893, "step": 6925, "valid_targets_mean": 2450.8, "valid_targets_min": 1001 }, { "epoch": 6.794117647058823, "grad_norm": 0.6232735656011807, "learning_rate": 1.0631586281327988e-07, "loss": 0.0891, "loss_nan_ranks": 0, "loss_rank_avg": 0.08557818084955215, "step": 6930, "valid_targets_mean": 1834.9, "valid_targets_min": 766 }, { "epoch": 6.799019607843137, "grad_norm": 0.5980549584459026, "learning_rate": 1.0134110532454167e-07, "loss": 0.0659, "loss_nan_ranks": 0, "loss_rank_avg": 0.06608110666275024, "step": 6935, "valid_targets_mean": 2118.2, "valid_targets_min": 646 }, { "epoch": 6.803921568627451, "grad_norm": 0.5574126476293245, "learning_rate": 9.648524784897418e-08, "loss": 0.0839, "loss_nan_ranks": 0, "loss_rank_avg": 0.07937115430831909, "step": 6940, "valid_targets_mean": 2194.7, "valid_targets_min": 746 }, { "epoch": 6.8088235294117645, "grad_norm": 0.5488303476404753, "learning_rate": 9.17483194016744e-08, "loss": 0.0794, "loss_nan_ranks": 0, "loss_rank_avg": 0.09899978339672089, "step": 6945, "valid_targets_mean": 2651.8, "valid_targets_min": 732 }, { "epoch": 6.813725490196078, "grad_norm": 0.5878960633853861, "learning_rate": 8.713034828710554e-08, "loss": 0.0807, "loss_nan_ranks": 0, "loss_rank_avg": 0.07570293545722961, "step": 6950, "valid_targets_mean": 2299.9, "valid_targets_min": 774 }, { "epoch": 6.818627450980392, "grad_norm": 0.5334957139961155, "learning_rate": 8.26313620989283e-08, "loss": 0.082, "loss_nan_ranks": 0, "loss_rank_avg": 0.07348759472370148, "step": 6955, "valid_targets_mean": 2329.1, "valid_targets_min": 858 }, { "epoch": 6.823529411764706, "grad_norm": 0.5061147065315302, "learning_rate": 7.825138771983432e-08, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.05788544565439224, "step": 6960, "valid_targets_mean": 2415.1, "valid_targets_min": 714 }, { "epoch": 6.828431372549019, "grad_norm": 0.5150049175490301, "learning_rate": 7.399045132138627e-08, "loss": 0.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.06460592150688171, "step": 6965, "valid_targets_mean": 2752.2, "valid_targets_min": 713 }, { "epoch": 6.833333333333333, "grad_norm": 0.4705212783129525, "learning_rate": 6.98485783638625e-08, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.0671989843249321, "step": 6970, "valid_targets_mean": 2491.8, "valid_targets_min": 743 }, { "epoch": 6.838235294117647, "grad_norm": 0.5857825766534208, "learning_rate": 6.582579359610597e-08, "loss": 0.0754, "loss_nan_ranks": 0, "loss_rank_avg": 0.07692444324493408, "step": 6975, "valid_targets_mean": 2063.6, "valid_targets_min": 567 }, { "epoch": 6.8431372549019605, "grad_norm": 0.5021496002955151, "learning_rate": 6.192212105537109e-08, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.08223918080329895, "step": 6980, "valid_targets_mean": 2688.7, "valid_targets_min": 686 }, { "epoch": 6.848039215686274, "grad_norm": 0.4348685643630877, "learning_rate": 5.813758406718606e-08, "loss": 0.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.05415298044681549, "step": 6985, "valid_targets_mean": 2850.8, "valid_targets_min": 597 }, { "epoch": 6.852941176470588, "grad_norm": 0.5560387400479142, "learning_rate": 5.4472205245208463e-08, "loss": 0.0813, "loss_nan_ranks": 0, "loss_rank_avg": 0.06583650410175323, "step": 6990, "valid_targets_mean": 2302.1, "valid_targets_min": 758 }, { "epoch": 6.857843137254902, "grad_norm": 0.565742943832882, "learning_rate": 5.092600649109658e-08, "loss": 0.0784, "loss_nan_ranks": 0, "loss_rank_avg": 0.06734960526227951, "step": 6995, "valid_targets_mean": 2259.1, "valid_targets_min": 763 }, { "epoch": 6.862745098039216, "grad_norm": 0.5171417741345915, "learning_rate": 4.7499008994373875e-08, "loss": 0.0727, "loss_nan_ranks": 0, "loss_rank_avg": 0.06790250539779663, "step": 7000, "valid_targets_mean": 2513.7, "valid_targets_min": 953 }, { "epoch": 6.867647058823529, "grad_norm": 0.503597251844863, "learning_rate": 4.4191233232300235e-08, "loss": 0.0685, "loss_nan_ranks": 0, "loss_rank_avg": 0.06478115916252136, "step": 7005, "valid_targets_mean": 2516.2, "valid_targets_min": 530 }, { "epoch": 6.872549019607844, "grad_norm": 0.6054050789758687, "learning_rate": 4.10026989697565e-08, "loss": 0.0707, "loss_nan_ranks": 0, "loss_rank_avg": 0.06746941804885864, "step": 7010, "valid_targets_mean": 2090.3, "valid_targets_min": 1144 }, { "epoch": 6.877450980392156, "grad_norm": 0.5606095020900572, "learning_rate": 3.793342525911792e-08, "loss": 0.0857, "loss_nan_ranks": 0, "loss_rank_avg": 0.0673239454627037, "step": 7015, "valid_targets_mean": 2314.0, "valid_targets_min": 869 }, { "epoch": 6.882352941176471, "grad_norm": 0.6021982902697057, "learning_rate": 3.4983430440149733e-08, "loss": 0.0831, "loss_nan_ranks": 0, "loss_rank_avg": 0.10573314130306244, "step": 7020, "valid_targets_mean": 2055.6, "valid_targets_min": 681 }, { "epoch": 6.887254901960784, "grad_norm": 0.5568757053589237, "learning_rate": 3.215273213988734e-08, "loss": 0.0764, "loss_nan_ranks": 0, "loss_rank_avg": 0.07062698900699615, "step": 7025, "valid_targets_mean": 2395.8, "valid_targets_min": 724 }, { "epoch": 6.892156862745098, "grad_norm": 0.7240829790900177, "learning_rate": 2.9441347272543e-08, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.0858493223786354, "step": 7030, "valid_targets_mean": 1650.8, "valid_targets_min": 748 }, { "epoch": 6.897058823529412, "grad_norm": 0.6349762124135037, "learning_rate": 2.6849292039390352e-08, "loss": 0.0685, "loss_nan_ranks": 0, "loss_rank_avg": 0.0749552771449089, "step": 7035, "valid_targets_mean": 1839.1, "valid_targets_min": 544 }, { "epoch": 6.901960784313726, "grad_norm": 0.5676422569750085, "learning_rate": 2.4376581928682307e-08, "loss": 0.0931, "loss_nan_ranks": 0, "loss_rank_avg": 0.06373101472854614, "step": 7040, "valid_targets_mean": 2116.4, "valid_targets_min": 678 }, { "epoch": 6.9068627450980395, "grad_norm": 0.5744939628095065, "learning_rate": 2.2023231715546655e-08, "loss": 0.0721, "loss_nan_ranks": 0, "loss_rank_avg": 0.06783310323953629, "step": 7045, "valid_targets_mean": 2597.4, "valid_targets_min": 813 }, { "epoch": 6.911764705882353, "grad_norm": 0.6284874290227057, "learning_rate": 1.9789255461906132e-08, "loss": 0.0809, "loss_nan_ranks": 0, "loss_rank_avg": 0.08478754758834839, "step": 7050, "valid_targets_mean": 2029.5, "valid_targets_min": 531 }, { "epoch": 6.916666666666667, "grad_norm": 0.5411737246105554, "learning_rate": 1.7674666516387383e-08, "loss": 0.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.06868691742420197, "step": 7055, "valid_targets_mean": 2305.8, "valid_targets_min": 673 }, { "epoch": 6.921568627450981, "grad_norm": 0.49737197499649116, "learning_rate": 1.56794775142477e-08, "loss": 0.0735, "loss_nan_ranks": 0, "loss_rank_avg": 0.06329074501991272, "step": 7060, "valid_targets_mean": 2280.2, "valid_targets_min": 589 }, { "epoch": 6.926470588235294, "grad_norm": 0.6751026916886007, "learning_rate": 1.380370037729728e-08, "loss": 0.0717, "loss_nan_ranks": 0, "loss_rank_avg": 0.08442050218582153, "step": 7065, "valid_targets_mean": 2083.4, "valid_targets_min": 659 }, { "epoch": 6.931372549019608, "grad_norm": 0.5030081784740777, "learning_rate": 1.204734631382154e-08, "loss": 0.0862, "loss_nan_ranks": 0, "loss_rank_avg": 0.06494186818599701, "step": 7070, "valid_targets_mean": 2563.1, "valid_targets_min": 869 }, { "epoch": 6.936274509803922, "grad_norm": 0.5113385667698365, "learning_rate": 1.0410425818525582e-08, "loss": 0.0749, "loss_nan_ranks": 0, "loss_rank_avg": 0.07213737070560455, "step": 7075, "valid_targets_mean": 2695.8, "valid_targets_min": 800 }, { "epoch": 6.9411764705882355, "grad_norm": 0.6583346196023455, "learning_rate": 8.892948672465373e-09, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.07703264057636261, "step": 7080, "valid_targets_mean": 2112.5, "valid_targets_min": 728 }, { "epoch": 6.946078431372549, "grad_norm": 0.4106397687578483, "learning_rate": 7.494923942985566e-09, "loss": 0.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.05719529092311859, "step": 7085, "valid_targets_mean": 3062.9, "valid_targets_min": 634 }, { "epoch": 6.950980392156863, "grad_norm": 0.5361202378127926, "learning_rate": 6.216359983675091e-09, "loss": 0.0725, "loss_nan_ranks": 0, "loss_rank_avg": 0.0644589364528656, "step": 7090, "valid_targets_mean": 2359.8, "valid_targets_min": 682 }, { "epoch": 6.955882352941177, "grad_norm": 0.5868554124771347, "learning_rate": 5.057264434307208e-09, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.06894619762897491, "step": 7095, "valid_targets_mean": 2037.6, "valid_targets_min": 835 }, { "epoch": 6.96078431372549, "grad_norm": 0.5026454645152694, "learning_rate": 4.017644220797312e-09, "loss": 0.0685, "loss_nan_ranks": 0, "loss_rank_avg": 0.06370195746421814, "step": 7100, "valid_targets_mean": 2236.1, "valid_targets_min": 822 }, { "epoch": 6.965686274509804, "grad_norm": 0.5172626012676429, "learning_rate": 3.097505555169633e-09, "loss": 0.071, "loss_nan_ranks": 0, "loss_rank_avg": 0.07044585049152374, "step": 7105, "valid_targets_mean": 2222.4, "valid_targets_min": 536 }, { "epoch": 6.970588235294118, "grad_norm": 0.48563914103910366, "learning_rate": 2.2968539355061603e-09, "loss": 0.0641, "loss_nan_ranks": 0, "loss_rank_avg": 0.060300637036561966, "step": 7110, "valid_targets_mean": 2759.5, "valid_targets_min": 819 }, { "epoch": 6.9754901960784315, "grad_norm": 0.5009744586716859, "learning_rate": 1.6156941459222197e-09, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.08746712654829025, "step": 7115, "valid_targets_mean": 2686.8, "valid_targets_min": 928 }, { "epoch": 6.980392156862745, "grad_norm": 0.6099074515269169, "learning_rate": 1.0540302565376081e-09, "loss": 0.0655, "loss_nan_ranks": 0, "loss_rank_avg": 0.06961031258106232, "step": 7120, "valid_targets_mean": 2117.1, "valid_targets_min": 788 }, { "epoch": 6.985294117647059, "grad_norm": 0.5865242816170935, "learning_rate": 6.118656234499476e-10, "loss": 0.071, "loss_nan_ranks": 0, "loss_rank_avg": 0.07421500980854034, "step": 7125, "valid_targets_mean": 2357.5, "valid_targets_min": 744 }, { "epoch": 6.990196078431373, "grad_norm": 0.5149688957802767, "learning_rate": 2.892028887147014e-10, "loss": 0.0717, "loss_nan_ranks": 0, "loss_rank_avg": 0.06031516194343567, "step": 7130, "valid_targets_mean": 2506.4, "valid_targets_min": 704 }, { "epoch": 6.995098039215686, "grad_norm": 0.6304851349269752, "learning_rate": 8.604398032963091e-11, "loss": 0.0967, "loss_nan_ranks": 0, "loss_rank_avg": 0.08709007501602173, "step": 7135, "valid_targets_mean": 2069.6, "valid_targets_min": 737 }, { "epoch": 7.0, "grad_norm": 0.48718293954798514, "learning_rate": 2.3901122303549018e-12, "loss": 0.0753, "loss_nan_ranks": 0, "loss_rank_avg": 0.059055425226688385, "step": 7140, "valid_targets_mean": 2420.6, "valid_targets_min": 743 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.059055425226688385, "step": 7140, "total_flos": 1483460788355072.0, "train_loss": 0.12303723783469668, "train_runtime": 34233.4373, "train_samples_per_second": 3.334, "train_steps_per_second": 0.209, "valid_targets_mean": 2420.6, "valid_targets_min": 743 } ], "logging_steps": 5, "max_steps": 7140, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1483460788355072.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }