| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4361, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.008025682182985553, |
| "grad_norm": 14.646306271075366, |
| "learning_rate": 3.661327231121282e-07, |
| "loss": 0.7867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.8202405571937561, |
| "step": 5, |
| "valid_targets_mean": 1387.8, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 0.016051364365971106, |
| "grad_norm": 11.968096269141974, |
| "learning_rate": 8.237986270022884e-07, |
| "loss": 0.7576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7305525541305542, |
| "step": 10, |
| "valid_targets_mean": 1799.4, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 0.024077046548956663, |
| "grad_norm": 11.236420564589006, |
| "learning_rate": 1.2814645308924487e-06, |
| "loss": 0.7727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7805347442626953, |
| "step": 15, |
| "valid_targets_mean": 1906.4, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 0.03210272873194221, |
| "grad_norm": 8.949334311195145, |
| "learning_rate": 1.7391304347826088e-06, |
| "loss": 0.752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7785749435424805, |
| "step": 20, |
| "valid_targets_mean": 2390.4, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 0.04012841091492777, |
| "grad_norm": 5.3497727404284365, |
| "learning_rate": 2.196796338672769e-06, |
| "loss": 0.673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6312217712402344, |
| "step": 25, |
| "valid_targets_mean": 2391.2, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 0.048154093097913325, |
| "grad_norm": 4.580136509374292, |
| "learning_rate": 2.654462242562929e-06, |
| "loss": 0.6483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6121365427970886, |
| "step": 30, |
| "valid_targets_mean": 2334.8, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 0.056179775280898875, |
| "grad_norm": 4.161436647961576, |
| "learning_rate": 3.1121281464530894e-06, |
| "loss": 0.5971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.592909574508667, |
| "step": 35, |
| "valid_targets_mean": 1784.5, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 0.06420545746388442, |
| "grad_norm": 3.212931241614404, |
| "learning_rate": 3.56979405034325e-06, |
| "loss": 0.5523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5291016697883606, |
| "step": 40, |
| "valid_targets_mean": 1793.4, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 0.07223113964686999, |
| "grad_norm": 1.89939583890284, |
| "learning_rate": 4.0274599542334094e-06, |
| "loss": 0.5286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5067185759544373, |
| "step": 45, |
| "valid_targets_mean": 1862.8, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 0.08025682182985554, |
| "grad_norm": 1.4106073213091272, |
| "learning_rate": 4.48512585812357e-06, |
| "loss": 0.4867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45846793055534363, |
| "step": 50, |
| "valid_targets_mean": 1882.2, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 0.08828250401284109, |
| "grad_norm": 1.314092536682443, |
| "learning_rate": 4.94279176201373e-06, |
| "loss": 0.5091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5191839933395386, |
| "step": 55, |
| "valid_targets_mean": 1953.6, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 0.09630818619582665, |
| "grad_norm": 1.22631301037501, |
| "learning_rate": 5.400457665903891e-06, |
| "loss": 0.4681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4688069522380829, |
| "step": 60, |
| "valid_targets_mean": 1773.1, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 0.1043338683788122, |
| "grad_norm": 0.9527209313385111, |
| "learning_rate": 5.858123569794051e-06, |
| "loss": 0.4591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43702492117881775, |
| "step": 65, |
| "valid_targets_mean": 2561.0, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 0.11235955056179775, |
| "grad_norm": 1.000235844903914, |
| "learning_rate": 6.31578947368421e-06, |
| "loss": 0.4309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4246852397918701, |
| "step": 70, |
| "valid_targets_mean": 1998.6, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 0.12038523274478331, |
| "grad_norm": 1.0089319236844694, |
| "learning_rate": 6.773455377574372e-06, |
| "loss": 0.4347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43148094415664673, |
| "step": 75, |
| "valid_targets_mean": 1942.4, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 0.12841091492776885, |
| "grad_norm": 0.8232756236327731, |
| "learning_rate": 7.231121281464531e-06, |
| "loss": 0.4306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43262892961502075, |
| "step": 80, |
| "valid_targets_mean": 2726.3, |
| "valid_targets_min": 1188 |
| }, |
| { |
| "epoch": 0.13643659711075443, |
| "grad_norm": 0.9596497429181713, |
| "learning_rate": 7.688787185354691e-06, |
| "loss": 0.4277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4384536147117615, |
| "step": 85, |
| "valid_targets_mean": 2762.1, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 0.14446227929373998, |
| "grad_norm": 0.9854480370415547, |
| "learning_rate": 8.146453089244852e-06, |
| "loss": 0.409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4489230513572693, |
| "step": 90, |
| "valid_targets_mean": 2211.6, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 0.15248796147672553, |
| "grad_norm": 0.8568389517883238, |
| "learning_rate": 8.604118993135013e-06, |
| "loss": 0.3943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38258206844329834, |
| "step": 95, |
| "valid_targets_mean": 1985.7, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 0.16051364365971107, |
| "grad_norm": 0.963371139740054, |
| "learning_rate": 9.061784897025172e-06, |
| "loss": 0.3885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39598965644836426, |
| "step": 100, |
| "valid_targets_mean": 1740.9, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 0.16853932584269662, |
| "grad_norm": 0.7956839523047545, |
| "learning_rate": 9.519450800915333e-06, |
| "loss": 0.3943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3456423878669739, |
| "step": 105, |
| "valid_targets_mean": 2082.3, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 0.17656500802568217, |
| "grad_norm": 1.0007550081839145, |
| "learning_rate": 9.977116704805492e-06, |
| "loss": 0.3831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.386109322309494, |
| "step": 110, |
| "valid_targets_mean": 1802.2, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 0.18459069020866772, |
| "grad_norm": 1.0875676039705295, |
| "learning_rate": 1.0434782608695653e-05, |
| "loss": 0.3762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.394925057888031, |
| "step": 115, |
| "valid_targets_mean": 1672.4, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 0.1926163723916533, |
| "grad_norm": 0.7978089011421273, |
| "learning_rate": 1.0892448512585814e-05, |
| "loss": 0.3906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37832242250442505, |
| "step": 120, |
| "valid_targets_mean": 2175.1, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 0.20064205457463885, |
| "grad_norm": 0.8058045609374141, |
| "learning_rate": 1.1350114416475973e-05, |
| "loss": 0.3619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38131511211395264, |
| "step": 125, |
| "valid_targets_mean": 2393.2, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 0.2086677367576244, |
| "grad_norm": 1.0459248253632374, |
| "learning_rate": 1.1807780320366134e-05, |
| "loss": 0.361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3370898962020874, |
| "step": 130, |
| "valid_targets_mean": 2067.6, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 0.21669341894060995, |
| "grad_norm": 0.815390844225969, |
| "learning_rate": 1.2265446224256295e-05, |
| "loss": 0.3776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41217032074928284, |
| "step": 135, |
| "valid_targets_mean": 2430.4, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 0.2247191011235955, |
| "grad_norm": 0.7725880706273025, |
| "learning_rate": 1.2723112128146454e-05, |
| "loss": 0.3671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3731037378311157, |
| "step": 140, |
| "valid_targets_mean": 2520.3, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 0.23274478330658105, |
| "grad_norm": 0.9555725515372832, |
| "learning_rate": 1.3180778032036615e-05, |
| "loss": 0.3566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37982848286628723, |
| "step": 145, |
| "valid_targets_mean": 1930.0, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 0.24077046548956663, |
| "grad_norm": 0.9884623923983096, |
| "learning_rate": 1.3638443935926776e-05, |
| "loss": 0.3674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3775394856929779, |
| "step": 150, |
| "valid_targets_mean": 2116.7, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 0.24879614767255218, |
| "grad_norm": 1.034002208624198, |
| "learning_rate": 1.4096109839816933e-05, |
| "loss": 0.339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28776052594184875, |
| "step": 155, |
| "valid_targets_mean": 1503.6, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 0.2568218298555377, |
| "grad_norm": 0.6896418675498204, |
| "learning_rate": 1.4553775743707096e-05, |
| "loss": 0.3622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3446170687675476, |
| "step": 160, |
| "valid_targets_mean": 2950.1, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 0.26484751203852325, |
| "grad_norm": 1.0577856602046278, |
| "learning_rate": 1.5011441647597256e-05, |
| "loss": 0.3664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33905932307243347, |
| "step": 165, |
| "valid_targets_mean": 1820.1, |
| "valid_targets_min": 1114 |
| }, |
| { |
| "epoch": 0.27287319422150885, |
| "grad_norm": 0.9974853998819494, |
| "learning_rate": 1.5469107551487414e-05, |
| "loss": 0.346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3451690077781677, |
| "step": 170, |
| "valid_targets_mean": 1546.1, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 0.2808988764044944, |
| "grad_norm": 1.0338258108878557, |
| "learning_rate": 1.5926773455377575e-05, |
| "loss": 0.3351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31521838903427124, |
| "step": 175, |
| "valid_targets_mean": 1886.1, |
| "valid_targets_min": 1008 |
| }, |
| { |
| "epoch": 0.28892455858747995, |
| "grad_norm": 0.8727309799049142, |
| "learning_rate": 1.6384439359267736e-05, |
| "loss": 0.3715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38526463508605957, |
| "step": 180, |
| "valid_targets_mean": 2234.8, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 0.2969502407704655, |
| "grad_norm": 1.0474632318062393, |
| "learning_rate": 1.6842105263157896e-05, |
| "loss": 0.3609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4184132218360901, |
| "step": 185, |
| "valid_targets_mean": 1813.5, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 0.30497592295345105, |
| "grad_norm": 0.904562584347718, |
| "learning_rate": 1.7299771167048057e-05, |
| "loss": 0.3305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2930997908115387, |
| "step": 190, |
| "valid_targets_mean": 1764.8, |
| "valid_targets_min": 1292 |
| }, |
| { |
| "epoch": 0.3130016051364366, |
| "grad_norm": 1.0289326023752954, |
| "learning_rate": 1.7757437070938218e-05, |
| "loss": 0.3533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3898566663265228, |
| "step": 195, |
| "valid_targets_mean": 1837.3, |
| "valid_targets_min": 834 |
| }, |
| { |
| "epoch": 0.32102728731942215, |
| "grad_norm": 0.7975458356550457, |
| "learning_rate": 1.8215102974828376e-05, |
| "loss": 0.3667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41650494933128357, |
| "step": 200, |
| "valid_targets_mean": 2710.9, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 0.3290529695024077, |
| "grad_norm": 0.8771063421172884, |
| "learning_rate": 1.8672768878718537e-05, |
| "loss": 0.362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33713459968566895, |
| "step": 205, |
| "valid_targets_mean": 1893.6, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 0.33707865168539325, |
| "grad_norm": 0.9698501237808315, |
| "learning_rate": 1.9130434782608697e-05, |
| "loss": 0.327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32817181944847107, |
| "step": 210, |
| "valid_targets_mean": 1683.0, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 0.3451043338683788, |
| "grad_norm": 0.9474489541649586, |
| "learning_rate": 1.9588100686498858e-05, |
| "loss": 0.3341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2981823682785034, |
| "step": 215, |
| "valid_targets_mean": 1833.7, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 0.35313001605136435, |
| "grad_norm": 1.181216739010819, |
| "learning_rate": 2.004576659038902e-05, |
| "loss": 0.3472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3394661247730255, |
| "step": 220, |
| "valid_targets_mean": 1705.2, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 0.3611556982343499, |
| "grad_norm": 0.8600956132450231, |
| "learning_rate": 2.050343249427918e-05, |
| "loss": 0.3324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36123359203338623, |
| "step": 225, |
| "valid_targets_mean": 2096.8, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 0.36918138041733545, |
| "grad_norm": 0.882945376901777, |
| "learning_rate": 2.0961098398169337e-05, |
| "loss": 0.3306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36194247007369995, |
| "step": 230, |
| "valid_targets_mean": 1882.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 0.37720706260032105, |
| "grad_norm": 0.8725076626948183, |
| "learning_rate": 2.14187643020595e-05, |
| "loss": 0.3493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38940614461898804, |
| "step": 235, |
| "valid_targets_mean": 2167.7, |
| "valid_targets_min": 827 |
| }, |
| { |
| "epoch": 0.3852327447833066, |
| "grad_norm": 0.7630509783880415, |
| "learning_rate": 2.187643020594966e-05, |
| "loss": 0.3471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35910847783088684, |
| "step": 240, |
| "valid_targets_mean": 2668.9, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 0.39325842696629215, |
| "grad_norm": 0.8495303482377304, |
| "learning_rate": 2.2334096109839817e-05, |
| "loss": 0.328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2962149977684021, |
| "step": 245, |
| "valid_targets_mean": 1937.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.4012841091492777, |
| "grad_norm": 0.7814400087970893, |
| "learning_rate": 2.279176201372998e-05, |
| "loss": 0.3436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3515506386756897, |
| "step": 250, |
| "valid_targets_mean": 3026.1, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 0.40930979133226325, |
| "grad_norm": 0.8463651123622614, |
| "learning_rate": 2.3249427917620138e-05, |
| "loss": 0.3345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3280409574508667, |
| "step": 255, |
| "valid_targets_mean": 2258.4, |
| "valid_targets_min": 1139 |
| }, |
| { |
| "epoch": 0.4173354735152488, |
| "grad_norm": 0.9681815239196544, |
| "learning_rate": 2.37070938215103e-05, |
| "loss": 0.3405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34646350145339966, |
| "step": 260, |
| "valid_targets_mean": 1639.3, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 0.42536115569823435, |
| "grad_norm": 0.8245899420634851, |
| "learning_rate": 2.4164759725400463e-05, |
| "loss": 0.3234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29822391271591187, |
| "step": 265, |
| "valid_targets_mean": 2175.2, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 0.4333868378812199, |
| "grad_norm": 0.8089617843516632, |
| "learning_rate": 2.462242562929062e-05, |
| "loss": 0.3253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33770427107810974, |
| "step": 270, |
| "valid_targets_mean": 2268.4, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 0.44141252006420545, |
| "grad_norm": 0.9716784399381654, |
| "learning_rate": 2.508009153318078e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31351184844970703, |
| "step": 275, |
| "valid_targets_mean": 1710.8, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 0.449438202247191, |
| "grad_norm": 0.9572310179043315, |
| "learning_rate": 2.5537757437070943e-05, |
| "loss": 0.3171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28802695870399475, |
| "step": 280, |
| "valid_targets_mean": 1709.4, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.45746388443017655, |
| "grad_norm": 0.9544189503916952, |
| "learning_rate": 2.59954233409611e-05, |
| "loss": 0.317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3242787718772888, |
| "step": 285, |
| "valid_targets_mean": 1835.8, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 0.4654895666131621, |
| "grad_norm": 1.0011493165732186, |
| "learning_rate": 2.645308924485126e-05, |
| "loss": 0.336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30623307824134827, |
| "step": 290, |
| "valid_targets_mean": 1786.2, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 0.47351524879614765, |
| "grad_norm": 0.8661555211405326, |
| "learning_rate": 2.6910755148741422e-05, |
| "loss": 0.3137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30924296379089355, |
| "step": 295, |
| "valid_targets_mean": 2096.7, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 0.48154093097913325, |
| "grad_norm": 1.0988416641746142, |
| "learning_rate": 2.7368421052631583e-05, |
| "loss": 0.3165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30219322443008423, |
| "step": 300, |
| "valid_targets_mean": 2274.4, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 0.4895666131621188, |
| "grad_norm": 1.0111186395980374, |
| "learning_rate": 2.782608695652174e-05, |
| "loss": 0.3342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34024935960769653, |
| "step": 305, |
| "valid_targets_mean": 1785.6, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 0.49759229534510435, |
| "grad_norm": 1.1586792124415861, |
| "learning_rate": 2.8283752860411904e-05, |
| "loss": 0.3107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31047970056533813, |
| "step": 310, |
| "valid_targets_mean": 1722.4, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 0.5056179775280899, |
| "grad_norm": 0.832944021979809, |
| "learning_rate": 2.8741418764302062e-05, |
| "loss": 0.307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3337301015853882, |
| "step": 315, |
| "valid_targets_mean": 2222.3, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 0.5136436597110754, |
| "grad_norm": 0.8609636836160994, |
| "learning_rate": 2.9199084668192223e-05, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29694342613220215, |
| "step": 320, |
| "valid_targets_mean": 1934.9, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 0.521669341894061, |
| "grad_norm": 0.8598522131098509, |
| "learning_rate": 2.9656750572082384e-05, |
| "loss": 0.3052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3284974694252014, |
| "step": 325, |
| "valid_targets_mean": 2044.1, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 0.5296950240770465, |
| "grad_norm": 0.952951010741885, |
| "learning_rate": 3.0114416475972544e-05, |
| "loss": 0.3276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28754106163978577, |
| "step": 330, |
| "valid_targets_mean": 1731.6, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 0.5377207062600321, |
| "grad_norm": 0.9490678253695298, |
| "learning_rate": 3.05720823798627e-05, |
| "loss": 0.2909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3454781174659729, |
| "step": 335, |
| "valid_targets_mean": 1781.4, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 0.5457463884430177, |
| "grad_norm": 1.18873344442354, |
| "learning_rate": 3.102974828375286e-05, |
| "loss": 0.2988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29542940855026245, |
| "step": 340, |
| "valid_targets_mean": 1536.3, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 0.5537720706260032, |
| "grad_norm": 1.1976009299731565, |
| "learning_rate": 3.1487414187643024e-05, |
| "loss": 0.3173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2791876792907715, |
| "step": 345, |
| "valid_targets_mean": 1599.9, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 0.5617977528089888, |
| "grad_norm": 0.9101478694060584, |
| "learning_rate": 3.1945080091533184e-05, |
| "loss": 0.2994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2871367335319519, |
| "step": 350, |
| "valid_targets_mean": 1797.5, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 0.5698234349919743, |
| "grad_norm": 0.9896692838718341, |
| "learning_rate": 3.240274599542334e-05, |
| "loss": 0.3153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2911245822906494, |
| "step": 355, |
| "valid_targets_mean": 1839.2, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 0.5778491171749599, |
| "grad_norm": 0.9509341469647331, |
| "learning_rate": 3.2860411899313506e-05, |
| "loss": 0.3164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29795265197753906, |
| "step": 360, |
| "valid_targets_mean": 1844.8, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 0.5858747993579454, |
| "grad_norm": 0.8552209611893014, |
| "learning_rate": 3.331807780320366e-05, |
| "loss": 0.3174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35684460401535034, |
| "step": 365, |
| "valid_targets_mean": 2129.5, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 0.593900481540931, |
| "grad_norm": 0.8555759703411486, |
| "learning_rate": 3.377574370709382e-05, |
| "loss": 0.3255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28512653708457947, |
| "step": 370, |
| "valid_targets_mean": 1772.9, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 0.6019261637239165, |
| "grad_norm": 0.9269879757302991, |
| "learning_rate": 3.423340961098399e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25699400901794434, |
| "step": 375, |
| "valid_targets_mean": 1689.4, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 0.6099518459069021, |
| "grad_norm": 1.0001088715401525, |
| "learning_rate": 3.469107551487414e-05, |
| "loss": 0.315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34773507714271545, |
| "step": 380, |
| "valid_targets_mean": 1948.1, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 0.6179775280898876, |
| "grad_norm": 1.170913919890504, |
| "learning_rate": 3.5148741418764304e-05, |
| "loss": 0.2916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27243420481681824, |
| "step": 385, |
| "valid_targets_mean": 1619.1, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 0.6260032102728732, |
| "grad_norm": 0.8232018782624154, |
| "learning_rate": 3.5606407322654464e-05, |
| "loss": 0.3072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32129108905792236, |
| "step": 390, |
| "valid_targets_mean": 2377.1, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 0.6340288924558587, |
| "grad_norm": 0.8185543627668448, |
| "learning_rate": 3.6064073226544625e-05, |
| "loss": 0.3273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3443065881729126, |
| "step": 395, |
| "valid_targets_mean": 2255.8, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 0.6420545746388443, |
| "grad_norm": 0.9722842463690324, |
| "learning_rate": 3.6521739130434786e-05, |
| "loss": 0.2939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30047857761383057, |
| "step": 400, |
| "valid_targets_mean": 1743.6, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 0.6500802568218299, |
| "grad_norm": 0.7967856246753074, |
| "learning_rate": 3.697940503432495e-05, |
| "loss": 0.3206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2986922860145569, |
| "step": 405, |
| "valid_targets_mean": 2248.8, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 0.6581059390048154, |
| "grad_norm": 0.8316226837505692, |
| "learning_rate": 3.743707093821511e-05, |
| "loss": 0.3035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28393733501434326, |
| "step": 410, |
| "valid_targets_mean": 1886.7, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 0.666131621187801, |
| "grad_norm": 1.1649505956487092, |
| "learning_rate": 3.789473684210526e-05, |
| "loss": 0.3091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3361932039260864, |
| "step": 415, |
| "valid_targets_mean": 2057.5, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 0.6741573033707865, |
| "grad_norm": 0.8674562998891178, |
| "learning_rate": 3.835240274599543e-05, |
| "loss": 0.2817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.286508172750473, |
| "step": 420, |
| "valid_targets_mean": 1988.1, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 0.6821829855537721, |
| "grad_norm": 0.9171965836082356, |
| "learning_rate": 3.8810068649885584e-05, |
| "loss": 0.3252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3114051818847656, |
| "step": 425, |
| "valid_targets_mean": 1783.7, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 0.6902086677367576, |
| "grad_norm": 0.8725500087205194, |
| "learning_rate": 3.9267734553775745e-05, |
| "loss": 0.2903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2869841754436493, |
| "step": 430, |
| "valid_targets_mean": 1863.4, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 0.6982343499197432, |
| "grad_norm": 0.9441119652995636, |
| "learning_rate": 3.9725400457665905e-05, |
| "loss": 0.3042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2990264892578125, |
| "step": 435, |
| "valid_targets_mean": 1948.9, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 0.7062600321027287, |
| "grad_norm": 0.9405263676842486, |
| "learning_rate": 3.99999743609667e-05, |
| "loss": 0.3121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32914310693740845, |
| "step": 440, |
| "valid_targets_mean": 2115.7, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 0.7142857142857143, |
| "grad_norm": 0.8453482397076572, |
| "learning_rate": 3.999968592259695e-05, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30714958906173706, |
| "step": 445, |
| "valid_targets_mean": 2305.3, |
| "valid_targets_min": 1354 |
| }, |
| { |
| "epoch": 0.7223113964686998, |
| "grad_norm": 0.7738975856001973, |
| "learning_rate": 3.9999077001703266e-05, |
| "loss": 0.3068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32613644003868103, |
| "step": 450, |
| "valid_targets_mean": 2465.8, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 0.7303370786516854, |
| "grad_norm": 0.8149570285290635, |
| "learning_rate": 3.999814760804324e-05, |
| "loss": 0.3068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30127108097076416, |
| "step": 455, |
| "valid_targets_mean": 1977.8, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 0.7383627608346709, |
| "grad_norm": 0.9294086272204561, |
| "learning_rate": 3.9996897756509806e-05, |
| "loss": 0.3028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27201634645462036, |
| "step": 460, |
| "valid_targets_mean": 1491.2, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 0.7463884430176565, |
| "grad_norm": 0.8344262631630353, |
| "learning_rate": 3.9995327467131074e-05, |
| "loss": 0.3243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33017224073410034, |
| "step": 465, |
| "valid_targets_mean": 1846.1, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 0.7544141252006421, |
| "grad_norm": 0.7829996456838156, |
| "learning_rate": 3.9993436765069954e-05, |
| "loss": 0.316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3319680094718933, |
| "step": 470, |
| "valid_targets_mean": 2419.9, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 0.7624398073836276, |
| "grad_norm": 0.8771047139224807, |
| "learning_rate": 3.999122568062376e-05, |
| "loss": 0.3174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3266174793243408, |
| "step": 475, |
| "valid_targets_mean": 2624.4, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 0.7704654895666132, |
| "grad_norm": 0.8858493072216881, |
| "learning_rate": 3.9988694249223747e-05, |
| "loss": 0.305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.275663822889328, |
| "step": 480, |
| "valid_targets_mean": 1647.2, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 0.7784911717495987, |
| "grad_norm": 0.7689051739854088, |
| "learning_rate": 3.9985842511434544e-05, |
| "loss": 0.2923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2797590494155884, |
| "step": 485, |
| "valid_targets_mean": 2174.2, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 0.7865168539325843, |
| "grad_norm": 0.8020487982931901, |
| "learning_rate": 3.9982670512953446e-05, |
| "loss": 0.3016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34576845169067383, |
| "step": 490, |
| "valid_targets_mean": 2432.9, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 0.7945425361155698, |
| "grad_norm": 0.9730877600468747, |
| "learning_rate": 3.9979178304609777e-05, |
| "loss": 0.2908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27685031294822693, |
| "step": 495, |
| "valid_targets_mean": 1754.3, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 0.8025682182985554, |
| "grad_norm": 0.8427811924307392, |
| "learning_rate": 3.9975365942364e-05, |
| "loss": 0.2916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26822972297668457, |
| "step": 500, |
| "valid_targets_mean": 1744.6, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 0.8105939004815409, |
| "grad_norm": 0.8345994269057178, |
| "learning_rate": 3.997123348730685e-05, |
| "loss": 0.2982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2742110788822174, |
| "step": 505, |
| "valid_targets_mean": 2118.4, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 0.8186195826645265, |
| "grad_norm": 0.7394141508614848, |
| "learning_rate": 3.9966781005658336e-05, |
| "loss": 0.3182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29566675424575806, |
| "step": 510, |
| "valid_targets_mean": 2393.6, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 0.826645264847512, |
| "grad_norm": 0.7868169024326342, |
| "learning_rate": 3.996200856876671e-05, |
| "loss": 0.3184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31672143936157227, |
| "step": 515, |
| "valid_targets_mean": 2246.7, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 0.8346709470304976, |
| "grad_norm": 0.8208599603839487, |
| "learning_rate": 3.9956916253107316e-05, |
| "loss": 0.2801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23943054676055908, |
| "step": 520, |
| "valid_targets_mean": 1570.6, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 0.8426966292134831, |
| "grad_norm": 0.8304116707206449, |
| "learning_rate": 3.995150414028134e-05, |
| "loss": 0.2939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30285578966140747, |
| "step": 525, |
| "valid_targets_mean": 1989.4, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 0.8507223113964687, |
| "grad_norm": 1.0277770584511348, |
| "learning_rate": 3.994577231701451e-05, |
| "loss": 0.2891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32783007621765137, |
| "step": 530, |
| "valid_targets_mean": 2061.1, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 0.8587479935794543, |
| "grad_norm": 0.952928563450375, |
| "learning_rate": 3.993972087515574e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34268754720687866, |
| "step": 535, |
| "valid_targets_mean": 1843.8, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 0.8667736757624398, |
| "grad_norm": 0.9308129927095735, |
| "learning_rate": 3.9933349911675615e-05, |
| "loss": 0.3211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2926996052265167, |
| "step": 540, |
| "valid_targets_mean": 1644.0, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.8747993579454254, |
| "grad_norm": 0.7426138307689881, |
| "learning_rate": 3.9926659528664866e-05, |
| "loss": 0.2915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2840152978897095, |
| "step": 545, |
| "valid_targets_mean": 2081.6, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 0.8828250401284109, |
| "grad_norm": 0.7590896177179798, |
| "learning_rate": 3.9919649833332715e-05, |
| "loss": 0.2874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30055904388427734, |
| "step": 550, |
| "valid_targets_mean": 2541.2, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 0.8908507223113965, |
| "grad_norm": 0.9273338134445059, |
| "learning_rate": 3.991232093800517e-05, |
| "loss": 0.2785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22772808372974396, |
| "step": 555, |
| "valid_targets_mean": 1515.6, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 0.898876404494382, |
| "grad_norm": 0.7731132242138054, |
| "learning_rate": 3.990467296012322e-05, |
| "loss": 0.3127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31191396713256836, |
| "step": 560, |
| "valid_targets_mean": 2190.2, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 0.9069020866773676, |
| "grad_norm": 0.8650619758973038, |
| "learning_rate": 3.989670602224094e-05, |
| "loss": 0.2988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32659170031547546, |
| "step": 565, |
| "valid_targets_mean": 1817.8, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 0.9149277688603531, |
| "grad_norm": 0.8114237738910773, |
| "learning_rate": 3.988842025202358e-05, |
| "loss": 0.2936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2951407730579376, |
| "step": 570, |
| "valid_targets_mean": 2183.2, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 0.9229534510433387, |
| "grad_norm": 0.7315127957593782, |
| "learning_rate": 3.987981578224542e-05, |
| "loss": 0.3023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3168894648551941, |
| "step": 575, |
| "valid_targets_mean": 2335.3, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 0.9309791332263242, |
| "grad_norm": 0.8198512266606438, |
| "learning_rate": 3.987089275078776e-05, |
| "loss": 0.2992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3281818628311157, |
| "step": 580, |
| "valid_targets_mean": 1949.1, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 0.9390048154093098, |
| "grad_norm": 0.9458954789473605, |
| "learning_rate": 3.986165130063662e-05, |
| "loss": 0.2847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26376253366470337, |
| "step": 585, |
| "valid_targets_mean": 1493.2, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 0.9470304975922953, |
| "grad_norm": 0.881632921637052, |
| "learning_rate": 3.985209157988048e-05, |
| "loss": 0.3026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31336453557014465, |
| "step": 590, |
| "valid_targets_mean": 1887.2, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 0.9550561797752809, |
| "grad_norm": 0.8617456541273046, |
| "learning_rate": 3.984221374170793e-05, |
| "loss": 0.2898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2735736072063446, |
| "step": 595, |
| "valid_targets_mean": 1538.6, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 0.9630818619582665, |
| "grad_norm": 0.8672485396619697, |
| "learning_rate": 3.983201794440517e-05, |
| "loss": 0.2968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30543556809425354, |
| "step": 600, |
| "valid_targets_mean": 2531.9, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 0.971107544141252, |
| "grad_norm": 0.7590885144559714, |
| "learning_rate": 3.982150435135353e-05, |
| "loss": 0.2922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2916344702243805, |
| "step": 605, |
| "valid_targets_mean": 2051.1, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 0.9791332263242376, |
| "grad_norm": 0.7718877500600386, |
| "learning_rate": 3.981067313102677e-05, |
| "loss": 0.2868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28497275710105896, |
| "step": 610, |
| "valid_targets_mean": 1904.2, |
| "valid_targets_min": 784 |
| }, |
| { |
| "epoch": 0.9871589085072231, |
| "grad_norm": 0.7608096902947907, |
| "learning_rate": 3.979952445698847e-05, |
| "loss": 0.2909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26857396960258484, |
| "step": 615, |
| "valid_targets_mean": 1962.2, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 0.9951845906902087, |
| "grad_norm": 0.6228654680626398, |
| "learning_rate": 3.978805850788919e-05, |
| "loss": 0.2987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23795419931411743, |
| "step": 620, |
| "valid_targets_mean": 2535.7, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 1.0032102728731942, |
| "grad_norm": 0.8226067743998671, |
| "learning_rate": 3.9776275467463645e-05, |
| "loss": 0.2819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2510879337787628, |
| "step": 625, |
| "valid_targets_mean": 1790.2, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 1.0112359550561798, |
| "grad_norm": 0.9254700139665087, |
| "learning_rate": 3.9764175524527713e-05, |
| "loss": 0.2686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27632659673690796, |
| "step": 630, |
| "valid_targets_mean": 1515.6, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 1.0192616372391654, |
| "grad_norm": 0.8465617431259781, |
| "learning_rate": 3.975175887297545e-05, |
| "loss": 0.2817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30026766657829285, |
| "step": 635, |
| "valid_targets_mean": 1732.3, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 1.0272873194221508, |
| "grad_norm": 0.6931817861755858, |
| "learning_rate": 3.9739025711775984e-05, |
| "loss": 0.2677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27642396092414856, |
| "step": 640, |
| "valid_targets_mean": 2458.4, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 1.0353130016051364, |
| "grad_norm": 0.8037354268649257, |
| "learning_rate": 3.972597624497029e-05, |
| "loss": 0.2701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27763617038726807, |
| "step": 645, |
| "valid_targets_mean": 1996.9, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 1.043338683788122, |
| "grad_norm": 0.7384503118506207, |
| "learning_rate": 3.971261068166796e-05, |
| "loss": 0.2676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24708183109760284, |
| "step": 650, |
| "valid_targets_mean": 1862.0, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 1.0513643659711076, |
| "grad_norm": 0.7212274419919188, |
| "learning_rate": 3.969892923604383e-05, |
| "loss": 0.2686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3036978244781494, |
| "step": 655, |
| "valid_targets_mean": 2355.9, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 1.0593900481540932, |
| "grad_norm": 0.843707373832904, |
| "learning_rate": 3.9684932127334555e-05, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29731786251068115, |
| "step": 660, |
| "valid_targets_mean": 2513.6, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 1.0674157303370786, |
| "grad_norm": 0.8252091123984003, |
| "learning_rate": 3.967061957983509e-05, |
| "loss": 0.2792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2805379629135132, |
| "step": 665, |
| "valid_targets_mean": 2306.0, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 1.0754414125200642, |
| "grad_norm": 0.7679243083152455, |
| "learning_rate": 3.965599182289511e-05, |
| "loss": 0.2555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2966977655887604, |
| "step": 670, |
| "valid_targets_mean": 2099.9, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 1.0834670947030498, |
| "grad_norm": 0.7324918129142989, |
| "learning_rate": 3.964104909091531e-05, |
| "loss": 0.2663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.273954838514328, |
| "step": 675, |
| "valid_targets_mean": 2465.0, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 1.0914927768860354, |
| "grad_norm": 0.9526343036354475, |
| "learning_rate": 3.962579162334368e-05, |
| "loss": 0.2659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2664143145084381, |
| "step": 680, |
| "valid_targets_mean": 1999.2, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 1.0995184590690208, |
| "grad_norm": 0.7991262471661897, |
| "learning_rate": 3.961021966467165e-05, |
| "loss": 0.2738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31175559759140015, |
| "step": 685, |
| "valid_targets_mean": 2189.3, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 1.1075441412520064, |
| "grad_norm": 0.7616807096516526, |
| "learning_rate": 3.9594333464430155e-05, |
| "loss": 0.2769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2699921429157257, |
| "step": 690, |
| "valid_targets_mean": 2126.8, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 1.115569823434992, |
| "grad_norm": 0.6893907566892634, |
| "learning_rate": 3.957813327718568e-05, |
| "loss": 0.2536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2612619996070862, |
| "step": 695, |
| "valid_targets_mean": 2350.4, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 1.1235955056179776, |
| "grad_norm": 0.759736214908413, |
| "learning_rate": 3.956161936253615e-05, |
| "loss": 0.2769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2773323059082031, |
| "step": 700, |
| "valid_targets_mean": 2099.1, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 1.131621187800963, |
| "grad_norm": 0.7969447025466453, |
| "learning_rate": 3.954479198510676e-05, |
| "loss": 0.2837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.284991979598999, |
| "step": 705, |
| "valid_targets_mean": 2341.9, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 1.1396468699839486, |
| "grad_norm": 0.8759437781132143, |
| "learning_rate": 3.952765141454578e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2301260232925415, |
| "step": 710, |
| "valid_targets_mean": 1502.1, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 1.1476725521669342, |
| "grad_norm": 1.5236051002273119, |
| "learning_rate": 3.951019792552018e-05, |
| "loss": 0.2759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2769410014152527, |
| "step": 715, |
| "valid_targets_mean": 1819.7, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 1.1556982343499198, |
| "grad_norm": 0.8290152147933497, |
| "learning_rate": 3.949243179771126e-05, |
| "loss": 0.2765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26144346594810486, |
| "step": 720, |
| "valid_targets_mean": 1860.0, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 1.1637239165329052, |
| "grad_norm": 0.8614047618513456, |
| "learning_rate": 3.947435331581017e-05, |
| "loss": 0.264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2969715893268585, |
| "step": 725, |
| "valid_targets_mean": 1768.7, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 1.1717495987158908, |
| "grad_norm": 0.8263928626213929, |
| "learning_rate": 3.945596276951333e-05, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2564338147640228, |
| "step": 730, |
| "valid_targets_mean": 1887.8, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 1.1797752808988764, |
| "grad_norm": 0.7152475805264833, |
| "learning_rate": 3.943726045351782e-05, |
| "loss": 0.2745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28374791145324707, |
| "step": 735, |
| "valid_targets_mean": 2314.3, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 1.187800963081862, |
| "grad_norm": 0.8571151233033966, |
| "learning_rate": 3.941824666751659e-05, |
| "loss": 0.2709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26686954498291016, |
| "step": 740, |
| "valid_targets_mean": 1607.6, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 1.1958266452648476, |
| "grad_norm": 0.86405780600893, |
| "learning_rate": 3.939892171619375e-05, |
| "loss": 0.2675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2871187925338745, |
| "step": 745, |
| "valid_targets_mean": 1871.7, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 1.203852327447833, |
| "grad_norm": 0.717709948229875, |
| "learning_rate": 3.9379285909219616e-05, |
| "loss": 0.2722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28010597825050354, |
| "step": 750, |
| "valid_targets_mean": 2421.4, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 1.2118780096308186, |
| "grad_norm": 0.654139274364583, |
| "learning_rate": 3.935933956124578e-05, |
| "loss": 0.2486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2108229696750641, |
| "step": 755, |
| "valid_targets_mean": 1986.1, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 1.2199036918138042, |
| "grad_norm": 0.7787020251350064, |
| "learning_rate": 3.933908299190006e-05, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22526943683624268, |
| "step": 760, |
| "valid_targets_mean": 1925.8, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 1.2279293739967898, |
| "grad_norm": 0.6960673012286028, |
| "learning_rate": 3.931851652578137e-05, |
| "loss": 0.2691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28950342535972595, |
| "step": 765, |
| "valid_targets_mean": 2596.1, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 1.2359550561797752, |
| "grad_norm": 0.7791017658890873, |
| "learning_rate": 3.929764049245454e-05, |
| "loss": 0.2731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3156774640083313, |
| "step": 770, |
| "valid_targets_mean": 2444.2, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 1.2439807383627608, |
| "grad_norm": 0.7183503125932852, |
| "learning_rate": 3.9276455226445015e-05, |
| "loss": 0.2643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3058626055717468, |
| "step": 775, |
| "valid_targets_mean": 2245.4, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 1.2520064205457464, |
| "grad_norm": 0.6695581705684971, |
| "learning_rate": 3.92549610672335e-05, |
| "loss": 0.2681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.289934903383255, |
| "step": 780, |
| "valid_targets_mean": 2771.9, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.260032102728732, |
| "grad_norm": 0.6866570176470886, |
| "learning_rate": 3.9233158359250526e-05, |
| "loss": 0.2608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23689235746860504, |
| "step": 785, |
| "valid_targets_mean": 1918.2, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 1.2680577849117176, |
| "grad_norm": 0.7822630337022523, |
| "learning_rate": 3.9211047451870925e-05, |
| "loss": 0.2662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2988463044166565, |
| "step": 790, |
| "valid_targets_mean": 2311.7, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 1.276083467094703, |
| "grad_norm": 0.8317062530284344, |
| "learning_rate": 3.9188628699408226e-05, |
| "loss": 0.2749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31084558367729187, |
| "step": 795, |
| "valid_targets_mean": 1966.4, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 1.2841091492776886, |
| "grad_norm": 0.72484686674938, |
| "learning_rate": 3.916590246110899e-05, |
| "loss": 0.2561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2934309244155884, |
| "step": 800, |
| "valid_targets_mean": 2700.1, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.2921348314606742, |
| "grad_norm": 0.8156555683738264, |
| "learning_rate": 3.914286910114705e-05, |
| "loss": 0.2662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29776060581207275, |
| "step": 805, |
| "valid_targets_mean": 2074.9, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 1.3001605136436596, |
| "grad_norm": 0.8183857431272717, |
| "learning_rate": 3.9119528988617676e-05, |
| "loss": 0.2539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25548940896987915, |
| "step": 810, |
| "valid_targets_mean": 1921.6, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 1.3081861958266452, |
| "grad_norm": 0.7288663029670344, |
| "learning_rate": 3.909588249753164e-05, |
| "loss": 0.2738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2411450296640396, |
| "step": 815, |
| "valid_targets_mean": 2309.4, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 1.3162118780096308, |
| "grad_norm": 0.8147197023616638, |
| "learning_rate": 3.907193000680924e-05, |
| "loss": 0.2743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29190874099731445, |
| "step": 820, |
| "valid_targets_mean": 1898.1, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 1.3242375601926164, |
| "grad_norm": 0.8065187260999866, |
| "learning_rate": 3.9047671900274256e-05, |
| "loss": 0.256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2601572275161743, |
| "step": 825, |
| "valid_targets_mean": 1808.4, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 1.332263242375602, |
| "grad_norm": 0.8207215518210806, |
| "learning_rate": 3.9023108566647746e-05, |
| "loss": 0.2575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2769230604171753, |
| "step": 830, |
| "valid_targets_mean": 2078.6, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 1.3402889245585876, |
| "grad_norm": 0.924972736057203, |
| "learning_rate": 3.899824039954185e-05, |
| "loss": 0.2565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24372698366641998, |
| "step": 835, |
| "valid_targets_mean": 1450.0, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 1.348314606741573, |
| "grad_norm": 0.714092931128622, |
| "learning_rate": 3.897306779745347e-05, |
| "loss": 0.2789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.271422415971756, |
| "step": 840, |
| "valid_targets_mean": 2285.3, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 1.3563402889245586, |
| "grad_norm": 0.8417283546200632, |
| "learning_rate": 3.89475911637579e-05, |
| "loss": 0.2758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2518080770969391, |
| "step": 845, |
| "valid_targets_mean": 1609.2, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 1.3643659711075442, |
| "grad_norm": 0.7852542096242522, |
| "learning_rate": 3.892181090670233e-05, |
| "loss": 0.2755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2653108239173889, |
| "step": 850, |
| "valid_targets_mean": 1744.6, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 1.3723916532905296, |
| "grad_norm": 0.7958802575764924, |
| "learning_rate": 3.8895727439399366e-05, |
| "loss": 0.2567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2511981129646301, |
| "step": 855, |
| "valid_targets_mean": 1641.1, |
| "valid_targets_min": 1017 |
| }, |
| { |
| "epoch": 1.3804173354735152, |
| "grad_norm": 0.7781458043061429, |
| "learning_rate": 3.8869341179820314e-05, |
| "loss": 0.2689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2821986973285675, |
| "step": 860, |
| "valid_targets_mean": 2122.4, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 1.3884430176565008, |
| "grad_norm": 0.9086989564254825, |
| "learning_rate": 3.884265255078859e-05, |
| "loss": 0.2651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2702217102050781, |
| "step": 865, |
| "valid_targets_mean": 1887.4, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 1.3964686998394864, |
| "grad_norm": 0.774043855966981, |
| "learning_rate": 3.881566197997286e-05, |
| "loss": 0.2624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2534475326538086, |
| "step": 870, |
| "valid_targets_mean": 2067.0, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 1.404494382022472, |
| "grad_norm": 0.7066842171984723, |
| "learning_rate": 3.8788369899880225e-05, |
| "loss": 0.2629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28810229897499084, |
| "step": 875, |
| "valid_targets_mean": 2462.9, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 1.4125200642054574, |
| "grad_norm": 0.7708815207296795, |
| "learning_rate": 3.8760776747849303e-05, |
| "loss": 0.2641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26532846689224243, |
| "step": 880, |
| "valid_targets_mean": 1815.2, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 1.420545746388443, |
| "grad_norm": 0.75205317271865, |
| "learning_rate": 3.873288296604317e-05, |
| "loss": 0.2761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2786597013473511, |
| "step": 885, |
| "valid_targets_mean": 1939.7, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 1.4285714285714286, |
| "grad_norm": 0.672307215560877, |
| "learning_rate": 3.870468900144233e-05, |
| "loss": 0.2782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28444236516952515, |
| "step": 890, |
| "valid_targets_mean": 2277.8, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 1.4365971107544142, |
| "grad_norm": 0.6608204156050805, |
| "learning_rate": 3.8676195305837536e-05, |
| "loss": 0.2557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2395007461309433, |
| "step": 895, |
| "valid_targets_mean": 2169.6, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 1.4446227929373996, |
| "grad_norm": 0.7138327208605213, |
| "learning_rate": 3.864740233582252e-05, |
| "loss": 0.2817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2664600908756256, |
| "step": 900, |
| "valid_targets_mean": 2115.5, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 1.4526484751203852, |
| "grad_norm": 0.6925022486252039, |
| "learning_rate": 3.8618310552786715e-05, |
| "loss": 0.2631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2339175045490265, |
| "step": 905, |
| "valid_targets_mean": 2044.7, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.4606741573033708, |
| "grad_norm": 0.8534400357923534, |
| "learning_rate": 3.858892042290785e-05, |
| "loss": 0.2625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29541435837745667, |
| "step": 910, |
| "valid_targets_mean": 1677.3, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 1.4686998394863564, |
| "grad_norm": 0.7239107539611367, |
| "learning_rate": 3.855923241714447e-05, |
| "loss": 0.268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27571260929107666, |
| "step": 915, |
| "valid_targets_mean": 2073.4, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 1.476725521669342, |
| "grad_norm": 0.8487942181629813, |
| "learning_rate": 3.852924701122839e-05, |
| "loss": 0.2654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29242533445358276, |
| "step": 920, |
| "valid_targets_mean": 1567.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 1.4847512038523274, |
| "grad_norm": 0.7010812875356174, |
| "learning_rate": 3.8498964685657084e-05, |
| "loss": 0.2678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28116998076438904, |
| "step": 925, |
| "valid_targets_mean": 2125.7, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 1.492776886035313, |
| "grad_norm": 0.7241807089136368, |
| "learning_rate": 3.846838592568599e-05, |
| "loss": 0.2684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28465375304222107, |
| "step": 930, |
| "valid_targets_mean": 2401.2, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 1.5008025682182986, |
| "grad_norm": 0.7316004281768466, |
| "learning_rate": 3.84375112213207e-05, |
| "loss": 0.2645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25454214215278625, |
| "step": 935, |
| "valid_targets_mean": 1856.4, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 1.508828250401284, |
| "grad_norm": 0.7770880009110686, |
| "learning_rate": 3.840634106730915e-05, |
| "loss": 0.2577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24702686071395874, |
| "step": 940, |
| "valid_targets_mean": 1784.5, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 1.5168539325842696, |
| "grad_norm": 0.7275439210958472, |
| "learning_rate": 3.837487596313366e-05, |
| "loss": 0.2743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28921470046043396, |
| "step": 945, |
| "valid_targets_mean": 1958.6, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 1.5248796147672552, |
| "grad_norm": 0.7295956985847399, |
| "learning_rate": 3.834311641300296e-05, |
| "loss": 0.2458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2506203055381775, |
| "step": 950, |
| "valid_targets_mean": 2109.1, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 1.5329052969502408, |
| "grad_norm": 0.7788207921479691, |
| "learning_rate": 3.831106292584406e-05, |
| "loss": 0.2625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2641506493091583, |
| "step": 955, |
| "valid_targets_mean": 1837.2, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 1.5409309791332264, |
| "grad_norm": 1.0545045402423714, |
| "learning_rate": 3.827871601529417e-05, |
| "loss": 0.2701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28296715021133423, |
| "step": 960, |
| "valid_targets_mean": 1895.5, |
| "valid_targets_min": 1085 |
| }, |
| { |
| "epoch": 1.548956661316212, |
| "grad_norm": 0.8057606395413027, |
| "learning_rate": 3.8246076199692395e-05, |
| "loss": 0.2581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2991617023944855, |
| "step": 965, |
| "valid_targets_mean": 2077.7, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 1.5569823434991974, |
| "grad_norm": 0.6927010096471385, |
| "learning_rate": 3.821314400207148e-05, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2451082170009613, |
| "step": 970, |
| "valid_targets_mean": 1981.5, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 1.565008025682183, |
| "grad_norm": 0.7110441501753103, |
| "learning_rate": 3.817991995014939e-05, |
| "loss": 0.263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29124924540519714, |
| "step": 975, |
| "valid_targets_mean": 2240.8, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 1.5730337078651684, |
| "grad_norm": 0.6885281006909981, |
| "learning_rate": 3.8146404576320894e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23632869124412537, |
| "step": 980, |
| "valid_targets_mean": 1979.8, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 1.581059390048154, |
| "grad_norm": 0.7522169112208279, |
| "learning_rate": 3.8112598417649015e-05, |
| "loss": 0.2664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2756073772907257, |
| "step": 985, |
| "valid_targets_mean": 2060.7, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 1.5890850722311396, |
| "grad_norm": 0.8786648311794397, |
| "learning_rate": 3.80785020158564e-05, |
| "loss": 0.2627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25147706270217896, |
| "step": 990, |
| "valid_targets_mean": 1561.0, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 1.5971107544141252, |
| "grad_norm": 0.7195963819191232, |
| "learning_rate": 3.804411591731668e-05, |
| "loss": 0.2649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2796766459941864, |
| "step": 995, |
| "valid_targets_mean": 2145.2, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 1.6051364365971108, |
| "grad_norm": 0.8812045734435614, |
| "learning_rate": 3.80094406730457e-05, |
| "loss": 0.2634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23850060999393463, |
| "step": 1000, |
| "valid_targets_mean": 2386.0, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 1.6131621187800964, |
| "grad_norm": 0.7667863911451553, |
| "learning_rate": 3.7974476838692656e-05, |
| "loss": 0.2635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.268310546875, |
| "step": 1005, |
| "valid_targets_mean": 1975.6, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.621187800963082, |
| "grad_norm": 0.7545530524527456, |
| "learning_rate": 3.793922497453124e-05, |
| "loss": 0.2479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.234517440199852, |
| "step": 1010, |
| "valid_targets_mean": 1716.2, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 1.6292134831460674, |
| "grad_norm": 0.7013505596294985, |
| "learning_rate": 3.790368564545067e-05, |
| "loss": 0.2607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28479787707328796, |
| "step": 1015, |
| "valid_targets_mean": 2393.4, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.637239165329053, |
| "grad_norm": 0.8351965152529512, |
| "learning_rate": 3.786785942094656e-05, |
| "loss": 0.2544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2289065718650818, |
| "step": 1020, |
| "valid_targets_mean": 1477.6, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 1.6452648475120384, |
| "grad_norm": 0.8048989954188138, |
| "learning_rate": 3.783174687511188e-05, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24464435875415802, |
| "step": 1025, |
| "valid_targets_mean": 1876.4, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 1.653290529695024, |
| "grad_norm": 0.6657920575704092, |
| "learning_rate": 3.7795348586627696e-05, |
| "loss": 0.2563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2421034723520279, |
| "step": 1030, |
| "valid_targets_mean": 2440.4, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 1.6613162118780096, |
| "grad_norm": 0.6978432635250694, |
| "learning_rate": 3.7758665138753943e-05, |
| "loss": 0.2774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25340160727500916, |
| "step": 1035, |
| "valid_targets_mean": 2174.9, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 1.6693418940609952, |
| "grad_norm": 0.7036409883833363, |
| "learning_rate": 3.7721697119320054e-05, |
| "loss": 0.2734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2678963541984558, |
| "step": 1040, |
| "valid_targets_mean": 2500.4, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 1.6773675762439808, |
| "grad_norm": 0.7683015358822927, |
| "learning_rate": 3.768444512071553e-05, |
| "loss": 0.2525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24290819466114044, |
| "step": 1045, |
| "valid_targets_mean": 1559.9, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 1.6853932584269664, |
| "grad_norm": 0.7747543733128794, |
| "learning_rate": 3.7646909739880486e-05, |
| "loss": 0.2688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3120294213294983, |
| "step": 1050, |
| "valid_targets_mean": 2086.7, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 1.6934189406099518, |
| "grad_norm": 0.7582150632753363, |
| "learning_rate": 3.760909157829604e-05, |
| "loss": 0.2697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2633521556854248, |
| "step": 1055, |
| "valid_targets_mean": 1768.8, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 1.7014446227929374, |
| "grad_norm": 0.782741178401804, |
| "learning_rate": 3.75709912419747e-05, |
| "loss": 0.2615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2791171669960022, |
| "step": 1060, |
| "valid_targets_mean": 1728.7, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 1.709470304975923, |
| "grad_norm": 0.8113224135725746, |
| "learning_rate": 3.7532609341450655e-05, |
| "loss": 0.2662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.257160484790802, |
| "step": 1065, |
| "valid_targets_mean": 2120.3, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 1.7174959871589084, |
| "grad_norm": 0.7462354824079133, |
| "learning_rate": 3.749394649176998e-05, |
| "loss": 0.2646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2856426239013672, |
| "step": 1070, |
| "valid_targets_mean": 2123.1, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 1.725521669341894, |
| "grad_norm": 0.7126762615208581, |
| "learning_rate": 3.745500331248078e-05, |
| "loss": 0.2515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24018818140029907, |
| "step": 1075, |
| "valid_targets_mean": 1817.8, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 1.7335473515248796, |
| "grad_norm": 0.6898127387055668, |
| "learning_rate": 3.741578042762329e-05, |
| "loss": 0.2599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26695871353149414, |
| "step": 1080, |
| "valid_targets_mean": 2342.2, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 1.7415730337078652, |
| "grad_norm": 0.66757954744143, |
| "learning_rate": 3.737627846571982e-05, |
| "loss": 0.2467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22607743740081787, |
| "step": 1085, |
| "valid_targets_mean": 2161.1, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 1.7495987158908508, |
| "grad_norm": 0.6652154306317639, |
| "learning_rate": 3.733649805976474e-05, |
| "loss": 0.2564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2927885055541992, |
| "step": 1090, |
| "valid_targets_mean": 2548.8, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 1.7576243980738364, |
| "grad_norm": 0.7237170273830091, |
| "learning_rate": 3.729643984721431e-05, |
| "loss": 0.2477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2599429190158844, |
| "step": 1095, |
| "valid_targets_mean": 2250.6, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 1.7656500802568218, |
| "grad_norm": 0.7141988738983245, |
| "learning_rate": 3.725610446997646e-05, |
| "loss": 0.2667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2560562193393707, |
| "step": 1100, |
| "valid_targets_mean": 2340.1, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 1.7736757624398074, |
| "grad_norm": 1.1500842386133312, |
| "learning_rate": 3.7215492574400514e-05, |
| "loss": 0.275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30140018463134766, |
| "step": 1105, |
| "valid_targets_mean": 2404.6, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 1.7817014446227928, |
| "grad_norm": 0.6808585287726022, |
| "learning_rate": 3.717460481126684e-05, |
| "loss": 0.2703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3125297427177429, |
| "step": 1110, |
| "valid_targets_mean": 2692.1, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 1.7897271268057784, |
| "grad_norm": 0.7248268534788489, |
| "learning_rate": 3.7133441835776386e-05, |
| "loss": 0.2792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2808183431625366, |
| "step": 1115, |
| "valid_targets_mean": 2375.7, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 1.797752808988764, |
| "grad_norm": 0.8633733319106702, |
| "learning_rate": 3.7092004307540235e-05, |
| "loss": 0.2577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29408037662506104, |
| "step": 1120, |
| "valid_targets_mean": 1460.2, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 1.8057784911717496, |
| "grad_norm": 0.7680940895196984, |
| "learning_rate": 3.7050292890568995e-05, |
| "loss": 0.2916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2827860116958618, |
| "step": 1125, |
| "valid_targets_mean": 2280.7, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 1.8138041733547352, |
| "grad_norm": 0.7869442484722307, |
| "learning_rate": 3.700830825326218e-05, |
| "loss": 0.2661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26617157459259033, |
| "step": 1130, |
| "valid_targets_mean": 1957.4, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 1.8218298555377208, |
| "grad_norm": 0.7696885298751593, |
| "learning_rate": 3.696605106839747e-05, |
| "loss": 0.2939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2644560933113098, |
| "step": 1135, |
| "valid_targets_mean": 1796.3, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 1.8298555377207064, |
| "grad_norm": 0.8922311571098936, |
| "learning_rate": 3.6923522013119964e-05, |
| "loss": 0.2555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2608848214149475, |
| "step": 1140, |
| "valid_targets_mean": 1475.7, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 1.8378812199036918, |
| "grad_norm": 0.6335228244683325, |
| "learning_rate": 3.688072176893132e-05, |
| "loss": 0.2682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.288246750831604, |
| "step": 1145, |
| "valid_targets_mean": 2936.8, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 1.8459069020866774, |
| "grad_norm": 0.7476777076459231, |
| "learning_rate": 3.683765102167881e-05, |
| "loss": 0.2552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27494877576828003, |
| "step": 1150, |
| "valid_targets_mean": 2268.6, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 1.8539325842696628, |
| "grad_norm": 0.7507784672507724, |
| "learning_rate": 3.679431046154438e-05, |
| "loss": 0.2557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27138835191726685, |
| "step": 1155, |
| "valid_targets_mean": 2028.2, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 1.8619582664526484, |
| "grad_norm": 0.775484617594402, |
| "learning_rate": 3.675070078303352e-05, |
| "loss": 0.2617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2535039782524109, |
| "step": 1160, |
| "valid_targets_mean": 1500.2, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 1.869983948635634, |
| "grad_norm": 0.7919636650285514, |
| "learning_rate": 3.670682268496421e-05, |
| "loss": 0.2554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28811001777648926, |
| "step": 1165, |
| "valid_targets_mean": 2233.0, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 1.8780096308186196, |
| "grad_norm": 0.8269276141613667, |
| "learning_rate": 3.6662676870455676e-05, |
| "loss": 0.2575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22544220089912415, |
| "step": 1170, |
| "valid_targets_mean": 1450.8, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 1.8860353130016052, |
| "grad_norm": 0.7176606864299451, |
| "learning_rate": 3.661826404691712e-05, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2399870753288269, |
| "step": 1175, |
| "valid_targets_mean": 1901.9, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 1.8940609951845908, |
| "grad_norm": 0.6785006811736799, |
| "learning_rate": 3.657358492603641e-05, |
| "loss": 0.2719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28619182109832764, |
| "step": 1180, |
| "valid_targets_mean": 2383.9, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 1.9020866773675762, |
| "grad_norm": 0.7006806520786782, |
| "learning_rate": 3.652864022376866e-05, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2502840459346771, |
| "step": 1185, |
| "valid_targets_mean": 2024.3, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 1.9101123595505618, |
| "grad_norm": 0.7555474304079293, |
| "learning_rate": 3.648343066032476e-05, |
| "loss": 0.2659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22855910658836365, |
| "step": 1190, |
| "valid_targets_mean": 1711.2, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 1.9181380417335474, |
| "grad_norm": 0.7676954013858329, |
| "learning_rate": 3.643795696015985e-05, |
| "loss": 0.2515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26554515957832336, |
| "step": 1195, |
| "valid_targets_mean": 1831.3, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 1.9261637239165328, |
| "grad_norm": 5.5556263099749215, |
| "learning_rate": 3.639221985196166e-05, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2238149791955948, |
| "step": 1200, |
| "valid_targets_mean": 1427.6, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 1.9341894060995184, |
| "grad_norm": 0.7081355832362357, |
| "learning_rate": 3.634622006863891e-05, |
| "loss": 0.2597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2723257541656494, |
| "step": 1205, |
| "valid_targets_mean": 2102.0, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 1.942215088282504, |
| "grad_norm": 0.7197674750606493, |
| "learning_rate": 3.62999583473095e-05, |
| "loss": 0.272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2823481857776642, |
| "step": 1210, |
| "valid_targets_mean": 1959.4, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 1.9502407704654896, |
| "grad_norm": 0.7351267896359547, |
| "learning_rate": 3.625343542928874e-05, |
| "loss": 0.2515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23494531214237213, |
| "step": 1215, |
| "valid_targets_mean": 1691.6, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 1.9582664526484752, |
| "grad_norm": 0.8091637524191202, |
| "learning_rate": 3.620665206007744e-05, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2615356743335724, |
| "step": 1220, |
| "valid_targets_mean": 1755.5, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 1.9662921348314608, |
| "grad_norm": 0.630617638795346, |
| "learning_rate": 3.615960898934999e-05, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2906268835067749, |
| "step": 1225, |
| "valid_targets_mean": 2880.1, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 1.9743178170144462, |
| "grad_norm": 0.698026717328934, |
| "learning_rate": 3.6112306970942334e-05, |
| "loss": 0.2593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24983006715774536, |
| "step": 1230, |
| "valid_targets_mean": 1999.2, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 1.9823434991974318, |
| "grad_norm": 0.7323645627563731, |
| "learning_rate": 3.606474676283987e-05, |
| "loss": 0.2657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2904243469238281, |
| "step": 1235, |
| "valid_targets_mean": 2122.1, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 1.9903691813804172, |
| "grad_norm": 0.6960742489484173, |
| "learning_rate": 3.6016929127165365e-05, |
| "loss": 0.2821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2649298906326294, |
| "step": 1240, |
| "valid_targets_mean": 2274.1, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 1.9983948635634028, |
| "grad_norm": 0.7269920662477591, |
| "learning_rate": 3.5968854830166666e-05, |
| "loss": 0.262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26873061060905457, |
| "step": 1245, |
| "valid_targets_mean": 2070.6, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 2.0064205457463884, |
| "grad_norm": 0.6264465786385531, |
| "learning_rate": 3.592052464220447e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20619434118270874, |
| "step": 1250, |
| "valid_targets_mean": 2345.5, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 2.014446227929374, |
| "grad_norm": 0.8060408716572437, |
| "learning_rate": 3.587193933773998e-05, |
| "loss": 0.2143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22666709125041962, |
| "step": 1255, |
| "valid_targets_mean": 1974.3, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 2.0224719101123596, |
| "grad_norm": 0.6893664644285946, |
| "learning_rate": 3.582309969532247e-05, |
| "loss": 0.217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21046797931194305, |
| "step": 1260, |
| "valid_targets_mean": 2176.0, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 2.030497592295345, |
| "grad_norm": 0.7574788853071039, |
| "learning_rate": 3.577400649757682e-05, |
| "loss": 0.219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18405956029891968, |
| "step": 1265, |
| "valid_targets_mean": 1458.5, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 2.038523274478331, |
| "grad_norm": 0.7882212386208145, |
| "learning_rate": 3.572466053119099e-05, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25198838114738464, |
| "step": 1270, |
| "valid_targets_mean": 1880.4, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 2.0465489566613164, |
| "grad_norm": 0.8196333002543982, |
| "learning_rate": 3.567506258690338e-05, |
| "loss": 0.2222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22230197489261627, |
| "step": 1275, |
| "valid_targets_mean": 1761.6, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 2.0545746388443016, |
| "grad_norm": 0.848915909008126, |
| "learning_rate": 3.562521345949018e-05, |
| "loss": 0.223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2496098428964615, |
| "step": 1280, |
| "valid_targets_mean": 2336.7, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.062600321027287, |
| "grad_norm": 0.8863737442776473, |
| "learning_rate": 3.5575113947752666e-05, |
| "loss": 0.2352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24262848496437073, |
| "step": 1285, |
| "valid_targets_mean": 1759.6, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 2.070626003210273, |
| "grad_norm": 0.7589911362614817, |
| "learning_rate": 3.552476485450434e-05, |
| "loss": 0.2256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22207708656787872, |
| "step": 1290, |
| "valid_targets_mean": 1856.1, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 2.0786516853932584, |
| "grad_norm": 0.9495179896994681, |
| "learning_rate": 3.547416698655807e-05, |
| "loss": 0.219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25257399678230286, |
| "step": 1295, |
| "valid_targets_mean": 2386.2, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 2.086677367576244, |
| "grad_norm": 0.7221290673835988, |
| "learning_rate": 3.5423321154713245e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22047732770442963, |
| "step": 1300, |
| "valid_targets_mean": 2135.1, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 2.0947030497592296, |
| "grad_norm": 0.8574890872992614, |
| "learning_rate": 3.537222817374266e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18799078464508057, |
| "step": 1305, |
| "valid_targets_mean": 1523.1, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 2.102728731942215, |
| "grad_norm": 0.7745571983724101, |
| "learning_rate": 3.532088886237956e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2367406189441681, |
| "step": 1310, |
| "valid_targets_mean": 1826.2, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 2.110754414125201, |
| "grad_norm": 0.7807741896820481, |
| "learning_rate": 3.526930404330447e-05, |
| "loss": 0.2226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2241775095462799, |
| "step": 1315, |
| "valid_targets_mean": 1756.4, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 2.1187800963081864, |
| "grad_norm": 0.8548618903538644, |
| "learning_rate": 3.521747454313201e-05, |
| "loss": 0.2225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2160843312740326, |
| "step": 1320, |
| "valid_targets_mean": 1812.9, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 2.1268057784911716, |
| "grad_norm": 0.776344012436439, |
| "learning_rate": 3.516540119239769e-05, |
| "loss": 0.2167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22034770250320435, |
| "step": 1325, |
| "valid_targets_mean": 1766.5, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 2.134831460674157, |
| "grad_norm": 1.2889351825397468, |
| "learning_rate": 3.511308482554454e-05, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24177859723567963, |
| "step": 1330, |
| "valid_targets_mean": 2334.4, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 2.142857142857143, |
| "grad_norm": 0.8008461502115394, |
| "learning_rate": 3.506052628090981e-05, |
| "loss": 0.22, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21476683020591736, |
| "step": 1335, |
| "valid_targets_mean": 2030.2, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 2.1508828250401284, |
| "grad_norm": 0.810451115473788, |
| "learning_rate": 3.500772640071145e-05, |
| "loss": 0.2349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22298628091812134, |
| "step": 1340, |
| "valid_targets_mean": 1712.6, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 2.158908507223114, |
| "grad_norm": 0.7573148185013651, |
| "learning_rate": 3.495468603103472e-05, |
| "loss": 0.2469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24540317058563232, |
| "step": 1345, |
| "valid_targets_mean": 2262.4, |
| "valid_targets_min": 1157 |
| }, |
| { |
| "epoch": 2.1669341894060996, |
| "grad_norm": 0.7168592022709548, |
| "learning_rate": 3.4901406021818526e-05, |
| "loss": 0.2104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22075840830802917, |
| "step": 1350, |
| "valid_targets_mean": 2246.2, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 2.174959871589085, |
| "grad_norm": 0.8065302620751352, |
| "learning_rate": 3.4847887226841874e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21199846267700195, |
| "step": 1355, |
| "valid_targets_mean": 1803.8, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 2.182985553772071, |
| "grad_norm": 0.6668455625016351, |
| "learning_rate": 3.479413050371016e-05, |
| "loss": 0.2101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20517484843730927, |
| "step": 1360, |
| "valid_targets_mean": 2204.4, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 2.191011235955056, |
| "grad_norm": 0.7616659943300983, |
| "learning_rate": 3.4740136713841416e-05, |
| "loss": 0.238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22425301373004913, |
| "step": 1365, |
| "valid_targets_mean": 1955.1, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 2.1990369181380416, |
| "grad_norm": 0.765106380987224, |
| "learning_rate": 3.4685906722452537e-05, |
| "loss": 0.226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20790395140647888, |
| "step": 1370, |
| "valid_targets_mean": 2030.4, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 2.207062600321027, |
| "grad_norm": 0.8408989245850991, |
| "learning_rate": 3.4631441398545394e-05, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20086929202079773, |
| "step": 1375, |
| "valid_targets_mean": 1581.3, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 2.215088282504013, |
| "grad_norm": 0.7954396264203275, |
| "learning_rate": 3.4576741614892925e-05, |
| "loss": 0.2278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23235668241977692, |
| "step": 1380, |
| "valid_targets_mean": 2279.1, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 2.2231139646869984, |
| "grad_norm": 0.7874064449767312, |
| "learning_rate": 3.452180824802512e-05, |
| "loss": 0.2374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2614269554615021, |
| "step": 1385, |
| "valid_targets_mean": 2237.8, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 2.231139646869984, |
| "grad_norm": 0.7379527533621459, |
| "learning_rate": 3.4466642178215015e-05, |
| "loss": 0.2221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24073539674282074, |
| "step": 1390, |
| "valid_targets_mean": 2265.8, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 2.2391653290529696, |
| "grad_norm": 0.683724568782726, |
| "learning_rate": 3.441124428946455e-05, |
| "loss": 0.2207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2088882178068161, |
| "step": 1395, |
| "valid_targets_mean": 2312.8, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 2.247191011235955, |
| "grad_norm": 0.697858810104743, |
| "learning_rate": 3.435561546949043e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25173261761665344, |
| "step": 1400, |
| "valid_targets_mean": 2850.9, |
| "valid_targets_min": 1085 |
| }, |
| { |
| "epoch": 2.255216693418941, |
| "grad_norm": 0.7114309986626526, |
| "learning_rate": 3.429975660970988e-05, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.234367236495018, |
| "step": 1405, |
| "valid_targets_mean": 2420.1, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 2.263242375601926, |
| "grad_norm": 0.7461264034166555, |
| "learning_rate": 3.424366860522638e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23270238935947418, |
| "step": 1410, |
| "valid_targets_mean": 1986.1, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 2.2712680577849116, |
| "grad_norm": 0.6975362183207242, |
| "learning_rate": 3.41873523548153e-05, |
| "loss": 0.2333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19744381308555603, |
| "step": 1415, |
| "valid_targets_mean": 1985.9, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 2.279293739967897, |
| "grad_norm": 0.7633475145958678, |
| "learning_rate": 3.413080876090952e-05, |
| "loss": 0.223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2305845320224762, |
| "step": 1420, |
| "valid_targets_mean": 2110.4, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 2.287319422150883, |
| "grad_norm": 0.6987877696053163, |
| "learning_rate": 3.4074038729584955e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18873882293701172, |
| "step": 1425, |
| "valid_targets_mean": 2079.9, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 2.2953451043338684, |
| "grad_norm": 0.8229960285752915, |
| "learning_rate": 3.401704317054604e-05, |
| "loss": 0.2279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22099998593330383, |
| "step": 1430, |
| "valid_targets_mean": 1742.9, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 2.303370786516854, |
| "grad_norm": 0.7979213067997468, |
| "learning_rate": 3.395982299711114e-05, |
| "loss": 0.2241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23837853968143463, |
| "step": 1435, |
| "valid_targets_mean": 2065.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.3113964686998396, |
| "grad_norm": 0.7410217576693533, |
| "learning_rate": 3.390237912619793e-05, |
| "loss": 0.2278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19628407061100006, |
| "step": 1440, |
| "valid_targets_mean": 1947.8, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 2.319422150882825, |
| "grad_norm": 0.725538489703123, |
| "learning_rate": 3.384471247830872e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22274473309516907, |
| "step": 1445, |
| "valid_targets_mean": 2046.8, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 2.3274478330658104, |
| "grad_norm": 0.7718380143410368, |
| "learning_rate": 3.378682397751565e-05, |
| "loss": 0.2265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2532963156700134, |
| "step": 1450, |
| "valid_targets_mean": 2101.1, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 2.335473515248796, |
| "grad_norm": 0.8011655529732985, |
| "learning_rate": 3.372871455144593e-05, |
| "loss": 0.2219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23601312935352325, |
| "step": 1455, |
| "valid_targets_mean": 1879.2, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 2.3434991974317816, |
| "grad_norm": 0.9443935694282609, |
| "learning_rate": 3.367038513126697e-05, |
| "loss": 0.2262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.206557959318161, |
| "step": 1460, |
| "valid_targets_mean": 1639.8, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 2.351524879614767, |
| "grad_norm": 0.7339382552691981, |
| "learning_rate": 3.3611836651671426e-05, |
| "loss": 0.2255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23191966116428375, |
| "step": 1465, |
| "valid_targets_mean": 2068.2, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 2.359550561797753, |
| "grad_norm": 0.7882153069080308, |
| "learning_rate": 3.355307005086226e-05, |
| "loss": 0.2284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20615904033184052, |
| "step": 1470, |
| "valid_targets_mean": 1522.9, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 2.3675762439807384, |
| "grad_norm": 0.7562840977782597, |
| "learning_rate": 3.34940862705377e-05, |
| "loss": 0.2126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1904546320438385, |
| "step": 1475, |
| "valid_targets_mean": 1568.2, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 2.375601926163724, |
| "grad_norm": 0.8538351538237444, |
| "learning_rate": 3.3434886255876106e-05, |
| "loss": 0.2375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25030791759490967, |
| "step": 1480, |
| "valid_targets_mean": 2046.1, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 2.3836276083467096, |
| "grad_norm": 0.7220287827741136, |
| "learning_rate": 3.33754709555209e-05, |
| "loss": 0.23, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2569080591201782, |
| "step": 1485, |
| "valid_targets_mean": 2494.1, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 2.391653290529695, |
| "grad_norm": 0.7818531275905918, |
| "learning_rate": 3.33158413215653e-05, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2130444347858429, |
| "step": 1490, |
| "valid_targets_mean": 1575.5, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 2.399678972712681, |
| "grad_norm": 0.7625675101581627, |
| "learning_rate": 3.325599830953708e-05, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21467597782611847, |
| "step": 1495, |
| "valid_targets_mean": 2187.6, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 2.407704654895666, |
| "grad_norm": 0.7704348694195301, |
| "learning_rate": 3.31959428783833e-05, |
| "loss": 0.2318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2410392463207245, |
| "step": 1500, |
| "valid_targets_mean": 2143.1, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 2.4157303370786516, |
| "grad_norm": 0.6834706733838948, |
| "learning_rate": 3.3135675990454856e-05, |
| "loss": 0.2332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22266864776611328, |
| "step": 1505, |
| "valid_targets_mean": 2381.1, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 2.423756019261637, |
| "grad_norm": 0.7632035756467823, |
| "learning_rate": 3.307519861149114e-05, |
| "loss": 0.2259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25074198842048645, |
| "step": 1510, |
| "valid_targets_mean": 2307.4, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 2.431781701444623, |
| "grad_norm": 0.7796558920418386, |
| "learning_rate": 3.3014511710604526e-05, |
| "loss": 0.2185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2310362160205841, |
| "step": 1515, |
| "valid_targets_mean": 2021.8, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 2.4398073836276084, |
| "grad_norm": 0.8050959296365663, |
| "learning_rate": 3.295361626026484e-05, |
| "loss": 0.2154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22600339353084564, |
| "step": 1520, |
| "valid_targets_mean": 1891.7, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 2.447833065810594, |
| "grad_norm": 0.7172384753459945, |
| "learning_rate": 3.28925132362838e-05, |
| "loss": 0.223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21628597378730774, |
| "step": 1525, |
| "valid_targets_mean": 1877.1, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 2.4558587479935796, |
| "grad_norm": 0.6974119595402761, |
| "learning_rate": 3.2831203617799316e-05, |
| "loss": 0.2363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23294216394424438, |
| "step": 1530, |
| "valid_targets_mean": 2408.9, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 2.4638844301765648, |
| "grad_norm": 0.7841982652104295, |
| "learning_rate": 3.276968838725992e-05, |
| "loss": 0.2192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23504158854484558, |
| "step": 1535, |
| "valid_targets_mean": 1922.0, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 2.4719101123595504, |
| "grad_norm": 0.7111349004760731, |
| "learning_rate": 3.2707968530408886e-05, |
| "loss": 0.2259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2083408683538437, |
| "step": 1540, |
| "valid_targets_mean": 2066.4, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 2.479935794542536, |
| "grad_norm": 0.7365161685746568, |
| "learning_rate": 3.264604503626853e-05, |
| "loss": 0.2174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.235595241189003, |
| "step": 1545, |
| "valid_targets_mean": 2078.4, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 2.4879614767255216, |
| "grad_norm": 0.7269740343287259, |
| "learning_rate": 3.2583918897124315e-05, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2562892735004425, |
| "step": 1550, |
| "valid_targets_mean": 2318.0, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 2.495987158908507, |
| "grad_norm": 0.758066997386104, |
| "learning_rate": 3.2521591108508965e-05, |
| "loss": 0.2234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23280540108680725, |
| "step": 1555, |
| "valid_targets_mean": 1912.3, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 2.504012841091493, |
| "grad_norm": 0.6629939180933154, |
| "learning_rate": 3.245906266918651e-05, |
| "loss": 0.2249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19812926650047302, |
| "step": 1560, |
| "valid_targets_mean": 2150.6, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 2.5120385232744784, |
| "grad_norm": 0.7017031358542662, |
| "learning_rate": 3.2396334581136315e-05, |
| "loss": 0.2246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19861991703510284, |
| "step": 1565, |
| "valid_targets_mean": 1771.2, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 2.520064205457464, |
| "grad_norm": 0.7456695638200225, |
| "learning_rate": 3.2333407849536936e-05, |
| "loss": 0.2306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2588405907154083, |
| "step": 1570, |
| "valid_targets_mean": 2140.0, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 2.5280898876404496, |
| "grad_norm": 0.6842578186040127, |
| "learning_rate": 3.2270283482750106e-05, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23806709051132202, |
| "step": 1575, |
| "valid_targets_mean": 2214.6, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 2.5361155698234352, |
| "grad_norm": 0.7163287836668685, |
| "learning_rate": 3.220696249230453e-05, |
| "loss": 0.2295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2398744523525238, |
| "step": 1580, |
| "valid_targets_mean": 2410.4, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 2.5441412520064204, |
| "grad_norm": 0.7034472910128594, |
| "learning_rate": 3.214344589287969e-05, |
| "loss": 0.2373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24632596969604492, |
| "step": 1585, |
| "valid_targets_mean": 2491.1, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 2.552166934189406, |
| "grad_norm": 0.7470426673989888, |
| "learning_rate": 3.2079734702289555e-05, |
| "loss": 0.2241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23413334786891937, |
| "step": 1590, |
| "valid_targets_mean": 2035.4, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 2.5601926163723916, |
| "grad_norm": 0.6695700379125197, |
| "learning_rate": 3.201582994146633e-05, |
| "loss": 0.2195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.220213383436203, |
| "step": 1595, |
| "valid_targets_mean": 2228.4, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 2.568218298555377, |
| "grad_norm": 0.6398428853902913, |
| "learning_rate": 3.195173263444405e-05, |
| "loss": 0.2253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2369084358215332, |
| "step": 1600, |
| "valid_targets_mean": 2804.1, |
| "valid_targets_min": 1139 |
| }, |
| { |
| "epoch": 2.576243980738363, |
| "grad_norm": 0.7976580250915132, |
| "learning_rate": 3.188744380834218e-05, |
| "loss": 0.2327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25882312655448914, |
| "step": 1605, |
| "valid_targets_mean": 1818.9, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 2.5842696629213484, |
| "grad_norm": 0.738638803709468, |
| "learning_rate": 3.182296449334916e-05, |
| "loss": 0.2248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2369651198387146, |
| "step": 1610, |
| "valid_targets_mean": 2066.5, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 2.592295345104334, |
| "grad_norm": 0.8660756736906835, |
| "learning_rate": 3.1758295722705895e-05, |
| "loss": 0.2251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22791454195976257, |
| "step": 1615, |
| "valid_targets_mean": 1701.2, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 2.600321027287319, |
| "grad_norm": 0.7304793227556174, |
| "learning_rate": 3.1693438532689196e-05, |
| "loss": 0.2252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16894668340682983, |
| "step": 1620, |
| "valid_targets_mean": 1490.4, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 2.608346709470305, |
| "grad_norm": 0.7316882732876415, |
| "learning_rate": 3.162839396259519e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17454849183559418, |
| "step": 1625, |
| "valid_targets_mean": 1789.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.6163723916532904, |
| "grad_norm": 0.8293784310074404, |
| "learning_rate": 3.156316305472263e-05, |
| "loss": 0.2214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22549498081207275, |
| "step": 1630, |
| "valid_targets_mean": 1512.9, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.624398073836276, |
| "grad_norm": 0.7732588913978171, |
| "learning_rate": 3.149774685435626e-05, |
| "loss": 0.2293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23763619363307953, |
| "step": 1635, |
| "valid_targets_mean": 1928.6, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 2.6324237560192616, |
| "grad_norm": 0.6863872080427466, |
| "learning_rate": 3.143214640974996e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19767194986343384, |
| "step": 1640, |
| "valid_targets_mean": 1965.4, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 2.640449438202247, |
| "grad_norm": 0.7870511412965953, |
| "learning_rate": 3.136636277211005e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23969687521457672, |
| "step": 1645, |
| "valid_targets_mean": 1663.8, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.648475120385233, |
| "grad_norm": 0.7980891149995513, |
| "learning_rate": 3.13003969955784e-05, |
| "loss": 0.2094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19080209732055664, |
| "step": 1650, |
| "valid_targets_mean": 1481.9, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 2.6565008025682184, |
| "grad_norm": 0.7955277559817313, |
| "learning_rate": 3.1234250137215546e-05, |
| "loss": 0.2225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21440812945365906, |
| "step": 1655, |
| "valid_targets_mean": 1468.8, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 2.664526484751204, |
| "grad_norm": 0.7368668559606313, |
| "learning_rate": 3.1167923256983724e-05, |
| "loss": 0.2188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19377027451992035, |
| "step": 1660, |
| "valid_targets_mean": 1893.8, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 2.6725521669341896, |
| "grad_norm": 0.8011351264520532, |
| "learning_rate": 3.110141741772994e-05, |
| "loss": 0.2444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2542601227760315, |
| "step": 1665, |
| "valid_targets_mean": 1760.2, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 2.6805778491171752, |
| "grad_norm": 0.6620763926446247, |
| "learning_rate": 3.103473368516887e-05, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2350524365901947, |
| "step": 1670, |
| "valid_targets_mean": 2464.2, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 2.6886035313001604, |
| "grad_norm": 0.7931697359506537, |
| "learning_rate": 3.0967873127865856e-05, |
| "loss": 0.2273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22060030698776245, |
| "step": 1675, |
| "valid_targets_mean": 1841.6, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 2.696629213483146, |
| "grad_norm": 0.7023736927777215, |
| "learning_rate": 3.090083681721972e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21952059864997864, |
| "step": 1680, |
| "valid_targets_mean": 2159.6, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 2.7046548956661316, |
| "grad_norm": 0.7025168140845389, |
| "learning_rate": 3.083362582744564e-05, |
| "loss": 0.2272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2323223054409027, |
| "step": 1685, |
| "valid_targets_mean": 2033.8, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 2.712680577849117, |
| "grad_norm": 0.6589820080202528, |
| "learning_rate": 3.0766241235557914e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20285199582576752, |
| "step": 1690, |
| "valid_targets_mean": 2020.0, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 2.720706260032103, |
| "grad_norm": 0.6509308612016727, |
| "learning_rate": 3.0698684121352704e-05, |
| "loss": 0.2244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20531073212623596, |
| "step": 1695, |
| "valid_targets_mean": 2438.1, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 2.7287319422150884, |
| "grad_norm": 0.7373126457209139, |
| "learning_rate": 3.0630955567390714e-05, |
| "loss": 0.2288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22566135227680206, |
| "step": 1700, |
| "valid_targets_mean": 2027.4, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 2.7367576243980736, |
| "grad_norm": 0.8219020871621718, |
| "learning_rate": 3.0563056658979915e-05, |
| "loss": 0.248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2077377736568451, |
| "step": 1705, |
| "valid_targets_mean": 1601.4, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 2.744783306581059, |
| "grad_norm": 0.6685564666402026, |
| "learning_rate": 3.0494988484158048e-05, |
| "loss": 0.2166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21543152630329132, |
| "step": 1710, |
| "valid_targets_mean": 2170.0, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 2.752808988764045, |
| "grad_norm": 0.8026549087712966, |
| "learning_rate": 3.0426752133675274e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22285577654838562, |
| "step": 1715, |
| "valid_targets_mean": 1749.9, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 2.7608346709470304, |
| "grad_norm": 0.690495095349738, |
| "learning_rate": 3.035834870097665e-05, |
| "loss": 0.2331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21550163626670837, |
| "step": 1720, |
| "valid_targets_mean": 2140.2, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 2.768860353130016, |
| "grad_norm": 0.7360103068007144, |
| "learning_rate": 3.0289779282184627e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24632824957370758, |
| "step": 1725, |
| "valid_targets_mean": 2156.0, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 2.7768860353130016, |
| "grad_norm": 0.7527366517311297, |
| "learning_rate": 3.0221044976081484e-05, |
| "loss": 0.237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2297508716583252, |
| "step": 1730, |
| "valid_targets_mean": 1963.5, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 2.784911717495987, |
| "grad_norm": 0.7821248977519579, |
| "learning_rate": 3.0152146884091714e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22388526797294617, |
| "step": 1735, |
| "valid_targets_mean": 2456.3, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 2.792937399678973, |
| "grad_norm": 0.7248411712033483, |
| "learning_rate": 3.0083086110264372e-05, |
| "loss": 0.2188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20279636979103088, |
| "step": 1740, |
| "valid_targets_mean": 1725.7, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 2.8009630818619584, |
| "grad_norm": 0.7719057875204387, |
| "learning_rate": 3.0013863761255394e-05, |
| "loss": 0.226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22379055619239807, |
| "step": 1745, |
| "valid_targets_mean": 1751.1, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 2.808988764044944, |
| "grad_norm": 0.7078438529016131, |
| "learning_rate": 2.9944480946309857e-05, |
| "loss": 0.2099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2104533314704895, |
| "step": 1750, |
| "valid_targets_mean": 2152.8, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 2.8170144462279296, |
| "grad_norm": 0.7421779901837455, |
| "learning_rate": 2.9874938777244203e-05, |
| "loss": 0.2209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2339702844619751, |
| "step": 1755, |
| "valid_targets_mean": 2193.9, |
| "valid_targets_min": 1060 |
| }, |
| { |
| "epoch": 2.825040128410915, |
| "grad_norm": 0.6791983094516799, |
| "learning_rate": 2.9805238368428417e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23603284358978271, |
| "step": 1760, |
| "valid_targets_mean": 2690.4, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 2.8330658105939004, |
| "grad_norm": 0.7641709144274127, |
| "learning_rate": 2.9735380836768194e-05, |
| "loss": 0.2216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2092696875333786, |
| "step": 1765, |
| "valid_targets_mean": 1717.9, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 2.841091492776886, |
| "grad_norm": 0.6388373211209032, |
| "learning_rate": 2.966536730168702e-05, |
| "loss": 0.2211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23387748003005981, |
| "step": 1770, |
| "valid_targets_mean": 2613.9, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 2.8491171749598716, |
| "grad_norm": 0.7037310466747174, |
| "learning_rate": 2.9595198885108222e-05, |
| "loss": 0.2351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24809247255325317, |
| "step": 1775, |
| "valid_targets_mean": 2320.5, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 2.857142857142857, |
| "grad_norm": 0.7618055649190782, |
| "learning_rate": 2.9524876711437027e-05, |
| "loss": 0.2283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23056885600090027, |
| "step": 1780, |
| "valid_targets_mean": 2268.4, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 2.865168539325843, |
| "grad_norm": 0.7549506776491252, |
| "learning_rate": 2.945440190754252e-05, |
| "loss": 0.2393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2515849471092224, |
| "step": 1785, |
| "valid_targets_mean": 2207.3, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 2.8731942215088284, |
| "grad_norm": 0.7470019603913977, |
| "learning_rate": 2.9383775602739585e-05, |
| "loss": 0.2308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23992541432380676, |
| "step": 1790, |
| "valid_targets_mean": 2084.7, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 2.8812199036918136, |
| "grad_norm": 0.7337045498667797, |
| "learning_rate": 2.931299892877081e-05, |
| "loss": 0.2292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2097863256931305, |
| "step": 1795, |
| "valid_targets_mean": 1751.9, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 2.889245585874799, |
| "grad_norm": 0.7475735728231748, |
| "learning_rate": 2.924207301978837e-05, |
| "loss": 0.2208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22301986813545227, |
| "step": 1800, |
| "valid_targets_mean": 1816.0, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 2.897271268057785, |
| "grad_norm": 0.8609335895996135, |
| "learning_rate": 2.917099901233582e-05, |
| "loss": 0.2255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24170774221420288, |
| "step": 1805, |
| "valid_targets_mean": 1630.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 2.9052969502407704, |
| "grad_norm": 0.8836714454451741, |
| "learning_rate": 2.9099778045329915e-05, |
| "loss": 0.2112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2119920253753662, |
| "step": 1810, |
| "valid_targets_mean": 1986.5, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 2.913322632423756, |
| "grad_norm": 1.3175708087375508, |
| "learning_rate": 2.902841126004234e-05, |
| "loss": 0.2321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26432716846466064, |
| "step": 1815, |
| "valid_targets_mean": 2028.9, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 2.9213483146067416, |
| "grad_norm": 0.7616325494153396, |
| "learning_rate": 2.8956899800081434e-05, |
| "loss": 0.2161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22558796405792236, |
| "step": 1820, |
| "valid_targets_mean": 1613.9, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 2.929373996789727, |
| "grad_norm": 0.7367382610423877, |
| "learning_rate": 2.888524481137384e-05, |
| "loss": 0.2248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23133790493011475, |
| "step": 1825, |
| "valid_targets_mean": 2021.1, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 2.937399678972713, |
| "grad_norm": 0.6844977955140614, |
| "learning_rate": 2.8813447442146177e-05, |
| "loss": 0.2362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21383780241012573, |
| "step": 1830, |
| "valid_targets_mean": 1867.3, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 2.9454253611556984, |
| "grad_norm": 0.7558744597489246, |
| "learning_rate": 2.8741508842906617e-05, |
| "loss": 0.2277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21160289645195007, |
| "step": 1835, |
| "valid_targets_mean": 1775.3, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 2.953451043338684, |
| "grad_norm": 0.7825251274320609, |
| "learning_rate": 2.8669430166426452e-05, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22142228484153748, |
| "step": 1840, |
| "valid_targets_mean": 1709.3, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 2.961476725521669, |
| "grad_norm": 0.8621972624844769, |
| "learning_rate": 2.8597212567721638e-05, |
| "loss": 0.2277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20812058448791504, |
| "step": 1845, |
| "valid_targets_mean": 1360.6, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 2.969502407704655, |
| "grad_norm": 0.716293562577063, |
| "learning_rate": 2.8524857204034256e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24998609721660614, |
| "step": 1850, |
| "valid_targets_mean": 1911.3, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 2.9775280898876404, |
| "grad_norm": 0.6539894083962282, |
| "learning_rate": 2.8452365234813992e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24071596562862396, |
| "step": 1855, |
| "valid_targets_mean": 2464.8, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.985553772070626, |
| "grad_norm": 0.7537202116782218, |
| "learning_rate": 2.8379737821699557e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2464880496263504, |
| "step": 1860, |
| "valid_targets_mean": 2069.2, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 2.9935794542536116, |
| "grad_norm": 0.7507065541075459, |
| "learning_rate": 2.8306976128500054e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2356579601764679, |
| "step": 1865, |
| "valid_targets_mean": 2693.5, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.001605136436597, |
| "grad_norm": 0.6923513946863307, |
| "learning_rate": 2.823408132117635e-05, |
| "loss": 0.2151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20384138822555542, |
| "step": 1870, |
| "valid_targets_mean": 2270.1, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 3.009630818619583, |
| "grad_norm": 0.7149443578899167, |
| "learning_rate": 2.8161054567822375e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18554896116256714, |
| "step": 1875, |
| "valid_targets_mean": 2369.7, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 3.0176565008025684, |
| "grad_norm": 0.7734688939301865, |
| "learning_rate": 2.8087897038646428e-05, |
| "loss": 0.1891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19679996371269226, |
| "step": 1880, |
| "valid_targets_mean": 2192.3, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 3.0256821829855536, |
| "grad_norm": 0.7653501614317052, |
| "learning_rate": 2.801460990595239e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20114630460739136, |
| "step": 1885, |
| "valid_targets_mean": 1874.9, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 3.033707865168539, |
| "grad_norm": 0.830666272441702, |
| "learning_rate": 2.7941194344120965e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1925143003463745, |
| "step": 1890, |
| "valid_targets_mean": 1578.1, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 3.041733547351525, |
| "grad_norm": 1.2399862833715765, |
| "learning_rate": 2.7867651529590864e-05, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17397508025169373, |
| "step": 1895, |
| "valid_targets_mean": 1400.1, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 3.0497592295345104, |
| "grad_norm": 0.8087269986100477, |
| "learning_rate": 2.7793982640839933e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1715751439332962, |
| "step": 1900, |
| "valid_targets_mean": 1782.9, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 3.057784911717496, |
| "grad_norm": 0.6281749949063277, |
| "learning_rate": 2.7720188858366275e-05, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18476352095603943, |
| "step": 1905, |
| "valid_targets_mean": 2993.0, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 3.0658105939004816, |
| "grad_norm": 0.635189484478004, |
| "learning_rate": 2.7646271364669338e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15959222614765167, |
| "step": 1910, |
| "valid_targets_mean": 2513.0, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 3.073836276083467, |
| "grad_norm": 0.7011950467502195, |
| "learning_rate": 2.7572231344230983e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1984846293926239, |
| "step": 1915, |
| "valid_targets_mean": 2431.4, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 3.081861958266453, |
| "grad_norm": 0.8410097906484902, |
| "learning_rate": 2.7498069983496466e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20174948871135712, |
| "step": 1920, |
| "valid_targets_mean": 1798.1, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 3.0898876404494384, |
| "grad_norm": 0.7073569345794174, |
| "learning_rate": 2.7423788470855455e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19382837414741516, |
| "step": 1925, |
| "valid_targets_mean": 2452.8, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 3.0979133226324236, |
| "grad_norm": 0.8179807578648297, |
| "learning_rate": 2.734938799662297e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16232554614543915, |
| "step": 1930, |
| "valid_targets_mean": 1700.2, |
| "valid_targets_min": 827 |
| }, |
| { |
| "epoch": 3.105939004815409, |
| "grad_norm": 0.7858838266351695, |
| "learning_rate": 2.727486975302032e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19014039635658264, |
| "step": 1935, |
| "valid_targets_mean": 1804.1, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 3.113964686998395, |
| "grad_norm": 0.7209047591018296, |
| "learning_rate": 2.7200234934156012e-05, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17354069650173187, |
| "step": 1940, |
| "valid_targets_mean": 1919.5, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 3.1219903691813804, |
| "grad_norm": 0.8428897718911152, |
| "learning_rate": 2.712548473600657e-05, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19806596636772156, |
| "step": 1945, |
| "valid_targets_mean": 1813.6, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 3.130016051364366, |
| "grad_norm": 0.809920682857247, |
| "learning_rate": 2.7050620356397413e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18115901947021484, |
| "step": 1950, |
| "valid_targets_mean": 1606.6, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 3.1380417335473516, |
| "grad_norm": 0.893305519656849, |
| "learning_rate": 2.6975642994983658e-05, |
| "loss": 0.1908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1924627125263214, |
| "step": 1955, |
| "valid_targets_mean": 1423.1, |
| "valid_targets_min": 554 |
| }, |
| { |
| "epoch": 3.146067415730337, |
| "grad_norm": 0.751617349429226, |
| "learning_rate": 2.6900553853230856e-05, |
| "loss": 0.194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19373275339603424, |
| "step": 1960, |
| "valid_targets_mean": 2145.9, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 3.154093097913323, |
| "grad_norm": 0.8000049867410969, |
| "learning_rate": 2.6825354134395804e-05, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18756906688213348, |
| "step": 1965, |
| "valid_targets_mean": 1920.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 3.162118780096308, |
| "grad_norm": 0.7061336594749047, |
| "learning_rate": 2.6750045043507196e-05, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18700531125068665, |
| "step": 1970, |
| "valid_targets_mean": 1959.3, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 3.1701444622792936, |
| "grad_norm": 0.6065987384881834, |
| "learning_rate": 2.667462778734637e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15520010888576508, |
| "step": 1975, |
| "valid_targets_mean": 2880.4, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 3.178170144462279, |
| "grad_norm": 0.7999447629388277, |
| "learning_rate": 2.6599103574427928e-05, |
| "loss": 0.1758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1867016702890396, |
| "step": 1980, |
| "valid_targets_mean": 1824.9, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 3.186195826645265, |
| "grad_norm": 0.797199335886302, |
| "learning_rate": 2.6523473614980395e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20053572952747345, |
| "step": 1985, |
| "valid_targets_mean": 1946.2, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.1942215088282504, |
| "grad_norm": 0.7659734706627166, |
| "learning_rate": 2.6447739120926815e-05, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17469337582588196, |
| "step": 1990, |
| "valid_targets_mean": 1612.2, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 3.202247191011236, |
| "grad_norm": 0.7701645192834687, |
| "learning_rate": 2.6371901305865346e-05, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21454013884067535, |
| "step": 1995, |
| "valid_targets_mean": 2100.4, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 3.2102728731942216, |
| "grad_norm": 0.8125509864840708, |
| "learning_rate": 2.629596138504978e-05, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19029833376407623, |
| "step": 2000, |
| "valid_targets_mean": 1778.3, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 3.218298555377207, |
| "grad_norm": 0.7175888565554096, |
| "learning_rate": 2.6219920575370115e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18968114256858826, |
| "step": 2005, |
| "valid_targets_mean": 2400.2, |
| "valid_targets_min": 1284 |
| }, |
| { |
| "epoch": 3.226324237560193, |
| "grad_norm": 0.774431761352013, |
| "learning_rate": 2.6143780095332996e-05, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22374089062213898, |
| "step": 2010, |
| "valid_targets_mean": 2418.2, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 3.234349919743178, |
| "grad_norm": 0.7366934183831256, |
| "learning_rate": 2.6067541165042262e-05, |
| "loss": 0.1891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1646566092967987, |
| "step": 2015, |
| "valid_targets_mean": 1817.9, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 3.2423756019261636, |
| "grad_norm": 0.9085528020394846, |
| "learning_rate": 2.5991205006179332e-05, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2022278755903244, |
| "step": 2020, |
| "valid_targets_mean": 1888.2, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 3.250401284109149, |
| "grad_norm": 0.8496667981008769, |
| "learning_rate": 2.5914772841983653e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20533272624015808, |
| "step": 2025, |
| "valid_targets_mean": 1874.3, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 3.258426966292135, |
| "grad_norm": 0.7969748922112211, |
| "learning_rate": 2.5838245897233113e-05, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1906946450471878, |
| "step": 2030, |
| "valid_targets_mean": 1718.5, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 3.2664526484751204, |
| "grad_norm": 0.6925975178805427, |
| "learning_rate": 2.5761625398224387e-05, |
| "loss": 0.1947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18433983623981476, |
| "step": 2035, |
| "valid_targets_mean": 2462.9, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 3.274478330658106, |
| "grad_norm": 0.7245709850282777, |
| "learning_rate": 2.56849125727533e-05, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16477423906326294, |
| "step": 2040, |
| "valid_targets_mean": 2091.6, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 3.2825040128410916, |
| "grad_norm": 0.7771087868403446, |
| "learning_rate": 2.560810865009515e-05, |
| "loss": 0.1835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.193090558052063, |
| "step": 2045, |
| "valid_targets_mean": 1966.6, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 3.290529695024077, |
| "grad_norm": 0.7254301119297374, |
| "learning_rate": 2.5531214860985015e-05, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1945345103740692, |
| "step": 2050, |
| "valid_targets_mean": 2402.4, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 3.2985553772070624, |
| "grad_norm": 0.8027092204852169, |
| "learning_rate": 2.5454232437598032e-05, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20133385062217712, |
| "step": 2055, |
| "valid_targets_mean": 1915.6, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 3.306581059390048, |
| "grad_norm": 0.7363037186006427, |
| "learning_rate": 2.537716261352963e-05, |
| "loss": 0.1923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2043621689081192, |
| "step": 2060, |
| "valid_targets_mean": 2254.2, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 3.3146067415730336, |
| "grad_norm": 0.7744385014125538, |
| "learning_rate": 2.53000066237758e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1948285698890686, |
| "step": 2065, |
| "valid_targets_mean": 1942.2, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 3.322632423756019, |
| "grad_norm": 0.7687870461284612, |
| "learning_rate": 2.5222765704713265e-05, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18752048909664154, |
| "step": 2070, |
| "valid_targets_mean": 1865.8, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 3.330658105939005, |
| "grad_norm": 0.7263395997338279, |
| "learning_rate": 2.5145441094079702e-05, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19827114045619965, |
| "step": 2075, |
| "valid_targets_mean": 2504.3, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 3.3386837881219904, |
| "grad_norm": 0.7381187748986383, |
| "learning_rate": 2.5068034030953888e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17457011342048645, |
| "step": 2080, |
| "valid_targets_mean": 2321.3, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 3.346709470304976, |
| "grad_norm": 0.7334484973637228, |
| "learning_rate": 2.499054575573585e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16836518049240112, |
| "step": 2085, |
| "valid_targets_mean": 2020.1, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 3.3547351524879616, |
| "grad_norm": 0.8336487761249294, |
| "learning_rate": 2.491297751012699e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18217214941978455, |
| "step": 2090, |
| "valid_targets_mean": 1471.1, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 3.362760834670947, |
| "grad_norm": 0.7231447723601349, |
| "learning_rate": 2.483533053711018e-05, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19125714898109436, |
| "step": 2095, |
| "valid_targets_mean": 2079.2, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 3.370786516853933, |
| "grad_norm": 0.7871767792479442, |
| "learning_rate": 2.4757606080929856e-05, |
| "loss": 0.1897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19560378789901733, |
| "step": 2100, |
| "valid_targets_mean": 1715.2, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 3.378812199036918, |
| "grad_norm": 0.7353603707138118, |
| "learning_rate": 2.467980538707207e-05, |
| "loss": 0.193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1874968260526657, |
| "step": 2105, |
| "valid_targets_mean": 2198.7, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 3.3868378812199036, |
| "grad_norm": 0.8102308981966291, |
| "learning_rate": 2.460192970224454e-05, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2087075412273407, |
| "step": 2110, |
| "valid_targets_mean": 1647.7, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 3.394863563402889, |
| "grad_norm": 0.7431520066152951, |
| "learning_rate": 2.4523980274356665e-05, |
| "loss": 0.1914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21111366152763367, |
| "step": 2115, |
| "valid_targets_mean": 2318.9, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 3.402889245585875, |
| "grad_norm": 0.6583964122894566, |
| "learning_rate": 2.444595835249952e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17443379759788513, |
| "step": 2120, |
| "valid_targets_mean": 2557.6, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 3.4109149277688604, |
| "grad_norm": 0.9040657902276791, |
| "learning_rate": 2.436786518692587e-05, |
| "loss": 0.1958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18719065189361572, |
| "step": 2125, |
| "valid_targets_mean": 2413.8, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 3.418940609951846, |
| "grad_norm": 0.730483546474811, |
| "learning_rate": 2.428970202903011e-05, |
| "loss": 0.1963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19034501910209656, |
| "step": 2130, |
| "valid_targets_mean": 2162.1, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 3.4269662921348316, |
| "grad_norm": 0.8290450345988953, |
| "learning_rate": 2.4211470131328208e-05, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20703352987766266, |
| "step": 2135, |
| "valid_targets_mean": 1847.6, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.4349919743178168, |
| "grad_norm": 0.6912484043662559, |
| "learning_rate": 2.4133170747437657e-05, |
| "loss": 0.1943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2027449905872345, |
| "step": 2140, |
| "valid_targets_mean": 2536.1, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 3.4430176565008024, |
| "grad_norm": 0.748348272526716, |
| "learning_rate": 2.4054805132057362e-05, |
| "loss": 0.1935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1785166710615158, |
| "step": 2145, |
| "valid_targets_mean": 1872.3, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.451043338683788, |
| "grad_norm": 0.8392457980303076, |
| "learning_rate": 2.397637454094756e-05, |
| "loss": 0.1857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19250713288784027, |
| "step": 2150, |
| "valid_targets_mean": 1665.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.4590690208667736, |
| "grad_norm": 0.7956502741744578, |
| "learning_rate": 2.3897880230909678e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1779821813106537, |
| "step": 2155, |
| "valid_targets_mean": 1863.2, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 3.467094703049759, |
| "grad_norm": 0.6735272716108055, |
| "learning_rate": 2.3819323459766194e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18678349256515503, |
| "step": 2160, |
| "valid_targets_mean": 2579.4, |
| "valid_targets_min": 1288 |
| }, |
| { |
| "epoch": 3.475120385232745, |
| "grad_norm": 0.781264193277655, |
| "learning_rate": 2.3740705486340492e-05, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16642053425312042, |
| "step": 2165, |
| "valid_targets_mean": 2064.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.4831460674157304, |
| "grad_norm": 0.8509728426922071, |
| "learning_rate": 2.366202757043668e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1804889738559723, |
| "step": 2170, |
| "valid_targets_mean": 1531.1, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 3.491171749598716, |
| "grad_norm": 0.7681030716681042, |
| "learning_rate": 2.358329097281942e-05, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21239528059959412, |
| "step": 2175, |
| "valid_targets_mean": 2224.4, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 3.4991974317817016, |
| "grad_norm": 0.6875253594702069, |
| "learning_rate": 2.3504496955193695e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17239797115325928, |
| "step": 2180, |
| "valid_targets_mean": 1882.8, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 3.5072231139646872, |
| "grad_norm": 0.7423496773042868, |
| "learning_rate": 2.342564678018462e-05, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19619911909103394, |
| "step": 2185, |
| "valid_targets_mean": 2109.4, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 3.515248796147673, |
| "grad_norm": 0.6599800958836226, |
| "learning_rate": 2.3346741711317185e-05, |
| "loss": 0.1857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1889185905456543, |
| "step": 2190, |
| "valid_targets_mean": 2660.3, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 3.523274478330658, |
| "grad_norm": 0.8332035412792131, |
| "learning_rate": 2.326778301299603e-05, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1888495832681656, |
| "step": 2195, |
| "valid_targets_mean": 1617.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 3.5313001605136436, |
| "grad_norm": 0.7422726313573247, |
| "learning_rate": 2.3188771950485172e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16541287302970886, |
| "step": 2200, |
| "valid_targets_mean": 1771.2, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 3.539325842696629, |
| "grad_norm": 0.7751086907387414, |
| "learning_rate": 2.3109709789887732e-05, |
| "loss": 0.2092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2171766757965088, |
| "step": 2205, |
| "valid_targets_mean": 2355.4, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 3.547351524879615, |
| "grad_norm": 0.7959173282766169, |
| "learning_rate": 2.3030597798125642e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20218120515346527, |
| "step": 2210, |
| "valid_targets_mean": 1999.3, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 3.5553772070626004, |
| "grad_norm": 0.7123208491374362, |
| "learning_rate": 2.295143724291935e-05, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18248684704303741, |
| "step": 2215, |
| "valid_targets_mean": 1983.6, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 3.563402889245586, |
| "grad_norm": 0.7239156258883958, |
| "learning_rate": 2.2872229392767497e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18239015340805054, |
| "step": 2220, |
| "valid_targets_mean": 2137.5, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 3.571428571428571, |
| "grad_norm": 0.8073709827317045, |
| "learning_rate": 2.2792975516926615e-05, |
| "loss": 0.1908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20157527923583984, |
| "step": 2225, |
| "valid_targets_mean": 2178.2, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 3.579454253611557, |
| "grad_norm": 0.9561614899504988, |
| "learning_rate": 2.271367688539075e-05, |
| "loss": 0.1909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18683037161827087, |
| "step": 2230, |
| "valid_targets_mean": 2166.1, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 3.5874799357945424, |
| "grad_norm": 0.7468302593032567, |
| "learning_rate": 2.2634334768871133e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1675512194633484, |
| "step": 2235, |
| "valid_targets_mean": 1832.1, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 3.595505617977528, |
| "grad_norm": 0.7591043916830319, |
| "learning_rate": 2.2554950438775813e-05, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19787640869617462, |
| "step": 2240, |
| "valid_targets_mean": 2119.7, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 3.6035313001605136, |
| "grad_norm": 0.7812103358035377, |
| "learning_rate": 2.2475525167189298e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18840080499649048, |
| "step": 2245, |
| "valid_targets_mean": 1717.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 3.611556982343499, |
| "grad_norm": 0.8048037305797138, |
| "learning_rate": 2.2396060226852148e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17736947536468506, |
| "step": 2250, |
| "valid_targets_mean": 1519.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 3.619582664526485, |
| "grad_norm": 0.7382055576071299, |
| "learning_rate": 2.2316556891140594e-05, |
| "loss": 0.1989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18542557954788208, |
| "step": 2255, |
| "valid_targets_mean": 1981.1, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 3.6276083467094704, |
| "grad_norm": 0.8117240899793563, |
| "learning_rate": 2.2237016434046124e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.199208065867424, |
| "step": 2260, |
| "valid_targets_mean": 2017.4, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 3.635634028892456, |
| "grad_norm": 0.7814089947481103, |
| "learning_rate": 2.2157440130155084e-05, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2004736363887787, |
| "step": 2265, |
| "valid_targets_mean": 2167.4, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 3.6436597110754416, |
| "grad_norm": 0.8313337224306722, |
| "learning_rate": 2.2077829254628224e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19507341086864471, |
| "step": 2270, |
| "valid_targets_mean": 1738.1, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 3.6516853932584272, |
| "grad_norm": 0.736982749910831, |
| "learning_rate": 2.1998185083180297e-05, |
| "loss": 0.197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17966896295547485, |
| "step": 2275, |
| "valid_targets_mean": 1906.8, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 3.6597110754414124, |
| "grad_norm": 0.7529274800924642, |
| "learning_rate": 2.1918508892059608e-05, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1658572107553482, |
| "step": 2280, |
| "valid_targets_mean": 1714.2, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 3.667736757624398, |
| "grad_norm": 0.8232143722363245, |
| "learning_rate": 2.1838801958027533e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21375055611133575, |
| "step": 2285, |
| "valid_targets_mean": 1926.2, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 3.6757624398073836, |
| "grad_norm": 0.7437594523483552, |
| "learning_rate": 2.175906555833811e-05, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14584185183048248, |
| "step": 2290, |
| "valid_targets_mean": 1485.8, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 3.683788121990369, |
| "grad_norm": 0.8253400566984553, |
| "learning_rate": 2.1679300970717526e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.198220357298851, |
| "step": 2295, |
| "valid_targets_mean": 1756.6, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 3.691813804173355, |
| "grad_norm": 0.7631981257736214, |
| "learning_rate": 2.1599509473343688e-05, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1921335756778717, |
| "step": 2300, |
| "valid_targets_mean": 1836.2, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 3.6998394863563404, |
| "grad_norm": 0.8125231968272838, |
| "learning_rate": 2.1519692344825684e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19826048612594604, |
| "step": 2305, |
| "valid_targets_mean": 2303.0, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 3.7078651685393256, |
| "grad_norm": 0.796754649081973, |
| "learning_rate": 2.1439850864183343e-05, |
| "loss": 0.1828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18836288154125214, |
| "step": 2310, |
| "valid_targets_mean": 1845.9, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 3.715890850722311, |
| "grad_norm": 0.7011535417327573, |
| "learning_rate": 2.1359986310826723e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15693524479866028, |
| "step": 2315, |
| "valid_targets_mean": 1808.2, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.723916532905297, |
| "grad_norm": 0.6745982102974377, |
| "learning_rate": 2.1280099964535594e-05, |
| "loss": 0.2062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20702672004699707, |
| "step": 2320, |
| "valid_targets_mean": 2588.8, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 3.7319422150882824, |
| "grad_norm": 0.7036120650208736, |
| "learning_rate": 2.120019310543896e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2342701256275177, |
| "step": 2325, |
| "valid_targets_mean": 2742.9, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 3.739967897271268, |
| "grad_norm": 0.6978119100165123, |
| "learning_rate": 2.1120267013994527e-05, |
| "loss": 0.1859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19557003676891327, |
| "step": 2330, |
| "valid_targets_mean": 2265.5, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 3.7479935794542536, |
| "grad_norm": 1.1106527175621144, |
| "learning_rate": 2.104032297096817e-05, |
| "loss": 0.1919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19205822050571442, |
| "step": 2335, |
| "valid_targets_mean": 2021.2, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 3.756019261637239, |
| "grad_norm": 0.6649212142267416, |
| "learning_rate": 2.096036225741346e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1821729838848114, |
| "step": 2340, |
| "valid_targets_mean": 2483.3, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 3.764044943820225, |
| "grad_norm": 0.8682584189157655, |
| "learning_rate": 2.088038615465107e-05, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2323881983757019, |
| "step": 2345, |
| "valid_targets_mean": 2172.1, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 3.7720706260032104, |
| "grad_norm": 0.7059973626007631, |
| "learning_rate": 2.080039594424829e-05, |
| "loss": 0.194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19035211205482483, |
| "step": 2350, |
| "valid_targets_mean": 2238.2, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 3.780096308186196, |
| "grad_norm": 0.7025817999562849, |
| "learning_rate": 2.0720392907998473e-05, |
| "loss": 0.1838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16978096961975098, |
| "step": 2355, |
| "valid_targets_mean": 1907.9, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 3.7881219903691816, |
| "grad_norm": 0.7720895482426217, |
| "learning_rate": 2.0640378327900507e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18614491820335388, |
| "step": 2360, |
| "valid_targets_mean": 1797.3, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 3.796147672552167, |
| "grad_norm": 0.7448908723180842, |
| "learning_rate": 2.0560353486138255e-05, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1888936161994934, |
| "step": 2365, |
| "valid_targets_mean": 2135.0, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 3.8041733547351524, |
| "grad_norm": 0.7293585089215756, |
| "learning_rate": 2.0480319665060014e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17815639078617096, |
| "step": 2370, |
| "valid_targets_mean": 1993.8, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 3.812199036918138, |
| "grad_norm": 0.8436319534001945, |
| "learning_rate": 2.0400278147157973e-05, |
| "loss": 0.1924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19632424414157867, |
| "step": 2375, |
| "valid_targets_mean": 1567.9, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 3.8202247191011236, |
| "grad_norm": 0.762177401689057, |
| "learning_rate": 2.0320230215047667e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17414651811122894, |
| "step": 2380, |
| "valid_targets_mean": 1993.4, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 3.828250401284109, |
| "grad_norm": 0.7862690373739996, |
| "learning_rate": 2.0240177151447397e-05, |
| "loss": 0.1902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1997125893831253, |
| "step": 2385, |
| "valid_targets_mean": 1752.0, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 3.836276083467095, |
| "grad_norm": 0.7671200606374088, |
| "learning_rate": 2.0160120239157705e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19353365898132324, |
| "step": 2390, |
| "valid_targets_mean": 1993.4, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 3.8443017656500804, |
| "grad_norm": 0.7497960536151272, |
| "learning_rate": 2.0080060761040795e-05, |
| "loss": 0.1923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18841297924518585, |
| "step": 2395, |
| "valid_targets_mean": 2027.2, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 3.8523274478330656, |
| "grad_norm": 0.6984086156626323, |
| "learning_rate": 2e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17640450596809387, |
| "step": 2400, |
| "valid_targets_mean": 2163.6, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 3.860353130016051, |
| "grad_norm": 0.6985420493366072, |
| "learning_rate": 1.991993923895921e-05, |
| "loss": 0.1912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1724482774734497, |
| "step": 2405, |
| "valid_targets_mean": 2245.6, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 3.868378812199037, |
| "grad_norm": 0.7664827628096461, |
| "learning_rate": 1.9839879760842302e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17965087294578552, |
| "step": 2410, |
| "valid_targets_mean": 1988.3, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 3.8764044943820224, |
| "grad_norm": 0.8574637628450187, |
| "learning_rate": 1.975982284855261e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17706872522830963, |
| "step": 2415, |
| "valid_targets_mean": 1429.2, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 3.884430176565008, |
| "grad_norm": 0.8159684403134524, |
| "learning_rate": 1.967976978495234e-05, |
| "loss": 0.193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2066316157579422, |
| "step": 2420, |
| "valid_targets_mean": 1944.9, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 3.8924558587479936, |
| "grad_norm": 0.7653474014396054, |
| "learning_rate": 1.959972185284203e-05, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20480495691299438, |
| "step": 2425, |
| "valid_targets_mean": 2137.4, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 3.900481540930979, |
| "grad_norm": 0.7119154640913655, |
| "learning_rate": 1.951968033493999e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22431352734565735, |
| "step": 2430, |
| "valid_targets_mean": 2569.9, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 3.908507223113965, |
| "grad_norm": 0.6933243254616628, |
| "learning_rate": 1.9439646513861748e-05, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1814383864402771, |
| "step": 2435, |
| "valid_targets_mean": 2834.9, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 3.9165329052969504, |
| "grad_norm": 0.7003573100002531, |
| "learning_rate": 1.93596216720995e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1896560937166214, |
| "step": 2440, |
| "valid_targets_mean": 2383.5, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 3.924558587479936, |
| "grad_norm": 0.7987554233995582, |
| "learning_rate": 1.9279607092001534e-05, |
| "loss": 0.1912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17562270164489746, |
| "step": 2445, |
| "valid_targets_mean": 1630.9, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 3.932584269662921, |
| "grad_norm": 0.7727774163624671, |
| "learning_rate": 1.9199604055751718e-05, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2166813164949417, |
| "step": 2450, |
| "valid_targets_mean": 2261.4, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 3.940609951845907, |
| "grad_norm": 0.8131949994370706, |
| "learning_rate": 1.9119613845348935e-05, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1931370496749878, |
| "step": 2455, |
| "valid_targets_mean": 2146.0, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 3.9486356340288924, |
| "grad_norm": 0.7543765118463652, |
| "learning_rate": 1.9039637742586545e-05, |
| "loss": 0.1935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18845586478710175, |
| "step": 2460, |
| "valid_targets_mean": 1944.2, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 3.956661316211878, |
| "grad_norm": 0.8095687971348281, |
| "learning_rate": 1.8959677029031832e-05, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19238343834877014, |
| "step": 2465, |
| "valid_targets_mean": 2164.7, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 3.9646869983948636, |
| "grad_norm": 0.8236185986919573, |
| "learning_rate": 1.8879732986005476e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19786785542964935, |
| "step": 2470, |
| "valid_targets_mean": 1725.6, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 3.972712680577849, |
| "grad_norm": 0.9277927282461786, |
| "learning_rate": 1.8799806894561042e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2078876495361328, |
| "step": 2475, |
| "valid_targets_mean": 2197.4, |
| "valid_targets_min": 1186 |
| }, |
| { |
| "epoch": 3.980738362760835, |
| "grad_norm": 0.7514885129339864, |
| "learning_rate": 1.8719900035464412e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16057060658931732, |
| "step": 2480, |
| "valid_targets_mean": 1605.2, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 3.98876404494382, |
| "grad_norm": 0.6523845582349944, |
| "learning_rate": 1.864001368917328e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19543814659118652, |
| "step": 2485, |
| "valid_targets_mean": 2637.5, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 3.9967897271268056, |
| "grad_norm": 0.7614952279373743, |
| "learning_rate": 1.856014913581666e-05, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19684013724327087, |
| "step": 2490, |
| "valid_targets_mean": 2091.9, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 4.004815409309791, |
| "grad_norm": 0.7598894989729227, |
| "learning_rate": 1.8480307655174322e-05, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16470491886138916, |
| "step": 2495, |
| "valid_targets_mean": 1833.8, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 4.012841091492777, |
| "grad_norm": 0.7220917183884463, |
| "learning_rate": 1.8400490526656322e-05, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1639862060546875, |
| "step": 2500, |
| "valid_targets_mean": 2315.0, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 4.020866773675762, |
| "grad_norm": 0.7146247317400145, |
| "learning_rate": 1.8320699029282477e-05, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1569473147392273, |
| "step": 2505, |
| "valid_targets_mean": 2658.7, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 4.028892455858748, |
| "grad_norm": 0.7357502371403062, |
| "learning_rate": 1.8240934441661898e-05, |
| "loss": 0.1693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15852639079093933, |
| "step": 2510, |
| "valid_targets_mean": 2141.9, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 4.036918138041734, |
| "grad_norm": 0.9021773647071464, |
| "learning_rate": 1.8161198041972478e-05, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15807832777500153, |
| "step": 2515, |
| "valid_targets_mean": 1685.3, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 4.044943820224719, |
| "grad_norm": 0.8267907751505533, |
| "learning_rate": 1.8081491107940405e-05, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1717631220817566, |
| "step": 2520, |
| "valid_targets_mean": 1869.8, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 4.052969502407705, |
| "grad_norm": 0.8272280336042476, |
| "learning_rate": 1.8001814916819706e-05, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15036287903785706, |
| "step": 2525, |
| "valid_targets_mean": 2030.8, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 4.06099518459069, |
| "grad_norm": 0.750320928818136, |
| "learning_rate": 1.7922170745371782e-05, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15992726385593414, |
| "step": 2530, |
| "valid_targets_mean": 2341.8, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 4.069020866773676, |
| "grad_norm": 0.710265161172677, |
| "learning_rate": 1.7842559869844926e-05, |
| "loss": 0.1616, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16481420397758484, |
| "step": 2535, |
| "valid_targets_mean": 2390.8, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 4.077046548956662, |
| "grad_norm": 0.6932511885249728, |
| "learning_rate": 1.7762983565953882e-05, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15228337049484253, |
| "step": 2540, |
| "valid_targets_mean": 2558.4, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 4.085072231139647, |
| "grad_norm": 0.9665904156345935, |
| "learning_rate": 1.768344310885941e-05, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1605364829301834, |
| "step": 2545, |
| "valid_targets_mean": 1897.4, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 4.093097913322633, |
| "grad_norm": 0.8370869748032498, |
| "learning_rate": 1.760393977314786e-05, |
| "loss": 0.1582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1575726568698883, |
| "step": 2550, |
| "valid_targets_mean": 1763.5, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 4.101123595505618, |
| "grad_norm": 0.851361799332316, |
| "learning_rate": 1.7524474832810715e-05, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15234051644802094, |
| "step": 2555, |
| "valid_targets_mean": 1794.1, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 4.109149277688603, |
| "grad_norm": 0.8670710844035465, |
| "learning_rate": 1.7445049561224197e-05, |
| "loss": 0.158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18183620274066925, |
| "step": 2560, |
| "valid_targets_mean": 1944.7, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 4.117174959871589, |
| "grad_norm": 0.8008124802397306, |
| "learning_rate": 1.736566523112888e-05, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1569271683692932, |
| "step": 2565, |
| "valid_targets_mean": 1758.4, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 4.125200642054574, |
| "grad_norm": 0.7244247443223619, |
| "learning_rate": 1.7286323114609264e-05, |
| "loss": 0.1652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16013914346694946, |
| "step": 2570, |
| "valid_targets_mean": 2266.8, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 4.13322632423756, |
| "grad_norm": 0.7258758426401232, |
| "learning_rate": 1.7207024483073395e-05, |
| "loss": 0.1528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1507132351398468, |
| "step": 2575, |
| "valid_targets_mean": 2195.1, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 4.141252006420546, |
| "grad_norm": 0.7747021374459989, |
| "learning_rate": 1.7127770607232506e-05, |
| "loss": 0.165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16840553283691406, |
| "step": 2580, |
| "valid_targets_mean": 2432.6, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 4.149277688603531, |
| "grad_norm": 0.8370328803383551, |
| "learning_rate": 1.7048562757080658e-05, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15022283792495728, |
| "step": 2585, |
| "valid_targets_mean": 2054.2, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 4.157303370786517, |
| "grad_norm": 0.863183572527677, |
| "learning_rate": 1.6969402201874358e-05, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18424132466316223, |
| "step": 2590, |
| "valid_targets_mean": 1905.8, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 4.165329052969502, |
| "grad_norm": 0.7325225003293633, |
| "learning_rate": 1.6890290210112268e-05, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16462567448616028, |
| "step": 2595, |
| "valid_targets_mean": 2701.8, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 4.173354735152488, |
| "grad_norm": 0.8550527776626037, |
| "learning_rate": 1.6811228049514828e-05, |
| "loss": 0.1628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18417339026927948, |
| "step": 2600, |
| "valid_targets_mean": 2102.4, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 4.181380417335474, |
| "grad_norm": 0.7738912822273089, |
| "learning_rate": 1.6732216987003972e-05, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14265528321266174, |
| "step": 2605, |
| "valid_targets_mean": 2429.2, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 4.189406099518459, |
| "grad_norm": 0.846741833270454, |
| "learning_rate": 1.6653258288682815e-05, |
| "loss": 0.1591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.165584534406662, |
| "step": 2610, |
| "valid_targets_mean": 2022.3, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 4.197431781701445, |
| "grad_norm": 0.7860604699119313, |
| "learning_rate": 1.6574353219815383e-05, |
| "loss": 0.1622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17301838099956512, |
| "step": 2615, |
| "valid_targets_mean": 2509.3, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 4.20545746388443, |
| "grad_norm": 0.6042094358589516, |
| "learning_rate": 1.6495503044806305e-05, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1679677814245224, |
| "step": 2620, |
| "valid_targets_mean": 4193.2, |
| "valid_targets_min": 1385 |
| }, |
| { |
| "epoch": 4.213483146067416, |
| "grad_norm": 0.8435205892952795, |
| "learning_rate": 1.641670902718058e-05, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16670869290828705, |
| "step": 2625, |
| "valid_targets_mean": 1701.4, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 4.221508828250402, |
| "grad_norm": 0.8069505344707392, |
| "learning_rate": 1.633797242956332e-05, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17490074038505554, |
| "step": 2630, |
| "valid_targets_mean": 2187.9, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 4.229534510433387, |
| "grad_norm": 0.7681332462758949, |
| "learning_rate": 1.625929451365951e-05, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.139631450176239, |
| "step": 2635, |
| "valid_targets_mean": 2152.5, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 4.237560192616373, |
| "grad_norm": 0.7743079695057093, |
| "learning_rate": 1.618067654023381e-05, |
| "loss": 0.1593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15092188119888306, |
| "step": 2640, |
| "valid_targets_mean": 2007.7, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 4.245585874799358, |
| "grad_norm": 0.8045522607448906, |
| "learning_rate": 1.6102119769090325e-05, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15477828681468964, |
| "step": 2645, |
| "valid_targets_mean": 2015.0, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 4.253611556982343, |
| "grad_norm": 0.7842184804024716, |
| "learning_rate": 1.6023625459052442e-05, |
| "loss": 0.1623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14832571148872375, |
| "step": 2650, |
| "valid_targets_mean": 1659.8, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 4.261637239165329, |
| "grad_norm": 0.8453627359844748, |
| "learning_rate": 1.594519486794264e-05, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17142939567565918, |
| "step": 2655, |
| "valid_targets_mean": 1726.5, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 4.269662921348314, |
| "grad_norm": 0.68904498722134, |
| "learning_rate": 1.586682925256235e-05, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1561916470527649, |
| "step": 2660, |
| "valid_targets_mean": 2864.8, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 4.2776886035313, |
| "grad_norm": 0.7432020014717042, |
| "learning_rate": 1.5788529868671792e-05, |
| "loss": 0.1553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16694585978984833, |
| "step": 2665, |
| "valid_targets_mean": 2652.6, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 4.285714285714286, |
| "grad_norm": 0.8573411887216612, |
| "learning_rate": 1.5710297970969893e-05, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16618192195892334, |
| "step": 2670, |
| "valid_targets_mean": 1786.7, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 4.293739967897271, |
| "grad_norm": 0.8616537427897845, |
| "learning_rate": 1.563213481307413e-05, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1844010055065155, |
| "step": 2675, |
| "valid_targets_mean": 2021.8, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 4.301765650080257, |
| "grad_norm": 0.7980069825955369, |
| "learning_rate": 1.5554041647500485e-05, |
| "loss": 0.1652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18299910426139832, |
| "step": 2680, |
| "valid_targets_mean": 2434.2, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 4.309791332263242, |
| "grad_norm": 0.7786630652444673, |
| "learning_rate": 1.5476019725643342e-05, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17932823300361633, |
| "step": 2685, |
| "valid_targets_mean": 2057.4, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 4.317817014446228, |
| "grad_norm": 0.8119610141424436, |
| "learning_rate": 1.5398070297755465e-05, |
| "loss": 0.1652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1823132038116455, |
| "step": 2690, |
| "valid_targets_mean": 2320.1, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 4.325842696629214, |
| "grad_norm": 0.8571455033898614, |
| "learning_rate": 1.5320194612927935e-05, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19664575159549713, |
| "step": 2695, |
| "valid_targets_mean": 2258.8, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 4.333868378812199, |
| "grad_norm": 0.810464889478973, |
| "learning_rate": 1.5242393919070146e-05, |
| "loss": 0.1665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16627417504787445, |
| "step": 2700, |
| "valid_targets_mean": 1929.9, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 4.341894060995185, |
| "grad_norm": 0.8148753400319572, |
| "learning_rate": 1.5164669462889825e-05, |
| "loss": 0.1637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14969250559806824, |
| "step": 2705, |
| "valid_targets_mean": 1406.3, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 4.34991974317817, |
| "grad_norm": 0.7742908439387767, |
| "learning_rate": 1.5087022489873016e-05, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15673664212226868, |
| "step": 2710, |
| "valid_targets_mean": 2016.5, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 4.357945425361156, |
| "grad_norm": 0.8241151599270962, |
| "learning_rate": 1.5009454244264156e-05, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16360478103160858, |
| "step": 2715, |
| "valid_targets_mean": 2072.0, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 4.365971107544142, |
| "grad_norm": 0.7258922171050899, |
| "learning_rate": 1.4931965969046113e-05, |
| "loss": 0.1671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1603405475616455, |
| "step": 2720, |
| "valid_targets_mean": 2382.3, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 4.373996789727126, |
| "grad_norm": 0.746718193097595, |
| "learning_rate": 1.4854558905920303e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1559460312128067, |
| "step": 2725, |
| "valid_targets_mean": 2081.0, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 4.382022471910112, |
| "grad_norm": 0.8753737997888681, |
| "learning_rate": 1.4777234295286742e-05, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15468575060367584, |
| "step": 2730, |
| "valid_targets_mean": 1593.1, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 4.390048154093098, |
| "grad_norm": 0.8037530854979934, |
| "learning_rate": 1.469999337622421e-05, |
| "loss": 0.1671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16917386651039124, |
| "step": 2735, |
| "valid_targets_mean": 2151.1, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 4.398073836276083, |
| "grad_norm": 0.8500743057064097, |
| "learning_rate": 1.4622837386470373e-05, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.166961207985878, |
| "step": 2740, |
| "valid_targets_mean": 1751.0, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 4.406099518459069, |
| "grad_norm": 0.8311068179954831, |
| "learning_rate": 1.4545767562401973e-05, |
| "loss": 0.17, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15660396218299866, |
| "step": 2745, |
| "valid_targets_mean": 1665.8, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 4.414125200642054, |
| "grad_norm": 0.7888439337676993, |
| "learning_rate": 1.4468785139014986e-05, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16615541279315948, |
| "step": 2750, |
| "valid_targets_mean": 2020.2, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 4.42215088282504, |
| "grad_norm": 0.7271702792121916, |
| "learning_rate": 1.4391891349904859e-05, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1305883228778839, |
| "step": 2755, |
| "valid_targets_mean": 1820.6, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 4.430176565008026, |
| "grad_norm": 0.8100289776181084, |
| "learning_rate": 1.4315087427246706e-05, |
| "loss": 0.1622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16775105893611908, |
| "step": 2760, |
| "valid_targets_mean": 2011.5, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 4.438202247191011, |
| "grad_norm": 0.8341886619638011, |
| "learning_rate": 1.4238374601775617e-05, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.175085186958313, |
| "step": 2765, |
| "valid_targets_mean": 2030.1, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 4.446227929373997, |
| "grad_norm": 0.7861876079484966, |
| "learning_rate": 1.4161754102766892e-05, |
| "loss": 0.1644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16237448155879974, |
| "step": 2770, |
| "valid_targets_mean": 2125.4, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 4.454253611556982, |
| "grad_norm": 0.7974795438274449, |
| "learning_rate": 1.4085227158016355e-05, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1793215423822403, |
| "step": 2775, |
| "valid_targets_mean": 2240.8, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 4.462279293739968, |
| "grad_norm": 0.7610583199711114, |
| "learning_rate": 1.4008794993820676e-05, |
| "loss": 0.1647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16052846610546112, |
| "step": 2780, |
| "valid_targets_mean": 2020.9, |
| "valid_targets_min": 1038 |
| }, |
| { |
| "epoch": 4.470304975922954, |
| "grad_norm": 0.763307262888446, |
| "learning_rate": 1.3932458834957745e-05, |
| "loss": 0.1744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16174271702766418, |
| "step": 2785, |
| "valid_targets_mean": 2038.5, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 4.478330658105939, |
| "grad_norm": 0.7090993165393538, |
| "learning_rate": 1.3856219904667012e-05, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17628321051597595, |
| "step": 2790, |
| "valid_targets_mean": 2747.6, |
| "valid_targets_min": 1289 |
| }, |
| { |
| "epoch": 4.486356340288925, |
| "grad_norm": 0.7844335568292791, |
| "learning_rate": 1.3780079424629893e-05, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1669953465461731, |
| "step": 2795, |
| "valid_targets_mean": 2251.4, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 4.49438202247191, |
| "grad_norm": 0.7237391782540498, |
| "learning_rate": 1.3704038614950221e-05, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1593700349330902, |
| "step": 2800, |
| "valid_targets_mean": 2246.4, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 4.502407704654896, |
| "grad_norm": 0.6662862730256653, |
| "learning_rate": 1.362809869413466e-05, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15161554515361786, |
| "step": 2805, |
| "valid_targets_mean": 3524.4, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 4.510433386837882, |
| "grad_norm": 0.7261025807643624, |
| "learning_rate": 1.355226087907319e-05, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16334782540798187, |
| "step": 2810, |
| "valid_targets_mean": 2492.2, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 4.518459069020867, |
| "grad_norm": 0.6893457421297444, |
| "learning_rate": 1.3476526385019609e-05, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14589521288871765, |
| "step": 2815, |
| "valid_targets_mean": 2433.6, |
| "valid_targets_min": 996 |
| }, |
| { |
| "epoch": 4.526484751203852, |
| "grad_norm": 0.9075567951066162, |
| "learning_rate": 1.3400896425572078e-05, |
| "loss": 0.1622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18327827751636505, |
| "step": 2820, |
| "valid_targets_mean": 1756.2, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 4.534510433386838, |
| "grad_norm": 0.7717323287249781, |
| "learning_rate": 1.3325372212653638e-05, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17693357169628143, |
| "step": 2825, |
| "valid_targets_mean": 2270.5, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 4.542536115569823, |
| "grad_norm": 0.7535197151026929, |
| "learning_rate": 1.324995495649281e-05, |
| "loss": 0.1584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1388244926929474, |
| "step": 2830, |
| "valid_targets_mean": 2134.2, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 4.550561797752809, |
| "grad_norm": 0.7741815820615187, |
| "learning_rate": 1.3174645865604201e-05, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16817861795425415, |
| "step": 2835, |
| "valid_targets_mean": 2520.7, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 4.558587479935794, |
| "grad_norm": 0.8231972416370127, |
| "learning_rate": 1.3099446146769146e-05, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17522352933883667, |
| "step": 2840, |
| "valid_targets_mean": 2127.5, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 4.56661316211878, |
| "grad_norm": 0.797161483789656, |
| "learning_rate": 1.302435700501635e-05, |
| "loss": 0.1728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16017599403858185, |
| "step": 2845, |
| "valid_targets_mean": 2187.6, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 4.574638844301766, |
| "grad_norm": 0.830389247613262, |
| "learning_rate": 1.294937964360259e-05, |
| "loss": 0.1592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17233622074127197, |
| "step": 2850, |
| "valid_targets_mean": 1991.4, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 4.582664526484751, |
| "grad_norm": 0.8604436677037445, |
| "learning_rate": 1.2874515263993435e-05, |
| "loss": 0.1646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18079304695129395, |
| "step": 2855, |
| "valid_targets_mean": 1904.0, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 4.590690208667737, |
| "grad_norm": 0.8182705272129311, |
| "learning_rate": 1.2799765065843994e-05, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16060321033000946, |
| "step": 2860, |
| "valid_targets_mean": 1708.9, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 4.598715890850722, |
| "grad_norm": 0.7893789950794092, |
| "learning_rate": 1.2725130246979683e-05, |
| "loss": 0.1602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15286454558372498, |
| "step": 2865, |
| "valid_targets_mean": 1979.1, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 4.606741573033708, |
| "grad_norm": 0.6505588257536744, |
| "learning_rate": 1.2650612003377036e-05, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14304134249687195, |
| "step": 2870, |
| "valid_targets_mean": 2717.9, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 4.614767255216694, |
| "grad_norm": 0.78593772720222, |
| "learning_rate": 1.2576211529144554e-05, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15942759811878204, |
| "step": 2875, |
| "valid_targets_mean": 2011.0, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 4.622792937399679, |
| "grad_norm": 0.8273283308452407, |
| "learning_rate": 1.2501930016503541e-05, |
| "loss": 0.1671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17127399146556854, |
| "step": 2880, |
| "valid_targets_mean": 1755.8, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 4.630818619582665, |
| "grad_norm": 0.7348995377336468, |
| "learning_rate": 1.2427768655769024e-05, |
| "loss": 0.1884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22157861292362213, |
| "step": 2885, |
| "valid_targets_mean": 2057.2, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 4.63884430176565, |
| "grad_norm": 0.8505145389671085, |
| "learning_rate": 1.2353728635330667e-05, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16335329413414001, |
| "step": 2890, |
| "valid_targets_mean": 1816.2, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 4.646869983948635, |
| "grad_norm": 1.37076025694794, |
| "learning_rate": 1.2279811141633735e-05, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1675649881362915, |
| "step": 2895, |
| "valid_targets_mean": 2360.0, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 4.654895666131621, |
| "grad_norm": 0.732275170804169, |
| "learning_rate": 1.2206017359160075e-05, |
| "loss": 0.1564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1485610008239746, |
| "step": 2900, |
| "valid_targets_mean": 1736.9, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 4.662921348314606, |
| "grad_norm": 0.8216973272949605, |
| "learning_rate": 1.2132348470409143e-05, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18894213438034058, |
| "step": 2905, |
| "valid_targets_mean": 2240.9, |
| "valid_targets_min": 1017 |
| }, |
| { |
| "epoch": 4.670947030497592, |
| "grad_norm": 0.8075689232117615, |
| "learning_rate": 1.2058805655879038e-05, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16298025846481323, |
| "step": 2910, |
| "valid_targets_mean": 2005.5, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 4.678972712680578, |
| "grad_norm": 0.8159417807899707, |
| "learning_rate": 1.198539009404762e-05, |
| "loss": 0.1637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16406571865081787, |
| "step": 2915, |
| "valid_targets_mean": 1778.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 4.686998394863563, |
| "grad_norm": 0.8256426953405346, |
| "learning_rate": 1.1912102961353584e-05, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17584344744682312, |
| "step": 2920, |
| "valid_targets_mean": 1622.3, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 4.695024077046549, |
| "grad_norm": 0.7691107031706801, |
| "learning_rate": 1.1838945432177635e-05, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18694257736206055, |
| "step": 2925, |
| "valid_targets_mean": 2771.9, |
| "valid_targets_min": 1366 |
| }, |
| { |
| "epoch": 4.703049759229534, |
| "grad_norm": 0.7516487224153081, |
| "learning_rate": 1.1765918678823662e-05, |
| "loss": 0.1643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15113398432731628, |
| "step": 2930, |
| "valid_targets_mean": 1985.2, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 4.71107544141252, |
| "grad_norm": 0.7618974789209155, |
| "learning_rate": 1.1693023871499957e-05, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.165465846657753, |
| "step": 2935, |
| "valid_targets_mean": 2225.2, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 4.719101123595506, |
| "grad_norm": 0.8149074036818159, |
| "learning_rate": 1.1620262178300456e-05, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16010752320289612, |
| "step": 2940, |
| "valid_targets_mean": 1913.2, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 4.727126805778491, |
| "grad_norm": 0.8197427071898096, |
| "learning_rate": 1.1547634765186016e-05, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17915387451648712, |
| "step": 2945, |
| "valid_targets_mean": 2063.6, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 4.735152487961477, |
| "grad_norm": 0.7472007206086239, |
| "learning_rate": 1.1475142795965757e-05, |
| "loss": 0.1592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14832112193107605, |
| "step": 2950, |
| "valid_targets_mean": 2198.4, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 4.743178170144462, |
| "grad_norm": 0.716859850891493, |
| "learning_rate": 1.140278743227837e-05, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1730707287788391, |
| "step": 2955, |
| "valid_targets_mean": 2579.7, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 4.751203852327448, |
| "grad_norm": 0.7593041479712695, |
| "learning_rate": 1.1330569833573551e-05, |
| "loss": 0.1582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16250699758529663, |
| "step": 2960, |
| "valid_targets_mean": 2219.4, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 4.759229534510434, |
| "grad_norm": 0.7933693825582795, |
| "learning_rate": 1.1258491157093396e-05, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1603544056415558, |
| "step": 2965, |
| "valid_targets_mean": 2217.6, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 4.767255216693419, |
| "grad_norm": 0.7743905745905229, |
| "learning_rate": 1.1186552557853825e-05, |
| "loss": 0.1579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1547103375196457, |
| "step": 2970, |
| "valid_targets_mean": 2139.5, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 4.775280898876405, |
| "grad_norm": 0.820583631476114, |
| "learning_rate": 1.1114755188626168e-05, |
| "loss": 0.1587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1643066108226776, |
| "step": 2975, |
| "valid_targets_mean": 2056.4, |
| "valid_targets_min": 1132 |
| }, |
| { |
| "epoch": 4.78330658105939, |
| "grad_norm": 0.8466563247928943, |
| "learning_rate": 1.104310019991857e-05, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1671457588672638, |
| "step": 2980, |
| "valid_targets_mean": 1896.4, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 4.791332263242376, |
| "grad_norm": 0.8354506195581702, |
| "learning_rate": 1.0971588739957656e-05, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16162726283073425, |
| "step": 2985, |
| "valid_targets_mean": 2007.1, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 4.799357945425362, |
| "grad_norm": 1.062465812109398, |
| "learning_rate": 1.0900221954670088e-05, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17890310287475586, |
| "step": 2990, |
| "valid_targets_mean": 1936.5, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 4.807383627608346, |
| "grad_norm": 0.8028726047167257, |
| "learning_rate": 1.0829000987664182e-05, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16547292470932007, |
| "step": 2995, |
| "valid_targets_mean": 2699.4, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 4.815409309791332, |
| "grad_norm": 0.8256326317127171, |
| "learning_rate": 1.0757926980211631e-05, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1672663390636444, |
| "step": 3000, |
| "valid_targets_mean": 1877.8, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 4.823434991974318, |
| "grad_norm": 0.7478820911221347, |
| "learning_rate": 1.0687001071229193e-05, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1408068835735321, |
| "step": 3005, |
| "valid_targets_mean": 1811.9, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 4.831460674157303, |
| "grad_norm": 0.726272372822568, |
| "learning_rate": 1.0616224397260418e-05, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15432113409042358, |
| "step": 3010, |
| "valid_targets_mean": 2357.8, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 4.839486356340289, |
| "grad_norm": 0.7902014084251503, |
| "learning_rate": 1.0545598092457486e-05, |
| "loss": 0.1717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18471723794937134, |
| "step": 3015, |
| "valid_targets_mean": 2332.9, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 4.847512038523274, |
| "grad_norm": 0.7605054462637847, |
| "learning_rate": 1.0475123288562973e-05, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17729586362838745, |
| "step": 3020, |
| "valid_targets_mean": 2387.9, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 4.85553772070626, |
| "grad_norm": 0.7484290704810759, |
| "learning_rate": 1.0404801114891778e-05, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16589263081550598, |
| "step": 3025, |
| "valid_targets_mean": 2440.9, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 4.863563402889246, |
| "grad_norm": 0.856515566605694, |
| "learning_rate": 1.033463269831299e-05, |
| "loss": 0.1639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1638427972793579, |
| "step": 3030, |
| "valid_targets_mean": 1848.2, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 4.871589085072231, |
| "grad_norm": 0.8236028327289647, |
| "learning_rate": 1.0264619163231806e-05, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14224272966384888, |
| "step": 3035, |
| "valid_targets_mean": 1927.8, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 4.879614767255217, |
| "grad_norm": 0.8834260640383598, |
| "learning_rate": 1.0194761631571582e-05, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1616498827934265, |
| "step": 3040, |
| "valid_targets_mean": 1653.1, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 4.887640449438202, |
| "grad_norm": 0.884548808230801, |
| "learning_rate": 1.0125061222755803e-05, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16663256287574768, |
| "step": 3045, |
| "valid_targets_mean": 1720.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.895666131621188, |
| "grad_norm": 0.749412699231492, |
| "learning_rate": 1.0055519053690143e-05, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17901411652565002, |
| "step": 3050, |
| "valid_targets_mean": 2867.6, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 4.903691813804174, |
| "grad_norm": 0.7064928300374316, |
| "learning_rate": 9.986136238744611e-06, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14298474788665771, |
| "step": 3055, |
| "valid_targets_mean": 2419.4, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 4.911717495987159, |
| "grad_norm": 0.775858514439901, |
| "learning_rate": 9.916913889735631e-06, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1682652235031128, |
| "step": 3060, |
| "valid_targets_mean": 2224.8, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 4.919743178170145, |
| "grad_norm": 0.7840845068588912, |
| "learning_rate": 9.847853115908287e-06, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16616985201835632, |
| "step": 3065, |
| "valid_targets_mean": 2093.0, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 4.9277688603531296, |
| "grad_norm": 0.7358639310688878, |
| "learning_rate": 9.778955023918522e-06, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16126513481140137, |
| "step": 3070, |
| "valid_targets_mean": 2444.2, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 4.935794542536115, |
| "grad_norm": 0.7019002418904744, |
| "learning_rate": 9.710220717815378e-06, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1442476511001587, |
| "step": 3075, |
| "valid_targets_mean": 2195.4, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 4.943820224719101, |
| "grad_norm": 0.8891523546612572, |
| "learning_rate": 9.641651299023356e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17019495368003845, |
| "step": 3080, |
| "valid_targets_mean": 1681.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 4.951845906902086, |
| "grad_norm": 0.8057149797037921, |
| "learning_rate": 9.573247866324735e-06, |
| "loss": 0.158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14473962783813477, |
| "step": 3085, |
| "valid_targets_mean": 1626.6, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 4.959871589085072, |
| "grad_norm": 0.9372704511945662, |
| "learning_rate": 9.505011515841955e-06, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16392774879932404, |
| "step": 3090, |
| "valid_targets_mean": 2301.2, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 4.967897271268058, |
| "grad_norm": 0.8552067075934405, |
| "learning_rate": 9.436943341020086e-06, |
| "loss": 0.1555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1627275049686432, |
| "step": 3095, |
| "valid_targets_mean": 2126.2, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 4.975922953451043, |
| "grad_norm": 0.7875758040462811, |
| "learning_rate": 9.369044432609286e-06, |
| "loss": 0.1644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15442267060279846, |
| "step": 3100, |
| "valid_targets_mean": 1900.0, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 4.983948635634029, |
| "grad_norm": 0.7598316679466666, |
| "learning_rate": 9.301315878647303e-06, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1592252254486084, |
| "step": 3105, |
| "valid_targets_mean": 1947.6, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 4.991974317817014, |
| "grad_norm": 0.8310232291090573, |
| "learning_rate": 9.233758764442093e-06, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15542343258857727, |
| "step": 3110, |
| "valid_targets_mean": 2550.7, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.812388817451886, |
| "learning_rate": 9.166374172554362e-06, |
| "loss": 0.1549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14916843175888062, |
| "step": 3115, |
| "valid_targets_mean": 1729.6, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 5.008025682182986, |
| "grad_norm": 0.7607033094606126, |
| "learning_rate": 9.099163182780284e-06, |
| "loss": 0.1383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.135885089635849, |
| "step": 3120, |
| "valid_targets_mean": 1814.1, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 5.016051364365971, |
| "grad_norm": 0.8736465666549718, |
| "learning_rate": 9.032126872134158e-06, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13772378861904144, |
| "step": 3125, |
| "valid_targets_mean": 1659.3, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 5.024077046548957, |
| "grad_norm": 0.7904249272604563, |
| "learning_rate": 8.965266314831137e-06, |
| "loss": 0.1398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13139450550079346, |
| "step": 3130, |
| "valid_targets_mean": 1946.4, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 5.032102728731942, |
| "grad_norm": 0.7929407682892132, |
| "learning_rate": 8.898582582270068e-06, |
| "loss": 0.1411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14323486387729645, |
| "step": 3135, |
| "valid_targets_mean": 1973.4, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 5.040128410914928, |
| "grad_norm": 0.866269311457836, |
| "learning_rate": 8.83207674301628e-06, |
| "loss": 0.1468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14333856105804443, |
| "step": 3140, |
| "valid_targets_mean": 1734.8, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 5.048154093097914, |
| "grad_norm": 0.9162778441988956, |
| "learning_rate": 8.765749862784455e-06, |
| "loss": 0.1456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15251901745796204, |
| "step": 3145, |
| "valid_targets_mean": 1654.0, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 5.056179775280899, |
| "grad_norm": 0.8407736851023895, |
| "learning_rate": 8.699603004421602e-06, |
| "loss": 0.1383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13436079025268555, |
| "step": 3150, |
| "valid_targets_mean": 2126.9, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 5.064205457463885, |
| "grad_norm": 0.7832463394899054, |
| "learning_rate": 8.633637227889955e-06, |
| "loss": 0.14, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14068548381328583, |
| "step": 3155, |
| "valid_targets_mean": 1925.2, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 5.07223113964687, |
| "grad_norm": 0.8639774265044126, |
| "learning_rate": 8.567853590250045e-06, |
| "loss": 0.1435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15971428155899048, |
| "step": 3160, |
| "valid_targets_mean": 1906.4, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 5.080256821829855, |
| "grad_norm": 0.7906584083707138, |
| "learning_rate": 8.502253145643752e-06, |
| "loss": 0.1384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14278461039066315, |
| "step": 3165, |
| "valid_targets_mean": 2237.5, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 5.088282504012841, |
| "grad_norm": 0.7628112750420695, |
| "learning_rate": 8.436836945277368e-06, |
| "loss": 0.1394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12936154007911682, |
| "step": 3170, |
| "valid_targets_mean": 2202.6, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 5.096308186195826, |
| "grad_norm": 0.8267306131640556, |
| "learning_rate": 8.371606037404815e-06, |
| "loss": 0.1405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14580325782299042, |
| "step": 3175, |
| "valid_targets_mean": 2161.2, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 5.104333868378812, |
| "grad_norm": 0.6460612310814934, |
| "learning_rate": 8.306561467310812e-06, |
| "loss": 0.1394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12587103247642517, |
| "step": 3180, |
| "valid_targets_mean": 3042.2, |
| "valid_targets_min": 1359 |
| }, |
| { |
| "epoch": 5.112359550561798, |
| "grad_norm": 0.8017584928015836, |
| "learning_rate": 8.241704277294111e-06, |
| "loss": 0.1429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1343742311000824, |
| "step": 3185, |
| "valid_targets_mean": 2129.9, |
| "valid_targets_min": 1002 |
| }, |
| { |
| "epoch": 5.120385232744783, |
| "grad_norm": 0.9038978661911155, |
| "learning_rate": 8.17703550665084e-06, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15416087210178375, |
| "step": 3190, |
| "valid_targets_mean": 1875.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 5.128410914927769, |
| "grad_norm": 0.8573022613515127, |
| "learning_rate": 8.112556191657824e-06, |
| "loss": 0.1483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16371378302574158, |
| "step": 3195, |
| "valid_targets_mean": 2166.3, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 5.136436597110754, |
| "grad_norm": 0.7790246108354407, |
| "learning_rate": 8.04826736555595e-06, |
| "loss": 0.1376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13910721242427826, |
| "step": 3200, |
| "valid_targets_mean": 1948.4, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 5.14446227929374, |
| "grad_norm": 0.7766255832740316, |
| "learning_rate": 7.984170058533675e-06, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12751339375972748, |
| "step": 3205, |
| "valid_targets_mean": 2555.9, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 5.152487961476726, |
| "grad_norm": 0.7917119654505816, |
| "learning_rate": 7.920265297710451e-06, |
| "loss": 0.1389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1495143473148346, |
| "step": 3210, |
| "valid_targets_mean": 2617.8, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 5.160513643659711, |
| "grad_norm": 0.7844470449050925, |
| "learning_rate": 7.85655410712032e-06, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15069085359573364, |
| "step": 3215, |
| "valid_targets_mean": 2413.8, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 5.168539325842697, |
| "grad_norm": 0.8339048928177408, |
| "learning_rate": 7.793037507695478e-06, |
| "loss": 0.1405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1523759961128235, |
| "step": 3220, |
| "valid_targets_mean": 1656.4, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 5.176565008025682, |
| "grad_norm": 0.7967130499731122, |
| "learning_rate": 7.729716517249899e-06, |
| "loss": 0.1468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14771035313606262, |
| "step": 3225, |
| "valid_targets_mean": 2035.6, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 5.184590690208668, |
| "grad_norm": 0.7684917293766128, |
| "learning_rate": 7.666592150463069e-06, |
| "loss": 0.1369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12404549866914749, |
| "step": 3230, |
| "valid_targets_mean": 2203.1, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 5.192616372391654, |
| "grad_norm": 0.8176758283630357, |
| "learning_rate": 7.603665418863693e-06, |
| "loss": 0.1373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1301923543214798, |
| "step": 3235, |
| "valid_targets_mean": 1912.1, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 5.200642054574639, |
| "grad_norm": 0.838834519570343, |
| "learning_rate": 7.540937330813487e-06, |
| "loss": 0.1493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1450478732585907, |
| "step": 3240, |
| "valid_targets_mean": 1830.1, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 5.208667736757624, |
| "grad_norm": 0.85879810687639, |
| "learning_rate": 7.47840889149104e-06, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1518646478652954, |
| "step": 3245, |
| "valid_targets_mean": 2411.8, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 5.21669341894061, |
| "grad_norm": 0.9231616255122982, |
| "learning_rate": 7.416081102875696e-06, |
| "loss": 0.1458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1643749177455902, |
| "step": 3250, |
| "valid_targets_mean": 2091.4, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 5.224719101123595, |
| "grad_norm": 0.8492677793062714, |
| "learning_rate": 7.353954963731475e-06, |
| "loss": 0.1501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13949257135391235, |
| "step": 3255, |
| "valid_targets_mean": 1654.9, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 5.232744783306581, |
| "grad_norm": 0.7820953395694332, |
| "learning_rate": 7.292031469591121e-06, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1359032392501831, |
| "step": 3260, |
| "valid_targets_mean": 1941.2, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 5.240770465489566, |
| "grad_norm": 0.7968901999980463, |
| "learning_rate": 7.230311612740086e-06, |
| "loss": 0.1358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14728347957134247, |
| "step": 3265, |
| "valid_targets_mean": 2289.1, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 5.248796147672552, |
| "grad_norm": 0.8900568965689445, |
| "learning_rate": 7.168796382200682e-06, |
| "loss": 0.1411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14544740319252014, |
| "step": 3270, |
| "valid_targets_mean": 1736.2, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 5.256821829855538, |
| "grad_norm": 0.8484989618392149, |
| "learning_rate": 7.1074867637162185e-06, |
| "loss": 0.138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13557720184326172, |
| "step": 3275, |
| "valid_targets_mean": 1689.6, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 5.264847512038523, |
| "grad_norm": 0.7914982828194392, |
| "learning_rate": 7.046383739735166e-06, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15681229531764984, |
| "step": 3280, |
| "valid_targets_mean": 2608.4, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 5.272873194221509, |
| "grad_norm": 0.8523244039078887, |
| "learning_rate": 6.985488289395479e-06, |
| "loss": 0.1404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13885071873664856, |
| "step": 3285, |
| "valid_targets_mean": 1940.9, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 5.280898876404494, |
| "grad_norm": 0.9243935198555188, |
| "learning_rate": 6.924801388508868e-06, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1328265368938446, |
| "step": 3290, |
| "valid_targets_mean": 1775.9, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 5.28892455858748, |
| "grad_norm": 1.1133751117817525, |
| "learning_rate": 6.864324009545154e-06, |
| "loss": 0.1392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14222298562526703, |
| "step": 3295, |
| "valid_targets_mean": 1608.2, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 5.296950240770466, |
| "grad_norm": 0.7767976367343669, |
| "learning_rate": 6.804057121616714e-06, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14329108595848083, |
| "step": 3300, |
| "valid_targets_mean": 2415.2, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 5.304975922953451, |
| "grad_norm": 0.9041112781790765, |
| "learning_rate": 6.744001690462922e-06, |
| "loss": 0.1439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17742100358009338, |
| "step": 3305, |
| "valid_targets_mean": 2027.3, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 5.313001605136437, |
| "grad_norm": 0.8736023871852377, |
| "learning_rate": 6.684158678434707e-06, |
| "loss": 0.1406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14842301607131958, |
| "step": 3310, |
| "valid_targets_mean": 2091.2, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 5.321027287319422, |
| "grad_norm": 0.7618181166503121, |
| "learning_rate": 6.624529044479109e-06, |
| "loss": 0.1476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1443331241607666, |
| "step": 3315, |
| "valid_targets_mean": 2625.0, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 5.329052969502408, |
| "grad_norm": 0.8555745405542319, |
| "learning_rate": 6.565113744123901e-06, |
| "loss": 0.1364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1390853226184845, |
| "step": 3320, |
| "valid_targets_mean": 2440.4, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 5.337078651685394, |
| "grad_norm": 0.8485080262580758, |
| "learning_rate": 6.50591372946231e-06, |
| "loss": 0.1467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15979576110839844, |
| "step": 3325, |
| "valid_targets_mean": 2120.2, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 5.345104333868379, |
| "grad_norm": 0.9223840058497179, |
| "learning_rate": 6.446929949137748e-06, |
| "loss": 0.1387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13735276460647583, |
| "step": 3330, |
| "valid_targets_mean": 1705.1, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 5.353130016051364, |
| "grad_norm": 0.831007979180398, |
| "learning_rate": 6.388163348328582e-06, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13778018951416016, |
| "step": 3335, |
| "valid_targets_mean": 1862.8, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 5.36115569823435, |
| "grad_norm": 0.8576931373884364, |
| "learning_rate": 6.329614868733038e-06, |
| "loss": 0.1345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12894180417060852, |
| "step": 3340, |
| "valid_targets_mean": 1832.2, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 5.369181380417335, |
| "grad_norm": 0.9081132027537362, |
| "learning_rate": 6.271285448554072e-06, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1540372371673584, |
| "step": 3345, |
| "valid_targets_mean": 2121.2, |
| "valid_targets_min": 827 |
| }, |
| { |
| "epoch": 5.377207062600321, |
| "grad_norm": 0.7729268997973129, |
| "learning_rate": 6.213176022484353e-06, |
| "loss": 0.1397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13177214562892914, |
| "step": 3350, |
| "valid_targets_mean": 2114.1, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 5.385232744783306, |
| "grad_norm": 0.9645437263591448, |
| "learning_rate": 6.1552875216912866e-06, |
| "loss": 0.1399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14385467767715454, |
| "step": 3355, |
| "valid_targets_mean": 1654.4, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 5.393258426966292, |
| "grad_norm": 0.8829811829270534, |
| "learning_rate": 6.097620873802068e-06, |
| "loss": 0.1424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14625263214111328, |
| "step": 3360, |
| "valid_targets_mean": 2065.6, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 5.401284109149278, |
| "grad_norm": 0.8201170172984508, |
| "learning_rate": 6.0401770028888675e-06, |
| "loss": 0.1441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13578824698925018, |
| "step": 3365, |
| "valid_targets_mean": 1911.6, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 5.409309791332263, |
| "grad_norm": 0.7807754561817747, |
| "learning_rate": 5.982956829453965e-06, |
| "loss": 0.1364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14298827946186066, |
| "step": 3370, |
| "valid_targets_mean": 2299.7, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 5.417335473515249, |
| "grad_norm": 0.8242125235152692, |
| "learning_rate": 5.925961270415042e-06, |
| "loss": 0.145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14364124834537506, |
| "step": 3375, |
| "valid_targets_mean": 1832.5, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 5.425361155698234, |
| "grad_norm": 0.8447270823261972, |
| "learning_rate": 5.8691912390904815e-06, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15039601922035217, |
| "step": 3380, |
| "valid_targets_mean": 2066.4, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 5.43338683788122, |
| "grad_norm": 0.9092987692988171, |
| "learning_rate": 5.812647645184704e-06, |
| "loss": 0.1417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15466216206550598, |
| "step": 3385, |
| "valid_targets_mean": 1961.2, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 5.441412520064206, |
| "grad_norm": 0.8683991460939533, |
| "learning_rate": 5.756331394773624e-06, |
| "loss": 0.1462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15245194733142853, |
| "step": 3390, |
| "valid_targets_mean": 1784.2, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 5.449438202247191, |
| "grad_norm": 0.892968643755484, |
| "learning_rate": 5.7002433902901276e-06, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15332868695259094, |
| "step": 3395, |
| "valid_targets_mean": 1742.7, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 5.457463884430177, |
| "grad_norm": 0.7642059744988553, |
| "learning_rate": 5.644384530509574e-06, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14609497785568237, |
| "step": 3400, |
| "valid_targets_mean": 2508.6, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 5.465489566613162, |
| "grad_norm": 0.8768706215913115, |
| "learning_rate": 5.588755710535452e-06, |
| "loss": 0.1432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14894311130046844, |
| "step": 3405, |
| "valid_targets_mean": 1854.5, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 5.473515248796148, |
| "grad_norm": 0.7918482061402888, |
| "learning_rate": 5.533357821784991e-06, |
| "loss": 0.1558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20110508799552917, |
| "step": 3410, |
| "valid_targets_mean": 2252.2, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 5.481540930979134, |
| "grad_norm": 0.6880735681435827, |
| "learning_rate": 5.47819175197488e-06, |
| "loss": 0.1483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14852222800254822, |
| "step": 3415, |
| "valid_targets_mean": 3205.2, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 5.489566613162118, |
| "grad_norm": 0.6767067170795432, |
| "learning_rate": 5.42325838510708e-06, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11822806298732758, |
| "step": 3420, |
| "valid_targets_mean": 2824.0, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 5.497592295345104, |
| "grad_norm": 0.8718548056137807, |
| "learning_rate": 5.3685586014546075e-06, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1538342833518982, |
| "step": 3425, |
| "valid_targets_mean": 1895.7, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 5.50561797752809, |
| "grad_norm": 0.8040243257756551, |
| "learning_rate": 5.314093277547465e-06, |
| "loss": 0.1411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13354749977588654, |
| "step": 3430, |
| "valid_targets_mean": 2219.4, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 5.513643659711075, |
| "grad_norm": 0.8548517241885055, |
| "learning_rate": 5.259863286158591e-06, |
| "loss": 0.1438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13882416486740112, |
| "step": 3435, |
| "valid_targets_mean": 2167.7, |
| "valid_targets_min": 887 |
| }, |
| { |
| "epoch": 5.521669341894061, |
| "grad_norm": 0.8964297825625066, |
| "learning_rate": 5.205869496289846e-06, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1575285792350769, |
| "step": 3440, |
| "valid_targets_mean": 1769.5, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 5.529695024077046, |
| "grad_norm": 0.7937327005355985, |
| "learning_rate": 5.152112773158125e-06, |
| "loss": 0.1341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14235813915729523, |
| "step": 3445, |
| "valid_targets_mean": 2031.9, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 5.537720706260032, |
| "grad_norm": 0.8719446158769936, |
| "learning_rate": 5.0985939781814765e-06, |
| "loss": 0.1442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1630193591117859, |
| "step": 3450, |
| "valid_targets_mean": 1731.4, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 5.545746388443018, |
| "grad_norm": 0.8295730035601938, |
| "learning_rate": 5.045313968965282e-06, |
| "loss": 0.1346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14717170596122742, |
| "step": 3455, |
| "valid_targets_mean": 1955.8, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 5.553772070626003, |
| "grad_norm": 0.8964496498020716, |
| "learning_rate": 4.992273599288546e-06, |
| "loss": 0.1451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14559556543827057, |
| "step": 3460, |
| "valid_targets_mean": 1855.2, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 5.561797752808989, |
| "grad_norm": 0.8774241059648222, |
| "learning_rate": 4.9394737190902e-06, |
| "loss": 0.1486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16202348470687866, |
| "step": 3465, |
| "valid_targets_mean": 2333.4, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 5.569823434991974, |
| "grad_norm": 0.7667078264832548, |
| "learning_rate": 4.88691517445546e-06, |
| "loss": 0.1352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1312371790409088, |
| "step": 3470, |
| "valid_targets_mean": 1970.1, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 5.57784911717496, |
| "grad_norm": 0.8467942832579569, |
| "learning_rate": 4.834598807602317e-06, |
| "loss": 0.1495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13902528584003448, |
| "step": 3475, |
| "valid_targets_mean": 1953.3, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 5.585874799357946, |
| "grad_norm": 1.1418994519461927, |
| "learning_rate": 4.78252545686799e-06, |
| "loss": 0.143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13345175981521606, |
| "step": 3480, |
| "valid_targets_mean": 1804.4, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 5.593900481540931, |
| "grad_norm": 0.829765999744519, |
| "learning_rate": 4.730695956695532e-06, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14543312788009644, |
| "step": 3485, |
| "valid_targets_mean": 1963.8, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 5.601926163723917, |
| "grad_norm": 0.8564170677263149, |
| "learning_rate": 4.679111137620442e-06, |
| "loss": 0.1498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14116448163986206, |
| "step": 3490, |
| "valid_targets_mean": 1803.9, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 5.609951845906902, |
| "grad_norm": 0.9258578493411536, |
| "learning_rate": 4.627771826257341e-06, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15053588151931763, |
| "step": 3495, |
| "valid_targets_mean": 1818.8, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 5.617977528089888, |
| "grad_norm": 0.7635041251336951, |
| "learning_rate": 4.576678845286757e-06, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13723108172416687, |
| "step": 3500, |
| "valid_targets_mean": 2557.6, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 5.626003210272874, |
| "grad_norm": 0.720755360308493, |
| "learning_rate": 4.525833013441931e-06, |
| "loss": 0.1348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1270107477903366, |
| "step": 3505, |
| "valid_targets_mean": 2256.1, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 5.634028892455858, |
| "grad_norm": 0.8869362920498091, |
| "learning_rate": 4.475235145495669e-06, |
| "loss": 0.1374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1467820107936859, |
| "step": 3510, |
| "valid_targets_mean": 1817.4, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 5.642054574638844, |
| "grad_norm": 0.8025610722259726, |
| "learning_rate": 4.424886052247339e-06, |
| "loss": 0.1397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13881070911884308, |
| "step": 3515, |
| "valid_targets_mean": 1964.7, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 5.65008025682183, |
| "grad_norm": 0.7037787309221992, |
| "learning_rate": 4.374786540509821e-06, |
| "loss": 0.1404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13750547170639038, |
| "step": 3520, |
| "valid_targets_mean": 2488.4, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 5.658105939004815, |
| "grad_norm": 0.8339701185276572, |
| "learning_rate": 4.324937413096628e-06, |
| "loss": 0.1471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14046938717365265, |
| "step": 3525, |
| "valid_targets_mean": 1705.5, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 5.666131621187801, |
| "grad_norm": 0.7586982214483773, |
| "learning_rate": 4.275339468809019e-06, |
| "loss": 0.138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13911622762680054, |
| "step": 3530, |
| "valid_targets_mean": 2551.6, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 5.674157303370786, |
| "grad_norm": 0.9119810062418106, |
| "learning_rate": 4.225993502423182e-06, |
| "loss": 0.1477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1517258733510971, |
| "step": 3535, |
| "valid_targets_mean": 1962.5, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 5.682182985553772, |
| "grad_norm": 0.8619483579361343, |
| "learning_rate": 4.1769003046775315e-06, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1552795171737671, |
| "step": 3540, |
| "valid_targets_mean": 1997.1, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 5.690208667736758, |
| "grad_norm": 0.865824081520984, |
| "learning_rate": 4.128060662260025e-06, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13369613885879517, |
| "step": 3545, |
| "valid_targets_mean": 1609.4, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 5.698234349919743, |
| "grad_norm": 0.7527647909300139, |
| "learning_rate": 4.079475357795535e-06, |
| "loss": 0.1319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12556613981723785, |
| "step": 3550, |
| "valid_targets_mean": 2171.1, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 5.706260032102729, |
| "grad_norm": 1.1716775797352907, |
| "learning_rate": 4.031145169833342e-06, |
| "loss": 0.1429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11673303693532944, |
| "step": 3555, |
| "valid_targets_mean": 2320.8, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 5.714285714285714, |
| "grad_norm": 0.9267941895909233, |
| "learning_rate": 3.9830708728346445e-06, |
| "loss": 0.1409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15212789177894592, |
| "step": 3560, |
| "valid_targets_mean": 1611.5, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 5.7223113964687, |
| "grad_norm": 1.0419238252836576, |
| "learning_rate": 3.935253237160132e-06, |
| "loss": 0.1418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13419196009635925, |
| "step": 3565, |
| "valid_targets_mean": 1984.1, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 5.730337078651686, |
| "grad_norm": 0.8798559697698835, |
| "learning_rate": 3.887693029057675e-06, |
| "loss": 0.1396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1552184522151947, |
| "step": 3570, |
| "valid_targets_mean": 1911.6, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 5.738362760834671, |
| "grad_norm": 0.8518956486042853, |
| "learning_rate": 3.8403910106500104e-06, |
| "loss": 0.144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14175641536712646, |
| "step": 3575, |
| "valid_targets_mean": 1880.1, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 5.746388443017657, |
| "grad_norm": 0.9148318859217006, |
| "learning_rate": 3.7933479399225604e-06, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1558597981929779, |
| "step": 3580, |
| "valid_targets_mean": 1775.1, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 5.754414125200642, |
| "grad_norm": 0.8566250351217594, |
| "learning_rate": 3.746564570711266e-06, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13671304285526276, |
| "step": 3585, |
| "valid_targets_mean": 1997.3, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 5.762439807383627, |
| "grad_norm": 0.8092341832129542, |
| "learning_rate": 3.7000416526905026e-06, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1414514183998108, |
| "step": 3590, |
| "valid_targets_mean": 1647.3, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 5.770465489566613, |
| "grad_norm": 0.8530070873913949, |
| "learning_rate": 3.6537799313610946e-06, |
| "loss": 0.1427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13695083558559418, |
| "step": 3595, |
| "valid_targets_mean": 1496.6, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 5.778491171749598, |
| "grad_norm": 0.8542613937155389, |
| "learning_rate": 3.607780148038347e-06, |
| "loss": 0.1569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14914162456989288, |
| "step": 3600, |
| "valid_targets_mean": 2354.6, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 5.786516853932584, |
| "grad_norm": 0.837623744528209, |
| "learning_rate": 3.5620430398401596e-06, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13059459626674652, |
| "step": 3605, |
| "valid_targets_mean": 2035.4, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 5.79454253611557, |
| "grad_norm": 0.8111804173729541, |
| "learning_rate": 3.5165693396752443e-06, |
| "loss": 0.1361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1243569403886795, |
| "step": 3610, |
| "valid_targets_mean": 2214.9, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 5.802568218298555, |
| "grad_norm": 0.8833303698013306, |
| "learning_rate": 3.471359776231347e-06, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16278022527694702, |
| "step": 3615, |
| "valid_targets_mean": 1972.5, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 5.810593900481541, |
| "grad_norm": 0.8415725209000036, |
| "learning_rate": 3.426415073963594e-06, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1425856500864029, |
| "step": 3620, |
| "valid_targets_mean": 1869.6, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 5.818619582664526, |
| "grad_norm": 0.9466397913974439, |
| "learning_rate": 3.3817359530828873e-06, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1392950862646103, |
| "step": 3625, |
| "valid_targets_mean": 1488.4, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 5.826645264847512, |
| "grad_norm": 0.8152618375051688, |
| "learning_rate": 3.3373231295443277e-06, |
| "loss": 0.1451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1470872461795807, |
| "step": 3630, |
| "valid_targets_mean": 2061.8, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 5.834670947030498, |
| "grad_norm": 0.8554361536678649, |
| "learning_rate": 3.2931773150357893e-06, |
| "loss": 0.1382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1473013013601303, |
| "step": 3635, |
| "valid_targets_mean": 1860.9, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 5.842696629213483, |
| "grad_norm": 0.8497228090683818, |
| "learning_rate": 3.2492992169664837e-06, |
| "loss": 0.144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14080603420734406, |
| "step": 3640, |
| "valid_targets_mean": 1779.9, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 5.850722311396469, |
| "grad_norm": 0.8236171503439341, |
| "learning_rate": 3.2056895384556275e-06, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14260318875312805, |
| "step": 3645, |
| "valid_targets_mean": 1947.2, |
| "valid_targets_min": 1110 |
| }, |
| { |
| "epoch": 5.858747993579454, |
| "grad_norm": 0.8212400811046316, |
| "learning_rate": 3.1623489783211904e-06, |
| "loss": 0.1443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14351606369018555, |
| "step": 3650, |
| "valid_targets_mean": 1747.2, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 5.86677367576244, |
| "grad_norm": 0.77766697126824, |
| "learning_rate": 3.1192782310686874e-06, |
| "loss": 0.1418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1273421049118042, |
| "step": 3655, |
| "valid_targets_mean": 2407.2, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 5.874799357945426, |
| "grad_norm": 0.8663557165534255, |
| "learning_rate": 3.0764779868800398e-06, |
| "loss": 0.1489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17279453575611115, |
| "step": 3660, |
| "valid_targets_mean": 2015.9, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 5.882825040128411, |
| "grad_norm": 0.8558801380283106, |
| "learning_rate": 3.0339489316025394e-06, |
| "loss": 0.1388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14702408015727997, |
| "step": 3665, |
| "valid_targets_mean": 2130.3, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 5.890850722311397, |
| "grad_norm": 0.7505646399517081, |
| "learning_rate": 2.991691746737828e-06, |
| "loss": 0.1499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13228633999824524, |
| "step": 3670, |
| "valid_targets_mean": 2391.9, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 5.898876404494382, |
| "grad_norm": 0.8199757285730112, |
| "learning_rate": 2.949707109431006e-06, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14933696389198303, |
| "step": 3675, |
| "valid_targets_mean": 1866.2, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 5.906902086677368, |
| "grad_norm": 0.8965249228046941, |
| "learning_rate": 2.907995692459773e-06, |
| "loss": 0.136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15130048990249634, |
| "step": 3680, |
| "valid_targets_mean": 2021.9, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 5.914927768860353, |
| "grad_norm": 0.8777238241939872, |
| "learning_rate": 2.8665581642236227e-06, |
| "loss": 0.1419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1442902833223343, |
| "step": 3685, |
| "valid_targets_mean": 1744.5, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 5.922953451043338, |
| "grad_norm": 0.8252807172148935, |
| "learning_rate": 2.825395188733169e-06, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1298397034406662, |
| "step": 3690, |
| "valid_targets_mean": 1682.1, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 5.930979133226324, |
| "grad_norm": 0.7888917751614268, |
| "learning_rate": 2.784507425599492e-06, |
| "loss": 0.1382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1363508403301239, |
| "step": 3695, |
| "valid_targets_mean": 1906.1, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 5.93900481540931, |
| "grad_norm": 0.9105325822568995, |
| "learning_rate": 2.743895530023544e-06, |
| "loss": 0.1386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13701778650283813, |
| "step": 3700, |
| "valid_targets_mean": 1610.4, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 5.947030497592295, |
| "grad_norm": 0.8647716265607804, |
| "learning_rate": 2.7035601527856914e-06, |
| "loss": 0.1338, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12563112378120422, |
| "step": 3705, |
| "valid_targets_mean": 1931.8, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 5.955056179775281, |
| "grad_norm": 0.9083802247250276, |
| "learning_rate": 2.6635019402352645e-06, |
| "loss": 0.1429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14448779821395874, |
| "step": 3710, |
| "valid_targets_mean": 1673.9, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 5.963081861958266, |
| "grad_norm": 0.6538474603186538, |
| "learning_rate": 2.6237215342801857e-06, |
| "loss": 0.1411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1227862536907196, |
| "step": 3715, |
| "valid_targets_mean": 3093.8, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 5.971107544141252, |
| "grad_norm": 0.8126909161583662, |
| "learning_rate": 2.5842195723767205e-06, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14033716917037964, |
| "step": 3720, |
| "valid_targets_mean": 2245.1, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 5.979133226324238, |
| "grad_norm": 0.8847974712352168, |
| "learning_rate": 2.544996687519219e-06, |
| "loss": 0.1451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.147241473197937, |
| "step": 3725, |
| "valid_targets_mean": 1698.0, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 5.987158908507223, |
| "grad_norm": 0.823026519904926, |
| "learning_rate": 2.5060535082300266e-06, |
| "loss": 0.1451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15312634408473969, |
| "step": 3730, |
| "valid_targets_mean": 2188.0, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 5.995184590690209, |
| "grad_norm": 0.8213365844788153, |
| "learning_rate": 2.467390658549349e-06, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13517561554908752, |
| "step": 3735, |
| "valid_targets_mean": 2128.8, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 6.003210272873194, |
| "grad_norm": 0.8196675867105674, |
| "learning_rate": 2.429008758025302e-06, |
| "loss": 0.1359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13686616718769073, |
| "step": 3740, |
| "valid_targets_mean": 1792.6, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 6.01123595505618, |
| "grad_norm": 0.7101099418791215, |
| "learning_rate": 2.3909084217039634e-06, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12406958639621735, |
| "step": 3745, |
| "valid_targets_mean": 2482.2, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 6.019261637239166, |
| "grad_norm": 0.8233493110334807, |
| "learning_rate": 2.353090260119515e-06, |
| "loss": 0.1353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13340730965137482, |
| "step": 3750, |
| "valid_targets_mean": 1969.3, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 6.027287319422151, |
| "grad_norm": 0.9151878902447068, |
| "learning_rate": 2.3155548792844674e-06, |
| "loss": 0.1265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11424959450960159, |
| "step": 3755, |
| "valid_targets_mean": 1564.1, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 6.035313001605137, |
| "grad_norm": 0.8326440606539028, |
| "learning_rate": 2.27830288067995e-06, |
| "loss": 0.1323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13482320308685303, |
| "step": 3760, |
| "valid_targets_mean": 1919.4, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 6.043338683788122, |
| "grad_norm": 0.8742588018506022, |
| "learning_rate": 2.241334861246058e-06, |
| "loss": 0.1261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1303100883960724, |
| "step": 3765, |
| "valid_targets_mean": 1689.5, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 6.051364365971107, |
| "grad_norm": 0.8283773699034884, |
| "learning_rate": 2.2046514133723075e-06, |
| "loss": 0.126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11725350469350815, |
| "step": 3770, |
| "valid_targets_mean": 1564.1, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 6.059390048154093, |
| "grad_norm": 0.9066721433616125, |
| "learning_rate": 2.1682531248881266e-06, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13146190345287323, |
| "step": 3775, |
| "valid_targets_mean": 1457.2, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 6.067415730337078, |
| "grad_norm": 0.7917186831995832, |
| "learning_rate": 2.1321405790534412e-06, |
| "loss": 0.1238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14324235916137695, |
| "step": 3780, |
| "valid_targets_mean": 2544.8, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 6.075441412520064, |
| "grad_norm": 0.7995015410713523, |
| "learning_rate": 2.096314354549334e-06, |
| "loss": 0.1352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12818962335586548, |
| "step": 3785, |
| "valid_targets_mean": 1735.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 6.08346709470305, |
| "grad_norm": 0.8043412796343894, |
| "learning_rate": 2.0607750254687554e-06, |
| "loss": 0.1289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12518352270126343, |
| "step": 3790, |
| "valid_targets_mean": 2304.7, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 6.091492776886035, |
| "grad_norm": 0.8688221477476388, |
| "learning_rate": 2.025523161307348e-06, |
| "loss": 0.1364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1296396106481552, |
| "step": 3795, |
| "valid_targets_mean": 1634.8, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 6.099518459069021, |
| "grad_norm": 0.9117796677606809, |
| "learning_rate": 1.990559326954307e-06, |
| "loss": 0.1355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13730370998382568, |
| "step": 3800, |
| "valid_targets_mean": 1711.1, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 6.107544141252006, |
| "grad_norm": 0.721550972186035, |
| "learning_rate": 1.955884082683317e-06, |
| "loss": 0.13, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1108551174402237, |
| "step": 3805, |
| "valid_targets_mean": 2403.3, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 6.115569823434992, |
| "grad_norm": 0.8248557024007874, |
| "learning_rate": 1.9214979841435967e-06, |
| "loss": 0.1322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13973233103752136, |
| "step": 3810, |
| "valid_targets_mean": 2137.4, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 6.123595505617978, |
| "grad_norm": 0.8121793695204608, |
| "learning_rate": 1.8874015823509873e-06, |
| "loss": 0.1245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12547042965888977, |
| "step": 3815, |
| "valid_targets_mean": 2604.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 6.131621187800963, |
| "grad_norm": 0.7351257868663279, |
| "learning_rate": 1.8535954236791044e-06, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12898236513137817, |
| "step": 3820, |
| "valid_targets_mean": 2703.9, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 6.139646869983949, |
| "grad_norm": 0.8858783243545603, |
| "learning_rate": 1.8200800498506166e-06, |
| "loss": 0.1352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15943001210689545, |
| "step": 3825, |
| "valid_targets_mean": 1791.6, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 6.147672552166934, |
| "grad_norm": 0.8144635580836179, |
| "learning_rate": 1.7868559979285293e-06, |
| "loss": 0.1263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12163649499416351, |
| "step": 3830, |
| "valid_targets_mean": 1813.3, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 6.15569823434992, |
| "grad_norm": 0.8011893230062246, |
| "learning_rate": 1.7539238003076087e-06, |
| "loss": 0.1291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13179343938827515, |
| "step": 3835, |
| "valid_targets_mean": 2422.9, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 6.163723916532906, |
| "grad_norm": 0.9556250644794508, |
| "learning_rate": 1.721283984705835e-06, |
| "loss": 0.1318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14184167981147766, |
| "step": 3840, |
| "valid_targets_mean": 1440.4, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 6.171749598715891, |
| "grad_norm": 0.7764479036008669, |
| "learning_rate": 1.6889370741559407e-06, |
| "loss": 0.1274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1197129637002945, |
| "step": 3845, |
| "valid_targets_mean": 2076.1, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 6.179775280898877, |
| "grad_norm": 0.7481548950692756, |
| "learning_rate": 1.6568835869970445e-06, |
| "loss": 0.1306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13337062299251556, |
| "step": 3850, |
| "valid_targets_mean": 2484.6, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 6.187800963081862, |
| "grad_norm": 0.821740266972904, |
| "learning_rate": 1.625124036866339e-06, |
| "loss": 0.1337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14121049642562866, |
| "step": 3855, |
| "valid_targets_mean": 2158.6, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 6.195826645264847, |
| "grad_norm": 0.8251617106369992, |
| "learning_rate": 1.5936589326908513e-06, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1286158710718155, |
| "step": 3860, |
| "valid_targets_mean": 1933.1, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 6.203852327447833, |
| "grad_norm": 0.9413267314341657, |
| "learning_rate": 1.5624887786793008e-06, |
| "loss": 0.1339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13531285524368286, |
| "step": 3865, |
| "valid_targets_mean": 1385.5, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 6.211878009630818, |
| "grad_norm": 0.8800324368070407, |
| "learning_rate": 1.531614074314014e-06, |
| "loss": 0.1365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13416577875614166, |
| "step": 3870, |
| "valid_targets_mean": 2019.1, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 6.219903691813804, |
| "grad_norm": 0.9054587413802373, |
| "learning_rate": 1.501035314342918e-06, |
| "loss": 0.1327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13169649243354797, |
| "step": 3875, |
| "valid_targets_mean": 1469.8, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 6.22792937399679, |
| "grad_norm": 0.8324924083699635, |
| "learning_rate": 1.4707529887716177e-06, |
| "loss": 0.1258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1314225196838379, |
| "step": 3880, |
| "valid_targets_mean": 1870.7, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 6.235955056179775, |
| "grad_norm": 0.757807099087046, |
| "learning_rate": 1.4407675828555378e-06, |
| "loss": 0.1295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13538961112499237, |
| "step": 3885, |
| "valid_targets_mean": 2662.4, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 6.243980738362761, |
| "grad_norm": 0.9112108378646868, |
| "learning_rate": 1.4110795770921536e-06, |
| "loss": 0.1317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14746998250484467, |
| "step": 3890, |
| "valid_targets_mean": 1878.4, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 6.252006420545746, |
| "grad_norm": 0.8130635027374573, |
| "learning_rate": 1.3816894472132903e-06, |
| "loss": 0.1308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1274118721485138, |
| "step": 3895, |
| "valid_targets_mean": 2159.9, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 6.260032102728732, |
| "grad_norm": 0.8766350494372456, |
| "learning_rate": 1.3525976641774862e-06, |
| "loss": 0.1268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12585480511188507, |
| "step": 3900, |
| "valid_targets_mean": 1828.7, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 6.268057784911718, |
| "grad_norm": 0.8414903174334402, |
| "learning_rate": 1.3238046941624694e-06, |
| "loss": 0.1343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1348039209842682, |
| "step": 3905, |
| "valid_targets_mean": 2230.7, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 6.276083467094703, |
| "grad_norm": 0.8692836229326116, |
| "learning_rate": 1.295310998557673e-06, |
| "loss": 0.1334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13138556480407715, |
| "step": 3910, |
| "valid_targets_mean": 1685.2, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 6.284109149277689, |
| "grad_norm": 0.9927992924551751, |
| "learning_rate": 1.2671170339568372e-06, |
| "loss": 0.1303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12924659252166748, |
| "step": 3915, |
| "valid_targets_mean": 1712.9, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 6.292134831460674, |
| "grad_norm": 0.8708385582623096, |
| "learning_rate": 1.239223252150703e-06, |
| "loss": 0.1375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1407126933336258, |
| "step": 3920, |
| "valid_targets_mean": 1895.5, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 6.30016051364366, |
| "grad_norm": 0.9462826534291934, |
| "learning_rate": 1.211630100119776e-06, |
| "loss": 0.1364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15399542450904846, |
| "step": 3925, |
| "valid_targets_mean": 1808.5, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 6.308186195826646, |
| "grad_norm": 0.8338027195464212, |
| "learning_rate": 1.1843380200271426e-06, |
| "loss": 0.1328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11450174450874329, |
| "step": 3930, |
| "valid_targets_mean": 1831.6, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 6.31621187800963, |
| "grad_norm": 0.7844532891368925, |
| "learning_rate": 1.1573474492114122e-06, |
| "loss": 0.1269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11957096308469772, |
| "step": 3935, |
| "valid_targets_mean": 2298.2, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 6.324237560192616, |
| "grad_norm": 0.7148468016806782, |
| "learning_rate": 1.1306588201796863e-06, |
| "loss": 0.1237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10497011244297028, |
| "step": 3940, |
| "valid_targets_mean": 2023.3, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 6.332263242375602, |
| "grad_norm": 0.8075062564380106, |
| "learning_rate": 1.1042725606006388e-06, |
| "loss": 0.144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15959270298480988, |
| "step": 3945, |
| "valid_targets_mean": 2724.1, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 6.340288924558587, |
| "grad_norm": 0.8319131176662817, |
| "learning_rate": 1.078189093297668e-06, |
| "loss": 0.1339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13696303963661194, |
| "step": 3950, |
| "valid_targets_mean": 2162.0, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 6.348314606741573, |
| "grad_norm": 0.777206520799545, |
| "learning_rate": 1.0524088362421048e-06, |
| "loss": 0.1237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12403260171413422, |
| "step": 3955, |
| "valid_targets_mean": 2233.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 6.356340288924558, |
| "grad_norm": 0.7451807347978312, |
| "learning_rate": 1.0269322025465334e-06, |
| "loss": 0.1308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13250204920768738, |
| "step": 3960, |
| "valid_targets_mean": 2690.4, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 6.364365971107544, |
| "grad_norm": 0.8253339601537156, |
| "learning_rate": 1.0017596004581564e-06, |
| "loss": 0.1295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1278865784406662, |
| "step": 3965, |
| "valid_targets_mean": 1848.6, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 6.37239165329053, |
| "grad_norm": 0.8584721668386178, |
| "learning_rate": 9.768914333522584e-07, |
| "loss": 0.1289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13879048824310303, |
| "step": 3970, |
| "valid_targets_mean": 1834.6, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 6.380417335473515, |
| "grad_norm": 0.8283576544061164, |
| "learning_rate": 9.5232809972575e-07, |
| "loss": 0.1309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13557694852352142, |
| "step": 3975, |
| "valid_targets_mean": 1815.6, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 6.388443017656501, |
| "grad_norm": 0.8748562146778729, |
| "learning_rate": 9.280699931907633e-07, |
| "loss": 0.1415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15249726176261902, |
| "step": 3980, |
| "valid_targets_mean": 2136.6, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 6.396468699839486, |
| "grad_norm": 0.777927436115682, |
| "learning_rate": 9.04117502468369e-07, |
| "loss": 0.1327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14238354563713074, |
| "step": 3985, |
| "valid_targets_mean": 2248.8, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 6.404494382022472, |
| "grad_norm": 0.8043827719833165, |
| "learning_rate": 8.804710113823311e-07, |
| "loss": 0.126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12348157912492752, |
| "step": 3990, |
| "valid_targets_mean": 1787.2, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 6.412520064205458, |
| "grad_norm": 0.9862275060605692, |
| "learning_rate": 8.571308988529492e-07, |
| "loss": 0.1288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13508912920951843, |
| "step": 3995, |
| "valid_targets_mean": 1392.4, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 6.420545746388443, |
| "grad_norm": 0.8431627989023698, |
| "learning_rate": 8.3409753889101e-07, |
| "loss": 0.1318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13289272785186768, |
| "step": 4000, |
| "valid_targets_mean": 1806.3, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 6.428571428571429, |
| "grad_norm": 0.8239565380374946, |
| "learning_rate": 8.11371300591779e-07, |
| "loss": 0.1286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13981223106384277, |
| "step": 4005, |
| "valid_targets_mean": 2153.0, |
| "valid_targets_min": 1102 |
| }, |
| { |
| "epoch": 6.436597110754414, |
| "grad_norm": 0.9432509501592777, |
| "learning_rate": 7.889525481290805e-07, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1455557495355606, |
| "step": 4010, |
| "valid_targets_mean": 1852.8, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 6.4446227929374, |
| "grad_norm": 0.9014367927531765, |
| "learning_rate": 7.668416407494761e-07, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13227035105228424, |
| "step": 4015, |
| "valid_targets_mean": 1789.1, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 6.452648475120386, |
| "grad_norm": 0.8171835228507035, |
| "learning_rate": 7.450389327665042e-07, |
| "loss": 0.1291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13154827058315277, |
| "step": 4020, |
| "valid_targets_mean": 2095.6, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 6.460674157303371, |
| "grad_norm": 0.7683854828646659, |
| "learning_rate": 7.235447735549895e-07, |
| "loss": 0.132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13109341263771057, |
| "step": 4025, |
| "valid_targets_mean": 2461.7, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 6.468699839486356, |
| "grad_norm": 0.9022184794419694, |
| "learning_rate": 7.02359507545467e-07, |
| "loss": 0.1365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13602422177791595, |
| "step": 4030, |
| "valid_targets_mean": 1908.5, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 6.476725521669342, |
| "grad_norm": 0.8680280298928634, |
| "learning_rate": 6.814834742186361e-07, |
| "loss": 0.1288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13595837354660034, |
| "step": 4035, |
| "valid_targets_mean": 1791.1, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 6.484751203852327, |
| "grad_norm": 0.8624861818881404, |
| "learning_rate": 6.60917008099946e-07, |
| "loss": 0.1384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13239216804504395, |
| "step": 4040, |
| "valid_targets_mean": 1472.7, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 6.492776886035313, |
| "grad_norm": 0.8372254606922392, |
| "learning_rate": 6.406604387542259e-07, |
| "loss": 0.1348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12756837904453278, |
| "step": 4045, |
| "valid_targets_mean": 1802.8, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 6.500802568218298, |
| "grad_norm": 0.8845183639085258, |
| "learning_rate": 6.207140907803877e-07, |
| "loss": 0.1341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11851681768894196, |
| "step": 4050, |
| "valid_targets_mean": 1879.1, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 6.508828250401284, |
| "grad_norm": 0.9939476432578076, |
| "learning_rate": 6.010782838062534e-07, |
| "loss": 0.1363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16492959856987, |
| "step": 4055, |
| "valid_targets_mean": 1637.2, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 6.51685393258427, |
| "grad_norm": 0.7876122251990382, |
| "learning_rate": 5.817533324834146e-07, |
| "loss": 0.1364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1363506019115448, |
| "step": 4060, |
| "valid_targets_mean": 1869.1, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 6.524879614767255, |
| "grad_norm": 0.8344114489032715, |
| "learning_rate": 5.627395464821894e-07, |
| "loss": 0.1343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.140853613615036, |
| "step": 4065, |
| "valid_targets_mean": 2610.0, |
| "valid_targets_min": 1355 |
| }, |
| { |
| "epoch": 6.532905296950241, |
| "grad_norm": 0.6902659152306734, |
| "learning_rate": 5.440372304866692e-07, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13164812326431274, |
| "step": 4070, |
| "valid_targets_mean": 3041.7, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 6.540930979133226, |
| "grad_norm": 0.7503481708658517, |
| "learning_rate": 5.256466841898334e-07, |
| "loss": 0.1332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13292858004570007, |
| "step": 4075, |
| "valid_targets_mean": 2455.9, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 6.548956661316212, |
| "grad_norm": 0.7994462646941594, |
| "learning_rate": 5.075682022887441e-07, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1420678347349167, |
| "step": 4080, |
| "valid_targets_mean": 2302.2, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 6.556982343499198, |
| "grad_norm": 0.8804572670066306, |
| "learning_rate": 4.898020744798282e-07, |
| "loss": 0.1324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14195245504379272, |
| "step": 4085, |
| "valid_targets_mean": 2165.8, |
| "valid_targets_min": 1104 |
| }, |
| { |
| "epoch": 6.565008025682183, |
| "grad_norm": 0.7713249621956143, |
| "learning_rate": 4.7234858545422536e-07, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12661638855934143, |
| "step": 4090, |
| "valid_targets_mean": 2549.3, |
| "valid_targets_min": 1000 |
| }, |
| { |
| "epoch": 6.573033707865169, |
| "grad_norm": 0.8013666556551141, |
| "learning_rate": 4.552080148932425e-07, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1386134922504425, |
| "step": 4095, |
| "valid_targets_mean": 2510.6, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 6.581059390048154, |
| "grad_norm": 0.9379662069494056, |
| "learning_rate": 4.383806374638555e-07, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1294247806072235, |
| "step": 4100, |
| "valid_targets_mean": 1812.6, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 6.589085072231139, |
| "grad_norm": 0.8157148561089532, |
| "learning_rate": 4.2186672281432363e-07, |
| "loss": 0.1343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12697714567184448, |
| "step": 4105, |
| "valid_targets_mean": 2067.0, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 6.597110754414125, |
| "grad_norm": 0.8532772772866162, |
| "learning_rate": 4.056665355698508e-07, |
| "loss": 0.1403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15566185116767883, |
| "step": 4110, |
| "valid_targets_mean": 1932.4, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 6.60513643659711, |
| "grad_norm": 0.7347366895405252, |
| "learning_rate": 3.89780335328358e-07, |
| "loss": 0.1256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1240445151925087, |
| "step": 4115, |
| "valid_targets_mean": 2558.4, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 6.613162118780096, |
| "grad_norm": 0.7844171389786991, |
| "learning_rate": 3.7420837665632205e-07, |
| "loss": 0.1321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1311158537864685, |
| "step": 4120, |
| "valid_targets_mean": 2435.1, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 6.621187800963082, |
| "grad_norm": 1.016494260012105, |
| "learning_rate": 3.5895090908469433e-07, |
| "loss": 0.1365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13737598061561584, |
| "step": 4125, |
| "valid_targets_mean": 2182.8, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 6.629213483146067, |
| "grad_norm": 0.7662698129244558, |
| "learning_rate": 3.4400817710489754e-07, |
| "loss": 0.1314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13481801748275757, |
| "step": 4130, |
| "valid_targets_mean": 2539.6, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 6.637239165329053, |
| "grad_norm": 0.8804946515187855, |
| "learning_rate": 3.293804201649131e-07, |
| "loss": 0.1363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14753307402133942, |
| "step": 4135, |
| "valid_targets_mean": 1763.6, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 6.645264847512038, |
| "grad_norm": 0.8509011624485113, |
| "learning_rate": 3.1506787266545104e-07, |
| "loss": 0.1369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13469921052455902, |
| "step": 4140, |
| "valid_targets_mean": 1757.4, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 6.653290529695024, |
| "grad_norm": 0.7972105200462379, |
| "learning_rate": 3.010707639561727e-07, |
| "loss": 0.1276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11612634360790253, |
| "step": 4145, |
| "valid_targets_mean": 2148.2, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 6.66131621187801, |
| "grad_norm": 0.8607825669685812, |
| "learning_rate": 2.873893183320431e-07, |
| "loss": 0.1368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1409863531589508, |
| "step": 4150, |
| "valid_targets_mean": 1988.0, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 6.669341894060995, |
| "grad_norm": 0.8114169187350514, |
| "learning_rate": 2.740237550297131e-07, |
| "loss": 0.1414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1218997910618782, |
| "step": 4155, |
| "valid_targets_mean": 2225.8, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 6.677367576243981, |
| "grad_norm": 0.8553063985701393, |
| "learning_rate": 2.609742882240207e-07, |
| "loss": 0.1457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1512482464313507, |
| "step": 4160, |
| "valid_targets_mean": 2193.6, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 6.685393258426966, |
| "grad_norm": 0.7842315608676794, |
| "learning_rate": 2.482411270245533e-07, |
| "loss": 0.1316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12290303409099579, |
| "step": 4165, |
| "valid_targets_mean": 2215.3, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 6.693418940609952, |
| "grad_norm": 0.8288014529828364, |
| "learning_rate": 2.358244754722927e-07, |
| "loss": 0.1354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13061775267124176, |
| "step": 4170, |
| "valid_targets_mean": 1987.8, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 6.701444622792938, |
| "grad_norm": 0.7471758228205548, |
| "learning_rate": 2.2372453253635796e-07, |
| "loss": 0.1373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12854477763175964, |
| "step": 4175, |
| "valid_targets_mean": 2526.5, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 6.709470304975923, |
| "grad_norm": 0.9506746700643623, |
| "learning_rate": 2.1194149211080982e-07, |
| "loss": 0.1355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15296323597431183, |
| "step": 4180, |
| "valid_targets_mean": 1742.1, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 6.717495987158909, |
| "grad_norm": 0.8755571800580249, |
| "learning_rate": 2.004755430115335e-07, |
| "loss": 0.1353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14241819083690643, |
| "step": 4185, |
| "valid_targets_mean": 1680.2, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 6.725521669341894, |
| "grad_norm": 0.8620961091565507, |
| "learning_rate": 1.8932686897323417e-07, |
| "loss": 0.1301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12413826584815979, |
| "step": 4190, |
| "valid_targets_mean": 1665.9, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 6.73354735152488, |
| "grad_norm": 0.8368572454303962, |
| "learning_rate": 1.7849564864647506e-07, |
| "loss": 0.1425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1286819726228714, |
| "step": 4195, |
| "valid_targets_mean": 2069.0, |
| "valid_targets_min": 1155 |
| }, |
| { |
| "epoch": 6.741573033707866, |
| "grad_norm": 0.8146985305426502, |
| "learning_rate": 1.679820555948264e-07, |
| "loss": 0.1376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11927329003810883, |
| "step": 4200, |
| "valid_targets_mean": 1932.9, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 6.74959871589085, |
| "grad_norm": 0.8866600690370785, |
| "learning_rate": 1.5778625829207196e-07, |
| "loss": 0.1342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13215553760528564, |
| "step": 4205, |
| "valid_targets_mean": 1920.4, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 6.757624398073836, |
| "grad_norm": 0.701924183183066, |
| "learning_rate": 1.4790842011952023e-07, |
| "loss": 0.1314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11789841204881668, |
| "step": 4210, |
| "valid_targets_mean": 2835.7, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 6.765650080256822, |
| "grad_norm": 0.9501322619954992, |
| "learning_rate": 1.3834869936338424e-07, |
| "loss": 0.1312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1307641565799713, |
| "step": 4215, |
| "valid_targets_mean": 2221.1, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 6.773675762439807, |
| "grad_norm": 0.8812623724815387, |
| "learning_rate": 1.2910724921224139e-07, |
| "loss": 0.1349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1285921037197113, |
| "step": 4220, |
| "valid_targets_mean": 1583.2, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 6.781701444622793, |
| "grad_norm": 0.8385562110933432, |
| "learning_rate": 1.2018421775457978e-07, |
| "loss": 0.1297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14212295413017273, |
| "step": 4225, |
| "valid_targets_mean": 1936.7, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 6.789727126805778, |
| "grad_norm": 0.7834916138029038, |
| "learning_rate": 1.115797479764269e-07, |
| "loss": 0.1295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12338066846132278, |
| "step": 4230, |
| "valid_targets_mean": 2082.6, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 6.797752808988764, |
| "grad_norm": 0.8288684199479489, |
| "learning_rate": 1.0329397775905802e-07, |
| "loss": 0.1385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14609648287296295, |
| "step": 4235, |
| "valid_targets_mean": 2241.5, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 6.80577849117175, |
| "grad_norm": 0.8404101812550286, |
| "learning_rate": 9.532703987678692e-08, |
| "loss": 0.1322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15395131707191467, |
| "step": 4240, |
| "valid_targets_mean": 2035.6, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 6.813804173354735, |
| "grad_norm": 0.8562736483627456, |
| "learning_rate": 8.767906199483422e-08, |
| "loss": 0.132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1289074420928955, |
| "step": 4245, |
| "valid_targets_mean": 1866.0, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 6.821829855537721, |
| "grad_norm": 0.8444371886099169, |
| "learning_rate": 8.0350166667289e-08, |
| "loss": 0.1295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12709850072860718, |
| "step": 4250, |
| "valid_targets_mean": 1635.1, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 6.829855537720706, |
| "grad_norm": 0.7699603449450781, |
| "learning_rate": 7.33404713351371e-08, |
| "loss": 0.1318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12732994556427002, |
| "step": 4255, |
| "valid_targets_mean": 2395.6, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 6.837881219903692, |
| "grad_norm": 0.8872853267014166, |
| "learning_rate": 6.665008832438923e-08, |
| "loss": 0.1317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13180556893348694, |
| "step": 4260, |
| "valid_targets_mean": 2180.7, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 6.845906902086678, |
| "grad_norm": 0.7725443532887755, |
| "learning_rate": 6.027912484426468e-08, |
| "loss": 0.1385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11179924011230469, |
| "step": 4265, |
| "valid_targets_mean": 1924.9, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 6.853932584269663, |
| "grad_norm": 0.8216166028267735, |
| "learning_rate": 5.4227682985494854e-08, |
| "loss": 0.1257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11613370478153229, |
| "step": 4270, |
| "valid_targets_mean": 2039.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.861958266452649, |
| "grad_norm": 0.716010306215438, |
| "learning_rate": 4.849585971866688e-08, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13099314272403717, |
| "step": 4275, |
| "valid_targets_mean": 2827.7, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 6.8699839486356336, |
| "grad_norm": 1.008634190990714, |
| "learning_rate": 4.3083746892684796e-08, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13648265600204468, |
| "step": 4280, |
| "valid_targets_mean": 2092.2, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 6.878009630818619, |
| "grad_norm": 0.8050911139139982, |
| "learning_rate": 3.7991431233288525e-08, |
| "loss": 0.1281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12041358649730682, |
| "step": 4285, |
| "valid_targets_mean": 2016.8, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 6.886035313001605, |
| "grad_norm": 0.7538681689851715, |
| "learning_rate": 3.321899434166831e-08, |
| "loss": 0.1315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12728962302207947, |
| "step": 4290, |
| "valid_targets_mean": 2348.8, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 6.89406099518459, |
| "grad_norm": 0.9078340983454675, |
| "learning_rate": 2.876651269315689e-08, |
| "loss": 0.13, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13924184441566467, |
| "step": 4295, |
| "valid_targets_mean": 1564.9, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 6.902086677367576, |
| "grad_norm": 0.8322797461761388, |
| "learning_rate": 2.4634057636001573e-08, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13911721110343933, |
| "step": 4300, |
| "valid_targets_mean": 1888.2, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 6.910112359550562, |
| "grad_norm": 0.8873358332613721, |
| "learning_rate": 2.082169539022294e-08, |
| "loss": 0.1383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1478015035390854, |
| "step": 4305, |
| "valid_targets_mean": 1802.1, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.918138041733547, |
| "grad_norm": 0.8910795462193187, |
| "learning_rate": 1.7329487046555683e-08, |
| "loss": 0.1275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13803160190582275, |
| "step": 4310, |
| "valid_targets_mean": 1852.9, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 6.926163723916533, |
| "grad_norm": 0.7929871067815147, |
| "learning_rate": 1.4157488565464949e-08, |
| "loss": 0.136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12524215877056122, |
| "step": 4315, |
| "valid_targets_mean": 2124.4, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 6.934189406099518, |
| "grad_norm": 0.8321158322797556, |
| "learning_rate": 1.1305750776253733e-08, |
| "loss": 0.1295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12520332634449005, |
| "step": 4320, |
| "valid_targets_mean": 2153.6, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.942215088282504, |
| "grad_norm": 0.8721383068519388, |
| "learning_rate": 8.774319376245733e-09, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13430440425872803, |
| "step": 4325, |
| "valid_targets_mean": 1598.9, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 6.95024077046549, |
| "grad_norm": 0.7481357903290494, |
| "learning_rate": 6.56323493005262e-09, |
| "loss": 0.1284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11327686160802841, |
| "step": 4330, |
| "valid_targets_mean": 2174.6, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 6.958266452648475, |
| "grad_norm": 0.8510993038307517, |
| "learning_rate": 4.672532868927882e-09, |
| "loss": 0.1268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1371006816625595, |
| "step": 4335, |
| "valid_targets_mean": 1838.2, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 6.966292134831461, |
| "grad_norm": 0.8256184023206394, |
| "learning_rate": 3.102243490196166e-09, |
| "loss": 0.1355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12108443677425385, |
| "step": 4340, |
| "valid_targets_mean": 1822.3, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 6.974317817014446, |
| "grad_norm": 0.6715633485519991, |
| "learning_rate": 1.8523919567692283e-09, |
| "loss": 0.1289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11774402111768723, |
| "step": 4345, |
| "valid_targets_mean": 2833.9, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 6.982343499197432, |
| "grad_norm": 0.7122923788742873, |
| "learning_rate": 9.229982967373652e-10, |
| "loss": 0.127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13086260855197906, |
| "step": 4350, |
| "valid_targets_mean": 3114.6, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 6.990369181380418, |
| "grad_norm": 0.7497754087372094, |
| "learning_rate": 3.1407740305633425e-10, |
| "loss": 0.1304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12377274036407471, |
| "step": 4355, |
| "valid_targets_mean": 2433.6, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 6.998394863563403, |
| "grad_norm": 0.9056604423294736, |
| "learning_rate": 2.563903330532469e-11, |
| "loss": 0.1313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12367966026067734, |
| "step": 4360, |
| "valid_targets_mean": 2186.9, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12605062127113342, |
| "step": 4361, |
| "total_flos": 649913807929344.0, |
| "train_loss": 0.21077685282949843, |
| "train_runtime": 19161.6847, |
| "train_samples_per_second": 3.639, |
| "train_steps_per_second": 0.228, |
| "valid_targets_mean": 2205.3, |
| "valid_targets_min": 939 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4361, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 200, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 649913807929344.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|