| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4347, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.008051529790660225, |
| "grad_norm": 18.887031329342683, |
| "learning_rate": 3.6781609195402303e-07, |
| "loss": 0.7617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7170521020889282, |
| "step": 5, |
| "valid_targets_mean": 4721.3, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 0.01610305958132045, |
| "grad_norm": 17.610592482733104, |
| "learning_rate": 8.275862068965518e-07, |
| "loss": 0.7308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7500532865524292, |
| "step": 10, |
| "valid_targets_mean": 4560.7, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 0.024154589371980676, |
| "grad_norm": 17.389455158716025, |
| "learning_rate": 1.2873563218390806e-06, |
| "loss": 0.719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7645566463470459, |
| "step": 15, |
| "valid_targets_mean": 4224.9, |
| "valid_targets_min": 1424 |
| }, |
| { |
| "epoch": 0.0322061191626409, |
| "grad_norm": 12.900467657800844, |
| "learning_rate": 1.7471264367816093e-06, |
| "loss": 0.6498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6394810676574707, |
| "step": 20, |
| "valid_targets_mean": 3705.6, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 0.040257648953301126, |
| "grad_norm": 8.27577785552847, |
| "learning_rate": 2.206896551724138e-06, |
| "loss": 0.6021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6195220351219177, |
| "step": 25, |
| "valid_targets_mean": 4815.3, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 0.04830917874396135, |
| "grad_norm": 4.570129109709082, |
| "learning_rate": 2.666666666666667e-06, |
| "loss": 0.5337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4826958477497101, |
| "step": 30, |
| "valid_targets_mean": 4646.1, |
| "valid_targets_min": 1763 |
| }, |
| { |
| "epoch": 0.05636070853462158, |
| "grad_norm": 2.9815097303289773, |
| "learning_rate": 3.1264367816091956e-06, |
| "loss": 0.5145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5005267858505249, |
| "step": 35, |
| "valid_targets_mean": 4164.2, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 0.0644122383252818, |
| "grad_norm": 1.6024853481776866, |
| "learning_rate": 3.5862068965517243e-06, |
| "loss": 0.4877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43937644362449646, |
| "step": 40, |
| "valid_targets_mean": 4963.1, |
| "valid_targets_min": 1405 |
| }, |
| { |
| "epoch": 0.07246376811594203, |
| "grad_norm": 1.1550666348042289, |
| "learning_rate": 4.0459770114942535e-06, |
| "loss": 0.4836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45346975326538086, |
| "step": 45, |
| "valid_targets_mean": 5371.4, |
| "valid_targets_min": 1739 |
| }, |
| { |
| "epoch": 0.08051529790660225, |
| "grad_norm": 1.1056770926806292, |
| "learning_rate": 4.505747126436782e-06, |
| "loss": 0.4879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4831688106060028, |
| "step": 50, |
| "valid_targets_mean": 5321.5, |
| "valid_targets_min": 1966 |
| }, |
| { |
| "epoch": 0.08856682769726248, |
| "grad_norm": 0.9520259825035011, |
| "learning_rate": 4.965517241379311e-06, |
| "loss": 0.4173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43055927753448486, |
| "step": 55, |
| "valid_targets_mean": 4930.1, |
| "valid_targets_min": 1613 |
| }, |
| { |
| "epoch": 0.0966183574879227, |
| "grad_norm": 0.7379387322001421, |
| "learning_rate": 5.42528735632184e-06, |
| "loss": 0.4301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41147735714912415, |
| "step": 60, |
| "valid_targets_mean": 4576.1, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 0.10466988727858294, |
| "grad_norm": 0.6751399532440802, |
| "learning_rate": 5.8850574712643685e-06, |
| "loss": 0.3953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40098029375076294, |
| "step": 65, |
| "valid_targets_mean": 4767.1, |
| "valid_targets_min": 1984 |
| }, |
| { |
| "epoch": 0.11272141706924316, |
| "grad_norm": 0.6451168287397513, |
| "learning_rate": 6.344827586206898e-06, |
| "loss": 0.3955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41312819719314575, |
| "step": 70, |
| "valid_targets_mean": 4322.2, |
| "valid_targets_min": 523 |
| }, |
| { |
| "epoch": 0.12077294685990338, |
| "grad_norm": 0.6097646247381094, |
| "learning_rate": 6.804597701149426e-06, |
| "loss": 0.4048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3773424029350281, |
| "step": 75, |
| "valid_targets_mean": 4922.2, |
| "valid_targets_min": 1736 |
| }, |
| { |
| "epoch": 0.1288244766505636, |
| "grad_norm": 0.6955263869864199, |
| "learning_rate": 7.264367816091955e-06, |
| "loss": 0.386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3395404815673828, |
| "step": 80, |
| "valid_targets_mean": 4326.2, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 0.13687600644122383, |
| "grad_norm": 0.6047921080138658, |
| "learning_rate": 7.724137931034483e-06, |
| "loss": 0.373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33859458565711975, |
| "step": 85, |
| "valid_targets_mean": 4358.8, |
| "valid_targets_min": 2465 |
| }, |
| { |
| "epoch": 0.14492753623188406, |
| "grad_norm": 0.5884903953581806, |
| "learning_rate": 8.183908045977013e-06, |
| "loss": 0.3308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.323479026556015, |
| "step": 90, |
| "valid_targets_mean": 4712.4, |
| "valid_targets_min": 2373 |
| }, |
| { |
| "epoch": 0.1529790660225443, |
| "grad_norm": 0.5738600516460006, |
| "learning_rate": 8.643678160919541e-06, |
| "loss": 0.3431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33414769172668457, |
| "step": 95, |
| "valid_targets_mean": 4288.1, |
| "valid_targets_min": 1850 |
| }, |
| { |
| "epoch": 0.1610305958132045, |
| "grad_norm": 0.6365501852080249, |
| "learning_rate": 9.10344827586207e-06, |
| "loss": 0.3526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41237330436706543, |
| "step": 100, |
| "valid_targets_mean": 4589.5, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 0.16908212560386474, |
| "grad_norm": 0.5810936825227695, |
| "learning_rate": 9.563218390804598e-06, |
| "loss": 0.3694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3179246783256531, |
| "step": 105, |
| "valid_targets_mean": 4583.3, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 0.17713365539452497, |
| "grad_norm": 0.6085982104059682, |
| "learning_rate": 1.0022988505747126e-05, |
| "loss": 0.3688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3603907823562622, |
| "step": 110, |
| "valid_targets_mean": 3972.6, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 0.18518518518518517, |
| "grad_norm": 0.6219836430762767, |
| "learning_rate": 1.0482758620689658e-05, |
| "loss": 0.3434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36107924580574036, |
| "step": 115, |
| "valid_targets_mean": 3626.8, |
| "valid_targets_min": 784 |
| }, |
| { |
| "epoch": 0.1932367149758454, |
| "grad_norm": 0.5706613275227181, |
| "learning_rate": 1.0942528735632186e-05, |
| "loss": 0.3638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35068589448928833, |
| "step": 120, |
| "valid_targets_mean": 4590.1, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 0.20128824476650564, |
| "grad_norm": 0.5239098489712369, |
| "learning_rate": 1.1402298850574713e-05, |
| "loss": 0.3214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31050339341163635, |
| "step": 125, |
| "valid_targets_mean": 4365.3, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 0.20933977455716588, |
| "grad_norm": 0.5408209063854124, |
| "learning_rate": 1.1862068965517241e-05, |
| "loss": 0.3312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.343374639749527, |
| "step": 130, |
| "valid_targets_mean": 4735.1, |
| "valid_targets_min": 502 |
| }, |
| { |
| "epoch": 0.21739130434782608, |
| "grad_norm": 0.5429590967253727, |
| "learning_rate": 1.2321839080459773e-05, |
| "loss": 0.3132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2973455786705017, |
| "step": 135, |
| "valid_targets_mean": 4331.6, |
| "valid_targets_min": 1580 |
| }, |
| { |
| "epoch": 0.22544283413848631, |
| "grad_norm": 0.5564263430607277, |
| "learning_rate": 1.2781609195402301e-05, |
| "loss": 0.3223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33352577686309814, |
| "step": 140, |
| "valid_targets_mean": 4605.9, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 0.23349436392914655, |
| "grad_norm": 0.59405705309966, |
| "learning_rate": 1.324137931034483e-05, |
| "loss": 0.3197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31183719635009766, |
| "step": 145, |
| "valid_targets_mean": 3893.1, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 0.24154589371980675, |
| "grad_norm": 0.5158909121745847, |
| "learning_rate": 1.3701149425287356e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2867949604988098, |
| "step": 150, |
| "valid_targets_mean": 4840.7, |
| "valid_targets_min": 1486 |
| }, |
| { |
| "epoch": 0.249597423510467, |
| "grad_norm": 0.6568765520342051, |
| "learning_rate": 1.4160919540229888e-05, |
| "loss": 0.3106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3462482690811157, |
| "step": 155, |
| "valid_targets_mean": 3947.3, |
| "valid_targets_min": 1429 |
| }, |
| { |
| "epoch": 0.2576489533011272, |
| "grad_norm": 0.6071351268604575, |
| "learning_rate": 1.4620689655172416e-05, |
| "loss": 0.3274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33247584104537964, |
| "step": 160, |
| "valid_targets_mean": 4600.6, |
| "valid_targets_min": 1925 |
| }, |
| { |
| "epoch": 0.26570048309178745, |
| "grad_norm": 0.538560909580689, |
| "learning_rate": 1.5080459770114944e-05, |
| "loss": 0.3158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31049293279647827, |
| "step": 165, |
| "valid_targets_mean": 5258.5, |
| "valid_targets_min": 1983 |
| }, |
| { |
| "epoch": 0.27375201288244766, |
| "grad_norm": 0.568539391929678, |
| "learning_rate": 1.5540229885057473e-05, |
| "loss": 0.3157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30851513147354126, |
| "step": 170, |
| "valid_targets_mean": 4449.2, |
| "valid_targets_min": 453 |
| }, |
| { |
| "epoch": 0.28180354267310787, |
| "grad_norm": 0.6078239781315768, |
| "learning_rate": 1.6000000000000003e-05, |
| "loss": 0.3106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.302283376455307, |
| "step": 175, |
| "valid_targets_mean": 4618.0, |
| "valid_targets_min": 2377 |
| }, |
| { |
| "epoch": 0.2898550724637681, |
| "grad_norm": 0.5885746435904814, |
| "learning_rate": 1.645977011494253e-05, |
| "loss": 0.3296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3404327630996704, |
| "step": 180, |
| "valid_targets_mean": 4848.8, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 0.29790660225442833, |
| "grad_norm": 0.6287600513879442, |
| "learning_rate": 1.691954022988506e-05, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35874509811401367, |
| "step": 185, |
| "valid_targets_mean": 4003.5, |
| "valid_targets_min": 321 |
| }, |
| { |
| "epoch": 0.3059581320450886, |
| "grad_norm": 0.5118887113449945, |
| "learning_rate": 1.7379310344827586e-05, |
| "loss": 0.3036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3192656636238098, |
| "step": 190, |
| "valid_targets_mean": 5059.1, |
| "valid_targets_min": 2133 |
| }, |
| { |
| "epoch": 0.3140096618357488, |
| "grad_norm": 0.5676499502591437, |
| "learning_rate": 1.7839080459770116e-05, |
| "loss": 0.2746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2645234167575836, |
| "step": 195, |
| "valid_targets_mean": 4453.4, |
| "valid_targets_min": 1599 |
| }, |
| { |
| "epoch": 0.322061191626409, |
| "grad_norm": 0.5756721398531897, |
| "learning_rate": 1.8298850574712646e-05, |
| "loss": 0.3204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3237614631652832, |
| "step": 200, |
| "valid_targets_mean": 4916.9, |
| "valid_targets_min": 2747 |
| }, |
| { |
| "epoch": 0.33011272141706927, |
| "grad_norm": 0.661205961638061, |
| "learning_rate": 1.8758620689655173e-05, |
| "loss": 0.2988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30946576595306396, |
| "step": 205, |
| "valid_targets_mean": 4202.1, |
| "valid_targets_min": 1793 |
| }, |
| { |
| "epoch": 0.33816425120772947, |
| "grad_norm": 0.5585042067771965, |
| "learning_rate": 1.9218390804597703e-05, |
| "loss": 0.3035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30198991298675537, |
| "step": 210, |
| "valid_targets_mean": 4014.8, |
| "valid_targets_min": 1521 |
| }, |
| { |
| "epoch": 0.3462157809983897, |
| "grad_norm": 0.5364392722283728, |
| "learning_rate": 1.9678160919540233e-05, |
| "loss": 0.3032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3075558841228485, |
| "step": 215, |
| "valid_targets_mean": 4535.4, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 0.35426731078904994, |
| "grad_norm": 0.5478504018061776, |
| "learning_rate": 2.013793103448276e-05, |
| "loss": 0.293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30238276720046997, |
| "step": 220, |
| "valid_targets_mean": 4278.9, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 0.36231884057971014, |
| "grad_norm": 0.5543366789399233, |
| "learning_rate": 2.059770114942529e-05, |
| "loss": 0.3067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31759655475616455, |
| "step": 225, |
| "valid_targets_mean": 5445.6, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 0.37037037037037035, |
| "grad_norm": 0.6286539962949731, |
| "learning_rate": 2.1057471264367816e-05, |
| "loss": 0.2964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30352896451950073, |
| "step": 230, |
| "valid_targets_mean": 3805.3, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 0.3784219001610306, |
| "grad_norm": 0.5644783614075699, |
| "learning_rate": 2.1517241379310346e-05, |
| "loss": 0.2967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3186013102531433, |
| "step": 235, |
| "valid_targets_mean": 4621.7, |
| "valid_targets_min": 1571 |
| }, |
| { |
| "epoch": 0.3864734299516908, |
| "grad_norm": 0.5931980260785429, |
| "learning_rate": 2.1977011494252873e-05, |
| "loss": 0.3034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28426745533943176, |
| "step": 240, |
| "valid_targets_mean": 4771.1, |
| "valid_targets_min": 2048 |
| }, |
| { |
| "epoch": 0.394524959742351, |
| "grad_norm": 0.5236909740791719, |
| "learning_rate": 2.2436781609195406e-05, |
| "loss": 0.2915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2973197102546692, |
| "step": 245, |
| "valid_targets_mean": 4744.9, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 0.4025764895330113, |
| "grad_norm": 0.5306243392897267, |
| "learning_rate": 2.2896551724137933e-05, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3088257312774658, |
| "step": 250, |
| "valid_targets_mean": 5178.1, |
| "valid_targets_min": 1966 |
| }, |
| { |
| "epoch": 0.4106280193236715, |
| "grad_norm": 0.48677773497495813, |
| "learning_rate": 2.3356321839080463e-05, |
| "loss": 0.285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26008594036102295, |
| "step": 255, |
| "valid_targets_mean": 5040.2, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 0.41867954911433175, |
| "grad_norm": 1.2774083864267622, |
| "learning_rate": 2.381609195402299e-05, |
| "loss": 0.2967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2775506377220154, |
| "step": 260, |
| "valid_targets_mean": 4319.1, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 0.42673107890499196, |
| "grad_norm": 0.6457594097564714, |
| "learning_rate": 2.427586206896552e-05, |
| "loss": 0.2886, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2859913408756256, |
| "step": 265, |
| "valid_targets_mean": 3785.8, |
| "valid_targets_min": 284 |
| }, |
| { |
| "epoch": 0.43478260869565216, |
| "grad_norm": 0.5721794133457904, |
| "learning_rate": 2.4735632183908046e-05, |
| "loss": 0.2675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2737387716770172, |
| "step": 270, |
| "valid_targets_mean": 4904.9, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 0.4428341384863124, |
| "grad_norm": 0.6155727873490212, |
| "learning_rate": 2.5195402298850576e-05, |
| "loss": 0.2987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.317902147769928, |
| "step": 275, |
| "valid_targets_mean": 3661.2, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 0.45088566827697263, |
| "grad_norm": 0.6349757508130273, |
| "learning_rate": 2.5655172413793103e-05, |
| "loss": 0.282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2630305290222168, |
| "step": 280, |
| "valid_targets_mean": 3326.7, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 0.45893719806763283, |
| "grad_norm": 0.6148296415866233, |
| "learning_rate": 2.6114942528735636e-05, |
| "loss": 0.2793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27396440505981445, |
| "step": 285, |
| "valid_targets_mean": 4434.6, |
| "valid_targets_min": 1038 |
| }, |
| { |
| "epoch": 0.4669887278582931, |
| "grad_norm": 0.5645172489838126, |
| "learning_rate": 2.6574712643678166e-05, |
| "loss": 0.2686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25225305557250977, |
| "step": 290, |
| "valid_targets_mean": 4993.3, |
| "valid_targets_min": 1962 |
| }, |
| { |
| "epoch": 0.4750402576489533, |
| "grad_norm": 0.5739342126572219, |
| "learning_rate": 2.7034482758620693e-05, |
| "loss": 0.2957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.340742826461792, |
| "step": 295, |
| "valid_targets_mean": 4796.8, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 0.4830917874396135, |
| "grad_norm": 0.5587075968581772, |
| "learning_rate": 2.749425287356322e-05, |
| "loss": 0.2832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27218180894851685, |
| "step": 300, |
| "valid_targets_mean": 4788.8, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.49114331723027377, |
| "grad_norm": 0.7790422573070022, |
| "learning_rate": 2.795402298850575e-05, |
| "loss": 0.2762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25361332297325134, |
| "step": 305, |
| "valid_targets_mean": 3807.0, |
| "valid_targets_min": 344 |
| }, |
| { |
| "epoch": 0.499194847020934, |
| "grad_norm": 0.5359108312034309, |
| "learning_rate": 2.8413793103448276e-05, |
| "loss": 0.2899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24744702875614166, |
| "step": 310, |
| "valid_targets_mean": 4844.2, |
| "valid_targets_min": 1948 |
| }, |
| { |
| "epoch": 0.5072463768115942, |
| "grad_norm": 0.7694244503734501, |
| "learning_rate": 2.8873563218390806e-05, |
| "loss": 0.2574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25962382555007935, |
| "step": 315, |
| "valid_targets_mean": 3957.3, |
| "valid_targets_min": 751 |
| }, |
| { |
| "epoch": 0.5152979066022544, |
| "grad_norm": 0.6998112569580612, |
| "learning_rate": 2.9333333333333333e-05, |
| "loss": 0.2823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.283919095993042, |
| "step": 320, |
| "valid_targets_mean": 4178.9, |
| "valid_targets_min": 1504 |
| }, |
| { |
| "epoch": 0.5233494363929146, |
| "grad_norm": 0.5572107376686236, |
| "learning_rate": 2.9793103448275866e-05, |
| "loss": 0.299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3307899236679077, |
| "step": 325, |
| "valid_targets_mean": 4934.9, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 0.5314009661835749, |
| "grad_norm": 0.5601650228344617, |
| "learning_rate": 3.0252873563218396e-05, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26864737272262573, |
| "step": 330, |
| "valid_targets_mean": 3976.2, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 0.5394524959742351, |
| "grad_norm": 0.6400241549564539, |
| "learning_rate": 3.071264367816092e-05, |
| "loss": 0.2817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2869405746459961, |
| "step": 335, |
| "valid_targets_mean": 4011.7, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 0.5475040257648953, |
| "grad_norm": 0.5021644926973708, |
| "learning_rate": 3.117241379310345e-05, |
| "loss": 0.2568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2651926279067993, |
| "step": 340, |
| "valid_targets_mean": 5310.1, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.5555555555555556, |
| "grad_norm": 0.819724946601287, |
| "learning_rate": 3.1632183908045976e-05, |
| "loss": 0.2768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.297665536403656, |
| "step": 345, |
| "valid_targets_mean": 3748.9, |
| "valid_targets_min": 249 |
| }, |
| { |
| "epoch": 0.5636070853462157, |
| "grad_norm": 0.49635945683598137, |
| "learning_rate": 3.2091954022988506e-05, |
| "loss": 0.2736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27254384756088257, |
| "step": 350, |
| "valid_targets_mean": 4190.4, |
| "valid_targets_min": 380 |
| }, |
| { |
| "epoch": 0.571658615136876, |
| "grad_norm": 1.1643886506532481, |
| "learning_rate": 3.2551724137931036e-05, |
| "loss": 0.2698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2615281343460083, |
| "step": 355, |
| "valid_targets_mean": 3684.1, |
| "valid_targets_min": 304 |
| }, |
| { |
| "epoch": 0.5797101449275363, |
| "grad_norm": 0.5045131044975655, |
| "learning_rate": 3.3011494252873566e-05, |
| "loss": 0.2772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28446757793426514, |
| "step": 360, |
| "valid_targets_mean": 5213.9, |
| "valid_targets_min": 2518 |
| }, |
| { |
| "epoch": 0.5877616747181964, |
| "grad_norm": 0.5901966768401951, |
| "learning_rate": 3.3471264367816096e-05, |
| "loss": 0.2751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2504952549934387, |
| "step": 365, |
| "valid_targets_mean": 4182.6, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 0.5958132045088567, |
| "grad_norm": 0.620399649393727, |
| "learning_rate": 3.3931034482758626e-05, |
| "loss": 0.2721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2381853461265564, |
| "step": 370, |
| "valid_targets_mean": 4586.0, |
| "valid_targets_min": 1672 |
| }, |
| { |
| "epoch": 0.6038647342995169, |
| "grad_norm": 0.5417315383509183, |
| "learning_rate": 3.4390804597701156e-05, |
| "loss": 0.2635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2672516405582428, |
| "step": 375, |
| "valid_targets_mean": 4311.4, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 0.6119162640901772, |
| "grad_norm": 0.6433514192784039, |
| "learning_rate": 3.485057471264368e-05, |
| "loss": 0.284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32015344500541687, |
| "step": 380, |
| "valid_targets_mean": 3902.9, |
| "valid_targets_min": 1623 |
| }, |
| { |
| "epoch": 0.6199677938808373, |
| "grad_norm": 0.4775998328542989, |
| "learning_rate": 3.531034482758621e-05, |
| "loss": 0.2664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24788491427898407, |
| "step": 385, |
| "valid_targets_mean": 4189.4, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 0.6280193236714976, |
| "grad_norm": 0.5122265709609899, |
| "learning_rate": 3.577011494252874e-05, |
| "loss": 0.2738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27622339129447937, |
| "step": 390, |
| "valid_targets_mean": 4446.6, |
| "valid_targets_min": 1670 |
| }, |
| { |
| "epoch": 0.6360708534621579, |
| "grad_norm": 0.659466553378636, |
| "learning_rate": 3.622988505747126e-05, |
| "loss": 0.2831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3116128742694855, |
| "step": 395, |
| "valid_targets_mean": 4667.6, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 0.644122383252818, |
| "grad_norm": 0.5849425616180388, |
| "learning_rate": 3.668965517241379e-05, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27755099534988403, |
| "step": 400, |
| "valid_targets_mean": 4714.6, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 0.6521739130434783, |
| "grad_norm": 0.5327108961779472, |
| "learning_rate": 3.714942528735633e-05, |
| "loss": 0.2745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27385851740837097, |
| "step": 405, |
| "valid_targets_mean": 5260.8, |
| "valid_targets_min": 2141 |
| }, |
| { |
| "epoch": 0.6602254428341385, |
| "grad_norm": 0.5998643197455865, |
| "learning_rate": 3.760919540229885e-05, |
| "loss": 0.2872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3069554567337036, |
| "step": 410, |
| "valid_targets_mean": 4323.8, |
| "valid_targets_min": 831 |
| }, |
| { |
| "epoch": 0.6682769726247987, |
| "grad_norm": 0.5690712799581026, |
| "learning_rate": 3.806896551724138e-05, |
| "loss": 0.2731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29719623923301697, |
| "step": 415, |
| "valid_targets_mean": 4270.9, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 0.6763285024154589, |
| "grad_norm": 0.5754513117973928, |
| "learning_rate": 3.852873563218391e-05, |
| "loss": 0.2721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29911819100379944, |
| "step": 420, |
| "valid_targets_mean": 4512.4, |
| "valid_targets_min": 1988 |
| }, |
| { |
| "epoch": 0.6843800322061192, |
| "grad_norm": 0.6061703211904361, |
| "learning_rate": 3.898850574712644e-05, |
| "loss": 0.2673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23556432127952576, |
| "step": 425, |
| "valid_targets_mean": 3921.6, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 0.6924315619967794, |
| "grad_norm": 0.5391890622955845, |
| "learning_rate": 3.9448275862068966e-05, |
| "loss": 0.2459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23832057416439056, |
| "step": 430, |
| "valid_targets_mean": 4345.2, |
| "valid_targets_min": 2090 |
| }, |
| { |
| "epoch": 0.7004830917874396, |
| "grad_norm": 0.6101927641358206, |
| "learning_rate": 3.9908045977011496e-05, |
| "loss": 0.2721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2649371325969696, |
| "step": 435, |
| "valid_targets_mean": 4433.6, |
| "valid_targets_min": 1317 |
| }, |
| { |
| "epoch": 0.7085346215780999, |
| "grad_norm": 0.5646390271799305, |
| "learning_rate": 3.9999896813789735e-05, |
| "loss": 0.2601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27699440717697144, |
| "step": 440, |
| "valid_targets_mean": 4894.1, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 0.71658615136876, |
| "grad_norm": 0.5718807548846909, |
| "learning_rate": 3.999947762163533e-05, |
| "loss": 0.2623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29374945163726807, |
| "step": 445, |
| "valid_targets_mean": 3907.8, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 0.7246376811594203, |
| "grad_norm": 0.5614682322405541, |
| "learning_rate": 3.999873598115203e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.257183313369751, |
| "step": 450, |
| "valid_targets_mean": 4987.9, |
| "valid_targets_min": 1860 |
| }, |
| { |
| "epoch": 0.7326892109500805, |
| "grad_norm": 0.5300074790618707, |
| "learning_rate": 3.999767190429718e-05, |
| "loss": 0.2748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23682445287704468, |
| "step": 455, |
| "valid_targets_mean": 5225.4, |
| "valid_targets_min": 2450 |
| }, |
| { |
| "epoch": 0.7407407407407407, |
| "grad_norm": 0.6542049865844981, |
| "learning_rate": 3.99962854082267e-05, |
| "loss": 0.2822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29080742597579956, |
| "step": 460, |
| "valid_targets_mean": 4597.2, |
| "valid_targets_min": 2222 |
| }, |
| { |
| "epoch": 0.748792270531401, |
| "grad_norm": 0.502946880278254, |
| "learning_rate": 3.9994576515294864e-05, |
| "loss": 0.2668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28522011637687683, |
| "step": 465, |
| "valid_targets_mean": 4706.1, |
| "valid_targets_min": 1773 |
| }, |
| { |
| "epoch": 0.7568438003220612, |
| "grad_norm": 0.5050040823394027, |
| "learning_rate": 3.999254525305386e-05, |
| "loss": 0.2704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2506832480430603, |
| "step": 470, |
| "valid_targets_mean": 5194.9, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 0.7648953301127214, |
| "grad_norm": 0.8322414020355918, |
| "learning_rate": 3.999019165425341e-05, |
| "loss": 0.2682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29580700397491455, |
| "step": 475, |
| "valid_targets_mean": 3748.2, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 0.7729468599033816, |
| "grad_norm": 0.5680386432970268, |
| "learning_rate": 3.99875157568402e-05, |
| "loss": 0.2655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2671373188495636, |
| "step": 480, |
| "valid_targets_mean": 4587.8, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 0.7809983896940419, |
| "grad_norm": 0.5112203887556883, |
| "learning_rate": 3.998451760395729e-05, |
| "loss": 0.2623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2868801951408386, |
| "step": 485, |
| "valid_targets_mean": 4774.4, |
| "valid_targets_min": 1792 |
| }, |
| { |
| "epoch": 0.789049919484702, |
| "grad_norm": 0.5606005265672219, |
| "learning_rate": 3.99811972439434e-05, |
| "loss": 0.2643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2751631736755371, |
| "step": 490, |
| "valid_targets_mean": 4579.5, |
| "valid_targets_min": 1396 |
| }, |
| { |
| "epoch": 0.7971014492753623, |
| "grad_norm": 0.5467905444044749, |
| "learning_rate": 3.997755473033218e-05, |
| "loss": 0.2521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2562072277069092, |
| "step": 495, |
| "valid_targets_mean": 3827.3, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 0.8051529790660226, |
| "grad_norm": 0.5387721194984708, |
| "learning_rate": 3.997359012185127e-05, |
| "loss": 0.2612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2520545721054077, |
| "step": 500, |
| "valid_targets_mean": 4061.6, |
| "valid_targets_min": 547 |
| }, |
| { |
| "epoch": 0.8132045088566827, |
| "grad_norm": 0.5976518636156888, |
| "learning_rate": 3.996930348242141e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23626355826854706, |
| "step": 505, |
| "valid_targets_mean": 4540.9, |
| "valid_targets_min": 1484 |
| }, |
| { |
| "epoch": 0.821256038647343, |
| "grad_norm": 0.6166919816090995, |
| "learning_rate": 3.996469488115539e-05, |
| "loss": 0.2583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2615845203399658, |
| "step": 510, |
| "valid_targets_mean": 4508.8, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 0.8293075684380032, |
| "grad_norm": 0.530813397454018, |
| "learning_rate": 3.995976439235694e-05, |
| "loss": 0.2722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2612318694591522, |
| "step": 515, |
| "valid_targets_mean": 4225.1, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 0.8373590982286635, |
| "grad_norm": 0.6517729260520128, |
| "learning_rate": 3.995451209551953e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23576730489730835, |
| "step": 520, |
| "valid_targets_mean": 5023.0, |
| "valid_targets_min": 1701 |
| }, |
| { |
| "epoch": 0.8454106280193237, |
| "grad_norm": 0.4740752251218264, |
| "learning_rate": 3.994893807532509e-05, |
| "loss": 0.2922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28204214572906494, |
| "step": 525, |
| "valid_targets_mean": 4959.8, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 0.8534621578099839, |
| "grad_norm": 0.5257899294040256, |
| "learning_rate": 3.994304242164265e-05, |
| "loss": 0.2593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2655045986175537, |
| "step": 530, |
| "valid_targets_mean": 4981.6, |
| "valid_targets_min": 2051 |
| }, |
| { |
| "epoch": 0.8615136876006442, |
| "grad_norm": 0.536523092714892, |
| "learning_rate": 3.9936825229526855e-05, |
| "loss": 0.2861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29214853048324585, |
| "step": 535, |
| "valid_targets_mean": 4368.4, |
| "valid_targets_min": 2191 |
| }, |
| { |
| "epoch": 0.8695652173913043, |
| "grad_norm": 0.5028299546325571, |
| "learning_rate": 3.9930286599216506e-05, |
| "loss": 0.2587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27183425426483154, |
| "step": 540, |
| "valid_targets_mean": 5098.8, |
| "valid_targets_min": 2186 |
| }, |
| { |
| "epoch": 0.8776167471819646, |
| "grad_norm": 0.5635419055915679, |
| "learning_rate": 3.9923426636132866e-05, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2873607277870178, |
| "step": 545, |
| "valid_targets_mean": 4578.5, |
| "valid_targets_min": 1671 |
| }, |
| { |
| "epoch": 0.8856682769726248, |
| "grad_norm": 0.5724413640787459, |
| "learning_rate": 3.991624545087801e-05, |
| "loss": 0.2765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27895426750183105, |
| "step": 550, |
| "valid_targets_mean": 3958.7, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 0.893719806763285, |
| "grad_norm": 0.5024007626126078, |
| "learning_rate": 3.9908743159233016e-05, |
| "loss": 0.2569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20082515478134155, |
| "step": 555, |
| "valid_targets_mean": 4550.9, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 0.9017713365539453, |
| "grad_norm": 0.5485922659002295, |
| "learning_rate": 3.990091988215612e-05, |
| "loss": 0.2468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2621651887893677, |
| "step": 560, |
| "valid_targets_mean": 4163.2, |
| "valid_targets_min": 1507 |
| }, |
| { |
| "epoch": 0.9098228663446055, |
| "grad_norm": 0.5184933123196136, |
| "learning_rate": 3.989277574578074e-05, |
| "loss": 0.2692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20918220281600952, |
| "step": 565, |
| "valid_targets_mean": 3785.8, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 0.9178743961352657, |
| "grad_norm": 0.5186343425685319, |
| "learning_rate": 3.9884310881413473e-05, |
| "loss": 0.2637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2877514362335205, |
| "step": 570, |
| "valid_targets_mean": 5365.6, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 0.9259259259259259, |
| "grad_norm": 0.5097833267576443, |
| "learning_rate": 3.987552542553194e-05, |
| "loss": 0.2501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23448419570922852, |
| "step": 575, |
| "valid_targets_mean": 4300.2, |
| "valid_targets_min": 1615 |
| }, |
| { |
| "epoch": 0.9339774557165862, |
| "grad_norm": 0.5183101791069704, |
| "learning_rate": 3.9866419519782636e-05, |
| "loss": 0.2565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2744702696800232, |
| "step": 580, |
| "valid_targets_mean": 4674.6, |
| "valid_targets_min": 267 |
| }, |
| { |
| "epoch": 0.9420289855072463, |
| "grad_norm": 0.5621277031078485, |
| "learning_rate": 3.985699331097858e-05, |
| "loss": 0.2678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2877187728881836, |
| "step": 585, |
| "valid_targets_mean": 4813.2, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 0.9500805152979066, |
| "grad_norm": 0.6940945000218365, |
| "learning_rate": 3.984724695109702e-05, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29620370268821716, |
| "step": 590, |
| "valid_targets_mean": 5132.4, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 0.9581320450885669, |
| "grad_norm": 0.6065162564844915, |
| "learning_rate": 3.983718059727693e-05, |
| "loss": 0.2557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27759110927581787, |
| "step": 595, |
| "valid_targets_mean": 3982.5, |
| "valid_targets_min": 1549 |
| }, |
| { |
| "epoch": 0.966183574879227, |
| "grad_norm": 0.5059275833472612, |
| "learning_rate": 3.9826794411816495e-05, |
| "loss": 0.2645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27101898193359375, |
| "step": 600, |
| "valid_targets_mean": 4788.5, |
| "valid_targets_min": 1713 |
| }, |
| { |
| "epoch": 0.9742351046698873, |
| "grad_norm": 0.4992312775195265, |
| "learning_rate": 3.981608856217049e-05, |
| "loss": 0.2626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23076659440994263, |
| "step": 605, |
| "valid_targets_mean": 4342.8, |
| "valid_targets_min": 1263 |
| }, |
| { |
| "epoch": 0.9822866344605475, |
| "grad_norm": 0.5353175524067539, |
| "learning_rate": 3.980506322094761e-05, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2311723828315735, |
| "step": 610, |
| "valid_targets_mean": 4810.8, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 0.9903381642512077, |
| "grad_norm": 0.6330855933495575, |
| "learning_rate": 3.979371856590762e-05, |
| "loss": 0.2715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28571778535842896, |
| "step": 615, |
| "valid_targets_mean": 4376.3, |
| "valid_targets_min": 2240 |
| }, |
| { |
| "epoch": 0.998389694041868, |
| "grad_norm": 0.5397840170469355, |
| "learning_rate": 3.978205477995856e-05, |
| "loss": 0.2662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24998024106025696, |
| "step": 620, |
| "valid_targets_mean": 4034.1, |
| "valid_targets_min": 1638 |
| }, |
| { |
| "epoch": 1.0064412238325282, |
| "grad_norm": 0.5507361899409122, |
| "learning_rate": 3.9770072051153754e-05, |
| "loss": 0.2544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.252638041973114, |
| "step": 625, |
| "valid_targets_mean": 4238.3, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 1.0144927536231885, |
| "grad_norm": 0.5602531648929935, |
| "learning_rate": 3.9757770572688786e-05, |
| "loss": 0.2414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23810608685016632, |
| "step": 630, |
| "valid_targets_mean": 3836.5, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 1.0225442834138487, |
| "grad_norm": 0.5389828337838378, |
| "learning_rate": 3.9745150542898405e-05, |
| "loss": 0.2349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20239052176475525, |
| "step": 635, |
| "valid_targets_mean": 3506.9, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 1.0305958132045088, |
| "grad_norm": 0.5471627213957879, |
| "learning_rate": 3.97322121652533e-05, |
| "loss": 0.2466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23700180649757385, |
| "step": 640, |
| "valid_targets_mean": 4167.8, |
| "valid_targets_min": 380 |
| }, |
| { |
| "epoch": 1.038647342995169, |
| "grad_norm": 0.5304941534687796, |
| "learning_rate": 3.971895564835683e-05, |
| "loss": 0.2265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21442700922489166, |
| "step": 645, |
| "valid_targets_mean": 4103.1, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 1.0466988727858293, |
| "grad_norm": 0.5123253191465812, |
| "learning_rate": 3.970538120594166e-05, |
| "loss": 0.2191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22118300199508667, |
| "step": 650, |
| "valid_targets_mean": 4709.2, |
| "valid_targets_min": 1225 |
| }, |
| { |
| "epoch": 1.0547504025764896, |
| "grad_norm": 0.5144164225120834, |
| "learning_rate": 3.9691489056866324e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2365712821483612, |
| "step": 655, |
| "valid_targets_mean": 4630.8, |
| "valid_targets_min": 862 |
| }, |
| { |
| "epoch": 1.0628019323671498, |
| "grad_norm": 0.6461651582671288, |
| "learning_rate": 3.9677279425111684e-05, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24799947440624237, |
| "step": 660, |
| "valid_targets_mean": 4166.1, |
| "valid_targets_min": 1309 |
| }, |
| { |
| "epoch": 1.07085346215781, |
| "grad_norm": 0.5024189972964114, |
| "learning_rate": 3.9662752539777314e-05, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24382641911506653, |
| "step": 665, |
| "valid_targets_mean": 5176.7, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 1.0789049919484701, |
| "grad_norm": 0.9391803347175582, |
| "learning_rate": 3.9647908635077845e-05, |
| "loss": 0.2615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.277189165353775, |
| "step": 670, |
| "valid_targets_mean": 4315.8, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 1.0869565217391304, |
| "grad_norm": 0.4882832004268316, |
| "learning_rate": 3.963274795033913e-05, |
| "loss": 0.245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24163475632667542, |
| "step": 675, |
| "valid_targets_mean": 5134.3, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 1.0950080515297906, |
| "grad_norm": 0.6167872996926629, |
| "learning_rate": 3.9617270729994436e-05, |
| "loss": 0.2482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24507923424243927, |
| "step": 680, |
| "valid_targets_mean": 4063.7, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 1.103059581320451, |
| "grad_norm": 0.6232571737295083, |
| "learning_rate": 3.960147722358046e-05, |
| "loss": 0.2504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23517994582653046, |
| "step": 685, |
| "valid_targets_mean": 3350.7, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 1.1111111111111112, |
| "grad_norm": 0.5205417579091651, |
| "learning_rate": 3.958536768573335e-05, |
| "loss": 0.245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25678330659866333, |
| "step": 690, |
| "valid_targets_mean": 4774.0, |
| "valid_targets_min": 1681 |
| }, |
| { |
| "epoch": 1.1191626409017714, |
| "grad_norm": 0.5540696760333587, |
| "learning_rate": 3.956894237618456e-05, |
| "loss": 0.2455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2578514814376831, |
| "step": 695, |
| "valid_targets_mean": 3721.6, |
| "valid_targets_min": 543 |
| }, |
| { |
| "epoch": 1.1272141706924317, |
| "grad_norm": 0.5703134217215095, |
| "learning_rate": 3.955220155975669e-05, |
| "loss": 0.2465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27087417244911194, |
| "step": 700, |
| "valid_targets_mean": 4647.0, |
| "valid_targets_min": 1837 |
| }, |
| { |
| "epoch": 1.1352657004830917, |
| "grad_norm": 0.5281006763450222, |
| "learning_rate": 3.9535145506359206e-05, |
| "loss": 0.2431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2202616184949875, |
| "step": 705, |
| "valid_targets_mean": 4643.4, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 1.143317230273752, |
| "grad_norm": 0.4639603789841704, |
| "learning_rate": 3.951777449098408e-05, |
| "loss": 0.2377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2633700966835022, |
| "step": 710, |
| "valid_targets_mean": 5459.8, |
| "valid_targets_min": 2264 |
| }, |
| { |
| "epoch": 1.1513687600644122, |
| "grad_norm": 0.469137374700247, |
| "learning_rate": 3.9500088793701387e-05, |
| "loss": 0.2415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19833050668239594, |
| "step": 715, |
| "valid_targets_mean": 4964.5, |
| "valid_targets_min": 2160 |
| }, |
| { |
| "epoch": 1.1594202898550725, |
| "grad_norm": 0.4905202669992282, |
| "learning_rate": 3.948208869965473e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24042034149169922, |
| "step": 720, |
| "valid_targets_mean": 4569.5, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 1.1674718196457328, |
| "grad_norm": 0.5271378070562325, |
| "learning_rate": 3.946377449905672e-05, |
| "loss": 0.2332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24370059370994568, |
| "step": 725, |
| "valid_targets_mean": 4409.8, |
| "valid_targets_min": 1705 |
| }, |
| { |
| "epoch": 1.1755233494363928, |
| "grad_norm": 0.48816490928722517, |
| "learning_rate": 3.9445146487184226e-05, |
| "loss": 0.2268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23395568132400513, |
| "step": 730, |
| "valid_targets_mean": 4742.6, |
| "valid_targets_min": 1740 |
| }, |
| { |
| "epoch": 1.183574879227053, |
| "grad_norm": 0.508703086089454, |
| "learning_rate": 3.942620496437366e-05, |
| "loss": 0.2398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2787438929080963, |
| "step": 735, |
| "valid_targets_mean": 5090.3, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 1.1916264090177133, |
| "grad_norm": 0.5274435230388868, |
| "learning_rate": 3.940695023601612e-05, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23083099722862244, |
| "step": 740, |
| "valid_targets_mean": 4942.7, |
| "valid_targets_min": 1747 |
| }, |
| { |
| "epoch": 1.1996779388083736, |
| "grad_norm": 0.48187263788077117, |
| "learning_rate": 3.938738261255247e-05, |
| "loss": 0.2322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21453389525413513, |
| "step": 745, |
| "valid_targets_mean": 4564.6, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 1.2077294685990339, |
| "grad_norm": 0.7495259641509139, |
| "learning_rate": 3.9367502409468315e-05, |
| "loss": 0.2489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21770915389060974, |
| "step": 750, |
| "valid_targets_mean": 4150.0, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 1.2157809983896941, |
| "grad_norm": 0.513119058591006, |
| "learning_rate": 3.934730994728893e-05, |
| "loss": 0.2449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2321898341178894, |
| "step": 755, |
| "valid_targets_mean": 3742.6, |
| "valid_targets_min": 1247 |
| }, |
| { |
| "epoch": 1.2238325281803544, |
| "grad_norm": 0.5088681345844467, |
| "learning_rate": 3.932680555157413e-05, |
| "loss": 0.2362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2543366551399231, |
| "step": 760, |
| "valid_targets_mean": 4571.6, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 1.2318840579710144, |
| "grad_norm": 0.5212074947311489, |
| "learning_rate": 3.9305989552912936e-05, |
| "loss": 0.2311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24161793291568756, |
| "step": 765, |
| "valid_targets_mean": 4267.8, |
| "valid_targets_min": 2059 |
| }, |
| { |
| "epoch": 1.2399355877616747, |
| "grad_norm": 0.6379814909420424, |
| "learning_rate": 3.928486228691831e-05, |
| "loss": 0.2377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25767624378204346, |
| "step": 770, |
| "valid_targets_mean": 4049.4, |
| "valid_targets_min": 1596 |
| }, |
| { |
| "epoch": 1.247987117552335, |
| "grad_norm": 0.5355001588932113, |
| "learning_rate": 3.926342409422175e-05, |
| "loss": 0.2504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23288603127002716, |
| "step": 775, |
| "valid_targets_mean": 3844.3, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 1.2560386473429952, |
| "grad_norm": 0.5212100454034752, |
| "learning_rate": 3.924167532046773e-05, |
| "loss": 0.2554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24769359827041626, |
| "step": 780, |
| "valid_targets_mean": 4338.0, |
| "valid_targets_min": 1507 |
| }, |
| { |
| "epoch": 1.2640901771336555, |
| "grad_norm": 0.5991969877035959, |
| "learning_rate": 3.9219616316308215e-05, |
| "loss": 0.2391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23935574293136597, |
| "step": 785, |
| "valid_targets_mean": 4815.1, |
| "valid_targets_min": 1755 |
| }, |
| { |
| "epoch": 1.2721417069243155, |
| "grad_norm": 0.5852623692737184, |
| "learning_rate": 3.919724743739694e-05, |
| "loss": 0.2462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2316393107175827, |
| "step": 790, |
| "valid_targets_mean": 4748.1, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 1.2801932367149758, |
| "grad_norm": 0.5400353515222852, |
| "learning_rate": 3.91745690443837e-05, |
| "loss": 0.2372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24360281229019165, |
| "step": 795, |
| "valid_targets_mean": 4905.1, |
| "valid_targets_min": 1697 |
| }, |
| { |
| "epoch": 1.288244766505636, |
| "grad_norm": 0.5161454582163929, |
| "learning_rate": 3.915158150290855e-05, |
| "loss": 0.2297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2185833752155304, |
| "step": 800, |
| "valid_targets_mean": 4708.6, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 1.2962962962962963, |
| "grad_norm": 0.5421912889681342, |
| "learning_rate": 3.912828518359588e-05, |
| "loss": 0.2361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24869637191295624, |
| "step": 805, |
| "valid_targets_mean": 5677.7, |
| "valid_targets_min": 2666 |
| }, |
| { |
| "epoch": 1.3043478260869565, |
| "grad_norm": 0.5587294675034205, |
| "learning_rate": 3.910468046204846e-05, |
| "loss": 0.2255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.240371972322464, |
| "step": 810, |
| "valid_targets_mean": 3585.4, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 1.3123993558776168, |
| "grad_norm": 0.5803843717029648, |
| "learning_rate": 3.908076771884139e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23448866605758667, |
| "step": 815, |
| "valid_targets_mean": 4076.1, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 1.320450885668277, |
| "grad_norm": 0.6615696992092541, |
| "learning_rate": 3.905654733951595e-05, |
| "loss": 0.2366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24138154089450836, |
| "step": 820, |
| "valid_targets_mean": 3298.6, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 1.3285024154589373, |
| "grad_norm": 0.48424332287717764, |
| "learning_rate": 3.9032019714573366e-05, |
| "loss": 0.2274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2244749665260315, |
| "step": 825, |
| "valid_targets_mean": 4370.7, |
| "valid_targets_min": 1299 |
| }, |
| { |
| "epoch": 1.3365539452495974, |
| "grad_norm": 0.5116233310783836, |
| "learning_rate": 3.9007185239468554e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2363509237766266, |
| "step": 830, |
| "valid_targets_mean": 4251.2, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 1.3446054750402576, |
| "grad_norm": 0.5726251093172268, |
| "learning_rate": 3.8982044314603725e-05, |
| "loss": 0.2382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25756919384002686, |
| "step": 835, |
| "valid_targets_mean": 4103.4, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 1.3526570048309179, |
| "grad_norm": 0.5399551753973628, |
| "learning_rate": 3.8956597345321927e-05, |
| "loss": 0.2403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23214933276176453, |
| "step": 840, |
| "valid_targets_mean": 3571.1, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 1.3607085346215781, |
| "grad_norm": 0.5153551957359142, |
| "learning_rate": 3.893084474190051e-05, |
| "loss": 0.2456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24375241994857788, |
| "step": 845, |
| "valid_targets_mean": 4158.2, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 1.3687600644122382, |
| "grad_norm": 0.48984930240931984, |
| "learning_rate": 3.890478691954452e-05, |
| "loss": 0.2416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2558751702308655, |
| "step": 850, |
| "valid_targets_mean": 4738.9, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 1.3768115942028984, |
| "grad_norm": 0.5179307198966028, |
| "learning_rate": 3.8878424298379996e-05, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22707146406173706, |
| "step": 855, |
| "valid_targets_mean": 4074.3, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 1.3848631239935587, |
| "grad_norm": 0.6293401724856043, |
| "learning_rate": 3.885175730344718e-05, |
| "loss": 0.2487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24598611891269684, |
| "step": 860, |
| "valid_targets_mean": 4331.4, |
| "valid_targets_min": 1429 |
| }, |
| { |
| "epoch": 1.392914653784219, |
| "grad_norm": 0.5429776165767362, |
| "learning_rate": 3.882478636469372e-05, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25051477551460266, |
| "step": 865, |
| "valid_targets_mean": 4375.6, |
| "valid_targets_min": 1616 |
| }, |
| { |
| "epoch": 1.4009661835748792, |
| "grad_norm": 0.5668228228210831, |
| "learning_rate": 3.879751191696766e-05, |
| "loss": 0.2554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2403651624917984, |
| "step": 870, |
| "valid_targets_mean": 3847.9, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 1.4090177133655395, |
| "grad_norm": 0.4916125568229993, |
| "learning_rate": 3.8769934400010506e-05, |
| "loss": 0.2376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23794618248939514, |
| "step": 875, |
| "valid_targets_mean": 4820.1, |
| "valid_targets_min": 284 |
| }, |
| { |
| "epoch": 1.4170692431561998, |
| "grad_norm": 0.48401044866312015, |
| "learning_rate": 3.8742054258450085e-05, |
| "loss": 0.2435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25705933570861816, |
| "step": 880, |
| "valid_targets_mean": 4531.7, |
| "valid_targets_min": 1442 |
| }, |
| { |
| "epoch": 1.42512077294686, |
| "grad_norm": 0.5305875988771065, |
| "learning_rate": 3.871387194179338e-05, |
| "loss": 0.2428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20840579271316528, |
| "step": 885, |
| "valid_targets_mean": 4164.4, |
| "valid_targets_min": 2047 |
| }, |
| { |
| "epoch": 1.43317230273752, |
| "grad_norm": 0.5592288973797526, |
| "learning_rate": 3.868538790441931e-05, |
| "loss": 0.2344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24872620403766632, |
| "step": 890, |
| "valid_targets_mean": 4424.3, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 1.4412238325281803, |
| "grad_norm": 0.46555566538841864, |
| "learning_rate": 3.865660260557138e-05, |
| "loss": 0.2324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21978382766246796, |
| "step": 895, |
| "valid_targets_mean": 4317.1, |
| "valid_targets_min": 2278 |
| }, |
| { |
| "epoch": 1.4492753623188406, |
| "grad_norm": 0.5185263723338586, |
| "learning_rate": 3.8627516509350286e-05, |
| "loss": 0.2379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2476550042629242, |
| "step": 900, |
| "valid_targets_mean": 3795.6, |
| "valid_targets_min": 1701 |
| }, |
| { |
| "epoch": 1.4573268921095008, |
| "grad_norm": 0.5514262995566678, |
| "learning_rate": 3.859813008470644e-05, |
| "loss": 0.2488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24102932214736938, |
| "step": 905, |
| "valid_targets_mean": 3926.9, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 1.465378421900161, |
| "grad_norm": 0.4713138062680591, |
| "learning_rate": 3.856844380543239e-05, |
| "loss": 0.2316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23857206106185913, |
| "step": 910, |
| "valid_targets_mean": 4829.1, |
| "valid_targets_min": 1822 |
| }, |
| { |
| "epoch": 1.4734299516908211, |
| "grad_norm": 0.46745151947518565, |
| "learning_rate": 3.8538458150155186e-05, |
| "loss": 0.2337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21306023001670837, |
| "step": 915, |
| "valid_targets_mean": 5670.3, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 1.4814814814814814, |
| "grad_norm": 0.5399378076969245, |
| "learning_rate": 3.850817360232869e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23806512355804443, |
| "step": 920, |
| "valid_targets_mean": 5083.9, |
| "valid_targets_min": 2183 |
| }, |
| { |
| "epoch": 1.4895330112721417, |
| "grad_norm": 0.6208023209932018, |
| "learning_rate": 3.8477590650225735e-05, |
| "loss": 0.245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26910722255706787, |
| "step": 925, |
| "valid_targets_mean": 4777.4, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 1.497584541062802, |
| "grad_norm": 0.5213298121096795, |
| "learning_rate": 3.8446709786930305e-05, |
| "loss": 0.2341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24538570642471313, |
| "step": 930, |
| "valid_targets_mean": 4161.3, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 1.5056360708534622, |
| "grad_norm": 0.5236314811464815, |
| "learning_rate": 3.841553151032953e-05, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23516438901424408, |
| "step": 935, |
| "valid_targets_mean": 5095.7, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 1.5136876006441224, |
| "grad_norm": 0.44460197327326756, |
| "learning_rate": 3.8384056323105695e-05, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23193703591823578, |
| "step": 940, |
| "valid_targets_mean": 5266.9, |
| "valid_targets_min": 1863 |
| }, |
| { |
| "epoch": 1.5217391304347827, |
| "grad_norm": 0.6021732933768308, |
| "learning_rate": 3.835228473272814e-05, |
| "loss": 0.2202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2238101363182068, |
| "step": 945, |
| "valid_targets_mean": 4458.2, |
| "valid_targets_min": 751 |
| }, |
| { |
| "epoch": 1.529790660225443, |
| "grad_norm": 0.5548844712586349, |
| "learning_rate": 3.832021725144506e-05, |
| "loss": 0.2345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2418593019247055, |
| "step": 950, |
| "valid_targets_mean": 4469.2, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 1.537842190016103, |
| "grad_norm": 0.46334027352601115, |
| "learning_rate": 3.828785439627523e-05, |
| "loss": 0.2517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24094292521476746, |
| "step": 955, |
| "valid_targets_mean": 5478.1, |
| "valid_targets_min": 1745 |
| }, |
| { |
| "epoch": 1.5458937198067633, |
| "grad_norm": 0.5074800565232367, |
| "learning_rate": 3.825519668899972e-05, |
| "loss": 0.2418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25097841024398804, |
| "step": 960, |
| "valid_targets_mean": 5015.4, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 1.5539452495974235, |
| "grad_norm": 0.5212941157766611, |
| "learning_rate": 3.8222244656153444e-05, |
| "loss": 0.2467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2439125031232834, |
| "step": 965, |
| "valid_targets_mean": 4481.0, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 1.5619967793880838, |
| "grad_norm": 0.5111240156665687, |
| "learning_rate": 3.818899882901666e-05, |
| "loss": 0.2359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22901548445224762, |
| "step": 970, |
| "valid_targets_mean": 4092.8, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 1.5700483091787438, |
| "grad_norm": 0.512770693439504, |
| "learning_rate": 3.815545974360644e-05, |
| "loss": 0.2231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23196808993816376, |
| "step": 975, |
| "valid_targets_mean": 4075.3, |
| "valid_targets_min": 1956 |
| }, |
| { |
| "epoch": 1.578099838969404, |
| "grad_norm": 0.5042161332697872, |
| "learning_rate": 3.812162794066802e-05, |
| "loss": 0.236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25058242678642273, |
| "step": 980, |
| "valid_targets_mean": 4614.4, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 1.5861513687600644, |
| "grad_norm": 0.4846950795943882, |
| "learning_rate": 3.8087503965666057e-05, |
| "loss": 0.2359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2251492440700531, |
| "step": 985, |
| "valid_targets_mean": 4310.9, |
| "valid_targets_min": 1978 |
| }, |
| { |
| "epoch": 1.5942028985507246, |
| "grad_norm": 0.49445825909902524, |
| "learning_rate": 3.805308836877586e-05, |
| "loss": 0.2419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2309640347957611, |
| "step": 990, |
| "valid_targets_mean": 4083.0, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 1.6022544283413849, |
| "grad_norm": 0.522939331982219, |
| "learning_rate": 3.80183817048745e-05, |
| "loss": 0.2301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23157933354377747, |
| "step": 995, |
| "valid_targets_mean": 3599.1, |
| "valid_targets_min": 358 |
| }, |
| { |
| "epoch": 1.6103059581320451, |
| "grad_norm": 0.5144792659864994, |
| "learning_rate": 3.7983384533531894e-05, |
| "loss": 0.2367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2594456374645233, |
| "step": 1000, |
| "valid_targets_mean": 4572.1, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 1.6183574879227054, |
| "grad_norm": 0.514940069429718, |
| "learning_rate": 3.7948097419001736e-05, |
| "loss": 0.2325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23250789940357208, |
| "step": 1005, |
| "valid_targets_mean": 4625.0, |
| "valid_targets_min": 350 |
| }, |
| { |
| "epoch": 1.6264090177133657, |
| "grad_norm": 0.52221869816674, |
| "learning_rate": 3.7912520930212445e-05, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21590971946716309, |
| "step": 1010, |
| "valid_targets_mean": 4035.4, |
| "valid_targets_min": 1483 |
| }, |
| { |
| "epoch": 1.634460547504026, |
| "grad_norm": 0.42946813411877144, |
| "learning_rate": 3.7876655640757974e-05, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23158404231071472, |
| "step": 1015, |
| "valid_targets_mean": 5336.1, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 1.642512077294686, |
| "grad_norm": 0.4983259472306404, |
| "learning_rate": 3.784050212888857e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2527810335159302, |
| "step": 1020, |
| "valid_targets_mean": 5022.8, |
| "valid_targets_min": 2939 |
| }, |
| { |
| "epoch": 1.6505636070853462, |
| "grad_norm": 0.46712880691077496, |
| "learning_rate": 3.780406097750141e-05, |
| "loss": 0.2465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22650480270385742, |
| "step": 1025, |
| "valid_targets_mean": 4311.5, |
| "valid_targets_min": 1275 |
| }, |
| { |
| "epoch": 1.6586151368760065, |
| "grad_norm": 0.5417140597671484, |
| "learning_rate": 3.776733277413127e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.195145845413208, |
| "step": 1030, |
| "valid_targets_mean": 4207.8, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.4883088038596097, |
| "learning_rate": 3.7730318110941004e-05, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21643765270709991, |
| "step": 1035, |
| "valid_targets_mean": 4391.3, |
| "valid_targets_min": 2660 |
| }, |
| { |
| "epoch": 1.6747181964573268, |
| "grad_norm": 0.5289568127223118, |
| "learning_rate": 3.7693017584712013e-05, |
| "loss": 0.2456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23360106348991394, |
| "step": 1040, |
| "valid_targets_mean": 4826.2, |
| "valid_targets_min": 2011 |
| }, |
| { |
| "epoch": 1.682769726247987, |
| "grad_norm": 0.5576792989418248, |
| "learning_rate": 3.765543179683462e-05, |
| "loss": 0.2296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24486708641052246, |
| "step": 1045, |
| "valid_targets_mean": 3934.4, |
| "valid_targets_min": 1683 |
| }, |
| { |
| "epoch": 1.6908212560386473, |
| "grad_norm": 0.5017617827412163, |
| "learning_rate": 3.7617561353298395e-05, |
| "loss": 0.2521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24896810948848724, |
| "step": 1050, |
| "valid_targets_mean": 4011.8, |
| "valid_targets_min": 321 |
| }, |
| { |
| "epoch": 1.6988727858293076, |
| "grad_norm": 0.4860709875293544, |
| "learning_rate": 3.7579406864682327e-05, |
| "loss": 0.2264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24139925837516785, |
| "step": 1055, |
| "valid_targets_mean": 4299.9, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 1.7069243156199678, |
| "grad_norm": 0.5345894675911452, |
| "learning_rate": 3.7540968946145036e-05, |
| "loss": 0.241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2598978877067566, |
| "step": 1060, |
| "valid_targets_mean": 4928.6, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 1.714975845410628, |
| "grad_norm": 0.5465814570656329, |
| "learning_rate": 3.750224821741486e-05, |
| "loss": 0.2358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2219647765159607, |
| "step": 1065, |
| "valid_targets_mean": 5155.9, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 1.7230273752012883, |
| "grad_norm": 0.5300553470904004, |
| "learning_rate": 3.7463245302779795e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28267112374305725, |
| "step": 1070, |
| "valid_targets_mean": 3852.3, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 1.7310789049919486, |
| "grad_norm": 0.4624218505703108, |
| "learning_rate": 3.742396083107751e-05, |
| "loss": 0.2128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21661648154258728, |
| "step": 1075, |
| "valid_targets_mean": 4283.7, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 1.7391304347826086, |
| "grad_norm": 0.4993979746767997, |
| "learning_rate": 3.7384395435685166e-05, |
| "loss": 0.2346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21909837424755096, |
| "step": 1080, |
| "valid_targets_mean": 4359.1, |
| "valid_targets_min": 2250 |
| }, |
| { |
| "epoch": 1.747181964573269, |
| "grad_norm": 0.5407067040296573, |
| "learning_rate": 3.7344549754509196e-05, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22699233889579773, |
| "step": 1085, |
| "valid_targets_mean": 3677.0, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 1.7552334943639292, |
| "grad_norm": 0.4642737834973646, |
| "learning_rate": 3.7304424429975046e-05, |
| "loss": 0.2318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22292137145996094, |
| "step": 1090, |
| "valid_targets_mean": 5690.0, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 1.7632850241545892, |
| "grad_norm": 0.5671519558623886, |
| "learning_rate": 3.726402010901681e-05, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21334418654441833, |
| "step": 1095, |
| "valid_targets_mean": 4616.9, |
| "valid_targets_min": 1898 |
| }, |
| { |
| "epoch": 1.7713365539452495, |
| "grad_norm": 0.5083634785423456, |
| "learning_rate": 3.722333744306678e-05, |
| "loss": 0.2249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21738044917583466, |
| "step": 1100, |
| "valid_targets_mean": 5448.9, |
| "valid_targets_min": 1726 |
| }, |
| { |
| "epoch": 1.7793880837359097, |
| "grad_norm": 0.8896163020318464, |
| "learning_rate": 3.7182377088044984e-05, |
| "loss": 0.2286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22921855747699738, |
| "step": 1105, |
| "valid_targets_mean": 4703.8, |
| "valid_targets_min": 1508 |
| }, |
| { |
| "epoch": 1.78743961352657, |
| "grad_norm": 0.5450639925225488, |
| "learning_rate": 3.7141139704348576e-05, |
| "loss": 0.228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21833300590515137, |
| "step": 1110, |
| "valid_targets_mean": 3445.8, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 1.7954911433172303, |
| "grad_norm": 0.6520638172384545, |
| "learning_rate": 3.7099625956841175e-05, |
| "loss": 0.223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25272321701049805, |
| "step": 1115, |
| "valid_targets_mean": 3248.3, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 1.8035426731078905, |
| "grad_norm": 0.4493969588039246, |
| "learning_rate": 3.70578365148422e-05, |
| "loss": 0.2367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23505555093288422, |
| "step": 1120, |
| "valid_targets_mean": 5024.8, |
| "valid_targets_min": 1833 |
| }, |
| { |
| "epoch": 1.8115942028985508, |
| "grad_norm": 0.4827090106067237, |
| "learning_rate": 3.701577205211604e-05, |
| "loss": 0.2545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2535856366157532, |
| "step": 1125, |
| "valid_targets_mean": 4428.5, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 1.819645732689211, |
| "grad_norm": 0.6263613356926185, |
| "learning_rate": 3.697343324686119e-05, |
| "loss": 0.2272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23104625940322876, |
| "step": 1130, |
| "valid_targets_mean": 4673.7, |
| "valid_targets_min": 1449 |
| }, |
| { |
| "epoch": 1.8276972624798713, |
| "grad_norm": 0.5298323694554691, |
| "learning_rate": 3.693082078169933e-05, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24033012986183167, |
| "step": 1135, |
| "valid_targets_mean": 4732.1, |
| "valid_targets_min": 1605 |
| }, |
| { |
| "epoch": 1.8357487922705316, |
| "grad_norm": 0.4783853550563579, |
| "learning_rate": 3.68879353436643e-05, |
| "loss": 0.2189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2028733789920807, |
| "step": 1140, |
| "valid_targets_mean": 4867.9, |
| "valid_targets_min": 2154 |
| }, |
| { |
| "epoch": 1.8438003220611916, |
| "grad_norm": 0.4595078299986765, |
| "learning_rate": 3.684477762419108e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.215766042470932, |
| "step": 1145, |
| "valid_targets_mean": 4522.2, |
| "valid_targets_min": 2208 |
| }, |
| { |
| "epoch": 1.8518518518518519, |
| "grad_norm": 0.5149239335560051, |
| "learning_rate": 3.6801348319104546e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2230435311794281, |
| "step": 1150, |
| "valid_targets_mean": 3680.6, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 1.8599033816425121, |
| "grad_norm": 0.42919344493593076, |
| "learning_rate": 3.675764812860833e-05, |
| "loss": 0.2518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20287317037582397, |
| "step": 1155, |
| "valid_targets_mean": 5642.9, |
| "valid_targets_min": 2036 |
| }, |
| { |
| "epoch": 1.8679549114331722, |
| "grad_norm": 0.4884349396198345, |
| "learning_rate": 3.671367775727353e-05, |
| "loss": 0.2463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24478939175605774, |
| "step": 1160, |
| "valid_targets_mean": 4762.1, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 1.8760064412238324, |
| "grad_norm": 0.49953971630838795, |
| "learning_rate": 3.666943791402726e-05, |
| "loss": 0.2527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2292686104774475, |
| "step": 1165, |
| "valid_targets_mean": 4543.8, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 1.8840579710144927, |
| "grad_norm": 0.4644474561197982, |
| "learning_rate": 3.662492931214137e-05, |
| "loss": 0.2492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2597373127937317, |
| "step": 1170, |
| "valid_targets_mean": 5243.1, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 1.892109500805153, |
| "grad_norm": 0.5180686308684069, |
| "learning_rate": 3.6580152669220784e-05, |
| "loss": 0.2365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2606375813484192, |
| "step": 1175, |
| "valid_targets_mean": 4800.7, |
| "valid_targets_min": 2456 |
| }, |
| { |
| "epoch": 1.9001610305958132, |
| "grad_norm": 0.42092491518373576, |
| "learning_rate": 3.6535108707192053e-05, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22271546721458435, |
| "step": 1180, |
| "valid_targets_mean": 5251.3, |
| "valid_targets_min": 1616 |
| }, |
| { |
| "epoch": 1.9082125603864735, |
| "grad_norm": 0.5826394657065203, |
| "learning_rate": 3.648979815229167e-05, |
| "loss": 0.2372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20627357065677643, |
| "step": 1185, |
| "valid_targets_mean": 3834.6, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 1.9162640901771337, |
| "grad_norm": 0.7082935353213954, |
| "learning_rate": 3.644422173505433e-05, |
| "loss": 0.2517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24815203249454498, |
| "step": 1190, |
| "valid_targets_mean": 4642.2, |
| "valid_targets_min": 338 |
| }, |
| { |
| "epoch": 1.924315619967794, |
| "grad_norm": 0.5088420525828131, |
| "learning_rate": 3.639838019030123e-05, |
| "loss": 0.2303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23133976757526398, |
| "step": 1195, |
| "valid_targets_mean": 4064.8, |
| "valid_targets_min": 1849 |
| }, |
| { |
| "epoch": 1.9323671497584543, |
| "grad_norm": 0.4807696052913685, |
| "learning_rate": 3.635227425712812e-05, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24485018849372864, |
| "step": 1200, |
| "valid_targets_mean": 5358.3, |
| "valid_targets_min": 1956 |
| }, |
| { |
| "epoch": 1.9404186795491143, |
| "grad_norm": 0.5374569252336697, |
| "learning_rate": 3.6305904678893504e-05, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23684567213058472, |
| "step": 1205, |
| "valid_targets_mean": 4465.9, |
| "valid_targets_min": 2036 |
| }, |
| { |
| "epoch": 1.9484702093397746, |
| "grad_norm": 0.4315082896253737, |
| "learning_rate": 3.6259272203206535e-05, |
| "loss": 0.2397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20846745371818542, |
| "step": 1210, |
| "valid_targets_mean": 5167.9, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 1.9565217391304348, |
| "grad_norm": 0.5262891588589963, |
| "learning_rate": 3.621237758191505e-05, |
| "loss": 0.2385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24596351385116577, |
| "step": 1215, |
| "valid_targets_mean": 3761.8, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 1.9645732689210949, |
| "grad_norm": 0.49628184032222405, |
| "learning_rate": 3.616522157109342e-05, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21257467567920685, |
| "step": 1220, |
| "valid_targets_mean": 4065.5, |
| "valid_targets_min": 1897 |
| }, |
| { |
| "epoch": 1.9726247987117551, |
| "grad_norm": 0.4787291955056688, |
| "learning_rate": 3.6117804931030324e-05, |
| "loss": 0.2457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2495032548904419, |
| "step": 1225, |
| "valid_targets_mean": 4767.3, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 1.9806763285024154, |
| "grad_norm": 0.4952065016883059, |
| "learning_rate": 3.607012842621657e-05, |
| "loss": 0.2273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23980122804641724, |
| "step": 1230, |
| "valid_targets_mean": 4069.4, |
| "valid_targets_min": 1260 |
| }, |
| { |
| "epoch": 1.9887278582930756, |
| "grad_norm": 0.5230866628171786, |
| "learning_rate": 3.602219282533269e-05, |
| "loss": 0.2255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2368500828742981, |
| "step": 1235, |
| "valid_targets_mean": 4682.7, |
| "valid_targets_min": 2343 |
| }, |
| { |
| "epoch": 1.996779388083736, |
| "grad_norm": 0.5246193826991147, |
| "learning_rate": 3.597399890123659e-05, |
| "loss": 0.2329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21333156526088715, |
| "step": 1240, |
| "valid_targets_mean": 4692.2, |
| "valid_targets_min": 2047 |
| }, |
| { |
| "epoch": 2.004830917874396, |
| "grad_norm": 0.505863313320365, |
| "learning_rate": 3.5925547430951094e-05, |
| "loss": 0.2099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20909734070301056, |
| "step": 1245, |
| "valid_targets_mean": 4637.2, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 2.0128824476650564, |
| "grad_norm": 0.43133643927265986, |
| "learning_rate": 3.587683919565136e-05, |
| "loss": 0.2156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19329163432121277, |
| "step": 1250, |
| "valid_targets_mean": 5283.4, |
| "valid_targets_min": 1835 |
| }, |
| { |
| "epoch": 2.0209339774557167, |
| "grad_norm": 0.4837745442669591, |
| "learning_rate": 3.582787498065237e-05, |
| "loss": 0.2031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20409853756427765, |
| "step": 1255, |
| "valid_targets_mean": 4767.1, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 2.028985507246377, |
| "grad_norm": 0.6452848255637806, |
| "learning_rate": 3.577865557539621e-05, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1907821148633957, |
| "step": 1260, |
| "valid_targets_mean": 4763.1, |
| "valid_targets_min": 392 |
| }, |
| { |
| "epoch": 2.037037037037037, |
| "grad_norm": 0.5867010578619666, |
| "learning_rate": 3.572918177343935e-05, |
| "loss": 0.2132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1922091245651245, |
| "step": 1265, |
| "valid_targets_mean": 4118.4, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 2.0450885668276975, |
| "grad_norm": 0.48474397713094575, |
| "learning_rate": 3.567945437243987e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19150424003601074, |
| "step": 1270, |
| "valid_targets_mean": 4600.4, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 2.0531400966183573, |
| "grad_norm": 0.5113649508317663, |
| "learning_rate": 3.5629474174144564e-05, |
| "loss": 0.2242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.253940224647522, |
| "step": 1275, |
| "valid_targets_mean": 5131.0, |
| "valid_targets_min": 2438 |
| }, |
| { |
| "epoch": 2.0611916264090175, |
| "grad_norm": 0.491663340986429, |
| "learning_rate": 3.5579241984376065e-05, |
| "loss": 0.217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22499999403953552, |
| "step": 1280, |
| "valid_targets_mean": 3951.9, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 2.069243156199678, |
| "grad_norm": 0.520462248826658, |
| "learning_rate": 3.5528758613019804e-05, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19735172390937805, |
| "step": 1285, |
| "valid_targets_mean": 3831.2, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 2.077294685990338, |
| "grad_norm": 0.5206723700369398, |
| "learning_rate": 3.547802487401097e-05, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23212730884552002, |
| "step": 1290, |
| "valid_targets_mean": 5061.6, |
| "valid_targets_min": 2180 |
| }, |
| { |
| "epoch": 2.0853462157809983, |
| "grad_norm": 0.577226384156968, |
| "learning_rate": 3.54270415853214e-05, |
| "loss": 0.22, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20443934202194214, |
| "step": 1295, |
| "valid_targets_mean": 3395.8, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.0933977455716586, |
| "grad_norm": 0.4423746810496331, |
| "learning_rate": 3.537580956894638e-05, |
| "loss": 0.225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21375350654125214, |
| "step": 1300, |
| "valid_targets_mean": 5160.8, |
| "valid_targets_min": 1507 |
| }, |
| { |
| "epoch": 2.101449275362319, |
| "grad_norm": 0.5548629803187833, |
| "learning_rate": 3.532432965089138e-05, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22949251532554626, |
| "step": 1305, |
| "valid_targets_mean": 5229.6, |
| "valid_targets_min": 2557 |
| }, |
| { |
| "epoch": 2.109500805152979, |
| "grad_norm": 0.4906711255865245, |
| "learning_rate": 3.527260266115876e-05, |
| "loss": 0.2215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2087794542312622, |
| "step": 1310, |
| "valid_targets_mean": 5409.4, |
| "valid_targets_min": 2349 |
| }, |
| { |
| "epoch": 2.1175523349436394, |
| "grad_norm": 0.6560805934109221, |
| "learning_rate": 3.522062943373438e-05, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17596739530563354, |
| "step": 1315, |
| "valid_targets_mean": 4226.9, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 2.1256038647342996, |
| "grad_norm": 0.7107665752653891, |
| "learning_rate": 3.516841080657413e-05, |
| "loss": 0.22, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23091405630111694, |
| "step": 1320, |
| "valid_targets_mean": 4053.8, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 2.13365539452496, |
| "grad_norm": 0.5185713231757747, |
| "learning_rate": 3.511594762159046e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20578667521476746, |
| "step": 1325, |
| "valid_targets_mean": 4018.0, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 2.14170692431562, |
| "grad_norm": 0.463159581350649, |
| "learning_rate": 3.506324072463878e-05, |
| "loss": 0.2049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1929136961698532, |
| "step": 1330, |
| "valid_targets_mean": 4945.8, |
| "valid_targets_min": 2099 |
| }, |
| { |
| "epoch": 2.14975845410628, |
| "grad_norm": 0.5447005808188629, |
| "learning_rate": 3.5010290965503826e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23045824468135834, |
| "step": 1335, |
| "valid_targets_mean": 4698.5, |
| "valid_targets_min": 1716 |
| }, |
| { |
| "epoch": 2.1578099838969402, |
| "grad_norm": 0.4595107321034477, |
| "learning_rate": 3.495709919788597e-05, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18875578045845032, |
| "step": 1340, |
| "valid_targets_mean": 4457.4, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 2.1658615136876005, |
| "grad_norm": 0.6481051628858272, |
| "learning_rate": 3.490366627938742e-05, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22552573680877686, |
| "step": 1345, |
| "valid_targets_mean": 4907.9, |
| "valid_targets_min": 1381 |
| }, |
| { |
| "epoch": 2.1739130434782608, |
| "grad_norm": 0.8255339190022734, |
| "learning_rate": 3.484999307149846e-05, |
| "loss": 0.2202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20174431800842285, |
| "step": 1350, |
| "valid_targets_mean": 3897.0, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 2.181964573268921, |
| "grad_norm": 0.47550594396325907, |
| "learning_rate": 3.47960804395835e-05, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21997377276420593, |
| "step": 1355, |
| "valid_targets_mean": 4916.5, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 2.1900161030595813, |
| "grad_norm": 0.5142914581894688, |
| "learning_rate": 3.474192925286714e-05, |
| "loss": 0.2166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2234359234571457, |
| "step": 1360, |
| "valid_targets_mean": 4057.0, |
| "valid_targets_min": 554 |
| }, |
| { |
| "epoch": 2.1980676328502415, |
| "grad_norm": 0.5135241141747307, |
| "learning_rate": 3.468754038442017e-05, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21173028647899628, |
| "step": 1365, |
| "valid_targets_mean": 4122.8, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 2.206119162640902, |
| "grad_norm": 0.5281981416757465, |
| "learning_rate": 3.463291471114548e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2580035328865051, |
| "step": 1370, |
| "valid_targets_mean": 4534.7, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 2.214170692431562, |
| "grad_norm": 0.546080448981762, |
| "learning_rate": 3.4578053113763936e-05, |
| "loss": 0.2185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2357328236103058, |
| "step": 1375, |
| "valid_targets_mean": 4083.2, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 2.2222222222222223, |
| "grad_norm": 0.43510725221723323, |
| "learning_rate": 3.452295647680014e-05, |
| "loss": 0.2108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.210770383477211, |
| "step": 1380, |
| "valid_targets_mean": 5021.1, |
| "valid_targets_min": 1913 |
| }, |
| { |
| "epoch": 2.2302737520128826, |
| "grad_norm": 0.45576706352160945, |
| "learning_rate": 3.4467625688568245e-05, |
| "loss": 0.21, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20456649363040924, |
| "step": 1385, |
| "valid_targets_mean": 4813.6, |
| "valid_targets_min": 1879 |
| }, |
| { |
| "epoch": 2.238325281803543, |
| "grad_norm": 0.4605011820162796, |
| "learning_rate": 3.4412061641157546e-05, |
| "loss": 0.2026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1862925887107849, |
| "step": 1390, |
| "valid_targets_mean": 5375.2, |
| "valid_targets_min": 1405 |
| }, |
| { |
| "epoch": 2.246376811594203, |
| "grad_norm": 0.5067717085593049, |
| "learning_rate": 3.435626523041815e-05, |
| "loss": 0.2132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20806747674942017, |
| "step": 1395, |
| "valid_targets_mean": 4125.7, |
| "valid_targets_min": 2104 |
| }, |
| { |
| "epoch": 2.2544283413848634, |
| "grad_norm": 0.503211076543084, |
| "learning_rate": 3.430023735594653e-05, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23167727887630463, |
| "step": 1400, |
| "valid_targets_mean": 4897.6, |
| "valid_targets_min": 344 |
| }, |
| { |
| "epoch": 2.262479871175523, |
| "grad_norm": 0.5252844399823857, |
| "learning_rate": 3.4243978921071005e-05, |
| "loss": 0.2117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18407735228538513, |
| "step": 1405, |
| "valid_targets_mean": 4546.8, |
| "valid_targets_min": 1908 |
| }, |
| { |
| "epoch": 2.2705314009661834, |
| "grad_norm": 0.5703046217142366, |
| "learning_rate": 3.418749083283719e-05, |
| "loss": 0.223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23428402841091156, |
| "step": 1410, |
| "valid_targets_mean": 4894.1, |
| "valid_targets_min": 1720 |
| }, |
| { |
| "epoch": 2.2785829307568437, |
| "grad_norm": 0.45360806117795466, |
| "learning_rate": 3.413077400199334e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16744893789291382, |
| "step": 1415, |
| "valid_targets_mean": 4128.2, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 2.286634460547504, |
| "grad_norm": 0.48066382062291113, |
| "learning_rate": 3.407382934297571e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21223318576812744, |
| "step": 1420, |
| "valid_targets_mean": 4697.8, |
| "valid_targets_min": 1982 |
| }, |
| { |
| "epoch": 2.2946859903381642, |
| "grad_norm": 0.4623146781727566, |
| "learning_rate": 3.4016657773893785e-05, |
| "loss": 0.1946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.186685249209404, |
| "step": 1425, |
| "valid_targets_mean": 5018.8, |
| "valid_targets_min": 1843 |
| }, |
| { |
| "epoch": 2.3027375201288245, |
| "grad_norm": 0.5051350867881649, |
| "learning_rate": 3.3959260216515495e-05, |
| "loss": 0.2309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1981533169746399, |
| "step": 1430, |
| "valid_targets_mean": 4461.0, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 2.3107890499194848, |
| "grad_norm": 0.547928503478585, |
| "learning_rate": 3.3901637596252325e-05, |
| "loss": 0.2059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20269712805747986, |
| "step": 1435, |
| "valid_targets_mean": 4606.9, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 2.318840579710145, |
| "grad_norm": 0.5050671980985264, |
| "learning_rate": 3.384379084214443e-05, |
| "loss": 0.2157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21335461735725403, |
| "step": 1440, |
| "valid_targets_mean": 3892.7, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 2.3268921095008053, |
| "grad_norm": 0.48909304735454484, |
| "learning_rate": 3.378572088684562e-05, |
| "loss": 0.2037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19523759186267853, |
| "step": 1445, |
| "valid_targets_mean": 4354.8, |
| "valid_targets_min": 1308 |
| }, |
| { |
| "epoch": 2.3349436392914655, |
| "grad_norm": 0.6388146830801954, |
| "learning_rate": 3.372742866660836e-05, |
| "loss": 0.2178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.198106050491333, |
| "step": 1450, |
| "valid_targets_mean": 4365.9, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.342995169082126, |
| "grad_norm": 0.5410396103360308, |
| "learning_rate": 3.3668915121268636e-05, |
| "loss": 0.212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23412463068962097, |
| "step": 1455, |
| "valid_targets_mean": 4374.0, |
| "valid_targets_min": 547 |
| }, |
| { |
| "epoch": 2.3510466988727856, |
| "grad_norm": 0.5291219901130383, |
| "learning_rate": 3.361018119423085e-05, |
| "loss": 0.2084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2332005500793457, |
| "step": 1460, |
| "valid_targets_mean": 3958.9, |
| "valid_targets_min": 1381 |
| }, |
| { |
| "epoch": 2.359098228663446, |
| "grad_norm": 0.5100995870174685, |
| "learning_rate": 3.3551227832452555e-05, |
| "loss": 0.2113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2195730209350586, |
| "step": 1465, |
| "valid_targets_mean": 4228.3, |
| "valid_targets_min": 2352 |
| }, |
| { |
| "epoch": 2.367149758454106, |
| "grad_norm": 0.5322099118621038, |
| "learning_rate": 3.3492055986429235e-05, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22615352272987366, |
| "step": 1470, |
| "valid_targets_mean": 4539.8, |
| "valid_targets_min": 296 |
| }, |
| { |
| "epoch": 2.3752012882447664, |
| "grad_norm": 0.4656836442072764, |
| "learning_rate": 3.3432666610178936e-05, |
| "loss": 0.2039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17955255508422852, |
| "step": 1475, |
| "valid_targets_mean": 4149.8, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 2.3832528180354267, |
| "grad_norm": 0.5493172940293227, |
| "learning_rate": 3.3373060661226944e-05, |
| "loss": 0.2078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23940381407737732, |
| "step": 1480, |
| "valid_targets_mean": 4181.2, |
| "valid_targets_min": 2011 |
| }, |
| { |
| "epoch": 2.391304347826087, |
| "grad_norm": 0.49597904545260957, |
| "learning_rate": 3.331323910059027e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24300578236579895, |
| "step": 1485, |
| "valid_targets_mean": 3967.4, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 2.399355877616747, |
| "grad_norm": 0.5003561031279338, |
| "learning_rate": 3.3253202892762244e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1889512538909912, |
| "step": 1490, |
| "valid_targets_mean": 4254.9, |
| "valid_targets_min": 1570 |
| }, |
| { |
| "epoch": 2.4074074074074074, |
| "grad_norm": 0.4683723297524737, |
| "learning_rate": 3.319295300569686e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22197048366069794, |
| "step": 1495, |
| "valid_targets_mean": 5005.4, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 2.4154589371980677, |
| "grad_norm": 0.5071114785034765, |
| "learning_rate": 3.3132490410793294e-05, |
| "loss": 0.2086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20913785696029663, |
| "step": 1500, |
| "valid_targets_mean": 4472.4, |
| "valid_targets_min": 1073 |
| }, |
| { |
| "epoch": 2.423510466988728, |
| "grad_norm": 0.4572009276147089, |
| "learning_rate": 3.3071816082880115e-05, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19436806440353394, |
| "step": 1505, |
| "valid_targets_mean": 4905.2, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 2.4315619967793882, |
| "grad_norm": 0.5338897691126591, |
| "learning_rate": 3.3010931000199674e-05, |
| "loss": 0.2173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22107122838497162, |
| "step": 1510, |
| "valid_targets_mean": 4076.6, |
| "valid_targets_min": 1904 |
| }, |
| { |
| "epoch": 2.4396135265700485, |
| "grad_norm": 0.49724905678619213, |
| "learning_rate": 3.2949836144392256e-05, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22516636550426483, |
| "step": 1515, |
| "valid_targets_mean": 5009.3, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 2.4476650563607087, |
| "grad_norm": 0.5108239733431804, |
| "learning_rate": 3.28885325004803e-05, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23558905720710754, |
| "step": 1520, |
| "valid_targets_mean": 4774.4, |
| "valid_targets_min": 1731 |
| }, |
| { |
| "epoch": 2.455716586151369, |
| "grad_norm": 0.4908585219445986, |
| "learning_rate": 3.282702105685251e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22913925349712372, |
| "step": 1525, |
| "valid_targets_mean": 5611.8, |
| "valid_targets_min": 2104 |
| }, |
| { |
| "epoch": 2.463768115942029, |
| "grad_norm": 0.4523927665088012, |
| "learning_rate": 3.2765302805247885e-05, |
| "loss": 0.2063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20795124769210815, |
| "step": 1530, |
| "valid_targets_mean": 4889.2, |
| "valid_targets_min": 2184 |
| }, |
| { |
| "epoch": 2.471819645732689, |
| "grad_norm": 0.5485354909981668, |
| "learning_rate": 3.270337874073977e-05, |
| "loss": 0.217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2317976951599121, |
| "step": 1535, |
| "valid_targets_mean": 5319.1, |
| "valid_targets_min": 1932 |
| }, |
| { |
| "epoch": 2.4798711755233493, |
| "grad_norm": 0.5061836838324374, |
| "learning_rate": 3.264124986171981e-05, |
| "loss": 0.2273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25826138257980347, |
| "step": 1540, |
| "valid_targets_mean": 4537.9, |
| "valid_targets_min": 453 |
| }, |
| { |
| "epoch": 2.4879227053140096, |
| "grad_norm": 0.47633311927326305, |
| "learning_rate": 3.2578917169881816e-05, |
| "loss": 0.2185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22371219098567963, |
| "step": 1545, |
| "valid_targets_mean": 4426.5, |
| "valid_targets_min": 1435 |
| }, |
| { |
| "epoch": 2.49597423510467, |
| "grad_norm": 0.528382297311333, |
| "learning_rate": 3.2516381670205665e-05, |
| "loss": 0.2309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22219571471214294, |
| "step": 1550, |
| "valid_targets_mean": 4377.4, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 2.50402576489533, |
| "grad_norm": 0.496647756887993, |
| "learning_rate": 3.245364437094105e-05, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22214139997959137, |
| "step": 1555, |
| "valid_targets_mean": 4800.2, |
| "valid_targets_min": 1516 |
| }, |
| { |
| "epoch": 2.5120772946859904, |
| "grad_norm": 0.5176776733548973, |
| "learning_rate": 3.239070628359126e-05, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2536792755126953, |
| "step": 1560, |
| "valid_targets_mean": 4532.4, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 2.5201288244766507, |
| "grad_norm": 0.4521203535869814, |
| "learning_rate": 3.232756842289685e-05, |
| "loss": 0.209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1837652325630188, |
| "step": 1565, |
| "valid_targets_mean": 4955.4, |
| "valid_targets_min": 1611 |
| }, |
| { |
| "epoch": 2.528180354267311, |
| "grad_norm": 0.48332269443651105, |
| "learning_rate": 3.2264231806819286e-05, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18321290612220764, |
| "step": 1570, |
| "valid_targets_mean": 4541.4, |
| "valid_targets_min": 1371 |
| }, |
| { |
| "epoch": 2.536231884057971, |
| "grad_norm": 0.5203474071856915, |
| "learning_rate": 3.220069745652456e-05, |
| "loss": 0.2189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2053850144147873, |
| "step": 1575, |
| "valid_targets_mean": 4024.7, |
| "valid_targets_min": 380 |
| }, |
| { |
| "epoch": 2.544283413848631, |
| "grad_norm": 0.46470085704874836, |
| "learning_rate": 3.213696639636666e-05, |
| "loss": 0.2233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19794431328773499, |
| "step": 1580, |
| "valid_targets_mean": 4241.2, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 2.5523349436392913, |
| "grad_norm": 0.4921456777251355, |
| "learning_rate": 3.207303965387114e-05, |
| "loss": 0.2195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2276471108198166, |
| "step": 1585, |
| "valid_targets_mean": 4376.2, |
| "valid_targets_min": 327 |
| }, |
| { |
| "epoch": 2.5603864734299515, |
| "grad_norm": 0.5461925808616269, |
| "learning_rate": 3.200891825971846e-05, |
| "loss": 0.2148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2170354425907135, |
| "step": 1590, |
| "valid_targets_mean": 4376.3, |
| "valid_targets_min": 1624 |
| }, |
| { |
| "epoch": 2.5684380032206118, |
| "grad_norm": 0.45331868338223147, |
| "learning_rate": 3.194460324772746e-05, |
| "loss": 0.1971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17769229412078857, |
| "step": 1595, |
| "valid_targets_mean": 4559.6, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 2.576489533011272, |
| "grad_norm": 0.5481556666487605, |
| "learning_rate": 3.188009565483861e-05, |
| "loss": 0.2192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21930727362632751, |
| "step": 1600, |
| "valid_targets_mean": 3786.7, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.5845410628019323, |
| "grad_norm": 0.5306078402232887, |
| "learning_rate": 3.1815396521097376e-05, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22777387499809265, |
| "step": 1605, |
| "valid_targets_mean": 4098.1, |
| "valid_targets_min": 581 |
| }, |
| { |
| "epoch": 2.5925925925925926, |
| "grad_norm": 0.6396015312802733, |
| "learning_rate": 3.1750506889637366e-05, |
| "loss": 0.219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2606090009212494, |
| "step": 1610, |
| "valid_targets_mean": 4573.8, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 2.600644122383253, |
| "grad_norm": 0.5139629491463821, |
| "learning_rate": 3.1685427806663574e-05, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22717058658599854, |
| "step": 1615, |
| "valid_targets_mean": 4616.6, |
| "valid_targets_min": 2109 |
| }, |
| { |
| "epoch": 2.608695652173913, |
| "grad_norm": 0.4896772812229126, |
| "learning_rate": 3.1620160321435475e-05, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2393844723701477, |
| "step": 1620, |
| "valid_targets_mean": 4748.1, |
| "valid_targets_min": 1671 |
| }, |
| { |
| "epoch": 2.6167471819645733, |
| "grad_norm": 0.5123496934824213, |
| "learning_rate": 3.155470548625014e-05, |
| "loss": 0.2257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2570544481277466, |
| "step": 1625, |
| "valid_targets_mean": 4746.9, |
| "valid_targets_min": 1642 |
| }, |
| { |
| "epoch": 2.6247987117552336, |
| "grad_norm": 0.5011886008293388, |
| "learning_rate": 3.1489064356425235e-05, |
| "loss": 0.2223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21146038174629211, |
| "step": 1630, |
| "valid_targets_mean": 4106.5, |
| "valid_targets_min": 1263 |
| }, |
| { |
| "epoch": 2.632850241545894, |
| "grad_norm": 0.4918629952935143, |
| "learning_rate": 3.142323799028204e-05, |
| "loss": 0.2206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.205857515335083, |
| "step": 1635, |
| "valid_targets_mean": 4128.4, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.640901771336554, |
| "grad_norm": 0.4975884336977351, |
| "learning_rate": 3.135722744912836e-05, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19787558913230896, |
| "step": 1640, |
| "valid_targets_mean": 5678.5, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 2.6489533011272144, |
| "grad_norm": 0.48481732390442694, |
| "learning_rate": 3.129103379724143e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1850062608718872, |
| "step": 1645, |
| "valid_targets_mean": 3477.6, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 2.6570048309178746, |
| "grad_norm": 0.4665528515319807, |
| "learning_rate": 3.122465810185075e-05, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21181383728981018, |
| "step": 1650, |
| "valid_targets_mean": 4864.5, |
| "valid_targets_min": 1598 |
| }, |
| { |
| "epoch": 2.6650563607085345, |
| "grad_norm": 0.5077396920276867, |
| "learning_rate": 3.1158101433120863e-05, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19636741280555725, |
| "step": 1655, |
| "valid_targets_mean": 3697.4, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 2.6731078904991947, |
| "grad_norm": 0.5055566499587948, |
| "learning_rate": 3.1091364864134136e-05, |
| "loss": 0.197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20249465107917786, |
| "step": 1660, |
| "valid_targets_mean": 4576.9, |
| "valid_targets_min": 543 |
| }, |
| { |
| "epoch": 2.681159420289855, |
| "grad_norm": 0.49702037708190555, |
| "learning_rate": 3.102444947087342e-05, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17359226942062378, |
| "step": 1665, |
| "valid_targets_mean": 3802.2, |
| "valid_targets_min": 1850 |
| }, |
| { |
| "epoch": 2.6892109500805152, |
| "grad_norm": 0.543548482081646, |
| "learning_rate": 3.0957356332204745e-05, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21617215871810913, |
| "step": 1670, |
| "valid_targets_mean": 5324.2, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 2.6972624798711755, |
| "grad_norm": 0.473211339207569, |
| "learning_rate": 3.089008652985989e-05, |
| "loss": 0.2, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20709389448165894, |
| "step": 1675, |
| "valid_targets_mean": 4730.4, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 2.7053140096618358, |
| "grad_norm": 0.48495909325226566, |
| "learning_rate": 3.082264114841892e-05, |
| "loss": 0.2152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19697055220603943, |
| "step": 1680, |
| "valid_targets_mean": 4703.1, |
| "valid_targets_min": 1393 |
| }, |
| { |
| "epoch": 2.713365539452496, |
| "grad_norm": 0.525234042627054, |
| "learning_rate": 3.07550212752928e-05, |
| "loss": 0.2152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21602725982666016, |
| "step": 1685, |
| "valid_targets_mean": 4527.6, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 2.7214170692431563, |
| "grad_norm": 0.49507933380428965, |
| "learning_rate": 3.068722800070574e-05, |
| "loss": 0.2489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23652076721191406, |
| "step": 1690, |
| "valid_targets_mean": 3893.8, |
| "valid_targets_min": 1490 |
| }, |
| { |
| "epoch": 2.7294685990338166, |
| "grad_norm": 0.478229441737468, |
| "learning_rate": 3.0619262417677695e-05, |
| "loss": 0.2065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20760485529899597, |
| "step": 1695, |
| "valid_targets_mean": 4375.8, |
| "valid_targets_min": 1930 |
| }, |
| { |
| "epoch": 2.7375201288244764, |
| "grad_norm": 0.4760382784479069, |
| "learning_rate": 3.055112562200673e-05, |
| "loss": 0.2077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20306912064552307, |
| "step": 1700, |
| "valid_targets_mean": 4093.1, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 2.7455716586151366, |
| "grad_norm": 0.567194545288659, |
| "learning_rate": 3.0482818712251318e-05, |
| "loss": 0.2031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22697149217128754, |
| "step": 1705, |
| "valid_targets_mean": 5224.9, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 2.753623188405797, |
| "grad_norm": 0.7966562099200152, |
| "learning_rate": 3.0414342789712675e-05, |
| "loss": 0.2246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2644144296646118, |
| "step": 1710, |
| "valid_targets_mean": 3641.8, |
| "valid_targets_min": 267 |
| }, |
| { |
| "epoch": 2.761674718196457, |
| "grad_norm": 0.5194781986137333, |
| "learning_rate": 3.034569895841699e-05, |
| "loss": 0.2012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20732516050338745, |
| "step": 1715, |
| "valid_targets_mean": 4665.7, |
| "valid_targets_min": 1796 |
| }, |
| { |
| "epoch": 2.7697262479871174, |
| "grad_norm": 0.5139542297559575, |
| "learning_rate": 3.0276888325097583e-05, |
| "loss": 0.2108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2747165858745575, |
| "step": 1720, |
| "valid_targets_mean": 5593.7, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 2.7777777777777777, |
| "grad_norm": 0.5017349754200195, |
| "learning_rate": 3.020791199917713e-05, |
| "loss": 0.2097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19357708096504211, |
| "step": 1725, |
| "valid_targets_mean": 4411.8, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 2.785829307568438, |
| "grad_norm": 0.47883623225450245, |
| "learning_rate": 3.0138771092749722e-05, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21340464055538177, |
| "step": 1730, |
| "valid_targets_mean": 4259.2, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 2.793880837359098, |
| "grad_norm": 0.5042451347947459, |
| "learning_rate": 3.006946672056297e-05, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20300012826919556, |
| "step": 1735, |
| "valid_targets_mean": 4185.3, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 2.8019323671497585, |
| "grad_norm": 0.5599312568052899, |
| "learning_rate": 3.0000000000000004e-05, |
| "loss": 0.2111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22356563806533813, |
| "step": 1740, |
| "valid_targets_mean": 4172.1, |
| "valid_targets_min": 1019 |
| }, |
| { |
| "epoch": 2.8099838969404187, |
| "grad_norm": 0.5188094581424917, |
| "learning_rate": 2.993037205106147e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21803626418113708, |
| "step": 1745, |
| "valid_targets_mean": 4445.8, |
| "valid_targets_min": 1772 |
| }, |
| { |
| "epoch": 2.818035426731079, |
| "grad_norm": 0.48903765537814037, |
| "learning_rate": 2.9860583996347495e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21702814102172852, |
| "step": 1750, |
| "valid_targets_mean": 4806.7, |
| "valid_targets_min": 1671 |
| }, |
| { |
| "epoch": 2.8260869565217392, |
| "grad_norm": 0.48803716906398215, |
| "learning_rate": 2.9790636961039524e-05, |
| "loss": 0.2193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22425541281700134, |
| "step": 1755, |
| "valid_targets_mean": 4643.0, |
| "valid_targets_min": 1506 |
| }, |
| { |
| "epoch": 2.8341384863123995, |
| "grad_norm": 0.48749480729575717, |
| "learning_rate": 2.9720532072882268e-05, |
| "loss": 0.2248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19417119026184082, |
| "step": 1760, |
| "valid_targets_mean": 4002.8, |
| "valid_targets_min": 1522 |
| }, |
| { |
| "epoch": 2.8421900161030598, |
| "grad_norm": 0.45848716202240636, |
| "learning_rate": 2.965027046216544e-05, |
| "loss": 0.2081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1857365071773529, |
| "step": 1765, |
| "valid_targets_mean": 4783.7, |
| "valid_targets_min": 1919 |
| }, |
| { |
| "epoch": 2.85024154589372, |
| "grad_norm": 0.6718800164601025, |
| "learning_rate": 2.9579853261705573e-05, |
| "loss": 0.2024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23533181846141815, |
| "step": 1770, |
| "valid_targets_mean": 4673.9, |
| "valid_targets_min": 1311 |
| }, |
| { |
| "epoch": 2.8582930756843803, |
| "grad_norm": 0.4660110391421861, |
| "learning_rate": 2.950928160682775e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19263693690299988, |
| "step": 1775, |
| "valid_targets_mean": 4255.1, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 2.86634460547504, |
| "grad_norm": 0.5145254890484248, |
| "learning_rate": 2.943855663534731e-05, |
| "loss": 0.2183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23376551270484924, |
| "step": 1780, |
| "valid_targets_mean": 4397.2, |
| "valid_targets_min": 1787 |
| }, |
| { |
| "epoch": 2.8743961352657004, |
| "grad_norm": 0.4906091551370421, |
| "learning_rate": 2.9367679487551473e-05, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20546765625476837, |
| "step": 1785, |
| "valid_targets_mean": 3990.4, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 2.8824476650563606, |
| "grad_norm": 0.5093898731159036, |
| "learning_rate": 2.929665130618098e-05, |
| "loss": 0.2037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22851824760437012, |
| "step": 1790, |
| "valid_targets_mean": 5522.1, |
| "valid_targets_min": 1762 |
| }, |
| { |
| "epoch": 2.890499194847021, |
| "grad_norm": 0.4518802511006292, |
| "learning_rate": 2.9225473236411655e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18847951292991638, |
| "step": 1795, |
| "valid_targets_mean": 4818.7, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 2.898550724637681, |
| "grad_norm": 0.6937426790422542, |
| "learning_rate": 2.915414642583596e-05, |
| "loss": 0.2148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20088736712932587, |
| "step": 1800, |
| "valid_targets_mean": 3600.9, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 2.9066022544283414, |
| "grad_norm": 0.46521668715049397, |
| "learning_rate": 2.9082672024444485e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22432249784469604, |
| "step": 1805, |
| "valid_targets_mean": 4322.0, |
| "valid_targets_min": 1358 |
| }, |
| { |
| "epoch": 2.9146537842190017, |
| "grad_norm": 0.436860595041999, |
| "learning_rate": 2.901105118460737e-05, |
| "loss": 0.2072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1966436803340912, |
| "step": 1810, |
| "valid_targets_mean": 4940.1, |
| "valid_targets_min": 1944 |
| }, |
| { |
| "epoch": 2.922705314009662, |
| "grad_norm": 0.5361044008606226, |
| "learning_rate": 2.8939285061055807e-05, |
| "loss": 0.2146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2078220695257187, |
| "step": 1815, |
| "valid_targets_mean": 3302.5, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 2.930756843800322, |
| "grad_norm": 0.49990872670719105, |
| "learning_rate": 2.8867374810863325e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2396693229675293, |
| "step": 1820, |
| "valid_targets_mean": 4933.6, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 2.938808373590982, |
| "grad_norm": 0.4676050983632418, |
| "learning_rate": 2.8795321593427227e-05, |
| "loss": 0.2105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21761463582515717, |
| "step": 1825, |
| "valid_targets_mean": 4473.9, |
| "valid_targets_min": 1740 |
| }, |
| { |
| "epoch": 2.9468599033816423, |
| "grad_norm": 0.4579800892905144, |
| "learning_rate": 2.8723126570449813e-05, |
| "loss": 0.2137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22557538747787476, |
| "step": 1830, |
| "valid_targets_mean": 4990.2, |
| "valid_targets_min": 1104 |
| }, |
| { |
| "epoch": 2.9549114331723025, |
| "grad_norm": 0.521039627014324, |
| "learning_rate": 2.8650790905919724e-05, |
| "loss": 0.2127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21462702751159668, |
| "step": 1835, |
| "valid_targets_mean": 4125.9, |
| "valid_targets_min": 1187 |
| }, |
| { |
| "epoch": 2.962962962962963, |
| "grad_norm": 0.5446614093095541, |
| "learning_rate": 2.8578315766093133e-05, |
| "loss": 0.2275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22720134258270264, |
| "step": 1840, |
| "valid_targets_mean": 4199.9, |
| "valid_targets_min": 379 |
| }, |
| { |
| "epoch": 2.971014492753623, |
| "grad_norm": 0.5085501802829419, |
| "learning_rate": 2.850570231947493e-05, |
| "loss": 0.2086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20165984332561493, |
| "step": 1845, |
| "valid_targets_mean": 4610.2, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 2.9790660225442833, |
| "grad_norm": 0.4995531673717949, |
| "learning_rate": 2.8432951736799933e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21701423823833466, |
| "step": 1850, |
| "valid_targets_mean": 4243.4, |
| "valid_targets_min": 1952 |
| }, |
| { |
| "epoch": 2.9871175523349436, |
| "grad_norm": 0.5654118721016965, |
| "learning_rate": 2.8360065191013967e-05, |
| "loss": 0.2189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22924692928791046, |
| "step": 1855, |
| "valid_targets_mean": 3948.6, |
| "valid_targets_min": 1818 |
| }, |
| { |
| "epoch": 2.995169082125604, |
| "grad_norm": 0.5368747366497263, |
| "learning_rate": 2.8287043857254957e-05, |
| "loss": 0.2049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18569841980934143, |
| "step": 1860, |
| "valid_targets_mean": 4243.3, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 3.003220611916264, |
| "grad_norm": 0.5308612324214572, |
| "learning_rate": 2.8213888912834026e-05, |
| "loss": 0.2026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20392943918704987, |
| "step": 1865, |
| "valid_targets_mean": 5240.9, |
| "valid_targets_min": 3176 |
| }, |
| { |
| "epoch": 3.0112721417069244, |
| "grad_norm": 0.5850366317547473, |
| "learning_rate": 2.814060153721644e-05, |
| "loss": 0.1835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22741422057151794, |
| "step": 1870, |
| "valid_targets_mean": 4518.1, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 3.0193236714975846, |
| "grad_norm": 0.5456534322958014, |
| "learning_rate": 2.8067182912002663e-05, |
| "loss": 0.1929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19902676343917847, |
| "step": 1875, |
| "valid_targets_mean": 4697.9, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 3.027375201288245, |
| "grad_norm": 0.5866691020588805, |
| "learning_rate": 2.7993634220909254e-05, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17653107643127441, |
| "step": 1880, |
| "valid_targets_mean": 5312.7, |
| "valid_targets_min": 1668 |
| }, |
| { |
| "epoch": 3.035426731078905, |
| "grad_norm": 0.4839014869325985, |
| "learning_rate": 2.7919956649749826e-05, |
| "loss": 0.2012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.207495778799057, |
| "step": 1885, |
| "valid_targets_mean": 4792.9, |
| "valid_targets_min": 1475 |
| }, |
| { |
| "epoch": 3.0434782608695654, |
| "grad_norm": 0.5792725572749162, |
| "learning_rate": 2.784615138641588e-05, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2462862730026245, |
| "step": 1890, |
| "valid_targets_mean": 3582.7, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 3.0515297906602252, |
| "grad_norm": 0.5471292037490801, |
| "learning_rate": 2.7772219620857685e-05, |
| "loss": 0.2036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2000941038131714, |
| "step": 1895, |
| "valid_targets_mean": 4260.8, |
| "valid_targets_min": 1662 |
| }, |
| { |
| "epoch": 3.0595813204508855, |
| "grad_norm": 0.5418789392536902, |
| "learning_rate": 2.769816254506509e-05, |
| "loss": 0.1972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17109820246696472, |
| "step": 1900, |
| "valid_targets_mean": 4285.0, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 3.0676328502415457, |
| "grad_norm": 0.5696873068816691, |
| "learning_rate": 2.76239813530483e-05, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17864085733890533, |
| "step": 1905, |
| "valid_targets_mean": 3839.0, |
| "valid_targets_min": 356 |
| }, |
| { |
| "epoch": 3.075684380032206, |
| "grad_norm": 0.5257872930167539, |
| "learning_rate": 2.7549677240818628e-05, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20962268114089966, |
| "step": 1910, |
| "valid_targets_mean": 4587.1, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 3.0837359098228663, |
| "grad_norm": 0.5648446285032245, |
| "learning_rate": 2.7475251406369197e-05, |
| "loss": 0.1969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20219004154205322, |
| "step": 1915, |
| "valid_targets_mean": 4792.9, |
| "valid_targets_min": 1897 |
| }, |
| { |
| "epoch": 3.0917874396135265, |
| "grad_norm": 0.454963234903237, |
| "learning_rate": 2.740070504965565e-05, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1661757528781891, |
| "step": 1920, |
| "valid_targets_mean": 5107.2, |
| "valid_targets_min": 1842 |
| }, |
| { |
| "epoch": 3.099838969404187, |
| "grad_norm": 0.5802646506856157, |
| "learning_rate": 2.7326039372576782e-05, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20974227786064148, |
| "step": 1925, |
| "valid_targets_mean": 4211.8, |
| "valid_targets_min": 1850 |
| }, |
| { |
| "epoch": 3.107890499194847, |
| "grad_norm": 0.5115859872263251, |
| "learning_rate": 2.7251255578955186e-05, |
| "loss": 0.2016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.191048726439476, |
| "step": 1930, |
| "valid_targets_mean": 4847.3, |
| "valid_targets_min": 2149 |
| }, |
| { |
| "epoch": 3.1159420289855073, |
| "grad_norm": 0.4838092911137751, |
| "learning_rate": 2.7176354874517805e-05, |
| "loss": 0.1915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18548092246055603, |
| "step": 1935, |
| "valid_targets_mean": 4928.9, |
| "valid_targets_min": 1746 |
| }, |
| { |
| "epoch": 3.1239935587761676, |
| "grad_norm": 0.6716396355587732, |
| "learning_rate": 2.7101338466876542e-05, |
| "loss": 0.1884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17967697978019714, |
| "step": 1940, |
| "valid_targets_mean": 3838.4, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 3.132045088566828, |
| "grad_norm": 0.5175526656495621, |
| "learning_rate": 2.702620756550874e-05, |
| "loss": 0.2077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18851426243782043, |
| "step": 1945, |
| "valid_targets_mean": 4249.6, |
| "valid_targets_min": 1164 |
| }, |
| { |
| "epoch": 3.140096618357488, |
| "grad_norm": 0.5292721987453661, |
| "learning_rate": 2.6950963381737728e-05, |
| "loss": 0.1948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20516784489154816, |
| "step": 1950, |
| "valid_targets_mean": 4134.1, |
| "valid_targets_min": 1487 |
| }, |
| { |
| "epoch": 3.148148148148148, |
| "grad_norm": 0.5429459342739271, |
| "learning_rate": 2.687560712871325e-05, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19477809965610504, |
| "step": 1955, |
| "valid_targets_mean": 4617.6, |
| "valid_targets_min": 321 |
| }, |
| { |
| "epoch": 3.156199677938808, |
| "grad_norm": 0.5204990053162142, |
| "learning_rate": 2.6800140021391933e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2121405303478241, |
| "step": 1960, |
| "valid_targets_mean": 5504.8, |
| "valid_targets_min": 2133 |
| }, |
| { |
| "epoch": 3.1642512077294684, |
| "grad_norm": 0.5107603352588185, |
| "learning_rate": 2.6724563276517697e-05, |
| "loss": 0.1903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.217079758644104, |
| "step": 1965, |
| "valid_targets_mean": 4874.7, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 3.1723027375201287, |
| "grad_norm": 0.5709422965320798, |
| "learning_rate": 2.6648878112602115e-05, |
| "loss": 0.1865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20290029048919678, |
| "step": 1970, |
| "valid_targets_mean": 4168.8, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 3.180354267310789, |
| "grad_norm": 0.5236384072204857, |
| "learning_rate": 2.6573085749904784e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18646635115146637, |
| "step": 1975, |
| "valid_targets_mean": 5792.3, |
| "valid_targets_min": 3148 |
| }, |
| { |
| "epoch": 3.1884057971014492, |
| "grad_norm": 0.4931013592583483, |
| "learning_rate": 2.6497187410413676e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16621598601341248, |
| "step": 1980, |
| "valid_targets_mean": 4182.5, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 3.1964573268921095, |
| "grad_norm": 0.513477571797092, |
| "learning_rate": 2.642118431782537e-05, |
| "loss": 0.2045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19758376479148865, |
| "step": 1985, |
| "valid_targets_mean": 4814.4, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 3.2045088566827697, |
| "grad_norm": 0.5208664241436397, |
| "learning_rate": 2.6345077697525394e-05, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2036036252975464, |
| "step": 1990, |
| "valid_targets_mean": 4699.8, |
| "valid_targets_min": 1314 |
| }, |
| { |
| "epoch": 3.21256038647343, |
| "grad_norm": 0.48590086014586165, |
| "learning_rate": 2.6268868776568416e-05, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1840904951095581, |
| "step": 1995, |
| "valid_targets_mean": 4029.8, |
| "valid_targets_min": 2119 |
| }, |
| { |
| "epoch": 3.2206119162640903, |
| "grad_norm": 0.48975245964069325, |
| "learning_rate": 2.619255878365849e-05, |
| "loss": 0.2021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19650408625602722, |
| "step": 2000, |
| "valid_targets_mean": 4923.2, |
| "valid_targets_min": 2035 |
| }, |
| { |
| "epoch": 3.2286634460547505, |
| "grad_norm": 0.4730736998762011, |
| "learning_rate": 2.6116148949129237e-05, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19848835468292236, |
| "step": 2005, |
| "valid_targets_mean": 5154.9, |
| "valid_targets_min": 862 |
| }, |
| { |
| "epoch": 3.236714975845411, |
| "grad_norm": 0.49293775625702296, |
| "learning_rate": 2.603964050492401e-05, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1910780966281891, |
| "step": 2010, |
| "valid_targets_mean": 5177.5, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 3.244766505636071, |
| "grad_norm": 0.4352279629169526, |
| "learning_rate": 2.5963034684576024e-05, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1654304563999176, |
| "step": 2015, |
| "valid_targets_mean": 4889.2, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 3.2528180354267313, |
| "grad_norm": 0.48928557887722884, |
| "learning_rate": 2.5886332723188484e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17599686980247498, |
| "step": 2020, |
| "valid_targets_mean": 3929.6, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 3.260869565217391, |
| "grad_norm": 0.4602375034247986, |
| "learning_rate": 2.5809535857414637e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19927427172660828, |
| "step": 2025, |
| "valid_targets_mean": 4907.2, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 3.2689210950080514, |
| "grad_norm": 0.45533522839686313, |
| "learning_rate": 2.573264532543788e-05, |
| "loss": 0.1902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1822260171175003, |
| "step": 2030, |
| "valid_targets_mean": 4557.0, |
| "valid_targets_min": 2401 |
| }, |
| { |
| "epoch": 3.2769726247987117, |
| "grad_norm": 0.5432317512688624, |
| "learning_rate": 2.5655662366951778e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1943272203207016, |
| "step": 2035, |
| "valid_targets_mean": 3990.8, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 3.285024154589372, |
| "grad_norm": 0.5340485828335133, |
| "learning_rate": 2.557858822314007e-05, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2411888986825943, |
| "step": 2040, |
| "valid_targets_mean": 4090.6, |
| "valid_targets_min": 1032 |
| }, |
| { |
| "epoch": 3.293075684380032, |
| "grad_norm": 0.5155182145466647, |
| "learning_rate": 2.5501424136656635e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2276889681816101, |
| "step": 2045, |
| "valid_targets_mean": 4593.6, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 3.3011272141706924, |
| "grad_norm": 0.5465406153378882, |
| "learning_rate": 2.5424171351605518e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17450806498527527, |
| "step": 2050, |
| "valid_targets_mean": 4325.6, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 3.3091787439613527, |
| "grad_norm": 0.5652814304177497, |
| "learning_rate": 2.5346831113520827e-05, |
| "loss": 0.1961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21284984052181244, |
| "step": 2055, |
| "valid_targets_mean": 4811.6, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 3.317230273752013, |
| "grad_norm": 0.5717869882020237, |
| "learning_rate": 2.526940466934664e-05, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19881507754325867, |
| "step": 2060, |
| "valid_targets_mean": 3001.5, |
| "valid_targets_min": 350 |
| }, |
| { |
| "epoch": 3.325281803542673, |
| "grad_norm": 0.5193991609655757, |
| "learning_rate": 2.5191893267416964e-05, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19282767176628113, |
| "step": 2065, |
| "valid_targets_mean": 4379.1, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.5087654352874541, |
| "learning_rate": 2.5114298157435526e-05, |
| "loss": 0.2077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22454917430877686, |
| "step": 2070, |
| "valid_targets_mean": 5994.5, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 3.3413848631239937, |
| "grad_norm": 0.4773374743223842, |
| "learning_rate": 2.503662059045568e-05, |
| "loss": 0.1961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19372783601284027, |
| "step": 2075, |
| "valid_targets_mean": 4415.6, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 3.3494363929146536, |
| "grad_norm": 0.5211750691881805, |
| "learning_rate": 2.4958861818860217e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20317870378494263, |
| "step": 2080, |
| "valid_targets_mean": 4938.8, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 3.357487922705314, |
| "grad_norm": 0.580769513908195, |
| "learning_rate": 2.488102309634119e-05, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17012670636177063, |
| "step": 2085, |
| "valid_targets_mean": 3300.9, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 3.365539452495974, |
| "grad_norm": 0.4677262023270228, |
| "learning_rate": 2.480310567787967e-05, |
| "loss": 0.1943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21143823862075806, |
| "step": 2090, |
| "valid_targets_mean": 4960.4, |
| "valid_targets_min": 1486 |
| }, |
| { |
| "epoch": 3.3735909822866343, |
| "grad_norm": 0.498695274074395, |
| "learning_rate": 2.4725110819725542e-05, |
| "loss": 0.1877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19077152013778687, |
| "step": 2095, |
| "valid_targets_mean": 4409.8, |
| "valid_targets_min": 1603 |
| }, |
| { |
| "epoch": 3.3816425120772946, |
| "grad_norm": 0.6606944270313985, |
| "learning_rate": 2.464703977937723e-05, |
| "loss": 0.2122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2209235429763794, |
| "step": 2100, |
| "valid_targets_mean": 5160.9, |
| "valid_targets_min": 2260 |
| }, |
| { |
| "epoch": 3.389694041867955, |
| "grad_norm": 0.48392843927081547, |
| "learning_rate": 2.456889381556144e-05, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1707090586423874, |
| "step": 2105, |
| "valid_targets_mean": 4587.8, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 3.397745571658615, |
| "grad_norm": 0.4875147573168212, |
| "learning_rate": 2.449067418821285e-05, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18568046391010284, |
| "step": 2110, |
| "valid_targets_mean": 4881.9, |
| "valid_targets_min": 2069 |
| }, |
| { |
| "epoch": 3.4057971014492754, |
| "grad_norm": 0.5240738697697526, |
| "learning_rate": 2.4412382158453807e-05, |
| "loss": 0.2027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17656230926513672, |
| "step": 2115, |
| "valid_targets_mean": 4386.1, |
| "valid_targets_min": 1483 |
| }, |
| { |
| "epoch": 3.4138486312399356, |
| "grad_norm": 0.5359424822294189, |
| "learning_rate": 2.4334018988573983e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22453176975250244, |
| "step": 2120, |
| "valid_targets_mean": 4363.1, |
| "valid_targets_min": 2099 |
| }, |
| { |
| "epoch": 3.421900161030596, |
| "grad_norm": 0.7044397785288949, |
| "learning_rate": 2.425558594201004e-05, |
| "loss": 0.1963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17415092885494232, |
| "step": 2125, |
| "valid_targets_mean": 4853.5, |
| "valid_targets_min": 1658 |
| }, |
| { |
| "epoch": 3.429951690821256, |
| "grad_norm": 0.7313542515268883, |
| "learning_rate": 2.417708428332525e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18305009603500366, |
| "step": 2130, |
| "valid_targets_mean": 4156.8, |
| "valid_targets_min": 317 |
| }, |
| { |
| "epoch": 3.4380032206119164, |
| "grad_norm": 0.4738591164631795, |
| "learning_rate": 2.4098515278189097e-05, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1723197102546692, |
| "step": 2135, |
| "valid_targets_mean": 4533.4, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 3.4460547504025767, |
| "grad_norm": 0.5276265701938105, |
| "learning_rate": 2.4019880193356902e-05, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17899435758590698, |
| "step": 2140, |
| "valid_targets_mean": 4434.9, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 3.454106280193237, |
| "grad_norm": 0.5632489582281142, |
| "learning_rate": 2.3941180296649348e-05, |
| "loss": 0.2035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22366738319396973, |
| "step": 2145, |
| "valid_targets_mean": 3995.8, |
| "valid_targets_min": 1400 |
| }, |
| { |
| "epoch": 3.4621578099838968, |
| "grad_norm": 0.5526994009194625, |
| "learning_rate": 2.3862416856932087e-05, |
| "loss": 0.19, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19457975029945374, |
| "step": 2150, |
| "valid_targets_mean": 3929.9, |
| "valid_targets_min": 1593 |
| }, |
| { |
| "epoch": 3.470209339774557, |
| "grad_norm": 0.5417281294909433, |
| "learning_rate": 2.378359114409527e-05, |
| "loss": 0.2146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20209567248821259, |
| "step": 2155, |
| "valid_targets_mean": 4491.2, |
| "valid_targets_min": 1771 |
| }, |
| { |
| "epoch": 3.4782608695652173, |
| "grad_norm": 0.5283860783665116, |
| "learning_rate": 2.370470442903306e-05, |
| "loss": 0.2024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2074143886566162, |
| "step": 2160, |
| "valid_targets_mean": 3453.6, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 3.4863123993558776, |
| "grad_norm": 0.5596014550678241, |
| "learning_rate": 2.362575798362315e-05, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20553532242774963, |
| "step": 2165, |
| "valid_targets_mean": 3728.8, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 3.494363929146538, |
| "grad_norm": 0.47388886907429295, |
| "learning_rate": 2.3546753080706242e-05, |
| "loss": 0.1962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2011997401714325, |
| "step": 2170, |
| "valid_targets_mean": 4747.0, |
| "valid_targets_min": 1499 |
| }, |
| { |
| "epoch": 3.502415458937198, |
| "grad_norm": 0.5433473628742698, |
| "learning_rate": 2.346769099406557e-05, |
| "loss": 0.2048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22939231991767883, |
| "step": 2175, |
| "valid_targets_mean": 3726.4, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 3.5104669887278583, |
| "grad_norm": 0.4457288216134543, |
| "learning_rate": 2.33885729984063e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1754472553730011, |
| "step": 2180, |
| "valid_targets_mean": 5101.0, |
| "valid_targets_min": 1832 |
| }, |
| { |
| "epoch": 3.5185185185185186, |
| "grad_norm": 0.511189888500102, |
| "learning_rate": 2.3309400369335033e-05, |
| "loss": 0.1909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18584825098514557, |
| "step": 2185, |
| "valid_targets_mean": 4445.9, |
| "valid_targets_min": 1920 |
| }, |
| { |
| "epoch": 3.526570048309179, |
| "grad_norm": 0.5632502133321703, |
| "learning_rate": 2.3230174383339196e-05, |
| "loss": 0.2072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2198297381401062, |
| "step": 2190, |
| "valid_targets_mean": 4171.1, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 3.534621578099839, |
| "grad_norm": 0.4874975024015211, |
| "learning_rate": 2.3150896317766505e-05, |
| "loss": 0.1896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1995978057384491, |
| "step": 2195, |
| "valid_targets_mean": 4628.1, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 3.542673107890499, |
| "grad_norm": 0.47843928271386893, |
| "learning_rate": 2.3071567450804325e-05, |
| "loss": 0.2053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1690368950366974, |
| "step": 2200, |
| "valid_targets_mean": 4314.7, |
| "valid_targets_min": 1529 |
| }, |
| { |
| "epoch": 3.550724637681159, |
| "grad_norm": 0.5030690747235215, |
| "learning_rate": 2.299218906145909e-05, |
| "loss": 0.1883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17591848969459534, |
| "step": 2205, |
| "valid_targets_mean": 4831.5, |
| "valid_targets_min": 1692 |
| }, |
| { |
| "epoch": 3.5587761674718195, |
| "grad_norm": 0.4445594459012944, |
| "learning_rate": 2.2912762429535684e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2045142650604248, |
| "step": 2210, |
| "valid_targets_mean": 5075.3, |
| "valid_targets_min": 1787 |
| }, |
| { |
| "epoch": 3.5668276972624797, |
| "grad_norm": 0.5066371584429301, |
| "learning_rate": 2.2833288835616784e-05, |
| "loss": 0.1948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20660072565078735, |
| "step": 2215, |
| "valid_targets_mean": 4255.6, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 3.57487922705314, |
| "grad_norm": 0.5314312269324657, |
| "learning_rate": 2.2753769561042235e-05, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1856955885887146, |
| "step": 2220, |
| "valid_targets_mean": 4382.4, |
| "valid_targets_min": 306 |
| }, |
| { |
| "epoch": 3.5829307568438002, |
| "grad_norm": 0.594664193968932, |
| "learning_rate": 2.2674205887888386e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22779573500156403, |
| "step": 2225, |
| "valid_targets_mean": 4177.1, |
| "valid_targets_min": 581 |
| }, |
| { |
| "epoch": 3.5909822866344605, |
| "grad_norm": 0.4922219770303433, |
| "learning_rate": 2.259459909894742e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22328010201454163, |
| "step": 2230, |
| "valid_targets_mean": 5152.0, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 3.5990338164251208, |
| "grad_norm": 0.48869544172575563, |
| "learning_rate": 2.2514950477706657e-05, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20914164185523987, |
| "step": 2235, |
| "valid_targets_mean": 5138.6, |
| "valid_targets_min": 1484 |
| }, |
| { |
| "epoch": 3.607085346215781, |
| "grad_norm": 0.6963749789958893, |
| "learning_rate": 2.2435261308327875e-05, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1746867597103119, |
| "step": 2240, |
| "valid_targets_mean": 4765.4, |
| "valid_targets_min": 1839 |
| }, |
| { |
| "epoch": 3.6151368760064413, |
| "grad_norm": 0.5367886666270889, |
| "learning_rate": 2.2355532875626612e-05, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18968860805034637, |
| "step": 2245, |
| "valid_targets_mean": 3609.9, |
| "valid_targets_min": 1136 |
| }, |
| { |
| "epoch": 3.6231884057971016, |
| "grad_norm": 0.5074205448750082, |
| "learning_rate": 2.2275766465051444e-05, |
| "loss": 0.1989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20984122157096863, |
| "step": 2250, |
| "valid_targets_mean": 4557.3, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 3.631239935587762, |
| "grad_norm": 0.5328336917497768, |
| "learning_rate": 2.2195963362663236e-05, |
| "loss": 0.196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1873650997877121, |
| "step": 2255, |
| "valid_targets_mean": 4251.6, |
| "valid_targets_min": 1417 |
| }, |
| { |
| "epoch": 3.639291465378422, |
| "grad_norm": 0.5279031470689559, |
| "learning_rate": 2.211612485511446e-05, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19223317503929138, |
| "step": 2260, |
| "valid_targets_mean": 4547.8, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 3.6473429951690823, |
| "grad_norm": 0.4807142652014487, |
| "learning_rate": 2.2036252229628392e-05, |
| "loss": 0.1855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17448017001152039, |
| "step": 2265, |
| "valid_targets_mean": 4428.8, |
| "valid_targets_min": 1791 |
| }, |
| { |
| "epoch": 3.6553945249597426, |
| "grad_norm": 0.46162214621632697, |
| "learning_rate": 2.19563467739784e-05, |
| "loss": 0.1923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15724977850914001, |
| "step": 2270, |
| "valid_targets_mean": 4100.6, |
| "valid_targets_min": 1856 |
| }, |
| { |
| "epoch": 3.6634460547504024, |
| "grad_norm": 0.437259128811763, |
| "learning_rate": 2.1876409776467165e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19419334828853607, |
| "step": 2275, |
| "valid_targets_mean": 5604.3, |
| "valid_targets_min": 1799 |
| }, |
| { |
| "epoch": 3.6714975845410627, |
| "grad_norm": 0.509046081849507, |
| "learning_rate": 2.1796442525905923e-05, |
| "loss": 0.19, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1819322556257248, |
| "step": 2280, |
| "valid_targets_mean": 3572.2, |
| "valid_targets_min": 1228 |
| }, |
| { |
| "epoch": 3.679549114331723, |
| "grad_norm": 0.512456182600672, |
| "learning_rate": 2.171644631159366e-05, |
| "loss": 0.2032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21677514910697937, |
| "step": 2285, |
| "valid_targets_mean": 4920.6, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 3.687600644122383, |
| "grad_norm": 3.5749072057598865, |
| "learning_rate": 2.163642242329633e-05, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1948278695344925, |
| "step": 2290, |
| "valid_targets_mean": 4014.2, |
| "valid_targets_min": 1316 |
| }, |
| { |
| "epoch": 3.6956521739130435, |
| "grad_norm": 0.48865940439627575, |
| "learning_rate": 2.1556372151226097e-05, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21440473198890686, |
| "step": 2295, |
| "valid_targets_mean": 4626.4, |
| "valid_targets_min": 1967 |
| }, |
| { |
| "epoch": 3.7037037037037037, |
| "grad_norm": 0.5877525411956264, |
| "learning_rate": 2.1476296786020502e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.173828125, |
| "step": 2300, |
| "valid_targets_mean": 4059.1, |
| "valid_targets_min": 345 |
| }, |
| { |
| "epoch": 3.711755233494364, |
| "grad_norm": 0.532071939990665, |
| "learning_rate": 2.139619761872163e-05, |
| "loss": 0.2034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20449981093406677, |
| "step": 2305, |
| "valid_targets_mean": 3978.1, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 3.7198067632850242, |
| "grad_norm": 0.5500257667017805, |
| "learning_rate": 2.1316075940755363e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19600236415863037, |
| "step": 2310, |
| "valid_targets_mean": 4358.1, |
| "valid_targets_min": 2076 |
| }, |
| { |
| "epoch": 3.7278582930756845, |
| "grad_norm": 0.4910824420542707, |
| "learning_rate": 2.1235933043910488e-05, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1749979555606842, |
| "step": 2315, |
| "valid_targets_mean": 3997.7, |
| "valid_targets_min": 1403 |
| }, |
| { |
| "epoch": 3.7359098228663448, |
| "grad_norm": 0.49001315022408615, |
| "learning_rate": 2.1155770220317918e-05, |
| "loss": 0.2012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1976926326751709, |
| "step": 2320, |
| "valid_targets_mean": 4852.8, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 3.7439613526570046, |
| "grad_norm": 0.6702681948241392, |
| "learning_rate": 2.107558876242983e-05, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19468314945697784, |
| "step": 2325, |
| "valid_targets_mean": 3499.4, |
| "valid_targets_min": 1520 |
| }, |
| { |
| "epoch": 3.752012882447665, |
| "grad_norm": 0.4609480240941858, |
| "learning_rate": 2.0995389962998845e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19903123378753662, |
| "step": 2330, |
| "valid_targets_mean": 4891.3, |
| "valid_targets_min": 1678 |
| }, |
| { |
| "epoch": 3.760064412238325, |
| "grad_norm": 0.48913542025927365, |
| "learning_rate": 2.091517511505719e-05, |
| "loss": 0.2002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21223650872707367, |
| "step": 2335, |
| "valid_targets_mean": 4559.2, |
| "valid_targets_min": 2650 |
| }, |
| { |
| "epoch": 3.7681159420289854, |
| "grad_norm": 0.46883840985224706, |
| "learning_rate": 2.0834945511895816e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1941649466753006, |
| "step": 2340, |
| "valid_targets_mean": 5603.5, |
| "valid_targets_min": 2498 |
| }, |
| { |
| "epoch": 3.7761674718196456, |
| "grad_norm": 0.4681238690714185, |
| "learning_rate": 2.0754702447043585e-05, |
| "loss": 0.1954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1943756639957428, |
| "step": 2345, |
| "valid_targets_mean": 4566.8, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 3.784219001610306, |
| "grad_norm": 0.4482811469832385, |
| "learning_rate": 2.0674447214246394e-05, |
| "loss": 0.2, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1913878321647644, |
| "step": 2350, |
| "valid_targets_mean": 5163.6, |
| "valid_targets_min": 2337 |
| }, |
| { |
| "epoch": 3.792270531400966, |
| "grad_norm": 0.47556405809315727, |
| "learning_rate": 2.059418110744633e-05, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18677163124084473, |
| "step": 2355, |
| "valid_targets_mean": 4713.3, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 3.8003220611916264, |
| "grad_norm": 0.4690759790686193, |
| "learning_rate": 2.0513905420760798e-05, |
| "loss": 0.1988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19385367631912231, |
| "step": 2360, |
| "valid_targets_mean": 4902.2, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 3.8083735909822867, |
| "grad_norm": 0.5121675478037654, |
| "learning_rate": 2.043362144846164e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19691093266010284, |
| "step": 2365, |
| "valid_targets_mean": 3866.6, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 3.816425120772947, |
| "grad_norm": 0.52059333383564, |
| "learning_rate": 2.035333048495431e-05, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16973920166492462, |
| "step": 2370, |
| "valid_targets_mean": 3510.0, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 3.824476650563607, |
| "grad_norm": 0.5076146647866968, |
| "learning_rate": 2.0273033824756964e-05, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17860174179077148, |
| "step": 2375, |
| "valid_targets_mean": 3703.1, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 3.8325281803542675, |
| "grad_norm": 0.6011850519404554, |
| "learning_rate": 2.0192732762479616e-05, |
| "loss": 0.1908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20434610545635223, |
| "step": 2380, |
| "valid_targets_mean": 4579.6, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 3.8405797101449277, |
| "grad_norm": 0.5345131849791486, |
| "learning_rate": 2.011242859280325e-05, |
| "loss": 0.197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21205343306064606, |
| "step": 2385, |
| "valid_targets_mean": 4124.2, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 3.848631239935588, |
| "grad_norm": 0.5114321926687082, |
| "learning_rate": 2.0032122610458947e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17156703770160675, |
| "step": 2390, |
| "valid_targets_mean": 4274.9, |
| "valid_targets_min": 1740 |
| }, |
| { |
| "epoch": 3.8566827697262482, |
| "grad_norm": 0.6336174608958026, |
| "learning_rate": 1.9951816110207004e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1964995563030243, |
| "step": 2395, |
| "valid_targets_mean": 4251.1, |
| "valid_targets_min": 1610 |
| }, |
| { |
| "epoch": 3.864734299516908, |
| "grad_norm": 0.49492043165747124, |
| "learning_rate": 1.9871510386816103e-05, |
| "loss": 0.1869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17603623867034912, |
| "step": 2400, |
| "valid_targets_mean": 4051.9, |
| "valid_targets_min": 1925 |
| }, |
| { |
| "epoch": 3.8727858293075683, |
| "grad_norm": 0.5681035881235681, |
| "learning_rate": 1.979120673504235e-05, |
| "loss": 0.2058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20705150067806244, |
| "step": 2405, |
| "valid_targets_mean": 5603.1, |
| "valid_targets_min": 3701 |
| }, |
| { |
| "epoch": 3.8808373590982286, |
| "grad_norm": 1.2929630707396456, |
| "learning_rate": 1.9710906449608498e-05, |
| "loss": 0.1998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19122429192066193, |
| "step": 2410, |
| "valid_targets_mean": 4886.8, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 3.888888888888889, |
| "grad_norm": 0.47492876907794285, |
| "learning_rate": 1.9630610825182992e-05, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18603213131427765, |
| "step": 2415, |
| "valid_targets_mean": 4944.1, |
| "valid_targets_min": 1929 |
| }, |
| { |
| "epoch": 3.896940418679549, |
| "grad_norm": 0.5030538323026981, |
| "learning_rate": 1.955032115635915e-05, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22285720705986023, |
| "step": 2420, |
| "valid_targets_mean": 4422.1, |
| "valid_targets_min": 1352 |
| }, |
| { |
| "epoch": 3.9049919484702094, |
| "grad_norm": 0.5031818050359901, |
| "learning_rate": 1.9470038737634257e-05, |
| "loss": 0.1991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19892553985118866, |
| "step": 2425, |
| "valid_targets_mean": 4099.8, |
| "valid_targets_min": 1262 |
| }, |
| { |
| "epoch": 3.9130434782608696, |
| "grad_norm": 0.5757670497420159, |
| "learning_rate": 1.9389764863388706e-05, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19620567560195923, |
| "step": 2430, |
| "valid_targets_mean": 3868.5, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 3.92109500805153, |
| "grad_norm": 0.48359405966706115, |
| "learning_rate": 1.9309500827865136e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1803748607635498, |
| "step": 2435, |
| "valid_targets_mean": 4338.0, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 3.92914653784219, |
| "grad_norm": 0.4640923476833218, |
| "learning_rate": 1.9229247925147553e-05, |
| "loss": 0.1968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1907849907875061, |
| "step": 2440, |
| "valid_targets_mean": 4583.9, |
| "valid_targets_min": 1771 |
| }, |
| { |
| "epoch": 3.9371980676328504, |
| "grad_norm": 0.5117773057032822, |
| "learning_rate": 1.9149007449140462e-05, |
| "loss": 0.1877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17059685289859772, |
| "step": 2445, |
| "valid_targets_mean": 4338.1, |
| "valid_targets_min": 1784 |
| }, |
| { |
| "epoch": 3.9452495974235102, |
| "grad_norm": 0.5915049699700269, |
| "learning_rate": 1.906878069354804e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21201738715171814, |
| "step": 2450, |
| "valid_targets_mean": 3018.6, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 3.9533011272141705, |
| "grad_norm": 0.47160593652811594, |
| "learning_rate": 1.898856895185322e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16955235600471497, |
| "step": 2455, |
| "valid_targets_mean": 4181.1, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 3.9613526570048307, |
| "grad_norm": 0.49702142957897827, |
| "learning_rate": 1.8908373517296888e-05, |
| "loss": 0.1943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19719739258289337, |
| "step": 2460, |
| "valid_targets_mean": 4295.4, |
| "valid_targets_min": 249 |
| }, |
| { |
| "epoch": 3.969404186795491, |
| "grad_norm": 0.5129921266484054, |
| "learning_rate": 1.882819568285701e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19295062124729156, |
| "step": 2465, |
| "valid_targets_mean": 3921.4, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 3.9774557165861513, |
| "grad_norm": 0.45382648008126336, |
| "learning_rate": 1.874803674122778e-05, |
| "loss": 0.1929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1945837438106537, |
| "step": 2470, |
| "valid_targets_mean": 5054.1, |
| "valid_targets_min": 1828 |
| }, |
| { |
| "epoch": 3.9855072463768115, |
| "grad_norm": 0.47820396478837407, |
| "learning_rate": 1.8667897984798804e-05, |
| "loss": 0.2066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21562841534614563, |
| "step": 2475, |
| "valid_targets_mean": 4692.4, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 3.993558776167472, |
| "grad_norm": 0.539195337968872, |
| "learning_rate": 1.858778070563422e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1887316107749939, |
| "step": 2480, |
| "valid_targets_mean": 4306.7, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 4.001610305958132, |
| "grad_norm": 0.5374780928948082, |
| "learning_rate": 1.8507686195451918e-05, |
| "loss": 0.194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25074928998947144, |
| "step": 2485, |
| "valid_targets_mean": 4598.8, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 4.009661835748792, |
| "grad_norm": 0.4944011317477905, |
| "learning_rate": 1.8427615745602667e-05, |
| "loss": 0.1624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15997666120529175, |
| "step": 2490, |
| "valid_targets_mean": 4936.9, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 4.017713365539453, |
| "grad_norm": 0.4765635224384645, |
| "learning_rate": 1.834757064704933e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1592136025428772, |
| "step": 2495, |
| "valid_targets_mean": 4652.1, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 4.025764895330113, |
| "grad_norm": 0.4956167235108182, |
| "learning_rate": 1.826755219034603e-05, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19604167342185974, |
| "step": 2500, |
| "valid_targets_mean": 4386.4, |
| "valid_targets_min": 380 |
| }, |
| { |
| "epoch": 4.033816425120773, |
| "grad_norm": 0.45476926402320006, |
| "learning_rate": 1.818756166561733e-05, |
| "loss": 0.1865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1637008637189865, |
| "step": 2505, |
| "valid_targets_mean": 4699.8, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 4.041867954911433, |
| "grad_norm": 0.43733602489225165, |
| "learning_rate": 1.8107600362537473e-05, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16251038014888763, |
| "step": 2510, |
| "valid_targets_mean": 4847.2, |
| "valid_targets_min": 1813 |
| }, |
| { |
| "epoch": 4.049919484702094, |
| "grad_norm": 0.49193894405362015, |
| "learning_rate": 1.8027669570309572e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16793620586395264, |
| "step": 2515, |
| "valid_targets_mean": 4591.9, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 4.057971014492754, |
| "grad_norm": 0.5075017593056104, |
| "learning_rate": 1.7947770577644787e-05, |
| "loss": 0.1803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1729605346918106, |
| "step": 2520, |
| "valid_targets_mean": 4395.8, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 4.066022544283414, |
| "grad_norm": 0.499304090315969, |
| "learning_rate": 1.786790467274161e-05, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17558912932872772, |
| "step": 2525, |
| "valid_targets_mean": 4637.6, |
| "valid_targets_min": 2011 |
| }, |
| { |
| "epoch": 4.074074074074074, |
| "grad_norm": 0.5559504833423238, |
| "learning_rate": 1.778807314326505e-05, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18689918518066406, |
| "step": 2530, |
| "valid_targets_mean": 3930.3, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 4.082125603864735, |
| "grad_norm": 0.47641769475056645, |
| "learning_rate": 1.7708277276325886e-05, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1637909710407257, |
| "step": 2535, |
| "valid_targets_mean": 5154.6, |
| "valid_targets_min": 1826 |
| }, |
| { |
| "epoch": 4.090177133655395, |
| "grad_norm": 0.5182362997358064, |
| "learning_rate": 1.762851835845992e-05, |
| "loss": 0.1803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18916486203670502, |
| "step": 2540, |
| "valid_targets_mean": 4544.1, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 4.098228663446055, |
| "grad_norm": 0.4862343355871757, |
| "learning_rate": 1.754879767560723e-05, |
| "loss": 0.1981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18593139946460724, |
| "step": 2545, |
| "valid_targets_mean": 4532.4, |
| "valid_targets_min": 1521 |
| }, |
| { |
| "epoch": 4.106280193236715, |
| "grad_norm": 0.527960071470203, |
| "learning_rate": 1.746911651309144e-05, |
| "loss": 0.1788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19690777361392975, |
| "step": 2550, |
| "valid_targets_mean": 3843.6, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 4.114331723027375, |
| "grad_norm": 0.5103425212083436, |
| "learning_rate": 1.7389476155598974e-05, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21908551454544067, |
| "step": 2555, |
| "valid_targets_mean": 5082.4, |
| "valid_targets_min": 784 |
| }, |
| { |
| "epoch": 4.122383252818035, |
| "grad_norm": 0.7756087805548777, |
| "learning_rate": 1.7309877887158388e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1794763058423996, |
| "step": 2560, |
| "valid_targets_mean": 2992.2, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 4.130434782608695, |
| "grad_norm": 0.4567684656881922, |
| "learning_rate": 1.723032299111964e-05, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15088678896427155, |
| "step": 2565, |
| "valid_targets_mean": 4922.8, |
| "valid_targets_min": 1327 |
| }, |
| { |
| "epoch": 4.138486312399356, |
| "grad_norm": 0.5425918961875108, |
| "learning_rate": 1.7150812750133382e-05, |
| "loss": 0.1775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1673865020275116, |
| "step": 2570, |
| "valid_targets_mean": 3965.9, |
| "valid_targets_min": 1407 |
| }, |
| { |
| "epoch": 4.146537842190016, |
| "grad_norm": 0.6838407873867918, |
| "learning_rate": 1.707134844613032e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15312550961971283, |
| "step": 2575, |
| "valid_targets_mean": 4199.9, |
| "valid_targets_min": 1891 |
| }, |
| { |
| "epoch": 4.154589371980676, |
| "grad_norm": 0.5385560587074719, |
| "learning_rate": 1.699193136030052e-05, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17279349267482758, |
| "step": 2580, |
| "valid_targets_mean": 3938.8, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 4.162640901771336, |
| "grad_norm": 0.5502968325727028, |
| "learning_rate": 1.6912562773072765e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18601390719413757, |
| "step": 2585, |
| "valid_targets_mean": 4653.2, |
| "valid_targets_min": 2040 |
| }, |
| { |
| "epoch": 4.170692431561997, |
| "grad_norm": 0.5862578517681709, |
| "learning_rate": 1.6833243964093877e-05, |
| "loss": 0.1952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2094813883304596, |
| "step": 2590, |
| "valid_targets_mean": 4215.5, |
| "valid_targets_min": 1508 |
| }, |
| { |
| "epoch": 4.178743961352657, |
| "grad_norm": 0.525233464465349, |
| "learning_rate": 1.6753976212208137e-05, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17922204732894897, |
| "step": 2595, |
| "valid_targets_mean": 3851.4, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 4.186795491143317, |
| "grad_norm": 0.6610861468502892, |
| "learning_rate": 1.667476079543664e-05, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17614664137363434, |
| "step": 2600, |
| "valid_targets_mean": 3052.1, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 4.194847020933977, |
| "grad_norm": 0.5630100784699484, |
| "learning_rate": 1.659559899095667e-05, |
| "loss": 0.1895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20966169238090515, |
| "step": 2605, |
| "valid_targets_mean": 5309.3, |
| "valid_targets_min": 1187 |
| }, |
| { |
| "epoch": 4.202898550724638, |
| "grad_norm": 0.6807488645292253, |
| "learning_rate": 1.651649207508114e-05, |
| "loss": 0.1771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19908779859542847, |
| "step": 2610, |
| "valid_targets_mean": 4216.5, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 4.210950080515298, |
| "grad_norm": 0.49692416499926767, |
| "learning_rate": 1.643744132323801e-05, |
| "loss": 0.1844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19740644097328186, |
| "step": 2615, |
| "valid_targets_mean": 4830.8, |
| "valid_targets_min": 1913 |
| }, |
| { |
| "epoch": 4.219001610305958, |
| "grad_norm": 0.6036326467813666, |
| "learning_rate": 1.6358448009949714e-05, |
| "loss": 0.1855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22196456789970398, |
| "step": 2620, |
| "valid_targets_mean": 5333.3, |
| "valid_targets_min": 2355 |
| }, |
| { |
| "epoch": 4.2270531400966185, |
| "grad_norm": 0.4829391874239536, |
| "learning_rate": 1.6279513408812603e-05, |
| "loss": 0.17, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1743869185447693, |
| "step": 2625, |
| "valid_targets_mean": 5413.8, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 4.235104669887279, |
| "grad_norm": 0.5048080599206834, |
| "learning_rate": 1.620063879247643e-05, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16595719754695892, |
| "step": 2630, |
| "valid_targets_mean": 3924.2, |
| "valid_targets_min": 443 |
| }, |
| { |
| "epoch": 4.243156199677939, |
| "grad_norm": 0.46752510731782826, |
| "learning_rate": 1.6121825432623827e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1762651652097702, |
| "step": 2635, |
| "valid_targets_mean": 5055.4, |
| "valid_targets_min": 1403 |
| }, |
| { |
| "epoch": 4.251207729468599, |
| "grad_norm": 0.4797644865040805, |
| "learning_rate": 1.6043074599949785e-05, |
| "loss": 0.1808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17031241953372955, |
| "step": 2640, |
| "valid_targets_mean": 4893.6, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 4.2592592592592595, |
| "grad_norm": 1.0165849437996184, |
| "learning_rate": 1.5964387564141192e-05, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19583508372306824, |
| "step": 2645, |
| "valid_targets_mean": 4988.9, |
| "valid_targets_min": 1611 |
| }, |
| { |
| "epoch": 4.26731078904992, |
| "grad_norm": 0.6039054133342181, |
| "learning_rate": 1.588576559385635e-05, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17843933403491974, |
| "step": 2650, |
| "valid_targets_mean": 4234.7, |
| "valid_targets_min": 1211 |
| }, |
| { |
| "epoch": 4.27536231884058, |
| "grad_norm": 0.512856167089867, |
| "learning_rate": 1.5807209956704505e-05, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1996535062789917, |
| "step": 2655, |
| "valid_targets_mean": 4500.6, |
| "valid_targets_min": 1506 |
| }, |
| { |
| "epoch": 4.28341384863124, |
| "grad_norm": 0.4991515466828228, |
| "learning_rate": 1.5728721919225428e-05, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14569713175296783, |
| "step": 2660, |
| "valid_targets_mean": 4720.1, |
| "valid_targets_min": 1211 |
| }, |
| { |
| "epoch": 4.291465378421901, |
| "grad_norm": 0.9601831661650259, |
| "learning_rate": 1.5650302746869004e-05, |
| "loss": 0.1857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1880815625190735, |
| "step": 2665, |
| "valid_targets_mean": 4171.6, |
| "valid_targets_min": 833 |
| }, |
| { |
| "epoch": 4.29951690821256, |
| "grad_norm": 0.4412736536027149, |
| "learning_rate": 1.5571953703974813e-05, |
| "loss": 0.1752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16794951260089874, |
| "step": 2670, |
| "valid_targets_mean": 5724.5, |
| "valid_targets_min": 2565 |
| }, |
| { |
| "epoch": 4.30756843800322, |
| "grad_norm": 0.49660094639156666, |
| "learning_rate": 1.5493676053751747e-05, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17535799741744995, |
| "step": 2675, |
| "valid_targets_mean": 4800.3, |
| "valid_targets_min": 1829 |
| }, |
| { |
| "epoch": 4.3156199677938805, |
| "grad_norm": 0.5456531223844872, |
| "learning_rate": 1.5415471058257638e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17335663735866547, |
| "step": 2680, |
| "valid_targets_mean": 4570.4, |
| "valid_targets_min": 1658 |
| }, |
| { |
| "epoch": 4.323671497584541, |
| "grad_norm": 0.45678206025420953, |
| "learning_rate": 1.533733997837893e-05, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.169780433177948, |
| "step": 2685, |
| "valid_targets_mean": 4216.1, |
| "valid_targets_min": 1449 |
| }, |
| { |
| "epoch": 4.331723027375201, |
| "grad_norm": 0.5415606665772222, |
| "learning_rate": 1.5259284073810333e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16021227836608887, |
| "step": 2690, |
| "valid_targets_mean": 3275.1, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 4.339774557165861, |
| "grad_norm": 0.5136691048212793, |
| "learning_rate": 1.5181304603034513e-05, |
| "loss": 0.1914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1827298104763031, |
| "step": 2695, |
| "valid_targets_mean": 4889.6, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 4.3478260869565215, |
| "grad_norm": 1.4914173173538663, |
| "learning_rate": 1.5103402823301819e-05, |
| "loss": 0.1838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18776141107082367, |
| "step": 2700, |
| "valid_targets_mean": 4532.6, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 4.355877616747182, |
| "grad_norm": 0.5083803805655037, |
| "learning_rate": 1.5025579990609973e-05, |
| "loss": 0.1821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16755394637584686, |
| "step": 2705, |
| "valid_targets_mean": 4128.1, |
| "valid_targets_min": 379 |
| }, |
| { |
| "epoch": 4.363929146537842, |
| "grad_norm": 0.500974762279468, |
| "learning_rate": 1.4947837359683882e-05, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17978541553020477, |
| "step": 2710, |
| "valid_targets_mean": 5342.4, |
| "valid_targets_min": 2152 |
| }, |
| { |
| "epoch": 4.371980676328502, |
| "grad_norm": 0.5603545589277986, |
| "learning_rate": 1.487017618395534e-05, |
| "loss": 0.1781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.198044091463089, |
| "step": 2715, |
| "valid_targets_mean": 4740.4, |
| "valid_targets_min": 1746 |
| }, |
| { |
| "epoch": 4.3800322061191626, |
| "grad_norm": 0.4771112752411543, |
| "learning_rate": 1.479259771554288e-05, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1699572205543518, |
| "step": 2720, |
| "valid_targets_mean": 4872.8, |
| "valid_targets_min": 448 |
| }, |
| { |
| "epoch": 4.388083735909823, |
| "grad_norm": 0.521661536652827, |
| "learning_rate": 1.4715103205231545e-05, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18613924086093903, |
| "step": 2725, |
| "valid_targets_mean": 4061.7, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 4.396135265700483, |
| "grad_norm": 0.537250383283014, |
| "learning_rate": 1.463769390245273e-05, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.178946852684021, |
| "step": 2730, |
| "valid_targets_mean": 4061.8, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 4.404186795491143, |
| "grad_norm": 0.5244437127559632, |
| "learning_rate": 1.4560371055264052e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18043842911720276, |
| "step": 2735, |
| "valid_targets_mean": 4802.7, |
| "valid_targets_min": 1843 |
| }, |
| { |
| "epoch": 4.412238325281804, |
| "grad_norm": 0.5146870682156327, |
| "learning_rate": 1.448313591032922e-05, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17479149997234344, |
| "step": 2740, |
| "valid_targets_mean": 5214.2, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 4.420289855072464, |
| "grad_norm": 0.4691547439815975, |
| "learning_rate": 1.4405989712897923e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18224862217903137, |
| "step": 2745, |
| "valid_targets_mean": 5050.6, |
| "valid_targets_min": 1427 |
| }, |
| { |
| "epoch": 4.428341384863124, |
| "grad_norm": 0.5424155500541844, |
| "learning_rate": 1.4328933706785782e-05, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1883089393377304, |
| "step": 2750, |
| "valid_targets_mean": 4057.4, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 4.436392914653784, |
| "grad_norm": 0.5100283152717094, |
| "learning_rate": 1.4251969134354247e-05, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16344183683395386, |
| "step": 2755, |
| "valid_targets_mean": 4199.4, |
| "valid_targets_min": 1557 |
| }, |
| { |
| "epoch": 4.444444444444445, |
| "grad_norm": 0.5071596893081406, |
| "learning_rate": 1.4175097236490627e-05, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1783141791820526, |
| "step": 2760, |
| "valid_targets_mean": 4905.3, |
| "valid_targets_min": 383 |
| }, |
| { |
| "epoch": 4.452495974235105, |
| "grad_norm": 0.4808405938396642, |
| "learning_rate": 1.409831925258805e-05, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19857333600521088, |
| "step": 2765, |
| "valid_targets_mean": 4961.1, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 4.460547504025765, |
| "grad_norm": 0.48057741594526054, |
| "learning_rate": 1.4021636420525466e-05, |
| "loss": 0.1824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1644965559244156, |
| "step": 2770, |
| "valid_targets_mean": 4509.1, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 4.468599033816425, |
| "grad_norm": 0.5128321881887902, |
| "learning_rate": 1.3945049976647726e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1749866008758545, |
| "step": 2775, |
| "valid_targets_mean": 4825.0, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 4.476650563607086, |
| "grad_norm": 0.6327024505387485, |
| "learning_rate": 1.3868561155745628e-05, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19712504744529724, |
| "step": 2780, |
| "valid_targets_mean": 4430.3, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 4.484702093397746, |
| "grad_norm": 0.4913167577071679, |
| "learning_rate": 1.3792171191036001e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15714874863624573, |
| "step": 2785, |
| "valid_targets_mean": 4104.7, |
| "valid_targets_min": 1663 |
| }, |
| { |
| "epoch": 4.492753623188406, |
| "grad_norm": 0.5394186960786538, |
| "learning_rate": 1.3715881314141835e-05, |
| "loss": 0.1902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19951429963111877, |
| "step": 2790, |
| "valid_targets_mean": 4620.1, |
| "valid_targets_min": 1843 |
| }, |
| { |
| "epoch": 4.500805152979066, |
| "grad_norm": 0.5953737763754138, |
| "learning_rate": 1.3639692755072429e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2141798585653305, |
| "step": 2795, |
| "valid_targets_mean": 4660.8, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 4.508856682769727, |
| "grad_norm": 0.5453366269316137, |
| "learning_rate": 1.3563606742203548e-05, |
| "loss": 0.1969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20897048711776733, |
| "step": 2800, |
| "valid_targets_mean": 4447.4, |
| "valid_targets_min": 1113 |
| }, |
| { |
| "epoch": 4.516908212560386, |
| "grad_norm": 0.531617180983723, |
| "learning_rate": 1.3487624502257598e-05, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20468959212303162, |
| "step": 2805, |
| "valid_targets_mean": 4891.9, |
| "valid_targets_min": 2624 |
| }, |
| { |
| "epoch": 4.524959742351046, |
| "grad_norm": 1.0175978905323302, |
| "learning_rate": 1.3411747260283905e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1867702454328537, |
| "step": 2810, |
| "valid_targets_mean": 4380.1, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 4.533011272141707, |
| "grad_norm": 0.5172120222306495, |
| "learning_rate": 1.333597623963892e-05, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17019790410995483, |
| "step": 2815, |
| "valid_targets_mean": 4795.6, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 4.541062801932367, |
| "grad_norm": 0.6059009807629652, |
| "learning_rate": 1.3260312661966487e-05, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17550814151763916, |
| "step": 2820, |
| "valid_targets_mean": 5061.1, |
| "valid_targets_min": 1263 |
| }, |
| { |
| "epoch": 4.549114331723027, |
| "grad_norm": 0.613180864431363, |
| "learning_rate": 1.3184757747178187e-05, |
| "loss": 0.1758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19658298790454865, |
| "step": 2825, |
| "valid_targets_mean": 5041.3, |
| "valid_targets_min": 1795 |
| }, |
| { |
| "epoch": 4.557165861513687, |
| "grad_norm": 0.5633900947396653, |
| "learning_rate": 1.3109312713433642e-05, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18244323134422302, |
| "step": 2830, |
| "valid_targets_mean": 4282.2, |
| "valid_targets_min": 543 |
| }, |
| { |
| "epoch": 4.565217391304348, |
| "grad_norm": 0.9588780998775635, |
| "learning_rate": 1.3033978777120861e-05, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1690833568572998, |
| "step": 2835, |
| "valid_targets_mean": 3991.0, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 4.573268921095008, |
| "grad_norm": 0.5205077973662069, |
| "learning_rate": 1.2958757152836671e-05, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22376713156700134, |
| "step": 2840, |
| "valid_targets_mean": 4458.4, |
| "valid_targets_min": 2143 |
| }, |
| { |
| "epoch": 4.581320450885668, |
| "grad_norm": 0.5253874104264332, |
| "learning_rate": 1.2883649053367106e-05, |
| "loss": 0.1808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1675848662853241, |
| "step": 2845, |
| "valid_targets_mean": 4003.0, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 4.5893719806763285, |
| "grad_norm": 0.5452379881212879, |
| "learning_rate": 1.2808655689667846e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1796257197856903, |
| "step": 2850, |
| "valid_targets_mean": 4152.3, |
| "valid_targets_min": 455 |
| }, |
| { |
| "epoch": 4.597423510466989, |
| "grad_norm": 0.5239905621350787, |
| "learning_rate": 1.2733778270844712e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18232783675193787, |
| "step": 2855, |
| "valid_targets_mean": 4419.6, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 4.605475040257649, |
| "grad_norm": 0.5607032815508621, |
| "learning_rate": 1.265901800413416e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17835384607315063, |
| "step": 2860, |
| "valid_targets_mean": 3395.8, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 4.613526570048309, |
| "grad_norm": 0.9496967272226038, |
| "learning_rate": 1.2584376094883832e-05, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17716357111930847, |
| "step": 2865, |
| "valid_targets_mean": 4483.6, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 4.6215780998389695, |
| "grad_norm": 0.7842117859067653, |
| "learning_rate": 1.250985374653311e-05, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17786236107349396, |
| "step": 2870, |
| "valid_targets_mean": 4693.0, |
| "valid_targets_min": 1134 |
| }, |
| { |
| "epoch": 4.62962962962963, |
| "grad_norm": 0.5033684151280889, |
| "learning_rate": 1.2435452160593698e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17148058116436005, |
| "step": 2875, |
| "valid_targets_mean": 4303.3, |
| "valid_targets_min": 1429 |
| }, |
| { |
| "epoch": 4.63768115942029, |
| "grad_norm": 0.5032006756891246, |
| "learning_rate": 1.2361172536630288e-05, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16900071501731873, |
| "step": 2880, |
| "valid_targets_mean": 4471.4, |
| "valid_targets_min": 1507 |
| }, |
| { |
| "epoch": 4.64573268921095, |
| "grad_norm": 0.5449401674057853, |
| "learning_rate": 1.2287016072241195e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19873306155204773, |
| "step": 2885, |
| "valid_targets_mean": 4050.9, |
| "valid_targets_min": 321 |
| }, |
| { |
| "epoch": 4.6537842190016105, |
| "grad_norm": 0.5002283792241559, |
| "learning_rate": 1.221298396303904e-05, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17124618589878082, |
| "step": 2890, |
| "valid_targets_mean": 5187.2, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 4.661835748792271, |
| "grad_norm": 0.4706451280493202, |
| "learning_rate": 1.2139077402631495e-05, |
| "loss": 0.1721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14620235562324524, |
| "step": 2895, |
| "valid_targets_mean": 4477.4, |
| "valid_targets_min": 1454 |
| }, |
| { |
| "epoch": 4.669887278582931, |
| "grad_norm": 0.5330785987823722, |
| "learning_rate": 1.2065297582602037e-05, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17816966772079468, |
| "step": 2900, |
| "valid_targets_mean": 4355.4, |
| "valid_targets_min": 2065 |
| }, |
| { |
| "epoch": 4.677938808373591, |
| "grad_norm": 0.4942305241126504, |
| "learning_rate": 1.199164569249071e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18558406829833984, |
| "step": 2905, |
| "valid_targets_mean": 4951.6, |
| "valid_targets_min": 1299 |
| }, |
| { |
| "epoch": 4.685990338164252, |
| "grad_norm": 0.537628904978011, |
| "learning_rate": 1.191812291977497e-05, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19403138756752014, |
| "step": 2910, |
| "valid_targets_mean": 4024.0, |
| "valid_targets_min": 1450 |
| }, |
| { |
| "epoch": 4.694041867954912, |
| "grad_norm": 0.5439040484202802, |
| "learning_rate": 1.1844730449850546e-05, |
| "loss": 0.1782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19234639406204224, |
| "step": 2915, |
| "valid_targets_mean": 5036.8, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 4.702093397745571, |
| "grad_norm": 0.583242909808935, |
| "learning_rate": 1.1771469466012309e-05, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20131342113018036, |
| "step": 2920, |
| "valid_targets_mean": 4106.1, |
| "valid_targets_min": 983 |
| }, |
| { |
| "epoch": 4.710144927536232, |
| "grad_norm": 0.5038233636197879, |
| "learning_rate": 1.1698341149435196e-05, |
| "loss": 0.1849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1684148907661438, |
| "step": 2925, |
| "valid_targets_mean": 4802.6, |
| "valid_targets_min": 1952 |
| }, |
| { |
| "epoch": 4.718196457326892, |
| "grad_norm": 0.4600414999991662, |
| "learning_rate": 1.1625346679155179e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15985998511314392, |
| "step": 2930, |
| "valid_targets_mean": 4799.9, |
| "valid_targets_min": 1859 |
| }, |
| { |
| "epoch": 4.726247987117552, |
| "grad_norm": 0.4936755991303249, |
| "learning_rate": 1.1552487232050242e-05, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17861491441726685, |
| "step": 2935, |
| "valid_targets_mean": 4306.8, |
| "valid_targets_min": 1605 |
| }, |
| { |
| "epoch": 4.734299516908212, |
| "grad_norm": 0.44442070244437953, |
| "learning_rate": 1.1479763982821414e-05, |
| "loss": 0.1711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17784011363983154, |
| "step": 2940, |
| "valid_targets_mean": 5608.9, |
| "valid_targets_min": 1956 |
| }, |
| { |
| "epoch": 4.7423510466988725, |
| "grad_norm": 0.5637401886713175, |
| "learning_rate": 1.1407178103973834e-05, |
| "loss": 0.1983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18229396641254425, |
| "step": 2945, |
| "valid_targets_mean": 3870.8, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 4.750402576489533, |
| "grad_norm": 0.45308334583470944, |
| "learning_rate": 1.1334730765797843e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19959984719753265, |
| "step": 2950, |
| "valid_targets_mean": 5085.4, |
| "valid_targets_min": 1791 |
| }, |
| { |
| "epoch": 4.758454106280193, |
| "grad_norm": 0.5571182515606663, |
| "learning_rate": 1.1262423136350087e-05, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22160165011882782, |
| "step": 2955, |
| "valid_targets_mean": 3792.0, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 4.766505636070853, |
| "grad_norm": 0.5901554994508056, |
| "learning_rate": 1.1190256381434738e-05, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17873704433441162, |
| "step": 2960, |
| "valid_targets_mean": 3899.3, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 4.774557165861514, |
| "grad_norm": 0.5158336477050018, |
| "learning_rate": 1.1118231664584674e-05, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1886855959892273, |
| "step": 2965, |
| "valid_targets_mean": 4861.4, |
| "valid_targets_min": 1898 |
| }, |
| { |
| "epoch": 4.782608695652174, |
| "grad_norm": 0.4887213717876692, |
| "learning_rate": 1.1046350147042681e-05, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20001167058944702, |
| "step": 2970, |
| "valid_targets_mean": 4675.2, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 4.790660225442834, |
| "grad_norm": 0.48768071610571156, |
| "learning_rate": 1.0974612987742807e-05, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18149898946285248, |
| "step": 2975, |
| "valid_targets_mean": 4411.8, |
| "valid_targets_min": 1129 |
| }, |
| { |
| "epoch": 4.798711755233494, |
| "grad_norm": 0.4873268036344298, |
| "learning_rate": 1.0903021343291613e-05, |
| "loss": 0.1926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20546609163284302, |
| "step": 2980, |
| "valid_targets_mean": 4418.5, |
| "valid_targets_min": 608 |
| }, |
| { |
| "epoch": 4.806763285024155, |
| "grad_norm": 0.5054671612514106, |
| "learning_rate": 1.0831576367949555e-05, |
| "loss": 0.1886, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18941310048103333, |
| "step": 2985, |
| "valid_targets_mean": 4868.4, |
| "valid_targets_min": 2311 |
| }, |
| { |
| "epoch": 4.814814814814815, |
| "grad_norm": 0.5242076423511247, |
| "learning_rate": 1.0760279213612362e-05, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16793029010295868, |
| "step": 2990, |
| "valid_targets_mean": 5404.2, |
| "valid_targets_min": 2117 |
| }, |
| { |
| "epoch": 4.822866344605475, |
| "grad_norm": 0.6828436818331252, |
| "learning_rate": 1.068913102979248e-05, |
| "loss": 0.1858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19285649061203003, |
| "step": 2995, |
| "valid_targets_mean": 3826.8, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 4.830917874396135, |
| "grad_norm": 0.47219942742537285, |
| "learning_rate": 1.0618132963600507e-05, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18546539545059204, |
| "step": 3000, |
| "valid_targets_mean": 5087.4, |
| "valid_targets_min": 1959 |
| }, |
| { |
| "epoch": 4.838969404186796, |
| "grad_norm": 0.4457820811603146, |
| "learning_rate": 1.0547286159726743e-05, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19360345602035522, |
| "step": 3005, |
| "valid_targets_mean": 5867.6, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 4.847020933977456, |
| "grad_norm": 0.5847539672595908, |
| "learning_rate": 1.047659176042268e-05, |
| "loss": 0.1645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16391941905021667, |
| "step": 3010, |
| "valid_targets_mean": 3891.6, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 4.855072463768116, |
| "grad_norm": 0.5080943188478495, |
| "learning_rate": 1.0406050905482647e-05, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1736719310283661, |
| "step": 3015, |
| "valid_targets_mean": 4204.6, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 4.8631239935587764, |
| "grad_norm": 0.4950021070139557, |
| "learning_rate": 1.033566473222539e-05, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16896328330039978, |
| "step": 3020, |
| "valid_targets_mean": 5143.3, |
| "valid_targets_min": 2767 |
| }, |
| { |
| "epoch": 4.871175523349437, |
| "grad_norm": 0.5149173904980839, |
| "learning_rate": 1.0265434375475744e-05, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1894487589597702, |
| "step": 3025, |
| "valid_targets_mean": 4708.5, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 4.879227053140097, |
| "grad_norm": 0.5128722203180325, |
| "learning_rate": 1.0195360967546342e-05, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18005244433879852, |
| "step": 3030, |
| "valid_targets_mean": 5025.9, |
| "valid_targets_min": 1716 |
| }, |
| { |
| "epoch": 4.887278582930757, |
| "grad_norm": 0.5010958581493115, |
| "learning_rate": 1.0125445638219369e-05, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19406850636005402, |
| "step": 3035, |
| "valid_targets_mean": 4813.1, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 4.8953301127214175, |
| "grad_norm": 0.5210294803713594, |
| "learning_rate": 1.00556895147283e-05, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16892248392105103, |
| "step": 3040, |
| "valid_targets_mean": 3893.8, |
| "valid_targets_min": 1273 |
| }, |
| { |
| "epoch": 4.903381642512077, |
| "grad_norm": 0.6293372498483756, |
| "learning_rate": 9.986093721739793e-06, |
| "loss": 0.1872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1870511919260025, |
| "step": 3045, |
| "valid_targets_mean": 3776.4, |
| "valid_targets_min": 296 |
| }, |
| { |
| "epoch": 4.911433172302738, |
| "grad_norm": 0.5480638562689124, |
| "learning_rate": 9.916659381335524e-06, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15634512901306152, |
| "step": 3050, |
| "valid_targets_mean": 4189.9, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 4.919484702093397, |
| "grad_norm": 0.5734404649785564, |
| "learning_rate": 9.847387612994065e-06, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1715972125530243, |
| "step": 3055, |
| "valid_targets_mean": 4624.1, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 4.927536231884058, |
| "grad_norm": 0.4755904568874477, |
| "learning_rate": 9.778279533572894e-06, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1521787941455841, |
| "step": 3060, |
| "valid_targets_mean": 4754.1, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 4.935587761674718, |
| "grad_norm": 0.7122666442809198, |
| "learning_rate": 9.70933625729035e-06, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17114746570587158, |
| "step": 3065, |
| "valid_targets_mean": 5142.9, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 4.943639291465378, |
| "grad_norm": 0.7359607180808936, |
| "learning_rate": 9.640558895707681e-06, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18806086480617523, |
| "step": 3070, |
| "valid_targets_mean": 4064.7, |
| "valid_targets_min": 1615 |
| }, |
| { |
| "epoch": 4.951690821256038, |
| "grad_norm": 0.5379368590841539, |
| "learning_rate": 9.571948557711104e-06, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17751240730285645, |
| "step": 3075, |
| "valid_targets_mean": 3381.2, |
| "valid_targets_min": 249 |
| }, |
| { |
| "epoch": 4.959742351046699, |
| "grad_norm": 0.4777499224064591, |
| "learning_rate": 9.503506349493959e-06, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1592390239238739, |
| "step": 3080, |
| "valid_targets_mean": 4629.0, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 4.967793880837359, |
| "grad_norm": 0.5139616446857665, |
| "learning_rate": 9.435233374538848e-06, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18165704607963562, |
| "step": 3085, |
| "valid_targets_mean": 4665.1, |
| "valid_targets_min": 1736 |
| }, |
| { |
| "epoch": 4.975845410628019, |
| "grad_norm": 0.5162555365137094, |
| "learning_rate": 9.367130733599863e-06, |
| "loss": 0.1706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19067494571208954, |
| "step": 3090, |
| "valid_targets_mean": 4688.7, |
| "valid_targets_min": 1872 |
| }, |
| { |
| "epoch": 4.9838969404186795, |
| "grad_norm": 0.569575182274062, |
| "learning_rate": 9.299199524684815e-06, |
| "loss": 0.1671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16250163316726685, |
| "step": 3095, |
| "valid_targets_mean": 4311.8, |
| "valid_targets_min": 1994 |
| }, |
| { |
| "epoch": 4.99194847020934, |
| "grad_norm": 0.5520222968798817, |
| "learning_rate": 9.23144084303756e-06, |
| "loss": 0.1803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1921304166316986, |
| "step": 3100, |
| "valid_targets_mean": 4493.3, |
| "valid_targets_min": 2050 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.7884221741023202, |
| "learning_rate": 9.163855781120302e-06, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20062533020973206, |
| "step": 3105, |
| "valid_targets_mean": 3796.8, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 5.00805152979066, |
| "grad_norm": 0.5195634108838502, |
| "learning_rate": 9.096445428596026e-06, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1869000345468521, |
| "step": 3110, |
| "valid_targets_mean": 4366.8, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 5.0161030595813205, |
| "grad_norm": 0.5278497870764118, |
| "learning_rate": 9.029210872310884e-06, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1439373940229416, |
| "step": 3115, |
| "valid_targets_mean": 4365.9, |
| "valid_targets_min": 554 |
| }, |
| { |
| "epoch": 5.024154589371981, |
| "grad_norm": 0.5284272892101102, |
| "learning_rate": 8.962153196276713e-06, |
| "loss": 0.1692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14253228902816772, |
| "step": 3120, |
| "valid_targets_mean": 4662.7, |
| "valid_targets_min": 312 |
| }, |
| { |
| "epoch": 5.032206119162641, |
| "grad_norm": 0.5474998021835664, |
| "learning_rate": 8.895273481653527e-06, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17854666709899902, |
| "step": 3125, |
| "valid_targets_mean": 4428.5, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 5.040257648953301, |
| "grad_norm": 1.2329548853780503, |
| "learning_rate": 8.828572806732103e-06, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1708088219165802, |
| "step": 3130, |
| "valid_targets_mean": 4686.6, |
| "valid_targets_min": 1916 |
| }, |
| { |
| "epoch": 5.048309178743962, |
| "grad_norm": 0.5097310950347612, |
| "learning_rate": 8.76205224691659e-06, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17174428701400757, |
| "step": 3135, |
| "valid_targets_mean": 4785.3, |
| "valid_targets_min": 1860 |
| }, |
| { |
| "epoch": 5.056360708534622, |
| "grad_norm": 0.46008600902359126, |
| "learning_rate": 8.695712874707169e-06, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16250503063201904, |
| "step": 3140, |
| "valid_targets_mean": 4901.8, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 5.064412238325282, |
| "grad_norm": 0.47656692190311706, |
| "learning_rate": 8.629555759682756e-06, |
| "loss": 0.1676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15433499217033386, |
| "step": 3145, |
| "valid_targets_mean": 5206.9, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 5.072463768115942, |
| "grad_norm": 0.46684035634871635, |
| "learning_rate": 8.563581968483774e-06, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15580695867538452, |
| "step": 3150, |
| "valid_targets_mean": 4968.5, |
| "valid_targets_min": 1514 |
| }, |
| { |
| "epoch": 5.080515297906603, |
| "grad_norm": 0.4817709325187039, |
| "learning_rate": 8.497792564794935e-06, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1596037745475769, |
| "step": 3155, |
| "valid_targets_mean": 4873.9, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 5.088566827697263, |
| "grad_norm": 0.49561234768208556, |
| "learning_rate": 8.432188609328112e-06, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18620729446411133, |
| "step": 3160, |
| "valid_targets_mean": 4277.6, |
| "valid_targets_min": 429 |
| }, |
| { |
| "epoch": 5.096618357487923, |
| "grad_norm": 0.5342689640020111, |
| "learning_rate": 8.366771159805222e-06, |
| "loss": 0.1614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1623041033744812, |
| "step": 3165, |
| "valid_targets_mean": 3849.9, |
| "valid_targets_min": 1692 |
| }, |
| { |
| "epoch": 5.1046698872785825, |
| "grad_norm": 0.5558864483320473, |
| "learning_rate": 8.301541270941178e-06, |
| "loss": 0.1744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19302302598953247, |
| "step": 3170, |
| "valid_targets_mean": 3954.7, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 5.112721417069243, |
| "grad_norm": 0.5483085784932584, |
| "learning_rate": 8.236499994426886e-06, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17752034962177277, |
| "step": 3175, |
| "valid_targets_mean": 4114.2, |
| "valid_targets_min": 321 |
| }, |
| { |
| "epoch": 5.120772946859903, |
| "grad_norm": 0.5129349338303597, |
| "learning_rate": 8.171648378912272e-06, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1786811649799347, |
| "step": 3180, |
| "valid_targets_mean": 5010.1, |
| "valid_targets_min": 1693 |
| }, |
| { |
| "epoch": 5.128824476650563, |
| "grad_norm": 0.47618052790196236, |
| "learning_rate": 8.1069874699894e-06, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14539986848831177, |
| "step": 3185, |
| "valid_targets_mean": 4915.1, |
| "valid_targets_min": 1295 |
| }, |
| { |
| "epoch": 5.1368760064412236, |
| "grad_norm": 0.5408793562526828, |
| "learning_rate": 8.042518310175607e-06, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1692083477973938, |
| "step": 3190, |
| "valid_targets_mean": 4689.8, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 5.144927536231884, |
| "grad_norm": 0.427889087391779, |
| "learning_rate": 7.978241938896679e-06, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13784319162368774, |
| "step": 3195, |
| "valid_targets_mean": 4693.8, |
| "valid_targets_min": 2255 |
| }, |
| { |
| "epoch": 5.152979066022544, |
| "grad_norm": 0.5199711838065452, |
| "learning_rate": 7.914159392470118e-06, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16833321750164032, |
| "step": 3200, |
| "valid_targets_mean": 4362.7, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 5.161030595813204, |
| "grad_norm": 0.47753654786071936, |
| "learning_rate": 7.850271704088396e-06, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14919407665729523, |
| "step": 3205, |
| "valid_targets_mean": 4483.1, |
| "valid_targets_min": 2048 |
| }, |
| { |
| "epoch": 5.169082125603865, |
| "grad_norm": 0.47729884629127567, |
| "learning_rate": 7.786579903802342e-06, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15295487642288208, |
| "step": 3210, |
| "valid_targets_mean": 4766.6, |
| "valid_targets_min": 1817 |
| }, |
| { |
| "epoch": 5.177133655394525, |
| "grad_norm": 0.5186129305793417, |
| "learning_rate": 7.723085018504512e-06, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1621103286743164, |
| "step": 3215, |
| "valid_targets_mean": 4525.6, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 5.185185185185185, |
| "grad_norm": 0.562831677149766, |
| "learning_rate": 7.659788071912612e-06, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16404971480369568, |
| "step": 3220, |
| "valid_targets_mean": 3796.4, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 5.193236714975845, |
| "grad_norm": 0.48044538637214657, |
| "learning_rate": 7.59669008455304e-06, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16649338603019714, |
| "step": 3225, |
| "valid_targets_mean": 5432.8, |
| "valid_targets_min": 1858 |
| }, |
| { |
| "epoch": 5.201288244766506, |
| "grad_norm": 0.5790721887585502, |
| "learning_rate": 7.533792073744395e-06, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17744669318199158, |
| "step": 3230, |
| "valid_targets_mean": 4592.4, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 5.209339774557166, |
| "grad_norm": 0.5717495383522813, |
| "learning_rate": 7.471095053581086e-06, |
| "loss": 0.1758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1721886694431305, |
| "step": 3235, |
| "valid_targets_mean": 4073.8, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 5.217391304347826, |
| "grad_norm": 0.5319904040215578, |
| "learning_rate": 7.4086000349169864e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15195900201797485, |
| "step": 3240, |
| "valid_targets_mean": 4558.5, |
| "valid_targets_min": 296 |
| }, |
| { |
| "epoch": 5.225442834138486, |
| "grad_norm": 0.6199276315504786, |
| "learning_rate": 7.346308025349138e-06, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16166193783283234, |
| "step": 3245, |
| "valid_targets_mean": 3986.2, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 5.233494363929147, |
| "grad_norm": 0.6244366963899998, |
| "learning_rate": 7.2842200292014805e-06, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17683975398540497, |
| "step": 3250, |
| "valid_targets_mean": 3601.2, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 5.241545893719807, |
| "grad_norm": 0.5241028588187276, |
| "learning_rate": 7.2223370475086896e-06, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1595272421836853, |
| "step": 3255, |
| "valid_targets_mean": 4269.6, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 5.249597423510467, |
| "grad_norm": 0.4473386775088612, |
| "learning_rate": 7.160660078000028e-06, |
| "loss": 0.1621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16722847521305084, |
| "step": 3260, |
| "valid_targets_mean": 5286.9, |
| "valid_targets_min": 2305 |
| }, |
| { |
| "epoch": 5.2576489533011275, |
| "grad_norm": 0.5009816722230198, |
| "learning_rate": 7.099190115083259e-06, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17297816276550293, |
| "step": 3265, |
| "valid_targets_mean": 4930.7, |
| "valid_targets_min": 2434 |
| }, |
| { |
| "epoch": 5.265700483091788, |
| "grad_norm": 0.5600085277272723, |
| "learning_rate": 7.037928149828608e-06, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18866902589797974, |
| "step": 3270, |
| "valid_targets_mean": 4635.0, |
| "valid_targets_min": 1444 |
| }, |
| { |
| "epoch": 5.273752012882448, |
| "grad_norm": 0.5153595033812705, |
| "learning_rate": 6.97687516995279e-06, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15133386850357056, |
| "step": 3275, |
| "valid_targets_mean": 4087.8, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 5.281803542673108, |
| "grad_norm": 0.5588332326443939, |
| "learning_rate": 6.916032159803088e-06, |
| "loss": 0.1838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20162728428840637, |
| "step": 3280, |
| "valid_targets_mean": 4709.9, |
| "valid_targets_min": 2151 |
| }, |
| { |
| "epoch": 5.2898550724637685, |
| "grad_norm": 0.5640390114972573, |
| "learning_rate": 6.855400100341458e-06, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17432144284248352, |
| "step": 3285, |
| "valid_targets_mean": 3788.3, |
| "valid_targets_min": 543 |
| }, |
| { |
| "epoch": 5.297906602254429, |
| "grad_norm": 0.5376565233222369, |
| "learning_rate": 6.794979969128755e-06, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16141164302825928, |
| "step": 3290, |
| "valid_targets_mean": 4118.3, |
| "valid_targets_min": 1706 |
| }, |
| { |
| "epoch": 5.305958132045088, |
| "grad_norm": 0.5378942356008535, |
| "learning_rate": 6.7347727403089325e-06, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17127177119255066, |
| "step": 3295, |
| "valid_targets_mean": 4600.5, |
| "valid_targets_min": 1136 |
| }, |
| { |
| "epoch": 5.314009661835748, |
| "grad_norm": 0.48776680886655227, |
| "learning_rate": 6.674779384593373e-06, |
| "loss": 0.1591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13992200791835785, |
| "step": 3300, |
| "valid_targets_mean": 4386.2, |
| "valid_targets_min": 1725 |
| }, |
| { |
| "epoch": 5.322061191626409, |
| "grad_norm": 0.5329626208836868, |
| "learning_rate": 6.61500086924519e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17515888810157776, |
| "step": 3305, |
| "valid_targets_mean": 4181.7, |
| "valid_targets_min": 290 |
| }, |
| { |
| "epoch": 5.330112721417069, |
| "grad_norm": 0.46016033498034964, |
| "learning_rate": 6.555438158063683e-06, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17031973600387573, |
| "step": 3310, |
| "valid_targets_mean": 5609.8, |
| "valid_targets_min": 1475 |
| }, |
| { |
| "epoch": 5.338164251207729, |
| "grad_norm": 0.7890593958793812, |
| "learning_rate": 6.4960922113687695e-06, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17659761011600494, |
| "step": 3315, |
| "valid_targets_mean": 3941.4, |
| "valid_targets_min": 1450 |
| }, |
| { |
| "epoch": 5.3462157809983895, |
| "grad_norm": 0.5703421349872555, |
| "learning_rate": 6.4369639859855115e-06, |
| "loss": 0.1637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17057812213897705, |
| "step": 3320, |
| "valid_targets_mean": 4658.4, |
| "valid_targets_min": 1863 |
| }, |
| { |
| "epoch": 5.35426731078905, |
| "grad_norm": 0.564126182226765, |
| "learning_rate": 6.378054435228671e-06, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18041761219501495, |
| "step": 3325, |
| "valid_targets_mean": 4159.0, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 5.36231884057971, |
| "grad_norm": 0.4973048643598519, |
| "learning_rate": 6.319364508887371e-06, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1592758297920227, |
| "step": 3330, |
| "valid_targets_mean": 4736.2, |
| "valid_targets_min": 1812 |
| }, |
| { |
| "epoch": 5.37037037037037, |
| "grad_norm": 0.569769342446689, |
| "learning_rate": 6.260895153209763e-06, |
| "loss": 0.1644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18152937293052673, |
| "step": 3335, |
| "valid_targets_mean": 4268.9, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 5.3784219001610305, |
| "grad_norm": 0.5016879405573162, |
| "learning_rate": 6.202647310887764e-06, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17833814024925232, |
| "step": 3340, |
| "valid_targets_mean": 4741.9, |
| "valid_targets_min": 1679 |
| }, |
| { |
| "epoch": 5.386473429951691, |
| "grad_norm": 0.5247407647892519, |
| "learning_rate": 6.14462192104188e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20044955611228943, |
| "step": 3345, |
| "valid_targets_mean": 4656.0, |
| "valid_targets_min": 2099 |
| }, |
| { |
| "epoch": 5.394524959742351, |
| "grad_norm": 0.47014870620352595, |
| "learning_rate": 6.086819919206051e-06, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17010408639907837, |
| "step": 3350, |
| "valid_targets_mean": 5653.4, |
| "valid_targets_min": 2097 |
| }, |
| { |
| "epoch": 5.402576489533011, |
| "grad_norm": 0.6060057637724512, |
| "learning_rate": 6.029242237312554e-06, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18121179938316345, |
| "step": 3355, |
| "valid_targets_mean": 5222.9, |
| "valid_targets_min": 532 |
| }, |
| { |
| "epoch": 5.4106280193236715, |
| "grad_norm": 0.5270241265183322, |
| "learning_rate": 5.971889803676996e-06, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16754843294620514, |
| "step": 3360, |
| "valid_targets_mean": 4372.1, |
| "valid_targets_min": 1892 |
| }, |
| { |
| "epoch": 5.418679549114332, |
| "grad_norm": 0.5131324243265083, |
| "learning_rate": 5.914763542983355e-06, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18260961771011353, |
| "step": 3365, |
| "valid_targets_mean": 5181.3, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 5.426731078904992, |
| "grad_norm": 0.5192149826300284, |
| "learning_rate": 5.857864376269051e-06, |
| "loss": 0.1837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18823757767677307, |
| "step": 3370, |
| "valid_targets_mean": 4809.2, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 5.434782608695652, |
| "grad_norm": 0.5980250860155677, |
| "learning_rate": 5.801193220910108e-06, |
| "loss": 0.1539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16703063249588013, |
| "step": 3375, |
| "valid_targets_mean": 4509.7, |
| "valid_targets_min": 1367 |
| }, |
| { |
| "epoch": 5.442834138486313, |
| "grad_norm": 0.551837937511895, |
| "learning_rate": 5.744750990606356e-06, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15874727070331573, |
| "step": 3380, |
| "valid_targets_mean": 3712.6, |
| "valid_targets_min": 311 |
| }, |
| { |
| "epoch": 5.450885668276973, |
| "grad_norm": 0.49161398228706626, |
| "learning_rate": 5.688538595366706e-06, |
| "loss": 0.1569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.155176043510437, |
| "step": 3385, |
| "valid_targets_mean": 4476.1, |
| "valid_targets_min": 1936 |
| }, |
| { |
| "epoch": 5.458937198067633, |
| "grad_norm": 0.5355381631745951, |
| "learning_rate": 5.632556941494482e-06, |
| "loss": 0.1687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.153697669506073, |
| "step": 3390, |
| "valid_targets_mean": 3974.2, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 5.466988727858293, |
| "grad_norm": 0.5115948764108772, |
| "learning_rate": 5.5768069315727895e-06, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1722053587436676, |
| "step": 3395, |
| "valid_targets_mean": 4293.4, |
| "valid_targets_min": 2260 |
| }, |
| { |
| "epoch": 5.475040257648954, |
| "grad_norm": 0.4799188086454644, |
| "learning_rate": 5.521289464449975e-06, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17728543281555176, |
| "step": 3400, |
| "valid_targets_mean": 5211.7, |
| "valid_targets_min": 363 |
| }, |
| { |
| "epoch": 5.483091787439614, |
| "grad_norm": 0.5570316610757228, |
| "learning_rate": 5.46600543522515e-06, |
| "loss": 0.1694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16196802258491516, |
| "step": 3405, |
| "valid_targets_mean": 4058.4, |
| "valid_targets_min": 653 |
| }, |
| { |
| "epoch": 5.491143317230274, |
| "grad_norm": 0.6736055907952796, |
| "learning_rate": 5.410955735233736e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.171076238155365, |
| "step": 3410, |
| "valid_targets_mean": 5974.8, |
| "valid_targets_min": 2681 |
| }, |
| { |
| "epoch": 5.499194847020934, |
| "grad_norm": 0.5508461582818147, |
| "learning_rate": 5.3561412520331025e-06, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14637523889541626, |
| "step": 3415, |
| "valid_targets_mean": 4094.3, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 5.507246376811594, |
| "grad_norm": 0.5142188355081284, |
| "learning_rate": 5.30156286938826e-06, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1733294427394867, |
| "step": 3420, |
| "valid_targets_mean": 4461.4, |
| "valid_targets_min": 1105 |
| }, |
| { |
| "epoch": 5.515297906602254, |
| "grad_norm": 0.5905481814384393, |
| "learning_rate": 5.24722146725761e-06, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17892040312290192, |
| "step": 3425, |
| "valid_targets_mean": 4002.8, |
| "valid_targets_min": 1672 |
| }, |
| { |
| "epoch": 5.523349436392914, |
| "grad_norm": 0.45334104473741593, |
| "learning_rate": 5.193117921778743e-06, |
| "loss": 0.1616, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13965705037117004, |
| "step": 3430, |
| "valid_targets_mean": 4802.2, |
| "valid_targets_min": 1812 |
| }, |
| { |
| "epoch": 5.531400966183575, |
| "grad_norm": 0.742354374585886, |
| "learning_rate": 5.139253105254336e-06, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18780140578746796, |
| "step": 3435, |
| "valid_targets_mean": 4082.1, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 5.539452495974235, |
| "grad_norm": 0.44385771676975855, |
| "learning_rate": 5.085627886138078e-06, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14621910452842712, |
| "step": 3440, |
| "valid_targets_mean": 5131.4, |
| "valid_targets_min": 1610 |
| }, |
| { |
| "epoch": 5.547504025764895, |
| "grad_norm": 0.47820099076305106, |
| "learning_rate": 5.032243129020671e-06, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16836556792259216, |
| "step": 3445, |
| "valid_targets_mean": 5182.5, |
| "valid_targets_min": 1770 |
| }, |
| { |
| "epoch": 5.555555555555555, |
| "grad_norm": 0.5335135512220336, |
| "learning_rate": 4.9790996946158695e-06, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18833035230636597, |
| "step": 3450, |
| "valid_targets_mean": 4468.0, |
| "valid_targets_min": 1464 |
| }, |
| { |
| "epoch": 5.563607085346216, |
| "grad_norm": 0.5452849565299809, |
| "learning_rate": 4.926198439746641e-06, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16549217700958252, |
| "step": 3455, |
| "valid_targets_mean": 3943.1, |
| "valid_targets_min": 1663 |
| }, |
| { |
| "epoch": 5.571658615136876, |
| "grad_norm": 0.47569229716225025, |
| "learning_rate": 4.873540217331325e-06, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14578670263290405, |
| "step": 3460, |
| "valid_targets_mean": 4942.0, |
| "valid_targets_min": 1587 |
| }, |
| { |
| "epoch": 5.579710144927536, |
| "grad_norm": 0.6257220241925262, |
| "learning_rate": 4.82112587636989e-06, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14457204937934875, |
| "step": 3465, |
| "valid_targets_mean": 4796.1, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 5.587761674718196, |
| "grad_norm": 0.5126249751180715, |
| "learning_rate": 4.768956261930233e-06, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21914073824882507, |
| "step": 3470, |
| "valid_targets_mean": 5159.1, |
| "valid_targets_min": 1672 |
| }, |
| { |
| "epoch": 5.595813204508857, |
| "grad_norm": 0.5030438743653675, |
| "learning_rate": 4.717032215134576e-06, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1816645860671997, |
| "step": 3475, |
| "valid_targets_mean": 5501.6, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 5.603864734299517, |
| "grad_norm": 0.7789904581155889, |
| "learning_rate": 4.66535457314589e-06, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1629607379436493, |
| "step": 3480, |
| "valid_targets_mean": 5301.9, |
| "valid_targets_min": 1650 |
| }, |
| { |
| "epoch": 5.611916264090177, |
| "grad_norm": 0.5094527470833449, |
| "learning_rate": 4.613924169154406e-06, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16425767540931702, |
| "step": 3485, |
| "valid_targets_mean": 4554.6, |
| "valid_targets_min": 1654 |
| }, |
| { |
| "epoch": 5.6199677938808374, |
| "grad_norm": 0.48660247544704416, |
| "learning_rate": 4.5627418323641705e-06, |
| "loss": 0.1644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17449656128883362, |
| "step": 3490, |
| "valid_targets_mean": 5440.4, |
| "valid_targets_min": 3305 |
| }, |
| { |
| "epoch": 5.628019323671498, |
| "grad_norm": 0.6588365172160204, |
| "learning_rate": 4.51180838797969e-06, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16700059175491333, |
| "step": 3495, |
| "valid_targets_mean": 3524.9, |
| "valid_targets_min": 431 |
| }, |
| { |
| "epoch": 5.636070853462158, |
| "grad_norm": 0.5649424861690088, |
| "learning_rate": 4.461124657192612e-06, |
| "loss": 0.1923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16424767673015594, |
| "step": 3500, |
| "valid_targets_mean": 3976.2, |
| "valid_targets_min": 327 |
| }, |
| { |
| "epoch": 5.644122383252818, |
| "grad_norm": 0.5402856059826509, |
| "learning_rate": 4.410691457168488e-06, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17043063044548035, |
| "step": 3505, |
| "valid_targets_mean": 4236.4, |
| "valid_targets_min": 1605 |
| }, |
| { |
| "epoch": 5.6521739130434785, |
| "grad_norm": 0.6565234736534431, |
| "learning_rate": 4.3605096010336115e-06, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19410403072834015, |
| "step": 3510, |
| "valid_targets_mean": 3966.3, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 5.660225442834139, |
| "grad_norm": 0.46809524453228724, |
| "learning_rate": 4.310579897861902e-06, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14890244603157043, |
| "step": 3515, |
| "valid_targets_mean": 5078.9, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 5.668276972624799, |
| "grad_norm": 0.5402583356363803, |
| "learning_rate": 4.26090315266185e-06, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18138787150382996, |
| "step": 3520, |
| "valid_targets_mean": 4479.4, |
| "valid_targets_min": 1667 |
| }, |
| { |
| "epoch": 5.676328502415459, |
| "grad_norm": 0.5567198301706011, |
| "learning_rate": 4.2114801663635504e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19387924671173096, |
| "step": 3525, |
| "valid_targets_mean": 4855.1, |
| "valid_targets_min": 1475 |
| }, |
| { |
| "epoch": 5.6843800322061195, |
| "grad_norm": 0.5076182712626346, |
| "learning_rate": 4.1623117358057865e-06, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16965937614440918, |
| "step": 3530, |
| "valid_targets_mean": 4802.6, |
| "valid_targets_min": 2133 |
| }, |
| { |
| "epoch": 5.692431561996779, |
| "grad_norm": 0.5638233787105313, |
| "learning_rate": 4.113398653723168e-06, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1688123494386673, |
| "step": 3535, |
| "valid_targets_mean": 4551.8, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 5.70048309178744, |
| "grad_norm": 0.6026682576927842, |
| "learning_rate": 4.0647417087333776e-06, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17929375171661377, |
| "step": 3540, |
| "valid_targets_mean": 4203.6, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 5.708534621578099, |
| "grad_norm": 0.4840327343136473, |
| "learning_rate": 4.0163416853244385e-06, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15817004442214966, |
| "step": 3545, |
| "valid_targets_mean": 4813.0, |
| "valid_targets_min": 321 |
| }, |
| { |
| "epoch": 5.71658615136876, |
| "grad_norm": 0.5122311264991213, |
| "learning_rate": 3.968199363842056e-06, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15911847352981567, |
| "step": 3550, |
| "valid_targets_mean": 4163.8, |
| "valid_targets_min": 2141 |
| }, |
| { |
| "epoch": 5.72463768115942, |
| "grad_norm": 0.5526613981940242, |
| "learning_rate": 3.920315520477065e-06, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16690890491008759, |
| "step": 3555, |
| "valid_targets_mean": 3781.4, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 5.73268921095008, |
| "grad_norm": 0.5154673260140975, |
| "learning_rate": 3.872690927252891e-06, |
| "loss": 0.1775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18027852475643158, |
| "step": 3560, |
| "valid_targets_mean": 4373.6, |
| "valid_targets_min": 1594 |
| }, |
| { |
| "epoch": 5.7407407407407405, |
| "grad_norm": 0.48703994856912225, |
| "learning_rate": 3.825326352013119e-06, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16559578478336334, |
| "step": 3565, |
| "valid_targets_mean": 4382.0, |
| "valid_targets_min": 1603 |
| }, |
| { |
| "epoch": 5.748792270531401, |
| "grad_norm": 0.5472851978165418, |
| "learning_rate": 3.7782225584091016e-06, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15613017976284027, |
| "step": 3570, |
| "valid_targets_mean": 4052.4, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 5.756843800322061, |
| "grad_norm": 0.5873806542864478, |
| "learning_rate": 3.731380305887644e-06, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17352142930030823, |
| "step": 3575, |
| "valid_targets_mean": 4468.3, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 5.764895330112721, |
| "grad_norm": 0.562715584188104, |
| "learning_rate": 3.684800349678781e-06, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19309145212173462, |
| "step": 3580, |
| "valid_targets_mean": 3819.3, |
| "valid_targets_min": 831 |
| }, |
| { |
| "epoch": 5.7729468599033815, |
| "grad_norm": 0.584825018902196, |
| "learning_rate": 3.638483440783576e-06, |
| "loss": 0.1728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22266249358654022, |
| "step": 3585, |
| "valid_targets_mean": 4084.6, |
| "valid_targets_min": 1924 |
| }, |
| { |
| "epoch": 5.780998389694042, |
| "grad_norm": 0.5288099238647191, |
| "learning_rate": 3.5924303259620307e-06, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15193787217140198, |
| "step": 3590, |
| "valid_targets_mean": 4209.9, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 5.789049919484702, |
| "grad_norm": 0.5275609216950717, |
| "learning_rate": 3.546641747721036e-06, |
| "loss": 0.1892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16384585201740265, |
| "step": 3595, |
| "valid_targets_mean": 4627.3, |
| "valid_targets_min": 1626 |
| }, |
| { |
| "epoch": 5.797101449275362, |
| "grad_norm": 0.725525221737914, |
| "learning_rate": 3.501118444302394e-06, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18506191670894623, |
| "step": 3600, |
| "valid_targets_mean": 3873.7, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 5.805152979066023, |
| "grad_norm": 0.5082224637456563, |
| "learning_rate": 3.4558611496709384e-06, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.165011465549469, |
| "step": 3605, |
| "valid_targets_mean": 4355.2, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 5.813204508856683, |
| "grad_norm": 0.8025807922419831, |
| "learning_rate": 3.4108705935026685e-06, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15931957960128784, |
| "step": 3610, |
| "valid_targets_mean": 3695.9, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 5.821256038647343, |
| "grad_norm": 0.5168844656413334, |
| "learning_rate": 3.3661475011730206e-06, |
| "loss": 0.1639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15300890803337097, |
| "step": 3615, |
| "valid_targets_mean": 4747.3, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 5.829307568438003, |
| "grad_norm": 0.5249631418738182, |
| "learning_rate": 3.321692593745147e-06, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15493711829185486, |
| "step": 3620, |
| "valid_targets_mean": 3726.0, |
| "valid_targets_min": 1610 |
| }, |
| { |
| "epoch": 5.837359098228664, |
| "grad_norm": 0.5331107342319671, |
| "learning_rate": 3.2775065879582948e-06, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17267771065235138, |
| "step": 3625, |
| "valid_targets_mean": 5503.0, |
| "valid_targets_min": 1978 |
| }, |
| { |
| "epoch": 5.845410628019324, |
| "grad_norm": 0.5222892591386691, |
| "learning_rate": 3.233590196216263e-06, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1816999316215515, |
| "step": 3630, |
| "valid_targets_mean": 4842.2, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 5.853462157809984, |
| "grad_norm": 0.5132154525081916, |
| "learning_rate": 3.1899441265759036e-06, |
| "loss": 0.1808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19336271286010742, |
| "step": 3635, |
| "valid_targets_mean": 5282.2, |
| "valid_targets_min": 1948 |
| }, |
| { |
| "epoch": 5.861513687600644, |
| "grad_norm": 0.5087976961623909, |
| "learning_rate": 3.1465690827356955e-06, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17752087116241455, |
| "step": 3640, |
| "valid_targets_mean": 4912.0, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 5.869565217391305, |
| "grad_norm": 0.5723530802904422, |
| "learning_rate": 3.103465764024438e-06, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1567440927028656, |
| "step": 3645, |
| "valid_targets_mean": 3882.6, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 5.877616747181965, |
| "grad_norm": 0.6212444706400745, |
| "learning_rate": 3.0606348653899288e-06, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16555482149124146, |
| "step": 3650, |
| "valid_targets_mean": 4280.1, |
| "valid_targets_min": 1429 |
| }, |
| { |
| "epoch": 5.885668276972625, |
| "grad_norm": 0.6037643784134114, |
| "learning_rate": 3.0180770773877866e-06, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1539427787065506, |
| "step": 3655, |
| "valid_targets_mean": 3446.1, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 5.8937198067632846, |
| "grad_norm": 0.5417204859207484, |
| "learning_rate": 2.9757930861703223e-06, |
| "loss": 0.1546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1333686113357544, |
| "step": 3660, |
| "valid_targets_mean": 4272.0, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 5.901771336553946, |
| "grad_norm": 0.545060770024728, |
| "learning_rate": 2.9337835734754504e-06, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16815856099128723, |
| "step": 3665, |
| "valid_targets_mean": 4364.4, |
| "valid_targets_min": 1968 |
| }, |
| { |
| "epoch": 5.909822866344605, |
| "grad_norm": 0.4807913485701676, |
| "learning_rate": 2.892049216615724e-06, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16856727004051208, |
| "step": 3670, |
| "valid_targets_mean": 4645.9, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 5.917874396135265, |
| "grad_norm": 0.5872896027676431, |
| "learning_rate": 2.850590688467405e-06, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17276933789253235, |
| "step": 3675, |
| "valid_targets_mean": 4079.1, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 5.925925925925926, |
| "grad_norm": 0.5081772741434722, |
| "learning_rate": 2.8094086574595934e-06, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17815062403678894, |
| "step": 3680, |
| "valid_targets_mean": 4622.2, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 5.933977455716586, |
| "grad_norm": 0.5314566948595292, |
| "learning_rate": 2.768503787563497e-06, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15440833568572998, |
| "step": 3685, |
| "valid_targets_mean": 4177.4, |
| "valid_targets_min": 1764 |
| }, |
| { |
| "epoch": 5.942028985507246, |
| "grad_norm": 0.5944657537451915, |
| "learning_rate": 2.7278767382816828e-06, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15870711207389832, |
| "step": 3690, |
| "valid_targets_mean": 4034.2, |
| "valid_targets_min": 346 |
| }, |
| { |
| "epoch": 5.950080515297906, |
| "grad_norm": 0.5150609346752764, |
| "learning_rate": 2.687528164637474e-06, |
| "loss": 0.1682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16893523931503296, |
| "step": 3695, |
| "valid_targets_mean": 4341.7, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 5.958132045088567, |
| "grad_norm": 0.622800014898735, |
| "learning_rate": 2.647458717164357e-06, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1420368254184723, |
| "step": 3700, |
| "valid_targets_mean": 4181.0, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 5.966183574879227, |
| "grad_norm": 0.5118850984097806, |
| "learning_rate": 2.607669041895535e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17651256918907166, |
| "step": 3705, |
| "valid_targets_mean": 5766.2, |
| "valid_targets_min": 2526 |
| }, |
| { |
| "epoch": 5.974235104669887, |
| "grad_norm": 0.5922490816235029, |
| "learning_rate": 2.568159780353476e-06, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15372015535831451, |
| "step": 3710, |
| "valid_targets_mean": 3693.7, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 5.982286634460547, |
| "grad_norm": 0.5223810749820793, |
| "learning_rate": 2.5289315695395834e-06, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17238521575927734, |
| "step": 3715, |
| "valid_targets_mean": 3895.1, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 5.990338164251208, |
| "grad_norm": 0.6140059891446761, |
| "learning_rate": 2.489985041923928e-06, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18047456443309784, |
| "step": 3720, |
| "valid_targets_mean": 4203.8, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 5.998389694041868, |
| "grad_norm": 0.5110659722384324, |
| "learning_rate": 2.4513208254350486e-06, |
| "loss": 0.1749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1803944855928421, |
| "step": 3725, |
| "valid_targets_mean": 4611.9, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 6.006441223832528, |
| "grad_norm": 0.46649632563361154, |
| "learning_rate": 2.412939543449828e-06, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1679632067680359, |
| "step": 3730, |
| "valid_targets_mean": 4868.8, |
| "valid_targets_min": 1373 |
| }, |
| { |
| "epoch": 6.0144927536231885, |
| "grad_norm": 0.5752464912619374, |
| "learning_rate": 2.3748418147834394e-06, |
| "loss": 0.1728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14780664443969727, |
| "step": 3735, |
| "valid_targets_mean": 3625.4, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 6.022544283413849, |
| "grad_norm": 0.4873295942554316, |
| "learning_rate": 2.337028253679381e-06, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14143216609954834, |
| "step": 3740, |
| "valid_targets_mean": 4609.2, |
| "valid_targets_min": 1716 |
| }, |
| { |
| "epoch": 6.030595813204509, |
| "grad_norm": 0.4572827913243831, |
| "learning_rate": 2.299499469799542e-06, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1580767184495926, |
| "step": 3745, |
| "valid_targets_mean": 5816.4, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 6.038647342995169, |
| "grad_norm": 0.5186439466567816, |
| "learning_rate": 2.262256068214421e-06, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17476163804531097, |
| "step": 3750, |
| "valid_targets_mean": 4437.0, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 6.0466988727858295, |
| "grad_norm": 0.5118711095108422, |
| "learning_rate": 2.2252986493933237e-06, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16541600227355957, |
| "step": 3755, |
| "valid_targets_mean": 4525.7, |
| "valid_targets_min": 2162 |
| }, |
| { |
| "epoch": 6.05475040257649, |
| "grad_norm": 0.5109434582294012, |
| "learning_rate": 2.18862780919471e-06, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15595577657222748, |
| "step": 3760, |
| "valid_targets_mean": 4511.2, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 6.06280193236715, |
| "grad_norm": 0.5324485507591655, |
| "learning_rate": 2.152244138856585e-06, |
| "loss": 0.1559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1731036901473999, |
| "step": 3765, |
| "valid_targets_mean": 4594.2, |
| "valid_targets_min": 1788 |
| }, |
| { |
| "epoch": 6.07085346215781, |
| "grad_norm": 0.4936303320259845, |
| "learning_rate": 2.1161482249869513e-06, |
| "loss": 0.1499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14089539647102356, |
| "step": 3770, |
| "valid_targets_mean": 5116.8, |
| "valid_targets_min": 422 |
| }, |
| { |
| "epoch": 6.078904991948471, |
| "grad_norm": 0.5698965758566077, |
| "learning_rate": 2.080340649554369e-06, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16755038499832153, |
| "step": 3775, |
| "valid_targets_mean": 4225.4, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 6.086956521739131, |
| "grad_norm": 0.5229210197667631, |
| "learning_rate": 2.044821989878558e-06, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16623234748840332, |
| "step": 3780, |
| "valid_targets_mean": 4262.9, |
| "valid_targets_min": 1577 |
| }, |
| { |
| "epoch": 6.095008051529791, |
| "grad_norm": 0.5459701049906057, |
| "learning_rate": 2.0095928186210956e-06, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.147607684135437, |
| "step": 3785, |
| "valid_targets_mean": 4724.4, |
| "valid_targets_min": 1787 |
| }, |
| { |
| "epoch": 6.1030595813204505, |
| "grad_norm": 0.5581543823448861, |
| "learning_rate": 1.974653703776188e-06, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18220457434654236, |
| "step": 3790, |
| "valid_targets_mean": 5031.3, |
| "valid_targets_min": 392 |
| }, |
| { |
| "epoch": 6.111111111111111, |
| "grad_norm": 0.5197842393741545, |
| "learning_rate": 1.9400052086615153e-06, |
| "loss": 0.175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1598493456840515, |
| "step": 3795, |
| "valid_targets_mean": 4375.8, |
| "valid_targets_min": 1759 |
| }, |
| { |
| "epoch": 6.119162640901771, |
| "grad_norm": 0.5494186611639191, |
| "learning_rate": 1.9056478919091236e-06, |
| "loss": 0.1735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19067052006721497, |
| "step": 3800, |
| "valid_targets_mean": 4341.0, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.127214170692431, |
| "grad_norm": 0.5103976820611801, |
| "learning_rate": 1.8715823074564587e-06, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15958425402641296, |
| "step": 3805, |
| "valid_targets_mean": 4729.6, |
| "valid_targets_min": 362 |
| }, |
| { |
| "epoch": 6.1352657004830915, |
| "grad_norm": 0.5752435508668234, |
| "learning_rate": 1.837809004537401e-06, |
| "loss": 0.1579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1595839112997055, |
| "step": 3810, |
| "valid_targets_mean": 4986.8, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 6.143317230273752, |
| "grad_norm": 0.6232969103900382, |
| "learning_rate": 1.8043285276734334e-06, |
| "loss": 0.1663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17083576321601868, |
| "step": 3815, |
| "valid_targets_mean": 3214.8, |
| "valid_targets_min": 547 |
| }, |
| { |
| "epoch": 6.151368760064412, |
| "grad_norm": 0.5085611865605083, |
| "learning_rate": 1.7711414166648365e-06, |
| "loss": 0.1522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15489043295383453, |
| "step": 3820, |
| "valid_targets_mean": 4428.2, |
| "valid_targets_min": 1416 |
| }, |
| { |
| "epoch": 6.159420289855072, |
| "grad_norm": 0.5686690339243041, |
| "learning_rate": 1.7382482065820138e-06, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16790664196014404, |
| "step": 3825, |
| "valid_targets_mean": 4888.5, |
| "valid_targets_min": 1755 |
| }, |
| { |
| "epoch": 6.1674718196457325, |
| "grad_norm": 0.6929429650574811, |
| "learning_rate": 1.7056494277568503e-06, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1905716359615326, |
| "step": 3830, |
| "valid_targets_mean": 3701.2, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 6.175523349436393, |
| "grad_norm": 0.6367228356359814, |
| "learning_rate": 1.6733456057741592e-06, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1782214492559433, |
| "step": 3835, |
| "valid_targets_mean": 3788.4, |
| "valid_targets_min": 1742 |
| }, |
| { |
| "epoch": 6.183574879227053, |
| "grad_norm": 0.532748190271915, |
| "learning_rate": 1.641337261463216e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18782779574394226, |
| "step": 3840, |
| "valid_targets_mean": 4424.2, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 6.191626409017713, |
| "grad_norm": 0.5944352055775861, |
| "learning_rate": 1.6096249108893602e-06, |
| "loss": 0.1591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14986079931259155, |
| "step": 3845, |
| "valid_targets_mean": 4633.4, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 6.199677938808374, |
| "grad_norm": 0.4718113061336701, |
| "learning_rate": 1.5782090653456616e-06, |
| "loss": 0.1596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15445095300674438, |
| "step": 3850, |
| "valid_targets_mean": 5366.3, |
| "valid_targets_min": 2465 |
| }, |
| { |
| "epoch": 6.207729468599034, |
| "grad_norm": 0.5299032276018538, |
| "learning_rate": 1.547090231344699e-06, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1652597188949585, |
| "step": 3855, |
| "valid_targets_mean": 4490.8, |
| "valid_targets_min": 2050 |
| }, |
| { |
| "epoch": 6.215780998389694, |
| "grad_norm": 0.4937926792080132, |
| "learning_rate": 1.5162689106103746e-06, |
| "loss": 0.1571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16262544691562653, |
| "step": 3860, |
| "valid_targets_mean": 5297.2, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 6.223832528180354, |
| "grad_norm": 0.5983118290721653, |
| "learning_rate": 1.4857456000698366e-06, |
| "loss": 0.176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21267688274383545, |
| "step": 3865, |
| "valid_targets_mean": 5259.9, |
| "valid_targets_min": 1772 |
| }, |
| { |
| "epoch": 6.231884057971015, |
| "grad_norm": 0.5186630493468379, |
| "learning_rate": 1.4555207918454662e-06, |
| "loss": 0.1758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20158061385154724, |
| "step": 3870, |
| "valid_targets_mean": 5251.4, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 6.239935587761675, |
| "grad_norm": 0.5732567692410732, |
| "learning_rate": 1.4255949732469309e-06, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15088540315628052, |
| "step": 3875, |
| "valid_targets_mean": 3437.3, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 6.247987117552335, |
| "grad_norm": 0.5122360577374575, |
| "learning_rate": 1.3959686267633488e-06, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1651184856891632, |
| "step": 3880, |
| "valid_targets_mean": 5088.6, |
| "valid_targets_min": 1995 |
| }, |
| { |
| "epoch": 6.256038647342995, |
| "grad_norm": 0.48110861215986517, |
| "learning_rate": 1.3666422300554905e-06, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16647136211395264, |
| "step": 3885, |
| "valid_targets_mean": 5231.4, |
| "valid_targets_min": 2355 |
| }, |
| { |
| "epoch": 6.264090177133656, |
| "grad_norm": 0.582851491108072, |
| "learning_rate": 1.3376162559480822e-06, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18534335494041443, |
| "step": 3890, |
| "valid_targets_mean": 4512.3, |
| "valid_targets_min": 2039 |
| }, |
| { |
| "epoch": 6.272141706924316, |
| "grad_norm": 0.5404662794082068, |
| "learning_rate": 1.308891172422193e-06, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1919654756784439, |
| "step": 3895, |
| "valid_targets_mean": 4829.6, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 6.280193236714976, |
| "grad_norm": 0.628437639331324, |
| "learning_rate": 1.2804674426076757e-06, |
| "loss": 0.174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21055009961128235, |
| "step": 3900, |
| "valid_targets_mean": 4256.2, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 6.2882447665056365, |
| "grad_norm": 0.4797286979992782, |
| "learning_rate": 1.2523455247757088e-06, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14173908531665802, |
| "step": 3905, |
| "valid_targets_mean": 5012.4, |
| "valid_targets_min": 1956 |
| }, |
| { |
| "epoch": 6.296296296296296, |
| "grad_norm": 0.5914383870555415, |
| "learning_rate": 1.224525872331408e-06, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17256557941436768, |
| "step": 3910, |
| "valid_targets_mean": 3722.4, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 6.304347826086957, |
| "grad_norm": 0.5475160234396864, |
| "learning_rate": 1.1970089338065071e-06, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16874639689922333, |
| "step": 3915, |
| "valid_targets_mean": 4964.1, |
| "valid_targets_min": 1411 |
| }, |
| { |
| "epoch": 6.312399355877616, |
| "grad_norm": 0.6352630163683538, |
| "learning_rate": 1.1697951528521422e-06, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16274841129779816, |
| "step": 3920, |
| "valid_targets_mean": 3514.2, |
| "valid_targets_min": 1903 |
| }, |
| { |
| "epoch": 6.320450885668277, |
| "grad_norm": 0.5450852465931986, |
| "learning_rate": 1.1428849682316766e-06, |
| "loss": 0.1545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16449615359306335, |
| "step": 3925, |
| "valid_targets_mean": 4061.4, |
| "valid_targets_min": 1262 |
| }, |
| { |
| "epoch": 6.328502415458937, |
| "grad_norm": 0.48987328370522754, |
| "learning_rate": 1.116278813813647e-06, |
| "loss": 0.1556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13572901487350464, |
| "step": 3930, |
| "valid_targets_mean": 4505.6, |
| "valid_targets_min": 1616 |
| }, |
| { |
| "epoch": 6.336553945249597, |
| "grad_norm": 0.503141267860805, |
| "learning_rate": 1.08997711856476e-06, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16356249153614044, |
| "step": 3935, |
| "valid_targets_mean": 4598.4, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 6.344605475040257, |
| "grad_norm": 0.7893130983095663, |
| "learning_rate": 1.0639803065429755e-06, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20338299870491028, |
| "step": 3940, |
| "valid_targets_mean": 5540.6, |
| "valid_targets_min": 2279 |
| }, |
| { |
| "epoch": 6.352657004830918, |
| "grad_norm": 0.5464519825128046, |
| "learning_rate": 1.0382887968906718e-06, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1746448576450348, |
| "step": 3945, |
| "valid_targets_mean": 3995.6, |
| "valid_targets_min": 1677 |
| }, |
| { |
| "epoch": 6.360708534621578, |
| "grad_norm": 0.5620117079550653, |
| "learning_rate": 1.012903003827883e-06, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1740240752696991, |
| "step": 3950, |
| "valid_targets_mean": 3910.2, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 6.368760064412238, |
| "grad_norm": 0.5014202584177402, |
| "learning_rate": 9.87823336645628e-07, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15709742903709412, |
| "step": 3955, |
| "valid_targets_mean": 4344.8, |
| "valid_targets_min": 2201 |
| }, |
| { |
| "epoch": 6.3768115942028984, |
| "grad_norm": 0.5362938011516779, |
| "learning_rate": 9.630501996993091e-07, |
| "loss": 0.163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17129208147525787, |
| "step": 3960, |
| "valid_targets_mean": 4717.5, |
| "valid_targets_min": 1989 |
| }, |
| { |
| "epoch": 6.384863123993559, |
| "grad_norm": 0.44355010700619574, |
| "learning_rate": 9.385839924021844e-07, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14925384521484375, |
| "step": 3965, |
| "valid_targets_mean": 5392.1, |
| "valid_targets_min": 2034 |
| }, |
| { |
| "epoch": 6.392914653784219, |
| "grad_norm": 0.5637410567366077, |
| "learning_rate": 9.144251092189416e-07, |
| "loss": 0.1721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2033105343580246, |
| "step": 3970, |
| "valid_targets_mean": 4397.6, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 6.400966183574879, |
| "grad_norm": 0.5246003448080508, |
| "learning_rate": 8.905739396593316e-07, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16925036907196045, |
| "step": 3975, |
| "valid_targets_mean": 4739.1, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 6.4090177133655395, |
| "grad_norm": 0.5406121384840578, |
| "learning_rate": 8.670308682718853e-07, |
| "loss": 0.1587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1594831645488739, |
| "step": 3980, |
| "valid_targets_mean": 4337.4, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 6.4170692431562, |
| "grad_norm": 0.4785613416301052, |
| "learning_rate": 8.437962746377204e-07, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1622602641582489, |
| "step": 3985, |
| "valid_targets_mean": 5365.6, |
| "valid_targets_min": 1316 |
| }, |
| { |
| "epoch": 6.42512077294686, |
| "grad_norm": 0.4972685992182721, |
| "learning_rate": 8.208705333644129e-07, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1673496663570404, |
| "step": 3990, |
| "valid_targets_mean": 4327.2, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 6.43317230273752, |
| "grad_norm": 0.51768549782515, |
| "learning_rate": 7.982540140799688e-07, |
| "loss": 0.1571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.161638081073761, |
| "step": 3995, |
| "valid_targets_mean": 4245.7, |
| "valid_targets_min": 1725 |
| }, |
| { |
| "epoch": 6.4412238325281805, |
| "grad_norm": 0.6255107806087558, |
| "learning_rate": 7.759470814268489e-07, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16319170594215393, |
| "step": 4000, |
| "valid_targets_mean": 3573.4, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 6.449275362318841, |
| "grad_norm": 0.5117136147623905, |
| "learning_rate": 7.539500950561063e-07, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18081682920455933, |
| "step": 4005, |
| "valid_targets_mean": 5030.6, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 6.457326892109501, |
| "grad_norm": 0.5410913172933577, |
| "learning_rate": 7.322634096215831e-07, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15669681131839752, |
| "step": 4010, |
| "valid_targets_mean": 4348.8, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 6.465378421900161, |
| "grad_norm": 0.4986868222815654, |
| "learning_rate": 7.108873747741807e-07, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14274120330810547, |
| "step": 4015, |
| "valid_targets_mean": 4543.1, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 6.473429951690822, |
| "grad_norm": 0.469433549650835, |
| "learning_rate": 6.898223351562405e-07, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15934091806411743, |
| "step": 4020, |
| "valid_targets_mean": 5432.7, |
| "valid_targets_min": 2526 |
| }, |
| { |
| "epoch": 6.481481481481482, |
| "grad_norm": 0.622115989263229, |
| "learning_rate": 6.690686303959748e-07, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18453718721866608, |
| "step": 4025, |
| "valid_targets_mean": 3467.2, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 6.489533011272142, |
| "grad_norm": 0.5270621108254152, |
| "learning_rate": 6.48626595101991e-07, |
| "loss": 0.1752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19507281482219696, |
| "step": 4030, |
| "valid_targets_mean": 5011.7, |
| "valid_targets_min": 2115 |
| }, |
| { |
| "epoch": 6.4975845410628015, |
| "grad_norm": 0.5614424641002262, |
| "learning_rate": 6.284965588579028e-07, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1735997200012207, |
| "step": 4035, |
| "valid_targets_mean": 4858.7, |
| "valid_targets_min": 1516 |
| }, |
| { |
| "epoch": 6.505636070853463, |
| "grad_norm": 0.6277678468034912, |
| "learning_rate": 6.08678846217019e-07, |
| "loss": 0.1553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.173121377825737, |
| "step": 4040, |
| "valid_targets_mean": 4697.3, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 6.513687600644122, |
| "grad_norm": 0.557886874518275, |
| "learning_rate": 5.891737766970984e-07, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16518916189670563, |
| "step": 4045, |
| "valid_targets_mean": 4401.9, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 6.521739130434782, |
| "grad_norm": 0.5026467498773549, |
| "learning_rate": 5.699816647752077e-07, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16781866550445557, |
| "step": 4050, |
| "valid_targets_mean": 4928.8, |
| "valid_targets_min": 2215 |
| }, |
| { |
| "epoch": 6.5297906602254425, |
| "grad_norm": 0.5451182471548547, |
| "learning_rate": 5.511028198826496e-07, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17092815041542053, |
| "step": 4055, |
| "valid_targets_mean": 4106.2, |
| "valid_targets_min": 451 |
| }, |
| { |
| "epoch": 6.537842190016103, |
| "grad_norm": 0.5743885198199623, |
| "learning_rate": 5.32537546399976e-07, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16788442432880402, |
| "step": 4060, |
| "valid_targets_mean": 4289.1, |
| "valid_targets_min": 1684 |
| }, |
| { |
| "epoch": 6.545893719806763, |
| "grad_norm": 0.6037224090967725, |
| "learning_rate": 5.142861436520763e-07, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20297744870185852, |
| "step": 4065, |
| "valid_targets_mean": 3997.9, |
| "valid_targets_min": 383 |
| }, |
| { |
| "epoch": 6.553945249597423, |
| "grad_norm": 0.8388825418667704, |
| "learning_rate": 4.963489059033477e-07, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16553989052772522, |
| "step": 4070, |
| "valid_targets_mean": 4784.5, |
| "valid_targets_min": 2033 |
| }, |
| { |
| "epoch": 6.561996779388084, |
| "grad_norm": 0.5970930999537574, |
| "learning_rate": 4.787261223529616e-07, |
| "loss": 0.165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17344771325588226, |
| "step": 4075, |
| "valid_targets_mean": 3786.6, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 6.570048309178744, |
| "grad_norm": 0.471204909767901, |
| "learning_rate": 4.6141807713019793e-07, |
| "loss": 0.155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13417160511016846, |
| "step": 4080, |
| "valid_targets_mean": 5032.4, |
| "valid_targets_min": 1912 |
| }, |
| { |
| "epoch": 6.578099838969404, |
| "grad_norm": 0.4884625900862524, |
| "learning_rate": 4.444250492898539e-07, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16039326786994934, |
| "step": 4085, |
| "valid_targets_mean": 5670.8, |
| "valid_targets_min": 1963 |
| }, |
| { |
| "epoch": 6.586151368760064, |
| "grad_norm": 1.3562926760409872, |
| "learning_rate": 4.277473128077625e-07, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15605992078781128, |
| "step": 4090, |
| "valid_targets_mean": 5004.9, |
| "valid_targets_min": 390 |
| }, |
| { |
| "epoch": 6.594202898550725, |
| "grad_norm": 0.5293266001333903, |
| "learning_rate": 4.113851365763544e-07, |
| "loss": 0.1626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1735745668411255, |
| "step": 4095, |
| "valid_targets_mean": 5240.4, |
| "valid_targets_min": 1701 |
| }, |
| { |
| "epoch": 6.602254428341385, |
| "grad_norm": 0.5578624317503144, |
| "learning_rate": 3.953387844003431e-07, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1669292151927948, |
| "step": 4100, |
| "valid_targets_mean": 4350.2, |
| "valid_targets_min": 2309 |
| }, |
| { |
| "epoch": 6.610305958132045, |
| "grad_norm": 0.604399390427962, |
| "learning_rate": 3.7960851499245554e-07, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14910921454429626, |
| "step": 4105, |
| "valid_targets_mean": 3900.4, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 6.618357487922705, |
| "grad_norm": 0.5270613962718504, |
| "learning_rate": 3.6419458196926825e-07, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1642162799835205, |
| "step": 4110, |
| "valid_targets_mean": 4613.5, |
| "valid_targets_min": 1191 |
| }, |
| { |
| "epoch": 6.626409017713366, |
| "grad_norm": 0.4768249623670376, |
| "learning_rate": 3.4909723384712436e-07, |
| "loss": 0.1647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15536585450172424, |
| "step": 4115, |
| "valid_targets_mean": 4920.4, |
| "valid_targets_min": 1743 |
| }, |
| { |
| "epoch": 6.634460547504026, |
| "grad_norm": 0.7880877824521434, |
| "learning_rate": 3.3431671403811207e-07, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14975430071353912, |
| "step": 4120, |
| "valid_targets_mean": 4408.2, |
| "valid_targets_min": 431 |
| }, |
| { |
| "epoch": 6.642512077294686, |
| "grad_norm": 0.5055031311515263, |
| "learning_rate": 3.198532608461524e-07, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18191225826740265, |
| "step": 4125, |
| "valid_targets_mean": 5325.4, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 6.650563607085346, |
| "grad_norm": 0.7377711817281254, |
| "learning_rate": 3.0570710746314903e-07, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1757345199584961, |
| "step": 4130, |
| "valid_targets_mean": 4204.0, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 6.658615136876007, |
| "grad_norm": 0.49184719888721345, |
| "learning_rate": 2.9187848196524205e-07, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1542222797870636, |
| "step": 4135, |
| "valid_targets_mean": 4731.2, |
| "valid_targets_min": 429 |
| }, |
| { |
| "epoch": 6.666666666666667, |
| "grad_norm": 0.6105305368391408, |
| "learning_rate": 2.7836760730910464e-07, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17159178853034973, |
| "step": 4140, |
| "valid_targets_mean": 3496.8, |
| "valid_targets_min": 397 |
| }, |
| { |
| "epoch": 6.674718196457327, |
| "grad_norm": 0.5519746733795567, |
| "learning_rate": 2.6517470132838117e-07, |
| "loss": 0.1536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1730884313583374, |
| "step": 4145, |
| "valid_targets_mean": 4672.2, |
| "valid_targets_min": 1995 |
| }, |
| { |
| "epoch": 6.6827697262479875, |
| "grad_norm": 0.5635266522753974, |
| "learning_rate": 2.522999767301482e-07, |
| "loss": 0.1652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15275679528713226, |
| "step": 4150, |
| "valid_targets_mean": 3927.0, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 6.690821256038648, |
| "grad_norm": 0.5061168238375812, |
| "learning_rate": 2.3974364109149886e-07, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14958354830741882, |
| "step": 4155, |
| "valid_targets_mean": 3901.1, |
| "valid_targets_min": 1810 |
| }, |
| { |
| "epoch": 6.698872785829307, |
| "grad_norm": 0.5040398527635441, |
| "learning_rate": 2.2750589685619495e-07, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17061063647270203, |
| "step": 4160, |
| "valid_targets_mean": 4585.4, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 6.706924315619968, |
| "grad_norm": 0.5035025471661269, |
| "learning_rate": 2.1558694133139823e-07, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16706478595733643, |
| "step": 4165, |
| "valid_targets_mean": 4401.9, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 6.714975845410628, |
| "grad_norm": 0.5623618030459923, |
| "learning_rate": 2.039869666844929e-07, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1561906784772873, |
| "step": 4170, |
| "valid_targets_mean": 3450.5, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 6.723027375201288, |
| "grad_norm": 0.5216795359225037, |
| "learning_rate": 1.9270615993998375e-07, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1636110544204712, |
| "step": 4175, |
| "valid_targets_mean": 4135.8, |
| "valid_targets_min": 1656 |
| }, |
| { |
| "epoch": 6.731078904991948, |
| "grad_norm": 0.5368469010480501, |
| "learning_rate": 1.817447029764874e-07, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16674436628818512, |
| "step": 4180, |
| "valid_targets_mean": 4527.6, |
| "valid_targets_min": 1381 |
| }, |
| { |
| "epoch": 6.739130434782608, |
| "grad_norm": 0.6438973279011997, |
| "learning_rate": 1.7110277252379238e-07, |
| "loss": 0.1554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15082503855228424, |
| "step": 4185, |
| "valid_targets_mean": 4736.3, |
| "valid_targets_min": 1379 |
| }, |
| { |
| "epoch": 6.747181964573269, |
| "grad_norm": 0.4998287056476511, |
| "learning_rate": 1.607805401600149e-07, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17229287326335907, |
| "step": 4190, |
| "valid_targets_mean": 4969.6, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 6.755233494363929, |
| "grad_norm": 0.599169633423643, |
| "learning_rate": 1.5077817230883419e-07, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15904340147972107, |
| "step": 4195, |
| "valid_targets_mean": 4552.9, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 6.763285024154589, |
| "grad_norm": 0.570759522637566, |
| "learning_rate": 1.4109583023679706e-07, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15024811029434204, |
| "step": 4200, |
| "valid_targets_mean": 5746.9, |
| "valid_targets_min": 1892 |
| }, |
| { |
| "epoch": 6.7713365539452495, |
| "grad_norm": 0.5403647002807387, |
| "learning_rate": 1.3173367005073545e-07, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17785856127738953, |
| "step": 4205, |
| "valid_targets_mean": 4047.6, |
| "valid_targets_min": 2002 |
| }, |
| { |
| "epoch": 6.77938808373591, |
| "grad_norm": 0.5226238218670288, |
| "learning_rate": 1.2269184269523282e-07, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16204693913459778, |
| "step": 4210, |
| "valid_targets_mean": 4730.7, |
| "valid_targets_min": 1508 |
| }, |
| { |
| "epoch": 6.78743961352657, |
| "grad_norm": 0.5555947999177602, |
| "learning_rate": 1.1397049395020842e-07, |
| "loss": 0.154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16874821484088898, |
| "step": 4215, |
| "valid_targets_mean": 4100.5, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 6.79549114331723, |
| "grad_norm": 0.5473832146836152, |
| "learning_rate": 1.0556976442854805e-07, |
| "loss": 0.1628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18583595752716064, |
| "step": 4220, |
| "valid_targets_mean": 4135.4, |
| "valid_targets_min": 344 |
| }, |
| { |
| "epoch": 6.8035426731078905, |
| "grad_norm": 0.5690884856327217, |
| "learning_rate": 9.748978957385025e-08, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1753610521554947, |
| "step": 4225, |
| "valid_targets_mean": 4328.1, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 6.811594202898551, |
| "grad_norm": 0.5625787536362429, |
| "learning_rate": 8.9730699658237e-08, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15724310278892517, |
| "step": 4230, |
| "valid_targets_mean": 4711.9, |
| "valid_targets_min": 2299 |
| }, |
| { |
| "epoch": 6.819645732689211, |
| "grad_norm": 0.5162132722455169, |
| "learning_rate": 8.229261978025316e-08, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17424245178699493, |
| "step": 4235, |
| "valid_targets_mean": 4760.0, |
| "valid_targets_min": 2276 |
| }, |
| { |
| "epoch": 6.827697262479871, |
| "grad_norm": 0.6156039773080834, |
| "learning_rate": 7.517566986285474e-08, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1574200689792633, |
| "step": 4240, |
| "valid_targets_mean": 3681.5, |
| "valid_targets_min": 751 |
| }, |
| { |
| "epoch": 6.835748792270532, |
| "grad_norm": 0.5832771610140742, |
| "learning_rate": 6.837996465146823e-08, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17290878295898438, |
| "step": 4245, |
| "valid_targets_mean": 3748.6, |
| "valid_targets_min": 284 |
| }, |
| { |
| "epoch": 6.843800322061192, |
| "grad_norm": 0.5576720036336581, |
| "learning_rate": 6.190561371214321e-08, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16148659586906433, |
| "step": 4250, |
| "valid_targets_mean": 4166.0, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 6.851851851851852, |
| "grad_norm": 0.5878319666889452, |
| "learning_rate": 5.575272142978927e-08, |
| "loss": 0.1799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.172722727060318, |
| "step": 4255, |
| "valid_targets_mean": 4018.2, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 6.859903381642512, |
| "grad_norm": 0.479443149906381, |
| "learning_rate": 4.992138700649074e-08, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13948974013328552, |
| "step": 4260, |
| "valid_targets_mean": 4858.1, |
| "valid_targets_min": 1813 |
| }, |
| { |
| "epoch": 6.867954911433173, |
| "grad_norm": 0.5541385500661399, |
| "learning_rate": 4.4411704459903506e-08, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1660829335451126, |
| "step": 4265, |
| "valid_targets_mean": 4232.4, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 6.876006441223833, |
| "grad_norm": 0.6179225703483298, |
| "learning_rate": 3.92237626217451e-08, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16906727850437164, |
| "step": 4270, |
| "valid_targets_mean": 4460.8, |
| "valid_targets_min": 1530 |
| }, |
| { |
| "epoch": 6.884057971014493, |
| "grad_norm": 0.5783966854225258, |
| "learning_rate": 3.435764513635809e-08, |
| "loss": 0.1671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17848993837833405, |
| "step": 4275, |
| "valid_targets_mean": 4309.5, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 6.892109500805153, |
| "grad_norm": 0.5351867682144865, |
| "learning_rate": 2.9813430459364465e-08, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17882059514522552, |
| "step": 4280, |
| "valid_targets_mean": 4416.9, |
| "valid_targets_min": 1611 |
| }, |
| { |
| "epoch": 6.900161030595813, |
| "grad_norm": 0.573670983161385, |
| "learning_rate": 2.5591191856397802e-08, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15430384874343872, |
| "step": 4285, |
| "valid_targets_mean": 4570.9, |
| "valid_targets_min": 1407 |
| }, |
| { |
| "epoch": 6.908212560386474, |
| "grad_norm": 0.5344897585917823, |
| "learning_rate": 2.1690997401928593e-08, |
| "loss": 0.1538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16887977719306946, |
| "step": 4290, |
| "valid_targets_mean": 4439.5, |
| "valid_targets_min": 2172 |
| }, |
| { |
| "epoch": 6.916264090177133, |
| "grad_norm": 0.551697601245166, |
| "learning_rate": 1.811290997815851e-08, |
| "loss": 0.1762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17137417197227478, |
| "step": 4295, |
| "valid_targets_mean": 4672.2, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 6.9243156199677935, |
| "grad_norm": 0.5535638309128108, |
| "learning_rate": 1.485698727400564e-08, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14466409385204315, |
| "step": 4300, |
| "valid_targets_mean": 3469.3, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 6.932367149758454, |
| "grad_norm": 0.5119337022576111, |
| "learning_rate": 1.1923281784185226e-08, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16587556898593903, |
| "step": 4305, |
| "valid_targets_mean": 4396.5, |
| "valid_targets_min": 1299 |
| }, |
| { |
| "epoch": 6.940418679549114, |
| "grad_norm": 0.5923102041383612, |
| "learning_rate": 9.311840808357009e-09, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1823520064353943, |
| "step": 4310, |
| "valid_targets_mean": 4216.1, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 6.948470209339774, |
| "grad_norm": 0.5103445914494756, |
| "learning_rate": 7.022706450354744e-09, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15162253379821777, |
| "step": 4315, |
| "valid_targets_mean": 5503.6, |
| "valid_targets_min": 2231 |
| }, |
| { |
| "epoch": 6.956521739130435, |
| "grad_norm": 0.533406608295802, |
| "learning_rate": 5.055915617522278e-09, |
| "loss": 0.158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14400282502174377, |
| "step": 4320, |
| "valid_targets_mean": 4314.7, |
| "valid_targets_min": 1448 |
| }, |
| { |
| "epoch": 6.964573268921095, |
| "grad_norm": 0.6879701190779768, |
| "learning_rate": 3.411500020109593e-09, |
| "loss": 0.161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1823330670595169, |
| "step": 4325, |
| "valid_targets_mean": 3070.6, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 6.972624798711755, |
| "grad_norm": 0.6418600229930465, |
| "learning_rate": 2.08948617075988e-09, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15779449045658112, |
| "step": 4330, |
| "valid_targets_mean": 3922.4, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 6.980676328502415, |
| "grad_norm": 0.5848882869027459, |
| "learning_rate": 1.0898953840898786e-09, |
| "loss": 0.1616, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18286889791488647, |
| "step": 4335, |
| "valid_targets_mean": 4633.8, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 6.988727858293076, |
| "grad_norm": 0.45093430680878505, |
| "learning_rate": 4.127437763390418e-10, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15890920162200928, |
| "step": 4340, |
| "valid_targets_mean": 5343.4, |
| "valid_targets_min": 2478 |
| }, |
| { |
| "epoch": 6.996779388083736, |
| "grad_norm": 0.5378585489037748, |
| "learning_rate": 5.804226511196831e-11, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15117883682250977, |
| "step": 4345, |
| "valid_targets_mean": 3975.8, |
| "valid_targets_min": 2081 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17696434259414673, |
| "step": 4347, |
| "total_flos": 1518375161495552.0, |
| "train_loss": 0.21155054198480733, |
| "train_runtime": 25607.106, |
| "train_samples_per_second": 2.714, |
| "train_steps_per_second": 0.17, |
| "valid_targets_mean": 4512.6, |
| "valid_targets_min": 535 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4347, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1518375161495552.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|