| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 5.0, |
| "eval_steps": 500, |
| "global_step": 3125, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.008, |
| "grad_norm": 8.019209505645138, |
| "learning_rate": 5.111821086261981e-07, |
| "loss": 0.9704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.9074519872665405, |
| "step": 5, |
| "valid_targets_mean": 4634.1, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 0.016, |
| "grad_norm": 8.056913572069162, |
| "learning_rate": 1.1501597444089457e-06, |
| "loss": 0.9831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.9801443815231323, |
| "step": 10, |
| "valid_targets_mean": 3432.8, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 0.024, |
| "grad_norm": 5.890567315411599, |
| "learning_rate": 1.7891373801916933e-06, |
| "loss": 0.9216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.9462229609489441, |
| "step": 15, |
| "valid_targets_mean": 3846.5, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 0.032, |
| "grad_norm": 4.815413753270494, |
| "learning_rate": 2.428115015974441e-06, |
| "loss": 0.9003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.9328570365905762, |
| "step": 20, |
| "valid_targets_mean": 2826.7, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 0.04, |
| "grad_norm": 3.2132576974472262, |
| "learning_rate": 3.0670926517571885e-06, |
| "loss": 0.9021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.9593732357025146, |
| "step": 25, |
| "valid_targets_mean": 5006.8, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 0.048, |
| "grad_norm": 2.1277286968257494, |
| "learning_rate": 3.7060702875399364e-06, |
| "loss": 0.8146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.8108715415000916, |
| "step": 30, |
| "valid_targets_mean": 4988.4, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 0.056, |
| "grad_norm": 1.8316025070705764, |
| "learning_rate": 4.345047923322684e-06, |
| "loss": 0.8371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.8360515832901001, |
| "step": 35, |
| "valid_targets_mean": 2703.9, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 0.064, |
| "grad_norm": 0.974656430471622, |
| "learning_rate": 4.984025559105431e-06, |
| "loss": 0.8143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.738986611366272, |
| "step": 40, |
| "valid_targets_mean": 5619.8, |
| "valid_targets_min": 496 |
| }, |
| { |
| "epoch": 0.072, |
| "grad_norm": 1.2003528549510873, |
| "learning_rate": 5.623003194888179e-06, |
| "loss": 0.8001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.834333598613739, |
| "step": 45, |
| "valid_targets_mean": 2614.9, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 0.08, |
| "grad_norm": 0.9375989258322925, |
| "learning_rate": 6.261980830670928e-06, |
| "loss": 0.7226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7906558513641357, |
| "step": 50, |
| "valid_targets_mean": 3902.1, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 0.088, |
| "grad_norm": 0.947503985003781, |
| "learning_rate": 6.900958466453675e-06, |
| "loss": 0.738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7608993053436279, |
| "step": 55, |
| "valid_targets_mean": 2622.6, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 0.096, |
| "grad_norm": 1.062618699465369, |
| "learning_rate": 7.5399361022364225e-06, |
| "loss": 0.7835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.8355079293251038, |
| "step": 60, |
| "valid_targets_mean": 2038.3, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 0.104, |
| "grad_norm": 0.6519054791996576, |
| "learning_rate": 8.17891373801917e-06, |
| "loss": 0.7377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6525523662567139, |
| "step": 65, |
| "valid_targets_mean": 4931.8, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 0.112, |
| "grad_norm": 0.8181807803276753, |
| "learning_rate": 8.817891373801917e-06, |
| "loss": 0.7468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7478166818618774, |
| "step": 70, |
| "valid_targets_mean": 2875.1, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 0.12, |
| "grad_norm": 0.8077200310163509, |
| "learning_rate": 9.456869009584665e-06, |
| "loss": 0.7, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7476080656051636, |
| "step": 75, |
| "valid_targets_mean": 2929.1, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 0.128, |
| "grad_norm": 0.6645101628172224, |
| "learning_rate": 1.0095846645367413e-05, |
| "loss": 0.6873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7070491313934326, |
| "step": 80, |
| "valid_targets_mean": 3938.2, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 0.136, |
| "grad_norm": 0.5668806150237382, |
| "learning_rate": 1.073482428115016e-05, |
| "loss": 0.6795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6539013385772705, |
| "step": 85, |
| "valid_targets_mean": 4791.0, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 0.144, |
| "grad_norm": 0.631829978989927, |
| "learning_rate": 1.1373801916932907e-05, |
| "loss": 0.6727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6462942957878113, |
| "step": 90, |
| "valid_targets_mean": 4125.3, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 0.152, |
| "grad_norm": 0.7522145077585198, |
| "learning_rate": 1.2012779552715656e-05, |
| "loss": 0.6913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6524339914321899, |
| "step": 95, |
| "valid_targets_mean": 2768.8, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 0.16, |
| "grad_norm": 0.6436788258939267, |
| "learning_rate": 1.2651757188498404e-05, |
| "loss": 0.6746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6656085848808289, |
| "step": 100, |
| "valid_targets_mean": 4070.2, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 0.168, |
| "grad_norm": 0.6829360551307666, |
| "learning_rate": 1.329073482428115e-05, |
| "loss": 0.6581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.696590006351471, |
| "step": 105, |
| "valid_targets_mean": 3549.9, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 0.176, |
| "grad_norm": 0.6518448907533483, |
| "learning_rate": 1.39297124600639e-05, |
| "loss": 0.6693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6982806921005249, |
| "step": 110, |
| "valid_targets_mean": 3914.5, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 0.184, |
| "grad_norm": 0.7108542582881471, |
| "learning_rate": 1.4568690095846648e-05, |
| "loss": 0.6437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6319302916526794, |
| "step": 115, |
| "valid_targets_mean": 3878.2, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 0.192, |
| "grad_norm": 0.6111508324238974, |
| "learning_rate": 1.5207667731629394e-05, |
| "loss": 0.6237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6298456788063049, |
| "step": 120, |
| "valid_targets_mean": 4183.7, |
| "valid_targets_min": 831 |
| }, |
| { |
| "epoch": 0.2, |
| "grad_norm": 0.636766820540127, |
| "learning_rate": 1.584664536741214e-05, |
| "loss": 0.6248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6381227970123291, |
| "step": 125, |
| "valid_targets_mean": 4150.9, |
| "valid_targets_min": 279 |
| }, |
| { |
| "epoch": 0.208, |
| "grad_norm": 0.7297687830940379, |
| "learning_rate": 1.648562300319489e-05, |
| "loss": 0.6313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6899981498718262, |
| "step": 130, |
| "valid_targets_mean": 3481.6, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 0.216, |
| "grad_norm": 0.6994014106747448, |
| "learning_rate": 1.712460063897764e-05, |
| "loss": 0.6099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.641595184803009, |
| "step": 135, |
| "valid_targets_mean": 4528.6, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 0.224, |
| "grad_norm": 0.682372825217958, |
| "learning_rate": 1.7763578274760385e-05, |
| "loss": 0.6255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6313050985336304, |
| "step": 140, |
| "valid_targets_mean": 4437.3, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 0.232, |
| "grad_norm": 0.6870311865242572, |
| "learning_rate": 1.840255591054313e-05, |
| "loss": 0.6237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5983741283416748, |
| "step": 145, |
| "valid_targets_mean": 3244.9, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 0.24, |
| "grad_norm": 0.7883183108248433, |
| "learning_rate": 1.904153354632588e-05, |
| "loss": 0.6184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6510107517242432, |
| "step": 150, |
| "valid_targets_mean": 3022.1, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 0.248, |
| "grad_norm": 0.6559928431572688, |
| "learning_rate": 1.9680511182108627e-05, |
| "loss": 0.6168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6277835369110107, |
| "step": 155, |
| "valid_targets_mean": 4691.1, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 0.256, |
| "grad_norm": 0.7040494425503686, |
| "learning_rate": 2.0319488817891376e-05, |
| "loss": 0.6178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5613512992858887, |
| "step": 160, |
| "valid_targets_mean": 3659.9, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 0.264, |
| "grad_norm": 0.7293885471955911, |
| "learning_rate": 2.0958466453674126e-05, |
| "loss": 0.578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.546758234500885, |
| "step": 165, |
| "valid_targets_mean": 3741.1, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 0.272, |
| "grad_norm": 0.772438514428517, |
| "learning_rate": 2.1597444089456872e-05, |
| "loss": 0.5705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5695148706436157, |
| "step": 170, |
| "valid_targets_mean": 3372.0, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 0.28, |
| "grad_norm": 0.8184517511660472, |
| "learning_rate": 2.2236421725239618e-05, |
| "loss": 0.6274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6200259923934937, |
| "step": 175, |
| "valid_targets_mean": 2952.8, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 0.288, |
| "grad_norm": 0.6401835135693486, |
| "learning_rate": 2.2875399361022364e-05, |
| "loss": 0.5871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6663122773170471, |
| "step": 180, |
| "valid_targets_mean": 4482.8, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 0.296, |
| "grad_norm": 0.562579817398789, |
| "learning_rate": 2.3514376996805114e-05, |
| "loss": 0.594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5693539977073669, |
| "step": 185, |
| "valid_targets_mean": 5274.5, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 0.304, |
| "grad_norm": 3.023582033179472, |
| "learning_rate": 2.415335463258786e-05, |
| "loss": 0.5726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6133388876914978, |
| "step": 190, |
| "valid_targets_mean": 3461.5, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 0.312, |
| "grad_norm": 0.63776000505745, |
| "learning_rate": 2.4792332268370606e-05, |
| "loss": 0.6095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5332133173942566, |
| "step": 195, |
| "valid_targets_mean": 4770.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 0.32, |
| "grad_norm": 0.6537457497646995, |
| "learning_rate": 2.543130990415336e-05, |
| "loss": 0.5961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6032932996749878, |
| "step": 200, |
| "valid_targets_mean": 4235.5, |
| "valid_targets_min": 418 |
| }, |
| { |
| "epoch": 0.328, |
| "grad_norm": 0.679784159844079, |
| "learning_rate": 2.6070287539936105e-05, |
| "loss": 0.5781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5432563424110413, |
| "step": 205, |
| "valid_targets_mean": 3482.2, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 0.336, |
| "grad_norm": 0.6536420335215318, |
| "learning_rate": 2.670926517571885e-05, |
| "loss": 0.5527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5386021137237549, |
| "step": 210, |
| "valid_targets_mean": 4072.3, |
| "valid_targets_min": 288 |
| }, |
| { |
| "epoch": 0.344, |
| "grad_norm": 0.7579600175695036, |
| "learning_rate": 2.73482428115016e-05, |
| "loss": 0.5917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5911605358123779, |
| "step": 215, |
| "valid_targets_mean": 2998.2, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 0.352, |
| "grad_norm": 0.8790312000878335, |
| "learning_rate": 2.7987220447284347e-05, |
| "loss": 0.6193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5623832941055298, |
| "step": 220, |
| "valid_targets_mean": 2856.6, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 0.36, |
| "grad_norm": 0.8411714839123007, |
| "learning_rate": 2.8626198083067093e-05, |
| "loss": 0.5871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6712679862976074, |
| "step": 225, |
| "valid_targets_mean": 3072.1, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 0.368, |
| "grad_norm": 0.6480362190445711, |
| "learning_rate": 2.9265175718849843e-05, |
| "loss": 0.5827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5256530046463013, |
| "step": 230, |
| "valid_targets_mean": 3665.3, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 0.376, |
| "grad_norm": 0.6347344055975906, |
| "learning_rate": 2.9904153354632592e-05, |
| "loss": 0.5871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6053222417831421, |
| "step": 235, |
| "valid_targets_mean": 4444.1, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 0.384, |
| "grad_norm": 0.7522140681943507, |
| "learning_rate": 3.054313099041534e-05, |
| "loss": 0.5885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6026010513305664, |
| "step": 240, |
| "valid_targets_mean": 3201.2, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 0.392, |
| "grad_norm": 0.59444256273076, |
| "learning_rate": 3.1182108626198084e-05, |
| "loss": 0.5656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5105293989181519, |
| "step": 245, |
| "valid_targets_mean": 4720.0, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 0.4, |
| "grad_norm": 0.7082748798819095, |
| "learning_rate": 3.1821086261980834e-05, |
| "loss": 0.5715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5332015752792358, |
| "step": 250, |
| "valid_targets_mean": 3776.2, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 0.408, |
| "grad_norm": 0.5935423684362258, |
| "learning_rate": 3.246006389776358e-05, |
| "loss": 0.5579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5111772418022156, |
| "step": 255, |
| "valid_targets_mean": 4674.4, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 0.416, |
| "grad_norm": 0.8490750724860248, |
| "learning_rate": 3.3099041533546326e-05, |
| "loss": 0.5582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5234127044677734, |
| "step": 260, |
| "valid_targets_mean": 4834.0, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 0.424, |
| "grad_norm": 0.6787686121432547, |
| "learning_rate": 3.3738019169329076e-05, |
| "loss": 0.5422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5584520101547241, |
| "step": 265, |
| "valid_targets_mean": 3572.9, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 0.432, |
| "grad_norm": 0.7210865201308775, |
| "learning_rate": 3.4376996805111825e-05, |
| "loss": 0.5439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5728445649147034, |
| "step": 270, |
| "valid_targets_mean": 3147.6, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 0.44, |
| "grad_norm": 0.9390958887116584, |
| "learning_rate": 3.5015974440894575e-05, |
| "loss": 0.572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6330382823944092, |
| "step": 275, |
| "valid_targets_mean": 2163.2, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 0.448, |
| "grad_norm": 0.7172744444294396, |
| "learning_rate": 3.565495207667732e-05, |
| "loss": 0.5708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.547631561756134, |
| "step": 280, |
| "valid_targets_mean": 3426.3, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 0.456, |
| "grad_norm": 0.6587837222708766, |
| "learning_rate": 3.629392971246007e-05, |
| "loss": 0.5714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5626546144485474, |
| "step": 285, |
| "valid_targets_mean": 4249.6, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 0.464, |
| "grad_norm": 0.5946489699255438, |
| "learning_rate": 3.6932907348242816e-05, |
| "loss": 0.5554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6051210165023804, |
| "step": 290, |
| "valid_targets_mean": 4729.2, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 0.472, |
| "grad_norm": 0.7892760841457642, |
| "learning_rate": 3.757188498402556e-05, |
| "loss": 0.5811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6125881671905518, |
| "step": 295, |
| "valid_targets_mean": 3489.5, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 0.48, |
| "grad_norm": 0.6623319928800957, |
| "learning_rate": 3.821086261980831e-05, |
| "loss": 0.5852, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5646267533302307, |
| "step": 300, |
| "valid_targets_mean": 3532.5, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 0.488, |
| "grad_norm": 0.6226375467862089, |
| "learning_rate": 3.884984025559106e-05, |
| "loss": 0.5714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5953035354614258, |
| "step": 305, |
| "valid_targets_mean": 4777.0, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 0.496, |
| "grad_norm": 0.7584022572749837, |
| "learning_rate": 3.94888178913738e-05, |
| "loss": 0.5374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5502133369445801, |
| "step": 310, |
| "valid_targets_mean": 3806.0, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 0.504, |
| "grad_norm": 0.7226522137453772, |
| "learning_rate": 3.9999987518434296e-05, |
| "loss": 0.5273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5224813222885132, |
| "step": 315, |
| "valid_targets_mean": 3150.1, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 0.512, |
| "grad_norm": 0.6141445710145204, |
| "learning_rate": 3.999955066527015e-05, |
| "loss": 0.5718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5544633269309998, |
| "step": 320, |
| "valid_targets_mean": 4412.2, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 0.52, |
| "grad_norm": 0.8461142526243931, |
| "learning_rate": 3.999848974939926e-05, |
| "loss": 0.5414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5990142822265625, |
| "step": 325, |
| "valid_targets_mean": 2348.9, |
| "valid_targets_min": 499 |
| }, |
| { |
| "epoch": 0.528, |
| "grad_norm": 0.8250606491282058, |
| "learning_rate": 3.999680480392626e-05, |
| "loss": 0.5356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5679922103881836, |
| "step": 330, |
| "valid_targets_mean": 3415.2, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 0.536, |
| "grad_norm": 0.637073771711946, |
| "learning_rate": 3.999449588142792e-05, |
| "loss": 0.534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4861408770084381, |
| "step": 335, |
| "valid_targets_mean": 3706.7, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 0.544, |
| "grad_norm": 0.8398228483120712, |
| "learning_rate": 3.9991563053951476e-05, |
| "loss": 0.5715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.646068811416626, |
| "step": 340, |
| "valid_targets_mean": 2273.1, |
| "valid_targets_min": 433 |
| }, |
| { |
| "epoch": 0.552, |
| "grad_norm": 0.6121671335659467, |
| "learning_rate": 3.99880064130124e-05, |
| "loss": 0.5564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5839049816131592, |
| "step": 345, |
| "valid_targets_mean": 4629.9, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 0.56, |
| "grad_norm": 0.7358980937968385, |
| "learning_rate": 3.9983826069591535e-05, |
| "loss": 0.5492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5735797882080078, |
| "step": 350, |
| "valid_targets_mean": 3127.5, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 0.568, |
| "grad_norm": 0.6083717163603471, |
| "learning_rate": 3.997902215413163e-05, |
| "loss": 0.5249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5112648010253906, |
| "step": 355, |
| "valid_targets_mean": 4718.0, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 0.576, |
| "grad_norm": 0.6072026819837963, |
| "learning_rate": 3.997359481653327e-05, |
| "loss": 0.5393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5504653453826904, |
| "step": 360, |
| "valid_targets_mean": 4234.2, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 0.584, |
| "grad_norm": 0.5970402191237862, |
| "learning_rate": 3.996754422615023e-05, |
| "loss": 0.547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5461069345474243, |
| "step": 365, |
| "valid_targets_mean": 4407.4, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 0.592, |
| "grad_norm": 0.7672984290731282, |
| "learning_rate": 3.996087057178411e-05, |
| "loss": 0.5539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6059372425079346, |
| "step": 370, |
| "valid_targets_mean": 3555.2, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 0.6, |
| "grad_norm": 0.7939676092215848, |
| "learning_rate": 3.995357406167856e-05, |
| "loss": 0.5563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5978292226791382, |
| "step": 375, |
| "valid_targets_mean": 2776.0, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 0.608, |
| "grad_norm": 0.6525335154383021, |
| "learning_rate": 3.994565492351267e-05, |
| "loss": 0.5352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5540485382080078, |
| "step": 380, |
| "valid_targets_mean": 4123.6, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 0.616, |
| "grad_norm": 0.6989698695789527, |
| "learning_rate": 3.993711340439394e-05, |
| "loss": 0.5343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6023855209350586, |
| "step": 385, |
| "valid_targets_mean": 3758.4, |
| "valid_targets_min": 463 |
| }, |
| { |
| "epoch": 0.624, |
| "grad_norm": 0.7124652823560258, |
| "learning_rate": 3.9927949770850535e-05, |
| "loss": 0.5326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5666008591651917, |
| "step": 390, |
| "valid_targets_mean": 3212.3, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.632, |
| "grad_norm": 0.6842076356533583, |
| "learning_rate": 3.991816430882297e-05, |
| "loss": 0.5375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5813860297203064, |
| "step": 395, |
| "valid_targets_mean": 4066.8, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 0.64, |
| "grad_norm": 0.529144826449527, |
| "learning_rate": 3.9907757323655206e-05, |
| "loss": 0.5396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.555700957775116, |
| "step": 400, |
| "valid_targets_mean": 7514.6, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 0.648, |
| "grad_norm": 0.687588424871281, |
| "learning_rate": 3.98967291400851e-05, |
| "loss": 0.5169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5300942659378052, |
| "step": 405, |
| "valid_targets_mean": 3809.2, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 0.656, |
| "grad_norm": 0.6988433600033485, |
| "learning_rate": 3.98850801022343e-05, |
| "loss": 0.5232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44089508056640625, |
| "step": 410, |
| "valid_targets_mean": 4746.0, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 0.664, |
| "grad_norm": 0.6587643148830101, |
| "learning_rate": 3.987281057359746e-05, |
| "loss": 0.5335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5711066126823425, |
| "step": 415, |
| "valid_targets_mean": 3932.2, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 0.672, |
| "grad_norm": 0.6308013522460244, |
| "learning_rate": 3.985992093703096e-05, |
| "loss": 0.5377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5582001805305481, |
| "step": 420, |
| "valid_targets_mean": 3887.5, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 0.68, |
| "grad_norm": 0.5418196566696337, |
| "learning_rate": 3.98464115947409e-05, |
| "loss": 0.5323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49433648586273193, |
| "step": 425, |
| "valid_targets_mean": 5441.3, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 0.688, |
| "grad_norm": 0.7175445202648967, |
| "learning_rate": 3.9832282968270595e-05, |
| "loss": 0.5287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.552021861076355, |
| "step": 430, |
| "valid_targets_mean": 2823.0, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 0.696, |
| "grad_norm": 0.6367170247884075, |
| "learning_rate": 3.9817535498487385e-05, |
| "loss": 0.5304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5349035263061523, |
| "step": 435, |
| "valid_targets_mean": 4406.4, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 0.704, |
| "grad_norm": 0.6231922620233467, |
| "learning_rate": 3.980216964556892e-05, |
| "loss": 0.5176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5187514424324036, |
| "step": 440, |
| "valid_targets_mean": 4343.2, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 0.712, |
| "grad_norm": 0.7123358352627772, |
| "learning_rate": 3.978618588898873e-05, |
| "loss": 0.5295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5067673921585083, |
| "step": 445, |
| "valid_targets_mean": 3212.3, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 0.72, |
| "grad_norm": 0.7454664370057654, |
| "learning_rate": 3.976958472750137e-05, |
| "loss": 0.537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5686776638031006, |
| "step": 450, |
| "valid_targets_mean": 3169.4, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 0.728, |
| "grad_norm": 0.5174561677012455, |
| "learning_rate": 3.9752366679126754e-05, |
| "loss": 0.528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5228891968727112, |
| "step": 455, |
| "valid_targets_mean": 5854.7, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 0.736, |
| "grad_norm": 0.7061480122954578, |
| "learning_rate": 3.973453228113405e-05, |
| "loss": 0.5422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5699916481971741, |
| "step": 460, |
| "valid_targets_mean": 3457.9, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 0.744, |
| "grad_norm": 0.6372505538914572, |
| "learning_rate": 3.971608209002489e-05, |
| "loss": 0.5036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.510094940662384, |
| "step": 465, |
| "valid_targets_mean": 3599.1, |
| "valid_targets_min": 827 |
| }, |
| { |
| "epoch": 0.752, |
| "grad_norm": 0.6192730292845192, |
| "learning_rate": 3.969701668151603e-05, |
| "loss": 0.4938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5506471395492554, |
| "step": 470, |
| "valid_targets_mean": 4186.9, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 0.76, |
| "grad_norm": 0.6458176448811681, |
| "learning_rate": 3.9677336650521336e-05, |
| "loss": 0.51, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4645317792892456, |
| "step": 475, |
| "valid_targets_mean": 5438.2, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 0.768, |
| "grad_norm": 0.6877541407077931, |
| "learning_rate": 3.9657042611133294e-05, |
| "loss": 0.5309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5832065343856812, |
| "step": 480, |
| "valid_targets_mean": 4794.7, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 0.776, |
| "grad_norm": 0.7261934590292777, |
| "learning_rate": 3.963613519660379e-05, |
| "loss": 0.5469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5814934968948364, |
| "step": 485, |
| "valid_targets_mean": 3265.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 0.784, |
| "grad_norm": 0.5727199057578912, |
| "learning_rate": 3.961461505932435e-05, |
| "loss": 0.5226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5271404385566711, |
| "step": 490, |
| "valid_targets_mean": 5650.6, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 0.792, |
| "grad_norm": 0.6931137062168018, |
| "learning_rate": 3.959248287080583e-05, |
| "loss": 0.4874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5182836055755615, |
| "step": 495, |
| "valid_targets_mean": 2894.6, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 0.8, |
| "grad_norm": 0.5579037807480154, |
| "learning_rate": 3.9569739321657416e-05, |
| "loss": 0.5329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4890630543231964, |
| "step": 500, |
| "valid_targets_mean": 4849.6, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.808, |
| "grad_norm": 0.5278555941049078, |
| "learning_rate": 3.9546385121565095e-05, |
| "loss": 0.5214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4740561842918396, |
| "step": 505, |
| "valid_targets_mean": 5560.9, |
| "valid_targets_min": 386 |
| }, |
| { |
| "epoch": 0.816, |
| "grad_norm": 0.7629284256030876, |
| "learning_rate": 3.952242099926951e-05, |
| "loss": 0.5019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5348608493804932, |
| "step": 510, |
| "valid_targets_mean": 3005.8, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 0.824, |
| "grad_norm": 0.5984390769675876, |
| "learning_rate": 3.9497847702543196e-05, |
| "loss": 0.5011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49162226915359497, |
| "step": 515, |
| "valid_targets_mean": 4003.1, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 0.832, |
| "grad_norm": 0.5425603828548777, |
| "learning_rate": 3.94726659981673e-05, |
| "loss": 0.5236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4525638222694397, |
| "step": 520, |
| "valid_targets_mean": 4395.4, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 0.84, |
| "grad_norm": 0.527115667278833, |
| "learning_rate": 3.94468766719076e-05, |
| "loss": 0.5203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5383976101875305, |
| "step": 525, |
| "valid_targets_mean": 6022.6, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 0.848, |
| "grad_norm": 0.48267274772473334, |
| "learning_rate": 3.942048052849001e-05, |
| "loss": 0.4667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40104740858078003, |
| "step": 530, |
| "valid_targets_mean": 5891.2, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 0.856, |
| "grad_norm": 0.7791947549458919, |
| "learning_rate": 3.939347839157548e-05, |
| "loss": 0.5056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5501073598861694, |
| "step": 535, |
| "valid_targets_mean": 2821.9, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 0.864, |
| "grad_norm": 0.7336120776006877, |
| "learning_rate": 3.9365871103734264e-05, |
| "loss": 0.5003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5346959829330444, |
| "step": 540, |
| "valid_targets_mean": 3434.2, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 0.872, |
| "grad_norm": 0.5526825963889843, |
| "learning_rate": 3.933765952641965e-05, |
| "loss": 0.4971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4672126770019531, |
| "step": 545, |
| "valid_targets_mean": 4462.4, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 0.88, |
| "grad_norm": 0.6189947196809612, |
| "learning_rate": 3.930884453994109e-05, |
| "loss": 0.4983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4648451507091522, |
| "step": 550, |
| "valid_targets_mean": 3606.6, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 0.888, |
| "grad_norm": 0.6586170474235856, |
| "learning_rate": 3.9279427043436706e-05, |
| "loss": 0.5388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5403224229812622, |
| "step": 555, |
| "valid_targets_mean": 3831.8, |
| "valid_targets_min": 415 |
| }, |
| { |
| "epoch": 0.896, |
| "grad_norm": 0.5313121728145141, |
| "learning_rate": 3.924940795484525e-05, |
| "loss": 0.5063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.521693766117096, |
| "step": 560, |
| "valid_targets_mean": 5235.8, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 0.904, |
| "grad_norm": 0.6424391584952766, |
| "learning_rate": 3.9218788210877436e-05, |
| "loss": 0.5359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5287529826164246, |
| "step": 565, |
| "valid_targets_mean": 3747.9, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 0.912, |
| "grad_norm": 0.7979713052864025, |
| "learning_rate": 3.918756876698676e-05, |
| "loss": 0.517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5333600640296936, |
| "step": 570, |
| "valid_targets_mean": 4772.2, |
| "valid_targets_min": 426 |
| }, |
| { |
| "epoch": 0.92, |
| "grad_norm": 0.5943189435660875, |
| "learning_rate": 3.9155750597339634e-05, |
| "loss": 0.4952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5387169718742371, |
| "step": 575, |
| "valid_targets_mean": 4364.7, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 0.928, |
| "grad_norm": 0.6520342943163902, |
| "learning_rate": 3.912333469478502e-05, |
| "loss": 0.5197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5179246068000793, |
| "step": 580, |
| "valid_targets_mean": 3263.0, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 0.936, |
| "grad_norm": 0.6103078060063878, |
| "learning_rate": 3.909032207082344e-05, |
| "loss": 0.4996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49960577487945557, |
| "step": 585, |
| "valid_targets_mean": 4096.7, |
| "valid_targets_min": 505 |
| }, |
| { |
| "epoch": 0.944, |
| "grad_norm": 0.585543703034473, |
| "learning_rate": 3.90567137555754e-05, |
| "loss": 0.5287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5424899458885193, |
| "step": 590, |
| "valid_targets_mean": 4775.8, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 0.952, |
| "grad_norm": 0.6304193255405047, |
| "learning_rate": 3.9022510797749286e-05, |
| "loss": 0.5087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5315080285072327, |
| "step": 595, |
| "valid_targets_mean": 4235.9, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 0.96, |
| "grad_norm": 0.585015028731908, |
| "learning_rate": 3.898771426460859e-05, |
| "loss": 0.4945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4809357523918152, |
| "step": 600, |
| "valid_targets_mean": 3830.8, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 0.968, |
| "grad_norm": 0.68245860217036, |
| "learning_rate": 3.8952325241938635e-05, |
| "loss": 0.5126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5318968296051025, |
| "step": 605, |
| "valid_targets_mean": 4136.1, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 0.976, |
| "grad_norm": 0.6148876956191819, |
| "learning_rate": 3.8916344834012695e-05, |
| "loss": 0.5311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5257702469825745, |
| "step": 610, |
| "valid_targets_mean": 4727.1, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 0.984, |
| "grad_norm": 0.6143278822542023, |
| "learning_rate": 3.887977416355754e-05, |
| "loss": 0.5224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4943949580192566, |
| "step": 615, |
| "valid_targets_mean": 3667.9, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 0.992, |
| "grad_norm": 0.639756859129058, |
| "learning_rate": 3.884261437171838e-05, |
| "loss": 0.5033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5292478799819946, |
| "step": 620, |
| "valid_targets_mean": 3723.4, |
| "valid_targets_min": 588 |
| }, |
| { |
| "epoch": 1.0, |
| "grad_norm": 0.6034626688615775, |
| "learning_rate": 3.8804866618023284e-05, |
| "loss": 0.4778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5043004751205444, |
| "step": 625, |
| "valid_targets_mean": 4286.8, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 1.008, |
| "grad_norm": 0.5749723492360072, |
| "learning_rate": 3.876653208034698e-05, |
| "loss": 0.5212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4886097311973572, |
| "step": 630, |
| "valid_targets_mean": 4484.8, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 1.016, |
| "grad_norm": 0.5975830354439139, |
| "learning_rate": 3.8727611954874114e-05, |
| "loss": 0.4941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4872697591781616, |
| "step": 635, |
| "valid_targets_mean": 4030.0, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 1.024, |
| "grad_norm": 0.6626052135788788, |
| "learning_rate": 3.8688107456061904e-05, |
| "loss": 0.4666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.48330509662628174, |
| "step": 640, |
| "valid_targets_mean": 3877.7, |
| "valid_targets_min": 751 |
| }, |
| { |
| "epoch": 1.032, |
| "grad_norm": 0.5825477612458702, |
| "learning_rate": 3.864801981660227e-05, |
| "loss": 0.4876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.50968998670578, |
| "step": 645, |
| "valid_targets_mean": 4582.6, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 1.04, |
| "grad_norm": 0.5888038935122548, |
| "learning_rate": 3.860735028738337e-05, |
| "loss": 0.4909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4983733296394348, |
| "step": 650, |
| "valid_targets_mean": 5661.3, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 1.048, |
| "grad_norm": 0.7028901777525807, |
| "learning_rate": 3.856610013745051e-05, |
| "loss": 0.4675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43987807631492615, |
| "step": 655, |
| "valid_targets_mean": 2972.2, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 1.056, |
| "grad_norm": 0.6837565819150657, |
| "learning_rate": 3.852427065396665e-05, |
| "loss": 0.5386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.54156893491745, |
| "step": 660, |
| "valid_targets_mean": 3283.2, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 1.064, |
| "grad_norm": 0.7103924713439609, |
| "learning_rate": 3.848186314217213e-05, |
| "loss": 0.4915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5271738767623901, |
| "step": 665, |
| "valid_targets_mean": 3783.6, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 1.072, |
| "grad_norm": 0.5777473820322118, |
| "learning_rate": 3.843887892534402e-05, |
| "loss": 0.4949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4844241142272949, |
| "step": 670, |
| "valid_targets_mean": 5510.7, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 1.08, |
| "grad_norm": 0.5592068039838433, |
| "learning_rate": 3.8395319344754776e-05, |
| "loss": 0.4824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4355768859386444, |
| "step": 675, |
| "valid_targets_mean": 4872.8, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 1.088, |
| "grad_norm": 0.5196780282819776, |
| "learning_rate": 3.8351185759630435e-05, |
| "loss": 0.5028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4816337525844574, |
| "step": 680, |
| "valid_targets_mean": 6182.8, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 1.096, |
| "grad_norm": 0.4974070083115012, |
| "learning_rate": 3.830647954710816e-05, |
| "loss": 0.4799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4324873685836792, |
| "step": 685, |
| "valid_targets_mean": 5340.4, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 1.104, |
| "grad_norm": 0.5227557174907695, |
| "learning_rate": 3.826120210219331e-05, |
| "loss": 0.4665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4405563771724701, |
| "step": 690, |
| "valid_targets_mean": 5245.5, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 1.112, |
| "grad_norm": 0.5415434424451512, |
| "learning_rate": 3.8215354837715836e-05, |
| "loss": 0.4753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.443329781293869, |
| "step": 695, |
| "valid_targets_mean": 6236.1, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 1.12, |
| "grad_norm": 0.6938512610507073, |
| "learning_rate": 3.816893918428631e-05, |
| "loss": 0.5224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5610541701316833, |
| "step": 700, |
| "valid_targets_mean": 3587.6, |
| "valid_targets_min": 975 |
| }, |
| { |
| "epoch": 1.1280000000000001, |
| "grad_norm": 0.7257198661742723, |
| "learning_rate": 3.8121956590251153e-05, |
| "loss": 0.4849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.511725902557373, |
| "step": 705, |
| "valid_targets_mean": 2714.5, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 1.1360000000000001, |
| "grad_norm": 0.7628570201199647, |
| "learning_rate": 3.8074408521647576e-05, |
| "loss": 0.4942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5041239857673645, |
| "step": 710, |
| "valid_targets_mean": 4192.9, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 1.144, |
| "grad_norm": 0.7232575314594617, |
| "learning_rate": 3.802629646215771e-05, |
| "loss": 0.5357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5536401271820068, |
| "step": 715, |
| "valid_targets_mean": 3258.6, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 1.152, |
| "grad_norm": 0.5322461206523738, |
| "learning_rate": 3.79776219130624e-05, |
| "loss": 0.5255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4725511074066162, |
| "step": 720, |
| "valid_targets_mean": 5086.8, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 1.16, |
| "grad_norm": 0.5597590750275225, |
| "learning_rate": 3.792838639319431e-05, |
| "loss": 0.4851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4070642590522766, |
| "step": 725, |
| "valid_targets_mean": 3765.9, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 1.168, |
| "grad_norm": 0.5995633156774554, |
| "learning_rate": 3.787859143889054e-05, |
| "loss": 0.4643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5027796030044556, |
| "step": 730, |
| "valid_targets_mean": 4211.0, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 1.176, |
| "grad_norm": 0.7391042973959496, |
| "learning_rate": 3.782823860394469e-05, |
| "loss": 0.535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.478831022977829, |
| "step": 735, |
| "valid_targets_mean": 3402.7, |
| "valid_targets_min": 428 |
| }, |
| { |
| "epoch": 1.184, |
| "grad_norm": 0.655094019532376, |
| "learning_rate": 3.777732945955841e-05, |
| "loss": 0.4662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49596506357192993, |
| "step": 740, |
| "valid_targets_mean": 4551.3, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 1.192, |
| "grad_norm": 0.6319621366301474, |
| "learning_rate": 3.772586559429229e-05, |
| "loss": 0.4796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5001382231712341, |
| "step": 745, |
| "valid_targets_mean": 3626.9, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 1.2, |
| "grad_norm": 0.5834982530634643, |
| "learning_rate": 3.767384861401636e-05, |
| "loss": 0.4846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4496903419494629, |
| "step": 750, |
| "valid_targets_mean": 3643.1, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 1.208, |
| "grad_norm": 0.7608316000603859, |
| "learning_rate": 3.762128014185998e-05, |
| "loss": 0.5195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5569829344749451, |
| "step": 755, |
| "valid_targets_mean": 2473.0, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 1.216, |
| "grad_norm": 0.5591412298342779, |
| "learning_rate": 3.7568161818161135e-05, |
| "loss": 0.4618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49754035472869873, |
| "step": 760, |
| "valid_targets_mean": 6402.6, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 1.224, |
| "grad_norm": 0.8123260766469027, |
| "learning_rate": 3.751449530041532e-05, |
| "loss": 0.4975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5815908908843994, |
| "step": 765, |
| "valid_targets_mean": 2641.3, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 1.232, |
| "grad_norm": 0.6101133475673763, |
| "learning_rate": 3.7460282263223764e-05, |
| "loss": 0.4819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4854985475540161, |
| "step": 770, |
| "valid_targets_mean": 4249.1, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 1.24, |
| "grad_norm": 0.5375018128815826, |
| "learning_rate": 3.740552439824122e-05, |
| "loss": 0.486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4772304594516754, |
| "step": 775, |
| "valid_targets_mean": 4520.9, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 1.248, |
| "grad_norm": 0.51139105848858, |
| "learning_rate": 3.735022341412314e-05, |
| "loss": 0.477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47216999530792236, |
| "step": 780, |
| "valid_targets_mean": 6126.1, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 1.256, |
| "grad_norm": 0.5195276484071466, |
| "learning_rate": 3.7294381036472386e-05, |
| "loss": 0.4797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46269387006759644, |
| "step": 785, |
| "valid_targets_mean": 4958.2, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 1.264, |
| "grad_norm": 0.6267531451482399, |
| "learning_rate": 3.723799900778538e-05, |
| "loss": 0.4883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4804888665676117, |
| "step": 790, |
| "valid_targets_mean": 3517.1, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 1.272, |
| "grad_norm": 0.5195057436049215, |
| "learning_rate": 3.7181079087397705e-05, |
| "loss": 0.5087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5404967665672302, |
| "step": 795, |
| "valid_targets_mean": 6603.4, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 1.28, |
| "grad_norm": 0.5398694980743434, |
| "learning_rate": 3.712362305142926e-05, |
| "loss": 0.4393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4667036831378937, |
| "step": 800, |
| "valid_targets_mean": 4789.3, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 1.288, |
| "grad_norm": 0.700472880561129, |
| "learning_rate": 3.706563269272878e-05, |
| "loss": 0.4852, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45391908288002014, |
| "step": 805, |
| "valid_targets_mean": 2936.9, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 1.296, |
| "grad_norm": 0.6212205565818121, |
| "learning_rate": 3.700710982081794e-05, |
| "loss": 0.4758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4718417823314667, |
| "step": 810, |
| "valid_targets_mean": 3432.1, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 1.304, |
| "grad_norm": 0.6408053164272295, |
| "learning_rate": 3.694805626183486e-05, |
| "loss": 0.4872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5090664625167847, |
| "step": 815, |
| "valid_targets_mean": 4112.0, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 1.312, |
| "grad_norm": 0.7001179282352733, |
| "learning_rate": 3.688847385847711e-05, |
| "loss": 0.4719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.427803099155426, |
| "step": 820, |
| "valid_targets_mean": 3749.1, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 1.32, |
| "grad_norm": 0.6511396074795565, |
| "learning_rate": 3.682836446994428e-05, |
| "loss": 0.5126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4967302083969116, |
| "step": 825, |
| "valid_targets_mean": 3997.8, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 1.328, |
| "grad_norm": 0.593371544756325, |
| "learning_rate": 3.676772997187989e-05, |
| "loss": 0.4859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.475099116563797, |
| "step": 830, |
| "valid_targets_mean": 4375.9, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 1.336, |
| "grad_norm": 0.6550709845667457, |
| "learning_rate": 3.670657225631289e-05, |
| "loss": 0.4717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5210568904876709, |
| "step": 835, |
| "valid_targets_mean": 3314.4, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 1.3439999999999999, |
| "grad_norm": 0.6168115512142734, |
| "learning_rate": 3.6644893231598635e-05, |
| "loss": 0.4695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5161671042442322, |
| "step": 840, |
| "valid_targets_mean": 3743.0, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 1.3519999999999999, |
| "grad_norm": 1.2636079758657017, |
| "learning_rate": 3.658269482235932e-05, |
| "loss": 0.4564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.433046817779541, |
| "step": 845, |
| "valid_targets_mean": 2702.0, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 1.3599999999999999, |
| "grad_norm": 0.644979165166496, |
| "learning_rate": 3.651997896942394e-05, |
| "loss": 0.525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5414267778396606, |
| "step": 850, |
| "valid_targets_mean": 4083.8, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 1.3679999999999999, |
| "grad_norm": 0.5287402349737144, |
| "learning_rate": 3.645674762976769e-05, |
| "loss": 0.4819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43094199895858765, |
| "step": 855, |
| "valid_targets_mean": 4626.4, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 1.376, |
| "grad_norm": 0.609279043498901, |
| "learning_rate": 3.639300277645096e-05, |
| "loss": 0.475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49126923084259033, |
| "step": 860, |
| "valid_targets_mean": 4487.2, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 1.384, |
| "grad_norm": 0.645279015628696, |
| "learning_rate": 3.6328746398557715e-05, |
| "loss": 0.4776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.500410795211792, |
| "step": 865, |
| "valid_targets_mean": 3312.8, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 1.392, |
| "grad_norm": 0.6099569963138785, |
| "learning_rate": 3.6263980501133466e-05, |
| "loss": 0.4815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4480360150337219, |
| "step": 870, |
| "valid_targets_mean": 4288.2, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 1.4, |
| "grad_norm": 0.5594438345209423, |
| "learning_rate": 3.619870710512268e-05, |
| "loss": 0.4831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46603310108184814, |
| "step": 875, |
| "valid_targets_mean": 4127.5, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 1.408, |
| "grad_norm": 0.7040863724335125, |
| "learning_rate": 3.6132928247305713e-05, |
| "loss": 0.4717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4972262978553772, |
| "step": 880, |
| "valid_targets_mean": 4002.6, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 1.416, |
| "grad_norm": 0.4723530474869513, |
| "learning_rate": 3.60666459802353e-05, |
| "loss": 0.4683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45891261100769043, |
| "step": 885, |
| "valid_targets_mean": 6404.6, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 1.424, |
| "grad_norm": 0.6504389615505566, |
| "learning_rate": 3.599986237217245e-05, |
| "loss": 0.4589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49261537194252014, |
| "step": 890, |
| "valid_targets_mean": 3836.1, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 1.432, |
| "grad_norm": 0.5829046317294024, |
| "learning_rate": 3.593257950702194e-05, |
| "loss": 0.4371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41449180245399475, |
| "step": 895, |
| "valid_targets_mean": 4351.4, |
| "valid_targets_min": 373 |
| }, |
| { |
| "epoch": 1.44, |
| "grad_norm": 0.6928805501763816, |
| "learning_rate": 3.586479948426728e-05, |
| "loss": 0.483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44609037041664124, |
| "step": 900, |
| "valid_targets_mean": 4319.5, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 1.448, |
| "grad_norm": 0.6643739326321101, |
| "learning_rate": 3.579652441890523e-05, |
| "loss": 0.4797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49757933616638184, |
| "step": 905, |
| "valid_targets_mean": 3803.0, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 1.456, |
| "grad_norm": 0.6143346831296209, |
| "learning_rate": 3.572775644137974e-05, |
| "loss": 0.4814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4909932315349579, |
| "step": 910, |
| "valid_targets_mean": 3776.1, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 1.464, |
| "grad_norm": 0.529180684369256, |
| "learning_rate": 3.5658497697515534e-05, |
| "loss": 0.4566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5000677704811096, |
| "step": 915, |
| "valid_targets_mean": 6069.6, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 1.472, |
| "grad_norm": 0.6497553129314787, |
| "learning_rate": 3.558875034845113e-05, |
| "loss": 0.4521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4506397545337677, |
| "step": 920, |
| "valid_targets_mean": 3804.3, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 1.48, |
| "grad_norm": 0.4920648541618837, |
| "learning_rate": 3.551851657057139e-05, |
| "loss": 0.4807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4525104761123657, |
| "step": 925, |
| "valid_targets_mean": 7107.8, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 1.488, |
| "grad_norm": 0.7772212863915389, |
| "learning_rate": 3.544779855543963e-05, |
| "loss": 0.4908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4923700988292694, |
| "step": 930, |
| "valid_targets_mean": 2380.3, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 1.496, |
| "grad_norm": 0.5981404469738086, |
| "learning_rate": 3.5376598509729226e-05, |
| "loss": 0.4821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4714764952659607, |
| "step": 935, |
| "valid_targets_mean": 4965.3, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 1.504, |
| "grad_norm": 0.7007792353553981, |
| "learning_rate": 3.5304918655154754e-05, |
| "loss": 0.4921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4638800024986267, |
| "step": 940, |
| "valid_targets_mean": 3031.9, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 1.512, |
| "grad_norm": 0.6097210410936542, |
| "learning_rate": 3.523276122840266e-05, |
| "loss": 0.4893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.483889102935791, |
| "step": 945, |
| "valid_targets_mean": 3922.5, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 1.52, |
| "grad_norm": 0.7526194303601134, |
| "learning_rate": 3.516012848106149e-05, |
| "loss": 0.4721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5017504692077637, |
| "step": 950, |
| "valid_targets_mean": 2572.9, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 1.528, |
| "grad_norm": 0.46052003404390657, |
| "learning_rate": 3.5087022679551614e-05, |
| "loss": 0.4661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41806378960609436, |
| "step": 955, |
| "valid_targets_mean": 5992.2, |
| "valid_targets_min": 751 |
| }, |
| { |
| "epoch": 1.536, |
| "grad_norm": 0.6989167426008138, |
| "learning_rate": 3.5013446105054486e-05, |
| "loss": 0.4931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5233873128890991, |
| "step": 960, |
| "valid_targets_mean": 2915.4, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 1.544, |
| "grad_norm": 0.7730262333694343, |
| "learning_rate": 3.493940105344152e-05, |
| "loss": 0.4765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45950740575790405, |
| "step": 965, |
| "valid_targets_mean": 3003.8, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 1.552, |
| "grad_norm": 0.6796211235694684, |
| "learning_rate": 3.4864889835202366e-05, |
| "loss": 0.4963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4867255389690399, |
| "step": 970, |
| "valid_targets_mean": 5517.5, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 1.56, |
| "grad_norm": 0.882468209296317, |
| "learning_rate": 3.4789914775372905e-05, |
| "loss": 0.4956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5269094705581665, |
| "step": 975, |
| "valid_targets_mean": 2169.9, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 1.568, |
| "grad_norm": 0.6427886583581234, |
| "learning_rate": 3.471447821346264e-05, |
| "loss": 0.4946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5064438581466675, |
| "step": 980, |
| "valid_targets_mean": 3668.9, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 1.576, |
| "grad_norm": 0.4751807016740937, |
| "learning_rate": 3.463858250338168e-05, |
| "loss": 0.478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4542385935783386, |
| "step": 985, |
| "valid_targets_mean": 7338.5, |
| "valid_targets_min": 371 |
| }, |
| { |
| "epoch": 1.584, |
| "grad_norm": 0.5520255318021472, |
| "learning_rate": 3.4562230013367374e-05, |
| "loss": 0.467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47316858172416687, |
| "step": 990, |
| "valid_targets_mean": 4990.0, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 1.592, |
| "grad_norm": 0.5538940893817148, |
| "learning_rate": 3.448542312591032e-05, |
| "loss": 0.4678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43099331855773926, |
| "step": 995, |
| "valid_targets_mean": 4630.3, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 1.6, |
| "grad_norm": 0.49936258088092805, |
| "learning_rate": 3.440816423768007e-05, |
| "loss": 0.4788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4556550085544586, |
| "step": 1000, |
| "valid_targets_mean": 5382.2, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 1.608, |
| "grad_norm": 0.6836362049629878, |
| "learning_rate": 3.433045575945031e-05, |
| "loss": 0.4665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5310341119766235, |
| "step": 1005, |
| "valid_targets_mean": 2997.4, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 1.616, |
| "grad_norm": 0.5410029620184749, |
| "learning_rate": 3.42523001160237e-05, |
| "loss": 0.4847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47429001331329346, |
| "step": 1010, |
| "valid_targets_mean": 4692.7, |
| "valid_targets_min": 418 |
| }, |
| { |
| "epoch": 1.624, |
| "grad_norm": 0.536446225642749, |
| "learning_rate": 3.417369974615615e-05, |
| "loss": 0.4739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44192248582839966, |
| "step": 1015, |
| "valid_targets_mean": 4533.6, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.6320000000000001, |
| "grad_norm": 0.654586453788874, |
| "learning_rate": 3.409465710248074e-05, |
| "loss": 0.4511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4620225727558136, |
| "step": 1020, |
| "valid_targets_mean": 3155.8, |
| "valid_targets_min": 497 |
| }, |
| { |
| "epoch": 1.6400000000000001, |
| "grad_norm": 0.6885658704413448, |
| "learning_rate": 3.401517465143119e-05, |
| "loss": 0.4594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47382691502571106, |
| "step": 1025, |
| "valid_targets_mean": 2903.8, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 1.6480000000000001, |
| "grad_norm": 0.5838313777450732, |
| "learning_rate": 3.393525487316489e-05, |
| "loss": 0.4802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4386270344257355, |
| "step": 1030, |
| "valid_targets_mean": 3802.1, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 1.6560000000000001, |
| "grad_norm": 0.5475012361833616, |
| "learning_rate": 3.385490026148554e-05, |
| "loss": 0.4882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47070324420928955, |
| "step": 1035, |
| "valid_targets_mean": 4426.2, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 1.6640000000000001, |
| "grad_norm": 0.5825446614405908, |
| "learning_rate": 3.377411332376529e-05, |
| "loss": 0.4871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49477773904800415, |
| "step": 1040, |
| "valid_targets_mean": 3675.8, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 1.6720000000000002, |
| "grad_norm": 0.5522875927498029, |
| "learning_rate": 3.369289658086651e-05, |
| "loss": 0.4774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4486830234527588, |
| "step": 1045, |
| "valid_targets_mean": 4307.8, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 1.6800000000000002, |
| "grad_norm": 0.5439529345170723, |
| "learning_rate": 3.3611252567063184e-05, |
| "loss": 0.4639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4867696166038513, |
| "step": 1050, |
| "valid_targets_mean": 4714.7, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 1.688, |
| "grad_norm": 0.753150960893063, |
| "learning_rate": 3.352918382996174e-05, |
| "loss": 0.4951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5364462733268738, |
| "step": 1055, |
| "valid_targets_mean": 3034.1, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 1.696, |
| "grad_norm": 0.5840969444722356, |
| "learning_rate": 3.344669293042163e-05, |
| "loss": 0.4687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5160173177719116, |
| "step": 1060, |
| "valid_targets_mean": 4426.8, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 1.704, |
| "grad_norm": 0.6291215602430366, |
| "learning_rate": 3.336378244247539e-05, |
| "loss": 0.4774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.48828327655792236, |
| "step": 1065, |
| "valid_targets_mean": 3159.0, |
| "valid_targets_min": 579 |
| }, |
| { |
| "epoch": 1.712, |
| "grad_norm": 0.7157439156221113, |
| "learning_rate": 3.3280454953248326e-05, |
| "loss": 0.4719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46565982699394226, |
| "step": 1070, |
| "valid_targets_mean": 2837.4, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 1.72, |
| "grad_norm": 0.8834848909249748, |
| "learning_rate": 3.3196713062877765e-05, |
| "loss": 0.4555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47797664999961853, |
| "step": 1075, |
| "valid_targets_mean": 2625.6, |
| "valid_targets_min": 588 |
| }, |
| { |
| "epoch": 1.728, |
| "grad_norm": 0.47069533464521623, |
| "learning_rate": 3.311255938443196e-05, |
| "loss": 0.467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4377485513687134, |
| "step": 1080, |
| "valid_targets_mean": 5656.1, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 1.736, |
| "grad_norm": 0.5994529019656026, |
| "learning_rate": 3.3027996543828524e-05, |
| "loss": 0.4708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5046743154525757, |
| "step": 1085, |
| "valid_targets_mean": 3614.6, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 1.744, |
| "grad_norm": 0.6262011025182842, |
| "learning_rate": 3.2943027179752494e-05, |
| "loss": 0.4717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4625643789768219, |
| "step": 1090, |
| "valid_targets_mean": 4390.8, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 1.752, |
| "grad_norm": 0.505027541492022, |
| "learning_rate": 3.285765394357401e-05, |
| "loss": 0.4815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46330204606056213, |
| "step": 1095, |
| "valid_targets_mean": 5306.1, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 1.76, |
| "grad_norm": 0.514752245979312, |
| "learning_rate": 3.277187949926556e-05, |
| "loss": 0.4531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41437840461730957, |
| "step": 1100, |
| "valid_targets_mean": 6349.6, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 1.768, |
| "grad_norm": 0.5757785700580377, |
| "learning_rate": 3.268570652331888e-05, |
| "loss": 0.4744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43744391202926636, |
| "step": 1105, |
| "valid_targets_mean": 3915.2, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 1.776, |
| "grad_norm": 0.5909523847823849, |
| "learning_rate": 3.2599137704661405e-05, |
| "loss": 0.4395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46480992436408997, |
| "step": 1110, |
| "valid_targets_mean": 3621.0, |
| "valid_targets_min": 468 |
| }, |
| { |
| "epoch": 1.784, |
| "grad_norm": 0.6522784519010079, |
| "learning_rate": 3.251217574457239e-05, |
| "loss": 0.4716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4484942555427551, |
| "step": 1115, |
| "valid_targets_mean": 3802.8, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 1.792, |
| "grad_norm": 0.6076639765753343, |
| "learning_rate": 3.242482335659861e-05, |
| "loss": 0.4756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41383862495422363, |
| "step": 1120, |
| "valid_targets_mean": 3632.5, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 1.8, |
| "grad_norm": 1.4930741994185592, |
| "learning_rate": 3.2337083266469687e-05, |
| "loss": 0.4672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49689725041389465, |
| "step": 1125, |
| "valid_targets_mean": 4094.2, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 1.808, |
| "grad_norm": 0.5983765842540781, |
| "learning_rate": 3.224895821201304e-05, |
| "loss": 0.4772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43095701932907104, |
| "step": 1130, |
| "valid_targets_mean": 3158.9, |
| "valid_targets_min": 505 |
| }, |
| { |
| "epoch": 1.8159999999999998, |
| "grad_norm": 0.7377527167711196, |
| "learning_rate": 3.2160450943068446e-05, |
| "loss": 0.494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4552053213119507, |
| "step": 1135, |
| "valid_targets_mean": 3169.7, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 1.8239999999999998, |
| "grad_norm": 0.48209247220176665, |
| "learning_rate": 3.207156422140225e-05, |
| "loss": 0.4665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40306127071380615, |
| "step": 1140, |
| "valid_targets_mean": 5754.3, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 1.8319999999999999, |
| "grad_norm": 0.6434012245459063, |
| "learning_rate": 3.198230082062115e-05, |
| "loss": 0.4792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4668983817100525, |
| "step": 1145, |
| "valid_targets_mean": 3197.2, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 1.8399999999999999, |
| "grad_norm": 0.6995497102738215, |
| "learning_rate": 3.189266352608574e-05, |
| "loss": 0.4839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5054548978805542, |
| "step": 1150, |
| "valid_targets_mean": 2973.6, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 1.8479999999999999, |
| "grad_norm": 0.569099812286609, |
| "learning_rate": 3.180265513482345e-05, |
| "loss": 0.4843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5099635720252991, |
| "step": 1155, |
| "valid_targets_mean": 4445.8, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 1.8559999999999999, |
| "grad_norm": 0.7118854281438147, |
| "learning_rate": 3.171227845544143e-05, |
| "loss": 0.5015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5411723852157593, |
| "step": 1160, |
| "valid_targets_mean": 3062.9, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 1.8639999999999999, |
| "grad_norm": 0.4667067376045219, |
| "learning_rate": 3.162153630803877e-05, |
| "loss": 0.4776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42969876527786255, |
| "step": 1165, |
| "valid_targets_mean": 6657.2, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 1.8719999999999999, |
| "grad_norm": 0.5574951952526179, |
| "learning_rate": 3.153043152411861e-05, |
| "loss": 0.4466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3883597254753113, |
| "step": 1170, |
| "valid_targets_mean": 3929.1, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 1.88, |
| "grad_norm": 0.49857166985641654, |
| "learning_rate": 3.14389669464997e-05, |
| "loss": 0.4621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4549972712993622, |
| "step": 1175, |
| "valid_targets_mean": 5751.6, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 1.888, |
| "grad_norm": 0.7211688221308987, |
| "learning_rate": 3.134714542922777e-05, |
| "loss": 0.4731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4644148647785187, |
| "step": 1180, |
| "valid_targets_mean": 4079.8, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 1.896, |
| "grad_norm": 0.5649019306883653, |
| "learning_rate": 3.1254969837486425e-05, |
| "loss": 0.4801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47578728199005127, |
| "step": 1185, |
| "valid_targets_mean": 4451.9, |
| "valid_targets_min": 496 |
| }, |
| { |
| "epoch": 1.904, |
| "grad_norm": 0.8113490782507405, |
| "learning_rate": 3.116244304750774e-05, |
| "loss": 0.4841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49812304973602295, |
| "step": 1190, |
| "valid_targets_mean": 4256.6, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 1.912, |
| "grad_norm": 0.6475596871318647, |
| "learning_rate": 3.106956794648254e-05, |
| "loss": 0.4662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4609223008155823, |
| "step": 1195, |
| "valid_targets_mean": 3238.9, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 1.92, |
| "grad_norm": 0.5392636163279259, |
| "learning_rate": 3.097634743247026e-05, |
| "loss": 0.4366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4826831519603729, |
| "step": 1200, |
| "valid_targets_mean": 4662.3, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 1.928, |
| "grad_norm": 0.61215815551841, |
| "learning_rate": 3.08827844143086e-05, |
| "loss": 0.4761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5427641868591309, |
| "step": 1205, |
| "valid_targets_mean": 4324.7, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 1.936, |
| "grad_norm": 0.5987033728383583, |
| "learning_rate": 3.078888181152264e-05, |
| "loss": 0.4722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42406606674194336, |
| "step": 1210, |
| "valid_targets_mean": 3636.4, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.944, |
| "grad_norm": 0.6515070925773007, |
| "learning_rate": 3.0694642554233855e-05, |
| "loss": 0.4707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47039297223091125, |
| "step": 1215, |
| "valid_targets_mean": 2975.4, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 1.952, |
| "grad_norm": 0.5388317669629852, |
| "learning_rate": 3.0600069583068594e-05, |
| "loss": 0.4779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4415266513824463, |
| "step": 1220, |
| "valid_targets_mean": 4852.2, |
| "valid_targets_min": 347 |
| }, |
| { |
| "epoch": 1.96, |
| "grad_norm": 0.5138321633547656, |
| "learning_rate": 3.0505165849066394e-05, |
| "loss": 0.4681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4434703290462494, |
| "step": 1225, |
| "valid_targets_mean": 5056.9, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 1.968, |
| "grad_norm": 0.7612326702075074, |
| "learning_rate": 3.040993431358782e-05, |
| "loss": 0.4736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4785926938056946, |
| "step": 1230, |
| "valid_targets_mean": 2302.5, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 1.976, |
| "grad_norm": 0.7430168909983449, |
| "learning_rate": 3.031437794822215e-05, |
| "loss": 0.4701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46587690711021423, |
| "step": 1235, |
| "valid_targets_mean": 3480.7, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 1.984, |
| "grad_norm": 0.8871840326954018, |
| "learning_rate": 3.021849973469455e-05, |
| "loss": 0.5202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5849260687828064, |
| "step": 1240, |
| "valid_targets_mean": 2373.0, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 1.992, |
| "grad_norm": 0.8005852985566412, |
| "learning_rate": 3.012230266477313e-05, |
| "loss": 0.4786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5191680788993835, |
| "step": 1245, |
| "valid_targets_mean": 2152.9, |
| "valid_targets_min": 834 |
| }, |
| { |
| "epoch": 2.0, |
| "grad_norm": 1.423544343942953, |
| "learning_rate": 3.0025789740175502e-05, |
| "loss": 0.4934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5457210540771484, |
| "step": 1250, |
| "valid_targets_mean": 2222.7, |
| "valid_targets_min": 561 |
| }, |
| { |
| "epoch": 2.008, |
| "grad_norm": 0.5955977900794318, |
| "learning_rate": 2.9928963972475186e-05, |
| "loss": 0.4681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4416769742965698, |
| "step": 1255, |
| "valid_targets_mean": 4610.1, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 2.016, |
| "grad_norm": 0.6090260458793183, |
| "learning_rate": 2.9831828383007585e-05, |
| "loss": 0.4479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4574715495109558, |
| "step": 1260, |
| "valid_targets_mean": 4182.2, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 2.024, |
| "grad_norm": 0.7360060643061078, |
| "learning_rate": 2.9734386002775754e-05, |
| "loss": 0.4695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5532656908035278, |
| "step": 1265, |
| "valid_targets_mean": 3207.1, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 2.032, |
| "grad_norm": 0.6687884359084095, |
| "learning_rate": 2.963663987235577e-05, |
| "loss": 0.4552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.426003634929657, |
| "step": 1270, |
| "valid_targets_mean": 2995.4, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 2.04, |
| "grad_norm": 0.7116484185211367, |
| "learning_rate": 2.95385930418019e-05, |
| "loss": 0.4567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5189186334609985, |
| "step": 1275, |
| "valid_targets_mean": 3110.1, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 2.048, |
| "grad_norm": 0.7186019588818685, |
| "learning_rate": 2.9440248570551406e-05, |
| "loss": 0.4459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41865086555480957, |
| "step": 1280, |
| "valid_targets_mean": 3671.8, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 2.056, |
| "grad_norm": 1.4747315343165368, |
| "learning_rate": 2.934160952732907e-05, |
| "loss": 0.449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4162527322769165, |
| "step": 1285, |
| "valid_targets_mean": 3745.3, |
| "valid_targets_min": 306 |
| }, |
| { |
| "epoch": 2.064, |
| "grad_norm": 0.6471086351380495, |
| "learning_rate": 2.9242678990051462e-05, |
| "loss": 0.4433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44822385907173157, |
| "step": 1290, |
| "valid_targets_mean": 4509.1, |
| "valid_targets_min": 576 |
| }, |
| { |
| "epoch": 2.072, |
| "grad_norm": 0.6346182269430595, |
| "learning_rate": 2.9143460045730886e-05, |
| "loss": 0.4487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.48546066880226135, |
| "step": 1295, |
| "valid_targets_mean": 3940.9, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 2.08, |
| "grad_norm": 2.031709545540969, |
| "learning_rate": 2.9043955790379035e-05, |
| "loss": 0.4714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43055105209350586, |
| "step": 1300, |
| "valid_targets_mean": 3915.9, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 2.088, |
| "grad_norm": 0.6903051949163922, |
| "learning_rate": 2.8944169328910427e-05, |
| "loss": 0.446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.48170751333236694, |
| "step": 1305, |
| "valid_targets_mean": 3417.4, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 2.096, |
| "grad_norm": 0.5332653284325558, |
| "learning_rate": 2.884410377504547e-05, |
| "loss": 0.4159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42663711309432983, |
| "step": 1310, |
| "valid_targets_mean": 5080.2, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 2.104, |
| "grad_norm": 0.602437990002518, |
| "learning_rate": 2.8743762251213333e-05, |
| "loss": 0.4508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47259843349456787, |
| "step": 1315, |
| "valid_targets_mean": 4112.4, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 2.112, |
| "grad_norm": 0.676214101245154, |
| "learning_rate": 2.8643147888454507e-05, |
| "loss": 0.4432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4584727883338928, |
| "step": 1320, |
| "valid_targets_mean": 3043.8, |
| "valid_targets_min": 415 |
| }, |
| { |
| "epoch": 2.12, |
| "grad_norm": 0.7428353700968319, |
| "learning_rate": 2.854226382632312e-05, |
| "loss": 0.4713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5539952516555786, |
| "step": 1325, |
| "valid_targets_mean": 3083.6, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 2.128, |
| "grad_norm": 0.5464368058251405, |
| "learning_rate": 2.844111321278893e-05, |
| "loss": 0.4385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3453948497772217, |
| "step": 1330, |
| "valid_targets_mean": 3928.3, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 2.136, |
| "grad_norm": 0.5772508201873505, |
| "learning_rate": 2.833969920413913e-05, |
| "loss": 0.4465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4165865182876587, |
| "step": 1335, |
| "valid_targets_mean": 3898.2, |
| "valid_targets_min": 480 |
| }, |
| { |
| "epoch": 2.144, |
| "grad_norm": 0.6774356448413013, |
| "learning_rate": 2.8238024964879857e-05, |
| "loss": 0.4465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4822053015232086, |
| "step": 1340, |
| "valid_targets_mean": 3180.1, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 2.152, |
| "grad_norm": 0.654073300893228, |
| "learning_rate": 2.8136093667637438e-05, |
| "loss": 0.4496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4197562336921692, |
| "step": 1345, |
| "valid_targets_mean": 2752.7, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 2.16, |
| "grad_norm": 0.7260228311473961, |
| "learning_rate": 2.8033908493059394e-05, |
| "loss": 0.4643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4236224591732025, |
| "step": 1350, |
| "valid_targets_mean": 3862.9, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 2.168, |
| "grad_norm": 0.5308213424796718, |
| "learning_rate": 2.793147262971519e-05, |
| "loss": 0.4484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4658902883529663, |
| "step": 1355, |
| "valid_targets_mean": 5550.6, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 2.176, |
| "grad_norm": 0.5816937352471572, |
| "learning_rate": 2.7828789273996748e-05, |
| "loss": 0.4431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.414844274520874, |
| "step": 1360, |
| "valid_targets_mean": 4192.6, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 2.184, |
| "grad_norm": 0.6690509201863886, |
| "learning_rate": 2.7725861630018703e-05, |
| "loss": 0.4441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41888707876205444, |
| "step": 1365, |
| "valid_targets_mean": 3258.7, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 2.192, |
| "grad_norm": 0.5315576725263342, |
| "learning_rate": 2.7622692909518423e-05, |
| "loss": 0.4088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4389989376068115, |
| "step": 1370, |
| "valid_targets_mean": 5194.4, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 2.2, |
| "grad_norm": 0.43861560505715885, |
| "learning_rate": 2.7519286331755766e-05, |
| "loss": 0.4343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36606454849243164, |
| "step": 1375, |
| "valid_targets_mean": 7803.1, |
| "valid_targets_min": 915 |
| }, |
| { |
| "epoch": 2.208, |
| "grad_norm": 0.6860438916170236, |
| "learning_rate": 2.7415645123412672e-05, |
| "loss": 0.4345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4727722704410553, |
| "step": 1380, |
| "valid_targets_mean": 3681.9, |
| "valid_targets_min": 354 |
| }, |
| { |
| "epoch": 2.216, |
| "grad_norm": 0.6233752088365587, |
| "learning_rate": 2.731177251849246e-05, |
| "loss": 0.4469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45124104619026184, |
| "step": 1385, |
| "valid_targets_mean": 3928.4, |
| "valid_targets_min": 409 |
| }, |
| { |
| "epoch": 2.224, |
| "grad_norm": 0.7054017714889622, |
| "learning_rate": 2.7207671758218884e-05, |
| "loss": 0.4511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5190399885177612, |
| "step": 1390, |
| "valid_targets_mean": 3278.7, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 2.232, |
| "grad_norm": 0.5481452159873532, |
| "learning_rate": 2.710334609093504e-05, |
| "loss": 0.4338, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40331241488456726, |
| "step": 1395, |
| "valid_targets_mean": 4237.9, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 2.24, |
| "grad_norm": 0.5209483042162194, |
| "learning_rate": 2.699879877200198e-05, |
| "loss": 0.4247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.367615282535553, |
| "step": 1400, |
| "valid_targets_mean": 4907.4, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 2.248, |
| "grad_norm": 0.6180610305765888, |
| "learning_rate": 2.6894033063697143e-05, |
| "loss": 0.4649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4836103916168213, |
| "step": 1405, |
| "valid_targets_mean": 4520.9, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 2.2560000000000002, |
| "grad_norm": 0.624263121954133, |
| "learning_rate": 2.6789052235112554e-05, |
| "loss": 0.4516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4151955544948578, |
| "step": 1410, |
| "valid_targets_mean": 3549.2, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 2.2640000000000002, |
| "grad_norm": 0.5255415368728256, |
| "learning_rate": 2.66838595620528e-05, |
| "loss": 0.4243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4413053095340729, |
| "step": 1415, |
| "valid_targets_mean": 5782.1, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 2.2720000000000002, |
| "grad_norm": 0.6397618135971025, |
| "learning_rate": 2.6578458326932842e-05, |
| "loss": 0.4536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44738149642944336, |
| "step": 1420, |
| "valid_targets_mean": 3827.2, |
| "valid_targets_min": 505 |
| }, |
| { |
| "epoch": 2.2800000000000002, |
| "grad_norm": 0.7085382486155277, |
| "learning_rate": 2.6472851818675583e-05, |
| "loss": 0.4633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4663681387901306, |
| "step": 1425, |
| "valid_targets_mean": 2644.9, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 2.288, |
| "grad_norm": 0.9979890243748089, |
| "learning_rate": 2.6367043332609223e-05, |
| "loss": 0.4459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4871729016304016, |
| "step": 1430, |
| "valid_targets_mean": 1448.7, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 2.296, |
| "grad_norm": 0.5174927037809555, |
| "learning_rate": 2.6261036170364448e-05, |
| "loss": 0.4251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43367236852645874, |
| "step": 1435, |
| "valid_targets_mean": 5433.6, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 2.304, |
| "grad_norm": 0.5663046987401196, |
| "learning_rate": 2.6154833639771415e-05, |
| "loss": 0.4422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46524518728256226, |
| "step": 1440, |
| "valid_targets_mean": 5141.4, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 2.312, |
| "grad_norm": 0.5337110127394135, |
| "learning_rate": 2.6048439054756492e-05, |
| "loss": 0.4463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4362761676311493, |
| "step": 1445, |
| "valid_targets_mean": 5409.9, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 2.32, |
| "grad_norm": 0.5463782845574509, |
| "learning_rate": 2.594185573523892e-05, |
| "loss": 0.4565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45417675375938416, |
| "step": 1450, |
| "valid_targets_mean": 4838.8, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 2.328, |
| "grad_norm": 0.6942365338980392, |
| "learning_rate": 2.583508700702716e-05, |
| "loss": 0.4481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4617985486984253, |
| "step": 1455, |
| "valid_targets_mean": 2802.6, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 2.336, |
| "grad_norm": 0.6070000633127984, |
| "learning_rate": 2.572813620171513e-05, |
| "loss": 0.4513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42797911167144775, |
| "step": 1460, |
| "valid_targets_mean": 3719.3, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 2.344, |
| "grad_norm": 0.4753849685324334, |
| "learning_rate": 2.5621006656578267e-05, |
| "loss": 0.4213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3997453451156616, |
| "step": 1465, |
| "valid_targets_mean": 5544.6, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 2.352, |
| "grad_norm": 0.5989976974737479, |
| "learning_rate": 2.5513701714469373e-05, |
| "loss": 0.4413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4619044363498688, |
| "step": 1470, |
| "valid_targets_mean": 4001.4, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 2.36, |
| "grad_norm": 0.5487842792272467, |
| "learning_rate": 2.540622472371429e-05, |
| "loss": 0.4343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4185061454772949, |
| "step": 1475, |
| "valid_targets_mean": 4278.5, |
| "valid_targets_min": 426 |
| }, |
| { |
| "epoch": 2.368, |
| "grad_norm": 0.4402218121898237, |
| "learning_rate": 2.5298579038007478e-05, |
| "loss": 0.4342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3919063210487366, |
| "step": 1480, |
| "valid_targets_mean": 6910.7, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 2.376, |
| "grad_norm": 0.7373247521439833, |
| "learning_rate": 2.519076801630727e-05, |
| "loss": 0.4723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5013588070869446, |
| "step": 1485, |
| "valid_targets_mean": 2875.9, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 2.384, |
| "grad_norm": 0.556610693165223, |
| "learning_rate": 2.508279502273117e-05, |
| "loss": 0.4419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43320780992507935, |
| "step": 1490, |
| "valid_targets_mean": 5407.4, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 2.392, |
| "grad_norm": 0.5098627681422288, |
| "learning_rate": 2.4974663426450798e-05, |
| "loss": 0.4392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4344981908798218, |
| "step": 1495, |
| "valid_targets_mean": 5123.3, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 2.4, |
| "grad_norm": 0.5039771982978674, |
| "learning_rate": 2.4866376601586798e-05, |
| "loss": 0.4464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4104907810688019, |
| "step": 1500, |
| "valid_targets_mean": 5579.6, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 2.408, |
| "grad_norm": 0.5096044181569787, |
| "learning_rate": 2.475793792710352e-05, |
| "loss": 0.4174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4063170552253723, |
| "step": 1505, |
| "valid_targets_mean": 5081.4, |
| "valid_targets_min": 488 |
| }, |
| { |
| "epoch": 2.416, |
| "grad_norm": 0.7479128529316125, |
| "learning_rate": 2.4649350786703637e-05, |
| "loss": 0.448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47363007068634033, |
| "step": 1510, |
| "valid_targets_mean": 2561.8, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 2.424, |
| "grad_norm": 0.5885671758624585, |
| "learning_rate": 2.45406185687225e-05, |
| "loss": 0.4514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44971561431884766, |
| "step": 1515, |
| "valid_targets_mean": 4042.2, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 2.432, |
| "grad_norm": 0.5915561518938581, |
| "learning_rate": 2.443174466602246e-05, |
| "loss": 0.4559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4462353587150574, |
| "step": 1520, |
| "valid_targets_mean": 3938.5, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 2.44, |
| "grad_norm": 0.663840439463274, |
| "learning_rate": 2.4322732475886953e-05, |
| "loss": 0.4457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.426447331905365, |
| "step": 1525, |
| "valid_targets_mean": 2940.4, |
| "valid_targets_min": 494 |
| }, |
| { |
| "epoch": 2.448, |
| "grad_norm": 0.5258251709290092, |
| "learning_rate": 2.4213585399914528e-05, |
| "loss": 0.4099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4359118640422821, |
| "step": 1530, |
| "valid_targets_mean": 4996.3, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 2.456, |
| "grad_norm": 0.5279872310300597, |
| "learning_rate": 2.4104306843912687e-05, |
| "loss": 0.4368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4399365186691284, |
| "step": 1535, |
| "valid_targets_mean": 5331.9, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 2.464, |
| "grad_norm": 0.5035482920980331, |
| "learning_rate": 2.3994900217791615e-05, |
| "loss": 0.4564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4546802341938019, |
| "step": 1540, |
| "valid_targets_mean": 6091.1, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 2.472, |
| "grad_norm": 0.5503280071758032, |
| "learning_rate": 2.3885368935457762e-05, |
| "loss": 0.4442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38341644406318665, |
| "step": 1545, |
| "valid_targets_mean": 4704.2, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 2.48, |
| "grad_norm": 0.5122727644758672, |
| "learning_rate": 2.3775716414707355e-05, |
| "loss": 0.4236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39771783351898193, |
| "step": 1550, |
| "valid_targets_mean": 5978.4, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 2.488, |
| "grad_norm": 0.577359891725372, |
| "learning_rate": 2.36659460771197e-05, |
| "loss": 0.4408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.426598459482193, |
| "step": 1555, |
| "valid_targets_mean": 4298.5, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 2.496, |
| "grad_norm": 0.534664454111424, |
| "learning_rate": 2.3556061347950455e-05, |
| "loss": 0.422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41438737511634827, |
| "step": 1560, |
| "valid_targets_mean": 4637.9, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 2.504, |
| "grad_norm": 0.742643154280012, |
| "learning_rate": 2.3446065656024734e-05, |
| "loss": 0.4412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45946621894836426, |
| "step": 1565, |
| "valid_targets_mean": 2557.0, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 2.512, |
| "grad_norm": 0.5946087395842765, |
| "learning_rate": 2.33359624336301e-05, |
| "loss": 0.4429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44135582447052, |
| "step": 1570, |
| "valid_targets_mean": 3980.1, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 2.52, |
| "grad_norm": 0.7692556639202142, |
| "learning_rate": 2.3225755116409497e-05, |
| "loss": 0.4855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49565717577934265, |
| "step": 1575, |
| "valid_targets_mean": 2437.8, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 2.528, |
| "grad_norm": 0.6518050042070153, |
| "learning_rate": 2.311544714325403e-05, |
| "loss": 0.4278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4329824149608612, |
| "step": 1580, |
| "valid_targets_mean": 3308.9, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 2.536, |
| "grad_norm": 0.7001492648412008, |
| "learning_rate": 2.300504195619563e-05, |
| "loss": 0.4865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47200626134872437, |
| "step": 1585, |
| "valid_targets_mean": 3019.2, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 2.544, |
| "grad_norm": 0.5775943044286223, |
| "learning_rate": 2.2894543000299697e-05, |
| "loss": 0.4546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4556680917739868, |
| "step": 1590, |
| "valid_targets_mean": 4622.2, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 2.552, |
| "grad_norm": 0.6300239166139451, |
| "learning_rate": 2.2783953723557572e-05, |
| "loss": 0.4442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47904396057128906, |
| "step": 1595, |
| "valid_targets_mean": 3739.5, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 2.56, |
| "grad_norm": 0.5521871360992379, |
| "learning_rate": 2.2673277576778946e-05, |
| "loss": 0.4353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4208674728870392, |
| "step": 1600, |
| "valid_targets_mean": 4564.6, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 2.568, |
| "grad_norm": 0.6820540018619283, |
| "learning_rate": 2.2562518013484208e-05, |
| "loss": 0.4273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40282294154167175, |
| "step": 1605, |
| "valid_targets_mean": 2706.5, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 2.576, |
| "grad_norm": 0.6077922915119577, |
| "learning_rate": 2.245167848979664e-05, |
| "loss": 0.4142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42859092354774475, |
| "step": 1610, |
| "valid_targets_mean": 3625.1, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 2.584, |
| "grad_norm": 0.5854962148493413, |
| "learning_rate": 2.23407624643346e-05, |
| "loss": 0.4648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42316490411758423, |
| "step": 1615, |
| "valid_targets_mean": 4010.8, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.592, |
| "grad_norm": 0.544244197674275, |
| "learning_rate": 2.2229773398103606e-05, |
| "loss": 0.4167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40714818239212036, |
| "step": 1620, |
| "valid_targets_mean": 4601.6, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 2.6, |
| "grad_norm": 0.7315101815116987, |
| "learning_rate": 2.2118714754388323e-05, |
| "loss": 0.4689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4557625651359558, |
| "step": 1625, |
| "valid_targets_mean": 2673.6, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.608, |
| "grad_norm": 0.6392348215128343, |
| "learning_rate": 2.200758999864449e-05, |
| "loss": 0.4095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41079527139663696, |
| "step": 1630, |
| "valid_targets_mean": 3180.8, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 2.616, |
| "grad_norm": 0.553837921244433, |
| "learning_rate": 2.1896402598390818e-05, |
| "loss": 0.419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3827151358127594, |
| "step": 1635, |
| "valid_targets_mean": 4638.4, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 2.624, |
| "grad_norm": 0.5193517813868557, |
| "learning_rate": 2.178515602310074e-05, |
| "loss": 0.4533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40580642223358154, |
| "step": 1640, |
| "valid_targets_mean": 4868.9, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 2.632, |
| "grad_norm": 0.6317219989613208, |
| "learning_rate": 2.1673853744094193e-05, |
| "loss": 0.4467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4618436098098755, |
| "step": 1645, |
| "valid_targets_mean": 3528.4, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 2.64, |
| "grad_norm": 0.8058706372384056, |
| "learning_rate": 2.1562499234429283e-05, |
| "loss": 0.4757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4898325800895691, |
| "step": 1650, |
| "valid_targets_mean": 2231.3, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 2.648, |
| "grad_norm": 0.7352262306367001, |
| "learning_rate": 2.1451095968793908e-05, |
| "loss": 0.4389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46522995829582214, |
| "step": 1655, |
| "valid_targets_mean": 3700.2, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 2.656, |
| "grad_norm": 0.6500232390169828, |
| "learning_rate": 2.1339647423397337e-05, |
| "loss": 0.4385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4323245882987976, |
| "step": 1660, |
| "valid_targets_mean": 3278.4, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 2.664, |
| "grad_norm": 0.6031196836473796, |
| "learning_rate": 2.122815707586176e-05, |
| "loss": 0.4358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4227977991104126, |
| "step": 1665, |
| "valid_targets_mean": 3835.8, |
| "valid_targets_min": 517 |
| }, |
| { |
| "epoch": 2.672, |
| "grad_norm": 0.5631354627031511, |
| "learning_rate": 2.111662840511373e-05, |
| "loss": 0.4372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40425512194633484, |
| "step": 1670, |
| "valid_targets_mean": 4473.6, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 2.68, |
| "grad_norm": 0.6281174285703458, |
| "learning_rate": 2.1005064891275638e-05, |
| "loss": 0.4534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4625401496887207, |
| "step": 1675, |
| "valid_targets_mean": 3325.9, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 2.6879999999999997, |
| "grad_norm": 0.5324007779451334, |
| "learning_rate": 2.0893470015557126e-05, |
| "loss": 0.4137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3770933151245117, |
| "step": 1680, |
| "valid_targets_mean": 4407.2, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 2.6959999999999997, |
| "grad_norm": 0.5704221627115216, |
| "learning_rate": 2.078184726014643e-05, |
| "loss": 0.4524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4448625445365906, |
| "step": 1685, |
| "valid_targets_mean": 4212.2, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 2.7039999999999997, |
| "grad_norm": 0.5813144458895672, |
| "learning_rate": 2.0670200108101754e-05, |
| "loss": 0.4548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4791436195373535, |
| "step": 1690, |
| "valid_targets_mean": 4126.9, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 2.7119999999999997, |
| "grad_norm": 0.8782653466918007, |
| "learning_rate": 2.0558532043242557e-05, |
| "loss": 0.464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.453347384929657, |
| "step": 1695, |
| "valid_targets_mean": 1782.1, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 2.7199999999999998, |
| "grad_norm": 0.5583160859664104, |
| "learning_rate": 2.0446846550040863e-05, |
| "loss": 0.428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4322124719619751, |
| "step": 1700, |
| "valid_targets_mean": 4821.1, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 2.7279999999999998, |
| "grad_norm": 0.5277977577152152, |
| "learning_rate": 2.033514711351253e-05, |
| "loss": 0.4315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42123162746429443, |
| "step": 1705, |
| "valid_targets_mean": 5344.1, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 2.7359999999999998, |
| "grad_norm": 0.498988724319745, |
| "learning_rate": 2.022343721910851e-05, |
| "loss": 0.4515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44440481066703796, |
| "step": 1710, |
| "valid_targets_mean": 6055.7, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 2.7439999999999998, |
| "grad_norm": 0.5688318880815759, |
| "learning_rate": 2.0111720352606054e-05, |
| "loss": 0.4293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4387132227420807, |
| "step": 1715, |
| "valid_targets_mean": 4293.4, |
| "valid_targets_min": 1000 |
| }, |
| { |
| "epoch": 2.752, |
| "grad_norm": 0.5541189383448685, |
| "learning_rate": 2e-05, |
| "loss": 0.4345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42854511737823486, |
| "step": 1720, |
| "valid_targets_mean": 4060.4, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 2.76, |
| "grad_norm": 0.5636891444562256, |
| "learning_rate": 1.988827964739395e-05, |
| "loss": 0.4569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4016704559326172, |
| "step": 1725, |
| "valid_targets_mean": 4026.6, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 2.768, |
| "grad_norm": 0.5707069098467574, |
| "learning_rate": 1.9776562780891494e-05, |
| "loss": 0.4277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3943563997745514, |
| "step": 1730, |
| "valid_targets_mean": 3987.3, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 2.776, |
| "grad_norm": 0.46274734962368136, |
| "learning_rate": 1.966485288648747e-05, |
| "loss": 0.4408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38267430663108826, |
| "step": 1735, |
| "valid_targets_mean": 6487.2, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 2.784, |
| "grad_norm": 0.5235450558438844, |
| "learning_rate": 1.9553153449959144e-05, |
| "loss": 0.4465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40462425351142883, |
| "step": 1740, |
| "valid_targets_mean": 4937.6, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 2.792, |
| "grad_norm": 0.4835906686418437, |
| "learning_rate": 1.9441467956757453e-05, |
| "loss": 0.4716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4714353680610657, |
| "step": 1745, |
| "valid_targets_mean": 6360.5, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 2.8, |
| "grad_norm": 0.5100225254528137, |
| "learning_rate": 1.9329799891898256e-05, |
| "loss": 0.4314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4558408260345459, |
| "step": 1750, |
| "valid_targets_mean": 5252.3, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 2.808, |
| "grad_norm": 0.7039108297346979, |
| "learning_rate": 1.9218152739853576e-05, |
| "loss": 0.4289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3978843688964844, |
| "step": 1755, |
| "valid_targets_mean": 4321.9, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 2.816, |
| "grad_norm": 0.5642168770075947, |
| "learning_rate": 1.9106529984442884e-05, |
| "loss": 0.4398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45182371139526367, |
| "step": 1760, |
| "valid_targets_mean": 4244.4, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 2.824, |
| "grad_norm": 0.6525684551205236, |
| "learning_rate": 1.8994935108724366e-05, |
| "loss": 0.4521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4625537395477295, |
| "step": 1765, |
| "valid_targets_mean": 3384.4, |
| "valid_targets_min": 838 |
| }, |
| { |
| "epoch": 2.832, |
| "grad_norm": 0.5604654454033197, |
| "learning_rate": 1.8883371594886276e-05, |
| "loss": 0.4497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4158444404602051, |
| "step": 1770, |
| "valid_targets_mean": 5318.2, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 2.84, |
| "grad_norm": 0.7805033021518426, |
| "learning_rate": 1.877184292413824e-05, |
| "loss": 0.4403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46476149559020996, |
| "step": 1775, |
| "valid_targets_mean": 2218.4, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 2.848, |
| "grad_norm": 0.632248312453592, |
| "learning_rate": 1.8660352576602663e-05, |
| "loss": 0.4715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4902727007865906, |
| "step": 1780, |
| "valid_targets_mean": 4020.6, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 2.856, |
| "grad_norm": 0.8500750674610906, |
| "learning_rate": 1.8548904031206102e-05, |
| "loss": 0.4558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5282151103019714, |
| "step": 1785, |
| "valid_targets_mean": 2049.2, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 2.864, |
| "grad_norm": 0.5478175008230401, |
| "learning_rate": 1.843750076557072e-05, |
| "loss": 0.4351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4625953137874603, |
| "step": 1790, |
| "valid_targets_mean": 4885.2, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 2.872, |
| "grad_norm": 0.6244527229546376, |
| "learning_rate": 1.832614625590581e-05, |
| "loss": 0.4246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43290358781814575, |
| "step": 1795, |
| "valid_targets_mean": 3414.3, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 2.88, |
| "grad_norm": 0.8234587446370712, |
| "learning_rate": 1.8214843976899264e-05, |
| "loss": 0.454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4970802664756775, |
| "step": 1800, |
| "valid_targets_mean": 2389.6, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 2.888, |
| "grad_norm": 0.7474318673230876, |
| "learning_rate": 1.810359740160919e-05, |
| "loss": 0.4377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44770461320877075, |
| "step": 1805, |
| "valid_targets_mean": 2616.4, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 2.896, |
| "grad_norm": 0.507392374752142, |
| "learning_rate": 1.7992410001355515e-05, |
| "loss": 0.4388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4395235776901245, |
| "step": 1810, |
| "valid_targets_mean": 5488.2, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 2.904, |
| "grad_norm": 0.7243529623293884, |
| "learning_rate": 1.788128524561168e-05, |
| "loss": 0.4574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5047330260276794, |
| "step": 1815, |
| "valid_targets_mean": 3967.6, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 2.912, |
| "grad_norm": 0.633168445724496, |
| "learning_rate": 1.7770226601896397e-05, |
| "loss": 0.4324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47217708826065063, |
| "step": 1820, |
| "valid_targets_mean": 3495.6, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 2.92, |
| "grad_norm": 0.5327318709010629, |
| "learning_rate": 1.7659237535665404e-05, |
| "loss": 0.4572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4306362569332123, |
| "step": 1825, |
| "valid_targets_mean": 4756.9, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 2.928, |
| "grad_norm": 0.7771946593440502, |
| "learning_rate": 1.754832151020337e-05, |
| "loss": 0.4335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.48200926184654236, |
| "step": 1830, |
| "valid_targets_mean": 2481.1, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 2.936, |
| "grad_norm": 0.7503956631971685, |
| "learning_rate": 1.74374819865158e-05, |
| "loss": 0.435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43350616097450256, |
| "step": 1835, |
| "valid_targets_mean": 2832.5, |
| "valid_targets_min": 751 |
| }, |
| { |
| "epoch": 2.944, |
| "grad_norm": 0.5813547416857596, |
| "learning_rate": 1.7326722423221057e-05, |
| "loss": 0.4394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39921069145202637, |
| "step": 1840, |
| "valid_targets_mean": 3993.1, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 2.952, |
| "grad_norm": 0.5326305159342818, |
| "learning_rate": 1.7216046276442438e-05, |
| "loss": 0.4184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40970325469970703, |
| "step": 1845, |
| "valid_targets_mean": 5141.3, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 2.96, |
| "grad_norm": 0.5726519569305819, |
| "learning_rate": 1.7105456999700306e-05, |
| "loss": 0.4379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4494893550872803, |
| "step": 1850, |
| "valid_targets_mean": 4538.5, |
| "valid_targets_min": 1067 |
| }, |
| { |
| "epoch": 2.968, |
| "grad_norm": 0.5532240290014173, |
| "learning_rate": 1.6994958043804374e-05, |
| "loss": 0.4503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41899892687797546, |
| "step": 1855, |
| "valid_targets_mean": 4828.1, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 2.976, |
| "grad_norm": 0.721900867482457, |
| "learning_rate": 1.6884552856745972e-05, |
| "loss": 0.4625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46213817596435547, |
| "step": 1860, |
| "valid_targets_mean": 2615.0, |
| "valid_targets_min": 288 |
| }, |
| { |
| "epoch": 2.984, |
| "grad_norm": 0.7315015103460375, |
| "learning_rate": 1.6774244883590503e-05, |
| "loss": 0.429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4381354749202728, |
| "step": 1865, |
| "valid_targets_mean": 2520.1, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 2.992, |
| "grad_norm": 0.5819438726684737, |
| "learning_rate": 1.6664037566369905e-05, |
| "loss": 0.4362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4385232925415039, |
| "step": 1870, |
| "valid_targets_mean": 4100.1, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 3.0, |
| "grad_norm": 0.6054633776816779, |
| "learning_rate": 1.6553934343975273e-05, |
| "loss": 0.4334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.390241801738739, |
| "step": 1875, |
| "valid_targets_mean": 3394.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 3.008, |
| "grad_norm": 0.5137093432064929, |
| "learning_rate": 1.644393865204955e-05, |
| "loss": 0.4403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4124566316604614, |
| "step": 1880, |
| "valid_targets_mean": 4975.0, |
| "valid_targets_min": 279 |
| }, |
| { |
| "epoch": 3.016, |
| "grad_norm": 0.6040955563332363, |
| "learning_rate": 1.6334053922880304e-05, |
| "loss": 0.4166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4080016613006592, |
| "step": 1885, |
| "valid_targets_mean": 4139.9, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 3.024, |
| "grad_norm": 0.5643520837040242, |
| "learning_rate": 1.622428358529265e-05, |
| "loss": 0.4374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41588467359542847, |
| "step": 1890, |
| "valid_targets_mean": 4808.7, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 3.032, |
| "grad_norm": 0.5036209628878098, |
| "learning_rate": 1.611463106454224e-05, |
| "loss": 0.4334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36360183358192444, |
| "step": 1895, |
| "valid_targets_mean": 5222.1, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 3.04, |
| "grad_norm": 0.643260239413669, |
| "learning_rate": 1.6005099782208392e-05, |
| "loss": 0.4385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4102736711502075, |
| "step": 1900, |
| "valid_targets_mean": 3426.6, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 3.048, |
| "grad_norm": 0.5073496084996462, |
| "learning_rate": 1.5895693156087317e-05, |
| "loss": 0.4128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41783252358436584, |
| "step": 1905, |
| "valid_targets_mean": 6147.1, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 3.056, |
| "grad_norm": 0.6943111946599407, |
| "learning_rate": 1.578641460008548e-05, |
| "loss": 0.4402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5079389214515686, |
| "step": 1910, |
| "valid_targets_mean": 3470.3, |
| "valid_targets_min": 508 |
| }, |
| { |
| "epoch": 3.064, |
| "grad_norm": 0.7091661125569685, |
| "learning_rate": 1.5677267524113054e-05, |
| "loss": 0.4107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4140545129776001, |
| "step": 1915, |
| "valid_targets_mean": 3084.1, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 3.072, |
| "grad_norm": 0.6859858593138877, |
| "learning_rate": 1.5568255333977547e-05, |
| "loss": 0.4185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4497836232185364, |
| "step": 1920, |
| "valid_targets_mean": 3122.9, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 3.08, |
| "grad_norm": 0.7339049628922232, |
| "learning_rate": 1.5459381431277506e-05, |
| "loss": 0.4082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3879634737968445, |
| "step": 1925, |
| "valid_targets_mean": 2320.3, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 3.088, |
| "grad_norm": 1.7541410222491485, |
| "learning_rate": 1.5350649213296373e-05, |
| "loss": 0.4249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46820366382598877, |
| "step": 1930, |
| "valid_targets_mean": 3518.1, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 3.096, |
| "grad_norm": 0.6039401909562907, |
| "learning_rate": 1.5242062072896483e-05, |
| "loss": 0.4204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4237516522407532, |
| "step": 1935, |
| "valid_targets_mean": 4190.0, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 3.104, |
| "grad_norm": 0.6053990380451738, |
| "learning_rate": 1.5133623398413209e-05, |
| "loss": 0.3991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38883084058761597, |
| "step": 1940, |
| "valid_targets_mean": 3890.1, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 3.112, |
| "grad_norm": 0.5153567551089437, |
| "learning_rate": 1.50253365735492e-05, |
| "loss": 0.4124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3877636790275574, |
| "step": 1945, |
| "valid_targets_mean": 4963.4, |
| "valid_targets_min": 519 |
| }, |
| { |
| "epoch": 3.12, |
| "grad_norm": 0.7398879295621316, |
| "learning_rate": 1.4917204977268833e-05, |
| "loss": 0.432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4899936318397522, |
| "step": 1950, |
| "valid_targets_mean": 3293.1, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 3.128, |
| "grad_norm": 0.5271555062833402, |
| "learning_rate": 1.4809231983692733e-05, |
| "loss": 0.4097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37848031520843506, |
| "step": 1955, |
| "valid_targets_mean": 4639.6, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 3.136, |
| "grad_norm": 0.5550015442785227, |
| "learning_rate": 1.4701420961992533e-05, |
| "loss": 0.424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4084477126598358, |
| "step": 1960, |
| "valid_targets_mean": 4837.2, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 3.144, |
| "grad_norm": 0.7096847519468681, |
| "learning_rate": 1.459377527628571e-05, |
| "loss": 0.4275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4384467899799347, |
| "step": 1965, |
| "valid_targets_mean": 2920.6, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 3.152, |
| "grad_norm": 0.7301446675432169, |
| "learning_rate": 1.4486298285530634e-05, |
| "loss": 0.4267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41845598816871643, |
| "step": 1970, |
| "valid_targets_mean": 2488.9, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 3.16, |
| "grad_norm": 0.675361855978539, |
| "learning_rate": 1.4378993343421736e-05, |
| "loss": 0.4293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41537049412727356, |
| "step": 1975, |
| "valid_targets_mean": 3094.2, |
| "valid_targets_min": 416 |
| }, |
| { |
| "epoch": 3.168, |
| "grad_norm": 0.5632344378219207, |
| "learning_rate": 1.4271863798284877e-05, |
| "loss": 0.4141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4148460030555725, |
| "step": 1980, |
| "valid_targets_mean": 4743.3, |
| "valid_targets_min": 986 |
| }, |
| { |
| "epoch": 3.176, |
| "grad_norm": 0.6386673015303019, |
| "learning_rate": 1.4164912992972846e-05, |
| "loss": 0.4376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4006524682044983, |
| "step": 1985, |
| "valid_targets_mean": 3333.8, |
| "valid_targets_min": 523 |
| }, |
| { |
| "epoch": 3.184, |
| "grad_norm": 0.7341708673500656, |
| "learning_rate": 1.4058144264761087e-05, |
| "loss": 0.4131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4031445384025574, |
| "step": 1990, |
| "valid_targets_mean": 5348.2, |
| "valid_targets_min": 653 |
| }, |
| { |
| "epoch": 3.192, |
| "grad_norm": 0.6108805400299323, |
| "learning_rate": 1.3951560945243517e-05, |
| "loss": 0.4285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39428362250328064, |
| "step": 1995, |
| "valid_targets_mean": 3951.9, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 3.2, |
| "grad_norm": 0.5744519338390691, |
| "learning_rate": 1.3845166360228597e-05, |
| "loss": 0.4248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40177762508392334, |
| "step": 2000, |
| "valid_targets_mean": 4564.3, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 3.208, |
| "grad_norm": 0.6863671838454662, |
| "learning_rate": 1.3738963829635559e-05, |
| "loss": 0.4504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46749067306518555, |
| "step": 2005, |
| "valid_targets_mean": 3531.8, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 3.216, |
| "grad_norm": 0.6671591173606514, |
| "learning_rate": 1.3632956667390784e-05, |
| "loss": 0.407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41678929328918457, |
| "step": 2010, |
| "valid_targets_mean": 3826.6, |
| "valid_targets_min": 561 |
| }, |
| { |
| "epoch": 3.224, |
| "grad_norm": 0.588235248316702, |
| "learning_rate": 1.3527148181324425e-05, |
| "loss": 0.4276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4322141706943512, |
| "step": 2015, |
| "valid_targets_mean": 4300.5, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 3.232, |
| "grad_norm": 0.5254294071213138, |
| "learning_rate": 1.3421541673067168e-05, |
| "loss": 0.4247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38688722252845764, |
| "step": 2020, |
| "valid_targets_mean": 4773.9, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 3.24, |
| "grad_norm": 0.7778220547959938, |
| "learning_rate": 1.3316140437947207e-05, |
| "loss": 0.4248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4182344675064087, |
| "step": 2025, |
| "valid_targets_mean": 4412.4, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 3.248, |
| "grad_norm": 0.5354024193090587, |
| "learning_rate": 1.321094776488745e-05, |
| "loss": 0.4155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38844114542007446, |
| "step": 2030, |
| "valid_targets_mean": 4513.8, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 3.2560000000000002, |
| "grad_norm": 0.6307442771592611, |
| "learning_rate": 1.3105966936302856e-05, |
| "loss": 0.4213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3858344554901123, |
| "step": 2035, |
| "valid_targets_mean": 3388.1, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 3.2640000000000002, |
| "grad_norm": 0.7489956045920521, |
| "learning_rate": 1.3001201227998023e-05, |
| "loss": 0.4295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4188210964202881, |
| "step": 2040, |
| "valid_targets_mean": 2661.7, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 3.2720000000000002, |
| "grad_norm": 0.650505657663387, |
| "learning_rate": 1.2896653909064964e-05, |
| "loss": 0.4111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4127410650253296, |
| "step": 2045, |
| "valid_targets_mean": 4998.3, |
| "valid_targets_min": 813 |
| }, |
| { |
| "epoch": 3.2800000000000002, |
| "grad_norm": 0.5978107263413696, |
| "learning_rate": 1.2792328241781124e-05, |
| "loss": 0.4016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4069294035434723, |
| "step": 2050, |
| "valid_targets_mean": 4051.4, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 3.288, |
| "grad_norm": 0.629812123697598, |
| "learning_rate": 1.2688227481507546e-05, |
| "loss": 0.4182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4324589669704437, |
| "step": 2055, |
| "valid_targets_mean": 3744.4, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 3.296, |
| "grad_norm": 0.5549507988646019, |
| "learning_rate": 1.258435487658733e-05, |
| "loss": 0.4164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40244030952453613, |
| "step": 2060, |
| "valid_targets_mean": 4940.0, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 3.304, |
| "grad_norm": 0.5869431749420226, |
| "learning_rate": 1.2480713668244243e-05, |
| "loss": 0.4177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41933634877204895, |
| "step": 2065, |
| "valid_targets_mean": 4774.3, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 3.312, |
| "grad_norm": 0.5560654604661646, |
| "learning_rate": 1.2377307090481586e-05, |
| "loss": 0.4348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40384188294410706, |
| "step": 2070, |
| "valid_targets_mean": 4333.8, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 3.32, |
| "grad_norm": 0.5258484186346938, |
| "learning_rate": 1.2274138369981298e-05, |
| "loss": 0.4312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41006770730018616, |
| "step": 2075, |
| "valid_targets_mean": 5825.9, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 3.328, |
| "grad_norm": 0.721798719675094, |
| "learning_rate": 1.2171210726003256e-05, |
| "loss": 0.4107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4058680534362793, |
| "step": 2080, |
| "valid_targets_mean": 3225.6, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 3.336, |
| "grad_norm": 0.6048643181166588, |
| "learning_rate": 1.2068527370284815e-05, |
| "loss": 0.4163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45129895210266113, |
| "step": 2085, |
| "valid_targets_mean": 3978.1, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 3.344, |
| "grad_norm": 0.6339488417554544, |
| "learning_rate": 1.1966091506940616e-05, |
| "loss": 0.4184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43796777725219727, |
| "step": 2090, |
| "valid_targets_mean": 3807.9, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 3.352, |
| "grad_norm": 0.6016289665121101, |
| "learning_rate": 1.1863906332362569e-05, |
| "loss": 0.4001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41488558053970337, |
| "step": 2095, |
| "valid_targets_mean": 3921.8, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 3.36, |
| "grad_norm": 0.6737156145382773, |
| "learning_rate": 1.176197503512015e-05, |
| "loss": 0.4234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46443474292755127, |
| "step": 2100, |
| "valid_targets_mean": 3559.7, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 3.368, |
| "grad_norm": 0.6983626223742545, |
| "learning_rate": 1.1660300795860877e-05, |
| "loss": 0.427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.432370662689209, |
| "step": 2105, |
| "valid_targets_mean": 3061.8, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 3.376, |
| "grad_norm": 0.4979082402374389, |
| "learning_rate": 1.1558886787211071e-05, |
| "loss": 0.4313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3811950087547302, |
| "step": 2110, |
| "valid_targets_mean": 5262.1, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 3.384, |
| "grad_norm": 0.5658616278719996, |
| "learning_rate": 1.1457736173676883e-05, |
| "loss": 0.384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39314180612564087, |
| "step": 2115, |
| "valid_targets_mean": 5609.1, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 3.392, |
| "grad_norm": 0.5742144020806174, |
| "learning_rate": 1.1356852111545493e-05, |
| "loss": 0.4091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3987872302532196, |
| "step": 2120, |
| "valid_targets_mean": 4422.2, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 3.4, |
| "grad_norm": 0.5596475137152013, |
| "learning_rate": 1.1256237748786675e-05, |
| "loss": 0.3993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3944924771785736, |
| "step": 2125, |
| "valid_targets_mean": 4539.4, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 3.408, |
| "grad_norm": 0.6913259682743764, |
| "learning_rate": 1.1155896224954543e-05, |
| "loss": 0.4201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46018218994140625, |
| "step": 2130, |
| "valid_targets_mean": 3704.2, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 3.416, |
| "grad_norm": 0.5521206700287924, |
| "learning_rate": 1.1055830671089578e-05, |
| "loss": 0.4269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41626229882240295, |
| "step": 2135, |
| "valid_targets_mean": 5602.0, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 3.424, |
| "grad_norm": 0.626791492401228, |
| "learning_rate": 1.0956044209620966e-05, |
| "loss": 0.4124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.435993492603302, |
| "step": 2140, |
| "valid_targets_mean": 3991.2, |
| "valid_targets_min": 496 |
| }, |
| { |
| "epoch": 3.432, |
| "grad_norm": 0.476094171103533, |
| "learning_rate": 1.0856539954269121e-05, |
| "loss": 0.4253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.377435564994812, |
| "step": 2145, |
| "valid_targets_mean": 5789.9, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 3.44, |
| "grad_norm": 0.6128716789365134, |
| "learning_rate": 1.0757321009948543e-05, |
| "loss": 0.419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40004780888557434, |
| "step": 2150, |
| "valid_targets_mean": 3649.6, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 3.448, |
| "grad_norm": 0.5575841204894988, |
| "learning_rate": 1.0658390472670938e-05, |
| "loss": 0.3902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4247322976589203, |
| "step": 2155, |
| "valid_targets_mean": 6032.9, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 3.456, |
| "grad_norm": 0.6753891110732698, |
| "learning_rate": 1.0559751429448597e-05, |
| "loss": 0.42, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4023727774620056, |
| "step": 2160, |
| "valid_targets_mean": 4760.7, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 3.464, |
| "grad_norm": 0.6369181074836571, |
| "learning_rate": 1.0461406958198101e-05, |
| "loss": 0.4353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4552972912788391, |
| "step": 2165, |
| "valid_targets_mean": 4412.8, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 3.472, |
| "grad_norm": 0.4819966107421562, |
| "learning_rate": 1.0363360127644235e-05, |
| "loss": 0.4066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.394325315952301, |
| "step": 2170, |
| "valid_targets_mean": 7356.6, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 3.48, |
| "grad_norm": 0.6128025340406501, |
| "learning_rate": 1.0265613997224255e-05, |
| "loss": 0.4125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3975856900215149, |
| "step": 2175, |
| "valid_targets_mean": 3477.9, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 3.488, |
| "grad_norm": 0.6384157096000654, |
| "learning_rate": 1.0168171616992422e-05, |
| "loss": 0.4358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4252591133117676, |
| "step": 2180, |
| "valid_targets_mean": 4226.9, |
| "valid_targets_min": 498 |
| }, |
| { |
| "epoch": 3.496, |
| "grad_norm": 0.5767516682589051, |
| "learning_rate": 1.007103602752483e-05, |
| "loss": 0.4353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4446565508842468, |
| "step": 2185, |
| "valid_targets_mean": 4517.8, |
| "valid_targets_min": 576 |
| }, |
| { |
| "epoch": 3.504, |
| "grad_norm": 0.5724798059794518, |
| "learning_rate": 9.974210259824505e-06, |
| "loss": 0.4143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4005405604839325, |
| "step": 2190, |
| "valid_targets_mean": 4404.2, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 3.512, |
| "grad_norm": 0.5733569057551399, |
| "learning_rate": 9.877697335226872e-06, |
| "loss": 0.4355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4807167053222656, |
| "step": 2195, |
| "valid_targets_mean": 4826.6, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 3.52, |
| "grad_norm": 1.1802646891503334, |
| "learning_rate": 9.781500265305448e-06, |
| "loss": 0.422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43163758516311646, |
| "step": 2200, |
| "valid_targets_mean": 3795.0, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 3.528, |
| "grad_norm": 0.8845021260253212, |
| "learning_rate": 9.685622051777856e-06, |
| "loss": 0.4302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46266594529151917, |
| "step": 2205, |
| "valid_targets_mean": 2079.0, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 3.536, |
| "grad_norm": 0.5646534622070288, |
| "learning_rate": 9.590065686412182e-06, |
| "loss": 0.3905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39034974575042725, |
| "step": 2210, |
| "valid_targets_mean": 4726.2, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 3.544, |
| "grad_norm": 0.5508012766023374, |
| "learning_rate": 9.494834150933616e-06, |
| "loss": 0.412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42684414982795715, |
| "step": 2215, |
| "valid_targets_mean": 5314.9, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 3.552, |
| "grad_norm": 0.6966622976087259, |
| "learning_rate": 9.399930416931404e-06, |
| "loss": 0.4038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38812291622161865, |
| "step": 2220, |
| "valid_targets_mean": 4849.1, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 3.56, |
| "grad_norm": 0.5793443000507197, |
| "learning_rate": 9.30535744576615e-06, |
| "loss": 0.4427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4145427346229553, |
| "step": 2225, |
| "valid_targets_mean": 4751.8, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 3.568, |
| "grad_norm": 0.5440153611777978, |
| "learning_rate": 9.211118188477362e-06, |
| "loss": 0.4129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42668813467025757, |
| "step": 2230, |
| "valid_targets_mean": 4886.1, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 3.576, |
| "grad_norm": 0.6942559664808036, |
| "learning_rate": 9.117215585691408e-06, |
| "loss": 0.4318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.408440500497818, |
| "step": 2235, |
| "valid_targets_mean": 2879.3, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 3.584, |
| "grad_norm": 0.5283718370515997, |
| "learning_rate": 9.023652567529744e-06, |
| "loss": 0.4322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39787888526916504, |
| "step": 2240, |
| "valid_targets_mean": 5380.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 3.592, |
| "grad_norm": 0.7189589849266416, |
| "learning_rate": 8.930432053517465e-06, |
| "loss": 0.4315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4863574802875519, |
| "step": 2245, |
| "valid_targets_mean": 3135.4, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 3.6, |
| "grad_norm": 0.5688319197328309, |
| "learning_rate": 8.837556952492264e-06, |
| "loss": 0.427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.443569153547287, |
| "step": 2250, |
| "valid_targets_mean": 4849.6, |
| "valid_targets_min": 491 |
| }, |
| { |
| "epoch": 3.608, |
| "grad_norm": 0.6372972828422979, |
| "learning_rate": 8.745030162513582e-06, |
| "loss": 0.4112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43911778926849365, |
| "step": 2255, |
| "valid_targets_mean": 3977.4, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 3.616, |
| "grad_norm": 0.646929389349214, |
| "learning_rate": 8.652854570772236e-06, |
| "loss": 0.4331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.452898770570755, |
| "step": 2260, |
| "valid_targets_mean": 4541.3, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 3.624, |
| "grad_norm": 0.536120974383535, |
| "learning_rate": 8.561033053500312e-06, |
| "loss": 0.4012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39861825108528137, |
| "step": 2265, |
| "valid_targets_mean": 5880.2, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 3.632, |
| "grad_norm": 0.5883785010261273, |
| "learning_rate": 8.46956847588141e-06, |
| "loss": 0.4105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4199955463409424, |
| "step": 2270, |
| "valid_targets_mean": 4599.0, |
| "valid_targets_min": 569 |
| }, |
| { |
| "epoch": 3.64, |
| "grad_norm": 0.43011548249040454, |
| "learning_rate": 8.378463691961237e-06, |
| "loss": 0.4052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3818497955799103, |
| "step": 2275, |
| "valid_targets_mean": 7853.8, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 3.648, |
| "grad_norm": 0.7813234320320073, |
| "learning_rate": 8.287721544558574e-06, |
| "loss": 0.423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4120236039161682, |
| "step": 2280, |
| "valid_targets_mean": 2544.3, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 3.656, |
| "grad_norm": 0.5267738721602246, |
| "learning_rate": 8.197344865176548e-06, |
| "loss": 0.4039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3992099165916443, |
| "step": 2285, |
| "valid_targets_mean": 4824.1, |
| "valid_targets_min": 421 |
| }, |
| { |
| "epoch": 3.664, |
| "grad_norm": 0.5857399421262088, |
| "learning_rate": 8.10733647391427e-06, |
| "loss": 0.4192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3996756076812744, |
| "step": 2290, |
| "valid_targets_mean": 4680.4, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 3.672, |
| "grad_norm": 0.6229880410561257, |
| "learning_rate": 8.017699179378849e-06, |
| "loss": 0.4102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4350461959838867, |
| "step": 2295, |
| "valid_targets_mean": 4063.1, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 3.68, |
| "grad_norm": 0.5935713053030977, |
| "learning_rate": 7.928435778597763e-06, |
| "loss": 0.4112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4190603494644165, |
| "step": 2300, |
| "valid_targets_mean": 4264.1, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 3.6879999999999997, |
| "grad_norm": 0.8421241937446357, |
| "learning_rate": 7.839549056931557e-06, |
| "loss": 0.4345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4648500084877014, |
| "step": 2305, |
| "valid_targets_mean": 2191.2, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 3.6959999999999997, |
| "grad_norm": 0.627712707242927, |
| "learning_rate": 7.751041787986965e-06, |
| "loss": 0.4379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43756556510925293, |
| "step": 2310, |
| "valid_targets_mean": 3952.6, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 3.7039999999999997, |
| "grad_norm": 0.55692187150058, |
| "learning_rate": 7.662916733530317e-06, |
| "loss": 0.4214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.410952627658844, |
| "step": 2315, |
| "valid_targets_mean": 5188.4, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 3.7119999999999997, |
| "grad_norm": 0.5841435249769223, |
| "learning_rate": 7.575176643401394e-06, |
| "loss": 0.3974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39622873067855835, |
| "step": 2320, |
| "valid_targets_mean": 4232.2, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 3.7199999999999998, |
| "grad_norm": 0.6334245660960619, |
| "learning_rate": 7.487824255427616e-06, |
| "loss": 0.4123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43315714597702026, |
| "step": 2325, |
| "valid_targets_mean": 3952.1, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 3.7279999999999998, |
| "grad_norm": 0.7125490272965322, |
| "learning_rate": 7.400862295338595e-06, |
| "loss": 0.4025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3960513770580292, |
| "step": 2330, |
| "valid_targets_mean": 2979.1, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 3.7359999999999998, |
| "grad_norm": 0.7047871741832065, |
| "learning_rate": 7.314293476681122e-06, |
| "loss": 0.4278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4047684669494629, |
| "step": 2335, |
| "valid_targets_mean": 2885.2, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 3.7439999999999998, |
| "grad_norm": 0.5235697909405775, |
| "learning_rate": 7.228120500734443e-06, |
| "loss": 0.4066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39039039611816406, |
| "step": 2340, |
| "valid_targets_mean": 5031.9, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 3.752, |
| "grad_norm": 0.6309610439555812, |
| "learning_rate": 7.1423460564259995e-06, |
| "loss": 0.425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41119787096977234, |
| "step": 2345, |
| "valid_targets_mean": 3696.8, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 3.76, |
| "grad_norm": 0.6046248254536285, |
| "learning_rate": 7.056972820247516e-06, |
| "loss": 0.4312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44950827956199646, |
| "step": 2350, |
| "valid_targets_mean": 4173.8, |
| "valid_targets_min": 468 |
| }, |
| { |
| "epoch": 3.768, |
| "grad_norm": 0.5813802818171795, |
| "learning_rate": 6.97200345617149e-06, |
| "loss": 0.4251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4253307580947876, |
| "step": 2355, |
| "valid_targets_mean": 4188.0, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 3.776, |
| "grad_norm": 0.6480857251816284, |
| "learning_rate": 6.887440615568044e-06, |
| "loss": 0.4063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3995557427406311, |
| "step": 2360, |
| "valid_targets_mean": 3368.9, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 3.784, |
| "grad_norm": 0.5978641746105108, |
| "learning_rate": 6.803286937122233e-06, |
| "loss": 0.4212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4335462749004364, |
| "step": 2365, |
| "valid_targets_mean": 4294.8, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 3.792, |
| "grad_norm": 0.705354339864555, |
| "learning_rate": 6.719545046751674e-06, |
| "loss": 0.4492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4486519694328308, |
| "step": 2370, |
| "valid_targets_mean": 3097.3, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 3.8, |
| "grad_norm": 0.6447197729667318, |
| "learning_rate": 6.636217557524605e-06, |
| "loss": 0.4089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4317939281463623, |
| "step": 2375, |
| "valid_targets_mean": 3642.6, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 3.808, |
| "grad_norm": 0.5784840504063279, |
| "learning_rate": 6.55330706957837e-06, |
| "loss": 0.4183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.417401522397995, |
| "step": 2380, |
| "valid_targets_mean": 4374.6, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 3.816, |
| "grad_norm": 0.5691858028003152, |
| "learning_rate": 6.4708161700382655e-06, |
| "loss": 0.4185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4285266101360321, |
| "step": 2385, |
| "valid_targets_mean": 4893.5, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 3.824, |
| "grad_norm": 0.6509918903676563, |
| "learning_rate": 6.388747432936819e-06, |
| "loss": 0.3843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39279234409332275, |
| "step": 2390, |
| "valid_targets_mean": 3421.9, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 3.832, |
| "grad_norm": 0.5477195713050954, |
| "learning_rate": 6.3071034191334915e-06, |
| "loss": 0.3963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4045974612236023, |
| "step": 2395, |
| "valid_targets_mean": 4609.2, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 3.84, |
| "grad_norm": 0.6280025691309644, |
| "learning_rate": 6.22588667623472e-06, |
| "loss": 0.4238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4826744794845581, |
| "step": 2400, |
| "valid_targets_mean": 4032.0, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 3.848, |
| "grad_norm": 0.7680355117957194, |
| "learning_rate": 6.145099738514466e-06, |
| "loss": 0.4578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4926620125770569, |
| "step": 2405, |
| "valid_targets_mean": 2725.4, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 3.856, |
| "grad_norm": 0.5711966605379848, |
| "learning_rate": 6.064745126835112e-06, |
| "loss": 0.4111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4238035976886749, |
| "step": 2410, |
| "valid_targets_mean": 4564.0, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 3.864, |
| "grad_norm": 0.5326749978154176, |
| "learning_rate": 5.984825348568812e-06, |
| "loss": 0.4065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4256637394428253, |
| "step": 2415, |
| "valid_targets_mean": 5087.4, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 3.872, |
| "grad_norm": 0.7369604952522139, |
| "learning_rate": 5.905342897519262e-06, |
| "loss": 0.405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47101157903671265, |
| "step": 2420, |
| "valid_targets_mean": 2868.4, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 3.88, |
| "grad_norm": 0.7010288266967857, |
| "learning_rate": 5.826300253843851e-06, |
| "loss": 0.421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3836793005466461, |
| "step": 2425, |
| "valid_targets_mean": 2784.3, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 3.888, |
| "grad_norm": 0.6824318371192227, |
| "learning_rate": 5.7476998839763035e-06, |
| "loss": 0.4208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4819521903991699, |
| "step": 2430, |
| "valid_targets_mean": 3219.2, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 3.896, |
| "grad_norm": 0.5989642635294622, |
| "learning_rate": 5.669544240549698e-06, |
| "loss": 0.3991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40206092596054077, |
| "step": 2435, |
| "valid_targets_mean": 3922.7, |
| "valid_targets_min": 749 |
| }, |
| { |
| "epoch": 3.904, |
| "grad_norm": 0.5819637834251199, |
| "learning_rate": 5.591835762319946e-06, |
| "loss": 0.43, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4356538653373718, |
| "step": 2440, |
| "valid_targets_mean": 4358.2, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 3.912, |
| "grad_norm": 0.8093003590748824, |
| "learning_rate": 5.514576874089683e-06, |
| "loss": 0.4171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4149336814880371, |
| "step": 2445, |
| "valid_targets_mean": 3634.3, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 3.92, |
| "grad_norm": 0.5637333714042546, |
| "learning_rate": 5.437769986632622e-06, |
| "loss": 0.4192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40535950660705566, |
| "step": 2450, |
| "valid_targets_mean": 5450.6, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 3.928, |
| "grad_norm": 0.5650303402408413, |
| "learning_rate": 5.361417496618315e-06, |
| "loss": 0.4098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4089083969593048, |
| "step": 2455, |
| "valid_targets_mean": 4491.1, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 3.936, |
| "grad_norm": 0.5862251884278199, |
| "learning_rate": 5.285521786537368e-06, |
| "loss": 0.4296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.421395480632782, |
| "step": 2460, |
| "valid_targets_mean": 4045.0, |
| "valid_targets_min": 499 |
| }, |
| { |
| "epoch": 3.944, |
| "grad_norm": 0.5911774172256168, |
| "learning_rate": 5.2100852246270975e-06, |
| "loss": 0.4443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41850167512893677, |
| "step": 2465, |
| "valid_targets_mean": 4103.7, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 3.952, |
| "grad_norm": 0.5488515492585119, |
| "learning_rate": 5.135110164797637e-06, |
| "loss": 0.4105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4004397988319397, |
| "step": 2470, |
| "valid_targets_mean": 4585.8, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 3.96, |
| "grad_norm": 0.638564502319262, |
| "learning_rate": 5.060598946558484e-06, |
| "loss": 0.4295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43971341848373413, |
| "step": 2475, |
| "valid_targets_mean": 3582.0, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 3.968, |
| "grad_norm": 0.5896713751876114, |
| "learning_rate": 4.986553894945512e-06, |
| "loss": 0.3939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3950134515762329, |
| "step": 2480, |
| "valid_targets_mean": 3773.5, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 3.976, |
| "grad_norm": 0.7928195363821494, |
| "learning_rate": 4.912977320448391e-06, |
| "loss": 0.4187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3833604156970978, |
| "step": 2485, |
| "valid_targets_mean": 3785.5, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 3.984, |
| "grad_norm": 0.59139939976017, |
| "learning_rate": 4.839871518938513e-06, |
| "loss": 0.4383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4159795343875885, |
| "step": 2490, |
| "valid_targets_mean": 4217.4, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 3.992, |
| "grad_norm": 0.550470299025946, |
| "learning_rate": 4.767238771597347e-06, |
| "loss": 0.3958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3765171766281128, |
| "step": 2495, |
| "valid_targets_mean": 5407.9, |
| "valid_targets_min": 1275 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 0.6285536655979354, |
| "learning_rate": 4.695081344845254e-06, |
| "loss": 0.4467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4390712380409241, |
| "step": 2500, |
| "valid_targets_mean": 3904.6, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 4.008, |
| "grad_norm": 0.6426613600523003, |
| "learning_rate": 4.623401490270778e-06, |
| "loss": 0.4065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4202343821525574, |
| "step": 2505, |
| "valid_targets_mean": 3585.8, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 4.016, |
| "grad_norm": 0.5585933431067611, |
| "learning_rate": 4.552201444560373e-06, |
| "loss": 0.4059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4154893457889557, |
| "step": 2510, |
| "valid_targets_mean": 4587.4, |
| "valid_targets_min": 834 |
| }, |
| { |
| "epoch": 4.024, |
| "grad_norm": 0.5849602135579992, |
| "learning_rate": 4.481483429428615e-06, |
| "loss": 0.4119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3984353244304657, |
| "step": 2515, |
| "valid_targets_mean": 4275.1, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 4.032, |
| "grad_norm": 0.5834357553067363, |
| "learning_rate": 4.4112496515488765e-06, |
| "loss": 0.4011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3702242970466614, |
| "step": 2520, |
| "valid_targets_mean": 4599.9, |
| "valid_targets_min": 608 |
| }, |
| { |
| "epoch": 4.04, |
| "grad_norm": 0.7637639117096291, |
| "learning_rate": 4.341502302484472e-06, |
| "loss": 0.425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4776972532272339, |
| "step": 2525, |
| "valid_targets_mean": 2890.7, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 4.048, |
| "grad_norm": 0.7468745784687151, |
| "learning_rate": 4.272243558620264e-06, |
| "loss": 0.4098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4523777961730957, |
| "step": 2530, |
| "valid_targets_mean": 2911.0, |
| "valid_targets_min": 333 |
| }, |
| { |
| "epoch": 4.056, |
| "grad_norm": 0.5802649714021575, |
| "learning_rate": 4.203475581094771e-06, |
| "loss": 0.4373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.425601601600647, |
| "step": 2535, |
| "valid_targets_mean": 5046.2, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 4.064, |
| "grad_norm": 0.5447288932891161, |
| "learning_rate": 4.135200515732716e-06, |
| "loss": 0.4005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3529777526855469, |
| "step": 2540, |
| "valid_targets_mean": 4301.4, |
| "valid_targets_min": 653 |
| }, |
| { |
| "epoch": 4.072, |
| "grad_norm": 0.7333561005546733, |
| "learning_rate": 4.067420492978065e-06, |
| "loss": 0.406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4183364808559418, |
| "step": 2545, |
| "valid_targets_mean": 2979.5, |
| "valid_targets_min": 433 |
| }, |
| { |
| "epoch": 4.08, |
| "grad_norm": 0.8448397467709902, |
| "learning_rate": 4.000137627827554e-06, |
| "loss": 0.411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4083864092826843, |
| "step": 2550, |
| "valid_targets_mean": 1975.8, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 4.088, |
| "grad_norm": 0.7039063639446964, |
| "learning_rate": 3.9333540197647035e-06, |
| "loss": 0.3973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42661112546920776, |
| "step": 2555, |
| "valid_targets_mean": 2891.6, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 4.096, |
| "grad_norm": 0.6103368310567368, |
| "learning_rate": 3.867071752694282e-06, |
| "loss": 0.4136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39338967204093933, |
| "step": 2560, |
| "valid_targets_mean": 4202.1, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 4.104, |
| "grad_norm": 0.5609255390428625, |
| "learning_rate": 3.8012928948773243e-06, |
| "loss": 0.4109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3590124249458313, |
| "step": 2565, |
| "valid_targets_mean": 4673.2, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 4.112, |
| "grad_norm": 0.7163062681286491, |
| "learning_rate": 3.7360194988665364e-06, |
| "loss": 0.4282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4255579113960266, |
| "step": 2570, |
| "valid_targets_mean": 2981.8, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 4.12, |
| "grad_norm": 0.4784051484306757, |
| "learning_rate": 3.6712536014422885e-06, |
| "loss": 0.405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.350371778011322, |
| "step": 2575, |
| "valid_targets_mean": 6456.9, |
| "valid_targets_min": 503 |
| }, |
| { |
| "epoch": 4.128, |
| "grad_norm": 0.5438453496849911, |
| "learning_rate": 3.606997223549049e-06, |
| "loss": 0.4131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4073692262172699, |
| "step": 2580, |
| "valid_targets_mean": 5279.0, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 4.136, |
| "grad_norm": 0.5879969117381249, |
| "learning_rate": 3.543252370232313e-06, |
| "loss": 0.3969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4108046889305115, |
| "step": 2585, |
| "valid_targets_mean": 4720.8, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 4.144, |
| "grad_norm": 0.5532047673911502, |
| "learning_rate": 3.4800210305760662e-06, |
| "loss": 0.4201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36657533049583435, |
| "step": 2590, |
| "valid_targets_mean": 4700.9, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 4.152, |
| "grad_norm": 0.5901167864484412, |
| "learning_rate": 3.4173051776406817e-06, |
| "loss": 0.4184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4340725541114807, |
| "step": 2595, |
| "valid_targets_mean": 4326.9, |
| "valid_targets_min": 523 |
| }, |
| { |
| "epoch": 4.16, |
| "grad_norm": 0.5475674178491631, |
| "learning_rate": 3.3551067684013706e-06, |
| "loss": 0.4084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3945809006690979, |
| "step": 2600, |
| "valid_targets_mean": 4706.6, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 4.168, |
| "grad_norm": 0.5801898131217752, |
| "learning_rate": 3.2934277436871187e-06, |
| "loss": 0.3873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3601340055465698, |
| "step": 2605, |
| "valid_targets_mean": 4189.4, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 4.176, |
| "grad_norm": 0.7299558918948404, |
| "learning_rate": 3.232270028120121e-06, |
| "loss": 0.405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4364742338657379, |
| "step": 2610, |
| "valid_targets_mean": 2916.7, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 4.184, |
| "grad_norm": 0.5996399283446768, |
| "learning_rate": 3.1716355300557256e-06, |
| "loss": 0.3937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4116308391094208, |
| "step": 2615, |
| "valid_targets_mean": 4109.5, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 4.192, |
| "grad_norm": 0.5730701668848656, |
| "learning_rate": 3.111526141522896e-06, |
| "loss": 0.4212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41376417875289917, |
| "step": 2620, |
| "valid_targets_mean": 4810.4, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 4.2, |
| "grad_norm": 0.5519404941783179, |
| "learning_rate": 3.0519437381651507e-06, |
| "loss": 0.4072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40336206555366516, |
| "step": 2625, |
| "valid_targets_mean": 4866.9, |
| "valid_targets_min": 749 |
| }, |
| { |
| "epoch": 4.208, |
| "grad_norm": 0.5067010081942247, |
| "learning_rate": 2.992890179182062e-06, |
| "loss": 0.3919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35615670680999756, |
| "step": 2630, |
| "valid_targets_mean": 5492.4, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 4.216, |
| "grad_norm": 0.6359749406389089, |
| "learning_rate": 2.93436730727122e-06, |
| "loss": 0.4067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.402889609336853, |
| "step": 2635, |
| "valid_targets_mean": 3929.4, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 4.224, |
| "grad_norm": 0.6145949359641839, |
| "learning_rate": 2.8763769485707447e-06, |
| "loss": 0.3904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40841296315193176, |
| "step": 2640, |
| "valid_targets_mean": 4276.6, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 4.232, |
| "grad_norm": 0.7110071687256778, |
| "learning_rate": 2.818920912602294e-06, |
| "loss": 0.405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4124786853790283, |
| "step": 2645, |
| "valid_targets_mean": 2939.0, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 4.24, |
| "grad_norm": 0.5743817768129006, |
| "learning_rate": 2.762000992214626e-06, |
| "loss": 0.4164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3974683880805969, |
| "step": 2650, |
| "valid_targets_mean": 4447.1, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 4.248, |
| "grad_norm": 0.5413226643387624, |
| "learning_rate": 2.7056189635276162e-06, |
| "loss": 0.3864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3866695463657379, |
| "step": 2655, |
| "valid_targets_mean": 5034.9, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 4.256, |
| "grad_norm": 0.5726347506605515, |
| "learning_rate": 2.6497765858768643e-06, |
| "loss": 0.4024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42359739542007446, |
| "step": 2660, |
| "valid_targets_mean": 4637.1, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 4.264, |
| "grad_norm": 0.4855797229728632, |
| "learning_rate": 2.594475601758786e-06, |
| "loss": 0.3905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3630528748035431, |
| "step": 2665, |
| "valid_targets_mean": 5871.8, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 4.272, |
| "grad_norm": 0.6421484551855371, |
| "learning_rate": 2.539717736776237e-06, |
| "loss": 0.3901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42318665981292725, |
| "step": 2670, |
| "valid_targets_mean": 4278.5, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 4.28, |
| "grad_norm": 0.6235765181112626, |
| "learning_rate": 2.4855046995846844e-06, |
| "loss": 0.3848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4206055700778961, |
| "step": 2675, |
| "valid_targets_mean": 4279.4, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 4.288, |
| "grad_norm": 0.5687422916455531, |
| "learning_rate": 2.431838181838868e-06, |
| "loss": 0.4003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38011544942855835, |
| "step": 2680, |
| "valid_targets_mean": 4600.6, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 4.296, |
| "grad_norm": 0.5597281309268304, |
| "learning_rate": 2.3787198581400285e-06, |
| "loss": 0.409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3837645649909973, |
| "step": 2685, |
| "valid_targets_mean": 4807.3, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 4.304, |
| "grad_norm": 0.5208997470892812, |
| "learning_rate": 2.3261513859836437e-06, |
| "loss": 0.3891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36763709783554077, |
| "step": 2690, |
| "valid_targets_mean": 5476.7, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 4.312, |
| "grad_norm": 0.729596593306008, |
| "learning_rate": 2.27413440570772e-06, |
| "loss": 0.4192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47866132855415344, |
| "step": 2695, |
| "valid_targets_mean": 3093.9, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 4.32, |
| "grad_norm": 0.5963682532410031, |
| "learning_rate": 2.222670540441596e-06, |
| "loss": 0.3944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35257434844970703, |
| "step": 2700, |
| "valid_targets_mean": 5420.8, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 4.328, |
| "grad_norm": 0.5229520235670004, |
| "learning_rate": 2.17176139605531e-06, |
| "loss": 0.4251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3816877603530884, |
| "step": 2705, |
| "valid_targets_mean": 5403.9, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 4.336, |
| "grad_norm": 0.6555810725268437, |
| "learning_rate": 2.121408561109466e-06, |
| "loss": 0.4173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38497596979141235, |
| "step": 2710, |
| "valid_targets_mean": 3670.6, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.344, |
| "grad_norm": 0.5360008671439541, |
| "learning_rate": 2.071613606805696e-06, |
| "loss": 0.4179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4150103032588959, |
| "step": 2715, |
| "valid_targets_mean": 5754.9, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 4.352, |
| "grad_norm": 0.5212551398201117, |
| "learning_rate": 2.0223780869376018e-06, |
| "loss": 0.394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40325045585632324, |
| "step": 2720, |
| "valid_targets_mean": 5807.8, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 4.36, |
| "grad_norm": 0.501570979642165, |
| "learning_rate": 1.9737035378422907e-06, |
| "loss": 0.3989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38142967224121094, |
| "step": 2725, |
| "valid_targets_mean": 5602.2, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 4.368, |
| "grad_norm": 0.6586918366767852, |
| "learning_rate": 1.925591478352424e-06, |
| "loss": 0.3876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3896998167037964, |
| "step": 2730, |
| "valid_targets_mean": 3427.3, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 4.376, |
| "grad_norm": 0.5558539980698498, |
| "learning_rate": 1.8780434097488443e-06, |
| "loss": 0.4082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4040504992008209, |
| "step": 2735, |
| "valid_targets_mean": 4714.9, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 4.384, |
| "grad_norm": 0.7867324950433691, |
| "learning_rate": 1.831060815713699e-06, |
| "loss": 0.4048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4829801917076111, |
| "step": 2740, |
| "valid_targets_mean": 2988.8, |
| "valid_targets_min": 288 |
| }, |
| { |
| "epoch": 4.392, |
| "grad_norm": 0.6214041417079301, |
| "learning_rate": 1.7846451622841643e-06, |
| "loss": 0.4194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3955761194229126, |
| "step": 2745, |
| "valid_targets_mean": 3676.2, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 4.4, |
| "grad_norm": 0.5561873136372868, |
| "learning_rate": 1.7387978978066988e-06, |
| "loss": 0.4089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3890697956085205, |
| "step": 2750, |
| "valid_targets_mean": 5758.4, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 4.408, |
| "grad_norm": 0.560721929365539, |
| "learning_rate": 1.6935204528918347e-06, |
| "loss": 0.3973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40641331672668457, |
| "step": 2755, |
| "valid_targets_mean": 5017.4, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 4.416, |
| "grad_norm": 0.6889136427973638, |
| "learning_rate": 1.6488142403695651e-06, |
| "loss": 0.4157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4421613812446594, |
| "step": 2760, |
| "valid_targets_mean": 3295.3, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 4.424, |
| "grad_norm": 0.7902577945988017, |
| "learning_rate": 1.6046806552452254e-06, |
| "loss": 0.4283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4924136698246002, |
| "step": 2765, |
| "valid_targets_mean": 3308.9, |
| "valid_targets_min": 751 |
| }, |
| { |
| "epoch": 4.432, |
| "grad_norm": 0.6844284345573052, |
| "learning_rate": 1.5611210746559868e-06, |
| "loss": 0.3938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40334612131118774, |
| "step": 2770, |
| "valid_targets_mean": 3122.0, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 4.44, |
| "grad_norm": 0.6162273196275045, |
| "learning_rate": 1.5181368578278744e-06, |
| "loss": 0.4041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35837671160697937, |
| "step": 2775, |
| "valid_targets_mean": 3665.4, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 4.448, |
| "grad_norm": 0.5974789854549655, |
| "learning_rate": 1.4757293460333566e-06, |
| "loss": 0.4308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4109255075454712, |
| "step": 2780, |
| "valid_targets_mean": 4179.9, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 4.456, |
| "grad_norm": 0.5708600383249177, |
| "learning_rate": 1.4338998625494905e-06, |
| "loss": 0.4075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3754119277000427, |
| "step": 2785, |
| "valid_targets_mean": 4436.0, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 4.464, |
| "grad_norm": 0.6313362954432985, |
| "learning_rate": 1.3926497126166405e-06, |
| "loss": 0.4204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41806894540786743, |
| "step": 2790, |
| "valid_targets_mean": 4132.2, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 4.4719999999999995, |
| "grad_norm": 0.5994471438843727, |
| "learning_rate": 1.3519801833977298e-06, |
| "loss": 0.4271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43274080753326416, |
| "step": 2795, |
| "valid_targets_mean": 4554.3, |
| "valid_targets_min": 371 |
| }, |
| { |
| "epoch": 4.48, |
| "grad_norm": 0.5410383078069514, |
| "learning_rate": 1.3118925439381003e-06, |
| "loss": 0.4073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35545891523361206, |
| "step": 2800, |
| "valid_targets_mean": 5008.1, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 4.4879999999999995, |
| "grad_norm": 0.7142880244968844, |
| "learning_rate": 1.2723880451258918e-06, |
| "loss": 0.4072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4319564998149872, |
| "step": 2805, |
| "valid_targets_mean": 3327.8, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 4.496, |
| "grad_norm": 0.5901784201564468, |
| "learning_rate": 1.2334679196530219e-06, |
| "loss": 0.4332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42878252267837524, |
| "step": 2810, |
| "valid_targets_mean": 4661.2, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 4.504, |
| "grad_norm": 0.5840631068232639, |
| "learning_rate": 1.1951333819767163e-06, |
| "loss": 0.4096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.392315149307251, |
| "step": 2815, |
| "valid_targets_mean": 4338.4, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 4.5120000000000005, |
| "grad_norm": 0.9670608326476431, |
| "learning_rate": 1.157385628281622e-06, |
| "loss": 0.4121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.409821093082428, |
| "step": 2820, |
| "valid_targets_mean": 2009.2, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 4.52, |
| "grad_norm": 0.6605390936042161, |
| "learning_rate": 1.1202258364424633e-06, |
| "loss": 0.4025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41265183687210083, |
| "step": 2825, |
| "valid_targets_mean": 3653.6, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 4.5280000000000005, |
| "grad_norm": 0.512314838581097, |
| "learning_rate": 1.0836551659873073e-06, |
| "loss": 0.4052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3962034583091736, |
| "step": 2830, |
| "valid_targets_mean": 5787.9, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 4.536, |
| "grad_norm": 0.5526075598864743, |
| "learning_rate": 1.0476747580613723e-06, |
| "loss": 0.4239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37799936532974243, |
| "step": 2835, |
| "valid_targets_mean": 4742.4, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 4.5440000000000005, |
| "grad_norm": 0.5423110924774888, |
| "learning_rate": 1.012285735391416e-06, |
| "loss": 0.4318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41332849860191345, |
| "step": 2840, |
| "valid_targets_mean": 5307.6, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 4.552, |
| "grad_norm": 0.611737571874644, |
| "learning_rate": 9.774892022507166e-07, |
| "loss": 0.4062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3971940875053406, |
| "step": 2845, |
| "valid_targets_mean": 4247.7, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 4.5600000000000005, |
| "grad_norm": 0.7135757278290046, |
| "learning_rate": 9.432862444245994e-07, |
| "loss": 0.4359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41892296075820923, |
| "step": 2850, |
| "valid_targets_mean": 3975.4, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 4.568, |
| "grad_norm": 0.7473593705860603, |
| "learning_rate": 9.096779291765667e-07, |
| "loss": 0.4205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4587504267692566, |
| "step": 2855, |
| "valid_targets_mean": 2893.6, |
| "valid_targets_min": 813 |
| }, |
| { |
| "epoch": 4.576, |
| "grad_norm": 0.6873974964018028, |
| "learning_rate": 8.766653052149831e-07, |
| "loss": 0.4326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44257092475891113, |
| "step": 2860, |
| "valid_targets_mean": 3811.4, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 4.584, |
| "grad_norm": 0.7683330781359213, |
| "learning_rate": 8.442494026603709e-07, |
| "loss": 0.4131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44089746475219727, |
| "step": 2865, |
| "valid_targets_mean": 3014.2, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 4.592, |
| "grad_norm": 0.5846368499398767, |
| "learning_rate": 8.124312330132423e-07, |
| "loss": 0.3811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3351588845252991, |
| "step": 2870, |
| "valid_targets_mean": 3851.7, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 4.6, |
| "grad_norm": 0.5968786949619281, |
| "learning_rate": 7.812117891225667e-07, |
| "loss": 0.405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3558521866798401, |
| "step": 2875, |
| "valid_targets_mean": 3713.2, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 4.608, |
| "grad_norm": 0.6212588253374268, |
| "learning_rate": 7.505920451547544e-07, |
| "loss": 0.4055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3719406723976135, |
| "step": 2880, |
| "valid_targets_mean": 3888.3, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 4.616, |
| "grad_norm": 0.8263222292237222, |
| "learning_rate": 7.205729565632947e-07, |
| "loss": 0.4107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.415608674287796, |
| "step": 2885, |
| "valid_targets_mean": 2358.3, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 4.624, |
| "grad_norm": 1.2742274611700906, |
| "learning_rate": 6.911554600589121e-07, |
| "loss": 0.4135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3934563398361206, |
| "step": 2890, |
| "valid_targets_mean": 4383.9, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 4.632, |
| "grad_norm": 0.7165845833648357, |
| "learning_rate": 6.62340473580354e-07, |
| "loss": 0.422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46797922253608704, |
| "step": 2895, |
| "valid_targets_mean": 3301.2, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 4.64, |
| "grad_norm": 0.5652440899945861, |
| "learning_rate": 6.341288962657422e-07, |
| "loss": 0.4163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4029410779476166, |
| "step": 2900, |
| "valid_targets_mean": 4548.8, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 4.648, |
| "grad_norm": 0.6700159540879693, |
| "learning_rate": 6.06521608424524e-07, |
| "loss": 0.4329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4570663273334503, |
| "step": 2905, |
| "valid_targets_mean": 4093.9, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 4.656, |
| "grad_norm": 0.6045546990414774, |
| "learning_rate": 5.795194715099905e-07, |
| "loss": 0.3856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4214397966861725, |
| "step": 2910, |
| "valid_targets_mean": 5777.8, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 4.664, |
| "grad_norm": 0.5952012215364537, |
| "learning_rate": 5.531233280924042e-07, |
| "loss": 0.4219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3828292787075043, |
| "step": 2915, |
| "valid_targets_mean": 4322.4, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 4.672, |
| "grad_norm": 0.6450876587783286, |
| "learning_rate": 5.273340018327044e-07, |
| "loss": 0.4067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4427468776702881, |
| "step": 2920, |
| "valid_targets_mean": 3636.7, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 4.68, |
| "grad_norm": 0.8489893578004784, |
| "learning_rate": 5.02152297456806e-07, |
| "loss": 0.4044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44238054752349854, |
| "step": 2925, |
| "valid_targets_mean": 2258.9, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 4.688, |
| "grad_norm": 0.7104670754151398, |
| "learning_rate": 4.775790007304993e-07, |
| "loss": 0.4145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43017131090164185, |
| "step": 2930, |
| "valid_targets_mean": 3351.2, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 4.696, |
| "grad_norm": 0.6357385020238071, |
| "learning_rate": 4.5361487843490924e-07, |
| "loss": 0.4049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4254443347454071, |
| "step": 2935, |
| "valid_targets_mean": 4101.7, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 4.704, |
| "grad_norm": 0.5732449316192012, |
| "learning_rate": 4.3026067834258667e-07, |
| "loss": 0.4204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4033844470977783, |
| "step": 2940, |
| "valid_targets_mean": 4472.9, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 4.712, |
| "grad_norm": 0.48553171918656174, |
| "learning_rate": 4.0751712919417484e-07, |
| "loss": 0.3781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3926544785499573, |
| "step": 2945, |
| "valid_targets_mean": 6882.5, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 4.72, |
| "grad_norm": 0.6821340139530365, |
| "learning_rate": 3.853849406756549e-07, |
| "loss": 0.4099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42946845293045044, |
| "step": 2950, |
| "valid_targets_mean": 3391.1, |
| "valid_targets_min": 373 |
| }, |
| { |
| "epoch": 4.728, |
| "grad_norm": 0.6654823260184427, |
| "learning_rate": 3.6386480339621886e-07, |
| "loss": 0.3988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39326146245002747, |
| "step": 2955, |
| "valid_targets_mean": 3489.5, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 4.736, |
| "grad_norm": 0.6083477077382592, |
| "learning_rate": 3.4295738886670925e-07, |
| "loss": 0.4034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3781413435935974, |
| "step": 2960, |
| "valid_targets_mean": 4359.6, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 4.744, |
| "grad_norm": 0.6597022939202071, |
| "learning_rate": 3.226633494786668e-07, |
| "loss": 0.3878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3716740012168884, |
| "step": 2965, |
| "valid_targets_mean": 3212.9, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 4.752, |
| "grad_norm": 0.8113317008052021, |
| "learning_rate": 3.0298331848398033e-07, |
| "loss": 0.4039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4363306760787964, |
| "step": 2970, |
| "valid_targets_mean": 3148.3, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 4.76, |
| "grad_norm": 0.6243007406816568, |
| "learning_rate": 2.839179099751133e-07, |
| "loss": 0.4149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4543706178665161, |
| "step": 2975, |
| "valid_targets_mean": 4166.6, |
| "valid_targets_min": 866 |
| }, |
| { |
| "epoch": 4.768, |
| "grad_norm": 0.6224022376593623, |
| "learning_rate": 2.654677188659549e-07, |
| "loss": 0.4168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.451460063457489, |
| "step": 2980, |
| "valid_targets_mean": 4207.4, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 4.776, |
| "grad_norm": 0.5374144174742845, |
| "learning_rate": 2.476333208732462e-07, |
| "loss": 0.4053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42308709025382996, |
| "step": 2985, |
| "valid_targets_mean": 6995.9, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 4.784, |
| "grad_norm": 0.6285382216596294, |
| "learning_rate": 2.3041527249863193e-07, |
| "loss": 0.4221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42085695266723633, |
| "step": 2990, |
| "valid_targets_mean": 3705.4, |
| "valid_targets_min": 915 |
| }, |
| { |
| "epoch": 4.792, |
| "grad_norm": 0.6313424923207209, |
| "learning_rate": 2.1381411101127013e-07, |
| "loss": 0.4242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4452266991138458, |
| "step": 2995, |
| "valid_targets_mean": 4179.6, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 4.8, |
| "grad_norm": 0.5405302367882336, |
| "learning_rate": 1.9783035443108999e-07, |
| "loss": 0.3761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3892124891281128, |
| "step": 3000, |
| "valid_targets_mean": 4694.6, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 4.808, |
| "grad_norm": 0.6499699005097503, |
| "learning_rate": 1.8246450151261362e-07, |
| "loss": 0.4126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46307098865509033, |
| "step": 3005, |
| "valid_targets_mean": 4108.7, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.816, |
| "grad_norm": 0.6639498536382377, |
| "learning_rate": 1.6771703172940635e-07, |
| "loss": 0.3848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44725149869918823, |
| "step": 3010, |
| "valid_targets_mean": 3558.9, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 4.824, |
| "grad_norm": 0.549526064647749, |
| "learning_rate": 1.5358840525909967e-07, |
| "loss": 0.3986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4009050130844116, |
| "step": 3015, |
| "valid_targets_mean": 4778.8, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 4.832, |
| "grad_norm": 0.7167556183864082, |
| "learning_rate": 1.4007906296904072e-07, |
| "loss": 0.3943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43567198514938354, |
| "step": 3020, |
| "valid_targets_mean": 3120.4, |
| "valid_targets_min": 547 |
| }, |
| { |
| "epoch": 4.84, |
| "grad_norm": 0.7952417316247405, |
| "learning_rate": 1.2718942640254084e-07, |
| "loss": 0.4024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4332461953163147, |
| "step": 3025, |
| "valid_targets_mean": 2783.6, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 4.848, |
| "grad_norm": 0.5604252297788266, |
| "learning_rate": 1.1491989776570623e-07, |
| "loss": 0.4079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3904341757297516, |
| "step": 3030, |
| "valid_targets_mean": 4534.9, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 4.856, |
| "grad_norm": 0.6858298477952322, |
| "learning_rate": 1.0327085991490127e-07, |
| "loss": 0.4213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4092717170715332, |
| "step": 3035, |
| "valid_targets_mean": 3204.4, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 4.864, |
| "grad_norm": 0.6401379988844095, |
| "learning_rate": 9.22426763447981e-08, |
| "loss": 0.4118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41920021176338196, |
| "step": 3040, |
| "valid_targets_mean": 3930.8, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 4.872, |
| "grad_norm": 0.5334024885638476, |
| "learning_rate": 8.183569117703461e-08, |
| "loss": 0.3955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3883068263530731, |
| "step": 3045, |
| "valid_targets_mean": 5270.0, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 4.88, |
| "grad_norm": 0.5549772986705793, |
| "learning_rate": 7.205022914946957e-08, |
| "loss": 0.4232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38646113872528076, |
| "step": 3050, |
| "valid_targets_mean": 4886.3, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 4.888, |
| "grad_norm": 0.5767956457076785, |
| "learning_rate": 6.288659560606203e-08, |
| "loss": 0.4086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3830558657646179, |
| "step": 3055, |
| "valid_targets_mean": 4712.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 4.896, |
| "grad_norm": 0.5988889732664718, |
| "learning_rate": 5.4345076487332114e-08, |
| "loss": 0.3863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4035729169845581, |
| "step": 3060, |
| "valid_targets_mean": 4299.6, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 4.904, |
| "grad_norm": 0.5205741542745066, |
| "learning_rate": 4.642593832144382e-08, |
| "loss": 0.4224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36331793665885925, |
| "step": 3065, |
| "valid_targets_mean": 4843.8, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 4.912, |
| "grad_norm": 0.6165591241445428, |
| "learning_rate": 3.912942821589161e-08, |
| "loss": 0.3843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3959740400314331, |
| "step": 3070, |
| "valid_targets_mean": 4223.8, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 4.92, |
| "grad_norm": 0.6355765004228577, |
| "learning_rate": 3.2455773849779935e-08, |
| "loss": 0.4104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42105889320373535, |
| "step": 3075, |
| "valid_targets_mean": 3869.8, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 4.928, |
| "grad_norm": 0.7183753779829565, |
| "learning_rate": 2.6405183466731154e-08, |
| "loss": 0.4293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46973997354507446, |
| "step": 3080, |
| "valid_targets_mean": 3456.1, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 4.936, |
| "grad_norm": 0.665925414774037, |
| "learning_rate": 2.0977845868375145e-08, |
| "loss": 0.4192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4395608603954315, |
| "step": 3085, |
| "valid_targets_mean": 3503.2, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 4.944, |
| "grad_norm": 0.6663253811911488, |
| "learning_rate": 1.6173930408467376e-08, |
| "loss": 0.4184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4220019578933716, |
| "step": 3090, |
| "valid_targets_mean": 3666.4, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 4.952, |
| "grad_norm": 0.628895057963846, |
| "learning_rate": 1.199358698759978e-08, |
| "loss": 0.3879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3834680914878845, |
| "step": 3095, |
| "valid_targets_mean": 3802.9, |
| "valid_targets_min": 468 |
| }, |
| { |
| "epoch": 4.96, |
| "grad_norm": 0.6447997763250441, |
| "learning_rate": 8.436946048522298e-09, |
| "loss": 0.4109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4318605065345764, |
| "step": 3100, |
| "valid_targets_mean": 3820.8, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 4.968, |
| "grad_norm": 0.4941475635121412, |
| "learning_rate": 5.504118572081662e-09, |
| "loss": 0.3983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3983478844165802, |
| "step": 3105, |
| "valid_targets_mean": 6376.6, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 4.976, |
| "grad_norm": 0.6289386884950056, |
| "learning_rate": 3.1951960737419686e-09, |
| "loss": 0.4222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4331316351890564, |
| "step": 3110, |
| "valid_targets_mean": 4068.7, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 4.984, |
| "grad_norm": 0.9118066646290699, |
| "learning_rate": 1.5102506007447227e-09, |
| "loss": 0.3988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4566645622253418, |
| "step": 3115, |
| "valid_targets_mean": 2408.6, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.992, |
| "grad_norm": 0.5570389322501734, |
| "learning_rate": 4.493347298528683e-10, |
| "loss": 0.4032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3776412904262543, |
| "step": 3120, |
| "valid_targets_mean": 4442.2, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.6109238323745433, |
| "learning_rate": 1.248156571209691e-11, |
| "loss": 0.3841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37494388222694397, |
| "step": 3125, |
| "valid_targets_mean": 3849.6, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 5.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37494388222694397, |
| "step": 3125, |
| "total_flos": 883823926247424.0, |
| "train_loss": 0.468077876701355, |
| "train_runtime": 22577.6779, |
| "train_samples_per_second": 2.212, |
| "train_steps_per_second": 0.138, |
| "valid_targets_mean": 3849.6, |
| "valid_targets_min": 730 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 3125, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 5, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": false, |
| "should_training_stop": false |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 883823926247424.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|