neginr commited on
Commit
fdbe797
·
verified ·
1 Parent(s): d380748

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1391b345ded08ee6dc7c825d87892ba006b33bb1ed96630a90a5359204e5ab32
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3986f0b0d935e713823a02fb38365846bed08a78e9e05d9d04ac3ec78fd7f2f5
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40b558538b862eaab0eda4043cf212b2a6ba8ea325976d80ceabd4f1d714ce6d
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06cba1a07fd98048a0fbdbf41fe510aa8aef407d0e4c6284490a6a842f5585ef
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1fa98be9ea44a7f3c90832ae17608d2da6c5c6eb1f734681a3e01de8030fc420
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c692a5b3c051e0866e5874071e62e64b6933de067735170162f5773202e2a7a
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e218413b9cf864471edbf4efb209c0f35b55097be1b8282f1dcf17dd16d8569e
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed8965fb198a58c93104190f49a57f01452048366beee83735e9c30a641f9f4f
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -741,3 +741,249 @@
741
  {"current_steps": 741, "total_steps": 1230, "loss": 0.2885, "lr": 1.6359475191103958e-05, "epoch": 3.0076026355803345, "percentage": 60.24, "elapsed_time": "9:07:23", "remaining_time": "6:01:14"}
742
  {"current_steps": 742, "total_steps": 1230, "loss": 0.2907, "lr": 1.6303679480270466e-05, "epoch": 3.011657374556513, "percentage": 60.33, "elapsed_time": "9:08:06", "remaining_time": "6:00:28"}
743
  {"current_steps": 743, "total_steps": 1230, "loss": 0.2906, "lr": 1.624791353909428e-05, "epoch": 3.0157121135326914, "percentage": 60.41, "elapsed_time": "9:08:47", "remaining_time": "5:59:42"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
741
  {"current_steps": 741, "total_steps": 1230, "loss": 0.2885, "lr": 1.6359475191103958e-05, "epoch": 3.0076026355803345, "percentage": 60.24, "elapsed_time": "9:07:23", "remaining_time": "6:01:14"}
742
  {"current_steps": 742, "total_steps": 1230, "loss": 0.2907, "lr": 1.6303679480270466e-05, "epoch": 3.011657374556513, "percentage": 60.33, "elapsed_time": "9:08:06", "remaining_time": "6:00:28"}
743
  {"current_steps": 743, "total_steps": 1230, "loss": 0.2906, "lr": 1.624791353909428e-05, "epoch": 3.0157121135326914, "percentage": 60.41, "elapsed_time": "9:08:47", "remaining_time": "5:59:42"}
744
+ {"current_steps": 744, "total_steps": 1230, "loss": 0.2822, "lr": 1.619217781670663e-05, "epoch": 3.01976685250887, "percentage": 60.49, "elapsed_time": "9:09:30", "remaining_time": "5:58:57"}
745
+ {"current_steps": 745, "total_steps": 1230, "loss": 0.2958, "lr": 1.6136472761995373e-05, "epoch": 3.0238215914850484, "percentage": 60.57, "elapsed_time": "9:10:16", "remaining_time": "5:58:13"}
746
+ {"current_steps": 746, "total_steps": 1230, "loss": 0.3039, "lr": 1.608079882360134e-05, "epoch": 3.0278763304612264, "percentage": 60.65, "elapsed_time": "9:10:57", "remaining_time": "5:57:27"}
747
+ {"current_steps": 747, "total_steps": 1230, "loss": 0.2845, "lr": 1.60251564499148e-05, "epoch": 3.031931069437405, "percentage": 60.73, "elapsed_time": "9:11:43", "remaining_time": "5:56:44"}
748
+ {"current_steps": 748, "total_steps": 1230, "loss": 0.2799, "lr": 1.596954608907176e-05, "epoch": 3.0359858084135833, "percentage": 60.81, "elapsed_time": "9:12:28", "remaining_time": "5:56:00"}
749
+ {"current_steps": 749, "total_steps": 1230, "loss": 0.2868, "lr": 1.591396818895043e-05, "epoch": 3.040040547389762, "percentage": 60.89, "elapsed_time": "9:13:12", "remaining_time": "5:55:16"}
750
+ {"current_steps": 750, "total_steps": 1230, "loss": 0.283, "lr": 1.585842319716759e-05, "epoch": 3.0440952863659403, "percentage": 60.98, "elapsed_time": "9:13:57", "remaining_time": "5:54:32"}
751
+ {"current_steps": 751, "total_steps": 1230, "loss": 0.2952, "lr": 1.5802911561074944e-05, "epoch": 3.0481500253421188, "percentage": 61.06, "elapsed_time": "9:14:41", "remaining_time": "5:53:47"}
752
+ {"current_steps": 752, "total_steps": 1230, "loss": 0.294, "lr": 1.5747433727755595e-05, "epoch": 3.052204764318297, "percentage": 61.14, "elapsed_time": "9:15:25", "remaining_time": "5:53:02"}
753
+ {"current_steps": 753, "total_steps": 1230, "loss": 0.2852, "lr": 1.5691990144020376e-05, "epoch": 3.0562595032944753, "percentage": 61.22, "elapsed_time": "9:16:05", "remaining_time": "5:52:15"}
754
+ {"current_steps": 754, "total_steps": 1230, "loss": 0.28, "lr": 1.5636581256404297e-05, "epoch": 3.0603142422706537, "percentage": 61.3, "elapsed_time": "9:16:50", "remaining_time": "5:51:32"}
755
+ {"current_steps": 755, "total_steps": 1230, "loss": 0.2779, "lr": 1.558120751116291e-05, "epoch": 3.064368981246832, "percentage": 61.38, "elapsed_time": "9:17:34", "remaining_time": "5:50:47"}
756
+ {"current_steps": 756, "total_steps": 1230, "loss": 0.2952, "lr": 1.552586935426876e-05, "epoch": 3.0684237202230107, "percentage": 61.46, "elapsed_time": "9:18:18", "remaining_time": "5:50:03"}
757
+ {"current_steps": 757, "total_steps": 1230, "loss": 0.3004, "lr": 1.547056723140774e-05, "epoch": 3.072478459199189, "percentage": 61.54, "elapsed_time": "9:19:01", "remaining_time": "5:49:17"}
758
+ {"current_steps": 758, "total_steps": 1230, "loss": 0.2862, "lr": 1.5415301587975565e-05, "epoch": 3.0765331981753676, "percentage": 61.63, "elapsed_time": "9:19:44", "remaining_time": "5:48:32"}
759
+ {"current_steps": 759, "total_steps": 1230, "loss": 0.2935, "lr": 1.536007286907411e-05, "epoch": 3.0805879371515457, "percentage": 61.71, "elapsed_time": "9:20:27", "remaining_time": "5:47:47"}
760
+ {"current_steps": 760, "total_steps": 1230, "loss": 0.2898, "lr": 1.5304881519507896e-05, "epoch": 3.084642676127724, "percentage": 61.79, "elapsed_time": "9:21:11", "remaining_time": "5:47:02"}
761
+ {"current_steps": 761, "total_steps": 1230, "loss": 0.292, "lr": 1.5249727983780453e-05, "epoch": 3.0886974151039026, "percentage": 61.87, "elapsed_time": "9:21:55", "remaining_time": "5:46:18"}
762
+ {"current_steps": 762, "total_steps": 1230, "loss": 0.2862, "lr": 1.5194612706090786e-05, "epoch": 3.092752154080081, "percentage": 61.95, "elapsed_time": "9:22:39", "remaining_time": "5:45:34"}
763
+ {"current_steps": 763, "total_steps": 1230, "loss": 0.2859, "lr": 1.5139536130329771e-05, "epoch": 3.0968068930562596, "percentage": 62.03, "elapsed_time": "9:23:24", "remaining_time": "5:44:50"}
764
+ {"current_steps": 764, "total_steps": 1230, "loss": 0.2916, "lr": 1.508449870007656e-05, "epoch": 3.100861632032438, "percentage": 62.11, "elapsed_time": "9:24:10", "remaining_time": "5:44:07"}
765
+ {"current_steps": 765, "total_steps": 1230, "loss": 0.2877, "lr": 1.5029500858595056e-05, "epoch": 3.1049163710086165, "percentage": 62.2, "elapsed_time": "9:24:55", "remaining_time": "5:43:22"}
766
+ {"current_steps": 766, "total_steps": 1230, "loss": 0.2877, "lr": 1.4974543048830328e-05, "epoch": 3.1089711099847945, "percentage": 62.28, "elapsed_time": "9:25:39", "remaining_time": "5:42:38"}
767
+ {"current_steps": 767, "total_steps": 1230, "loss": 0.2828, "lr": 1.4919625713405e-05, "epoch": 3.113025848960973, "percentage": 62.36, "elapsed_time": "9:26:25", "remaining_time": "5:41:55"}
768
+ {"current_steps": 768, "total_steps": 1230, "loss": 0.2884, "lr": 1.4864749294615756e-05, "epoch": 3.1170805879371515, "percentage": 62.44, "elapsed_time": "9:27:06", "remaining_time": "5:41:09"}
769
+ {"current_steps": 769, "total_steps": 1230, "loss": 0.292, "lr": 1.4809914234429716e-05, "epoch": 3.12113532691333, "percentage": 62.52, "elapsed_time": "9:27:49", "remaining_time": "5:40:24"}
770
+ {"current_steps": 770, "total_steps": 1230, "loss": 0.3002, "lr": 1.4755120974480923e-05, "epoch": 3.1251900658895084, "percentage": 62.6, "elapsed_time": "9:28:33", "remaining_time": "5:39:39"}
771
+ {"current_steps": 771, "total_steps": 1230, "loss": 0.2858, "lr": 1.4700369956066771e-05, "epoch": 3.129244804865687, "percentage": 62.68, "elapsed_time": "9:29:15", "remaining_time": "5:38:53"}
772
+ {"current_steps": 772, "total_steps": 1230, "loss": 0.2827, "lr": 1.4645661620144413e-05, "epoch": 3.1332995438418654, "percentage": 62.76, "elapsed_time": "9:29:57", "remaining_time": "5:38:08"}
773
+ {"current_steps": 773, "total_steps": 1230, "loss": 0.2937, "lr": 1.4590996407327284e-05, "epoch": 3.1373542828180434, "percentage": 62.85, "elapsed_time": "9:30:42", "remaining_time": "5:37:24"}
774
+ {"current_steps": 774, "total_steps": 1230, "loss": 0.2855, "lr": 1.4536374757881487e-05, "epoch": 3.141409021794222, "percentage": 62.93, "elapsed_time": "9:31:26", "remaining_time": "5:36:39"}
775
+ {"current_steps": 775, "total_steps": 1230, "loss": 0.2725, "lr": 1.4481797111722271e-05, "epoch": 3.1454637607704004, "percentage": 63.01, "elapsed_time": "9:32:12", "remaining_time": "5:35:56"}
776
+ {"current_steps": 776, "total_steps": 1230, "loss": 0.2916, "lr": 1.4427263908410507e-05, "epoch": 3.149518499746579, "percentage": 63.09, "elapsed_time": "9:32:56", "remaining_time": "5:35:12"}
777
+ {"current_steps": 777, "total_steps": 1230, "loss": 0.2915, "lr": 1.4372775587149108e-05, "epoch": 3.1535732387227573, "percentage": 63.17, "elapsed_time": "9:33:39", "remaining_time": "5:34:27"}
778
+ {"current_steps": 778, "total_steps": 1230, "loss": 0.2897, "lr": 1.4318332586779522e-05, "epoch": 3.1576279776989358, "percentage": 63.25, "elapsed_time": "9:34:20", "remaining_time": "5:33:40"}
779
+ {"current_steps": 779, "total_steps": 1230, "loss": 0.2835, "lr": 1.4263935345778202e-05, "epoch": 3.1616827166751142, "percentage": 63.33, "elapsed_time": "9:35:03", "remaining_time": "5:32:55"}
780
+ {"current_steps": 780, "total_steps": 1230, "loss": 0.289, "lr": 1.420958430225303e-05, "epoch": 3.1657374556512923, "percentage": 63.41, "elapsed_time": "9:35:46", "remaining_time": "5:32:10"}
781
+ {"current_steps": 781, "total_steps": 1230, "loss": 0.2916, "lr": 1.415527989393985e-05, "epoch": 3.1697921946274707, "percentage": 63.5, "elapsed_time": "9:36:31", "remaining_time": "5:31:26"}
782
+ {"current_steps": 782, "total_steps": 1230, "loss": 0.2952, "lr": 1.410102255819891e-05, "epoch": 3.1738469336036492, "percentage": 63.58, "elapsed_time": "9:37:16", "remaining_time": "5:30:42"}
783
+ {"current_steps": 783, "total_steps": 1230, "loss": 0.2877, "lr": 1.404681273201131e-05, "epoch": 3.1779016725798277, "percentage": 63.66, "elapsed_time": "9:37:58", "remaining_time": "5:29:57"}
784
+ {"current_steps": 784, "total_steps": 1230, "loss": 0.2815, "lr": 1.399265085197556e-05, "epoch": 3.181956411556006, "percentage": 63.74, "elapsed_time": "9:38:41", "remaining_time": "5:29:12"}
785
+ {"current_steps": 785, "total_steps": 1230, "loss": 0.2873, "lr": 1.393853735430398e-05, "epoch": 3.1860111505321846, "percentage": 63.82, "elapsed_time": "9:39:24", "remaining_time": "5:28:27"}
786
+ {"current_steps": 786, "total_steps": 1230, "loss": 0.2979, "lr": 1.3884472674819246e-05, "epoch": 3.1900658895083627, "percentage": 63.9, "elapsed_time": "9:40:05", "remaining_time": "5:27:41"}
787
+ {"current_steps": 787, "total_steps": 1230, "loss": 0.2827, "lr": 1.3830457248950864e-05, "epoch": 3.194120628484541, "percentage": 63.98, "elapsed_time": "9:40:46", "remaining_time": "5:26:55"}
788
+ {"current_steps": 788, "total_steps": 1230, "loss": 0.2876, "lr": 1.377649151173163e-05, "epoch": 3.1981753674607196, "percentage": 64.07, "elapsed_time": "9:41:28", "remaining_time": "5:26:09"}
789
+ {"current_steps": 789, "total_steps": 1230, "loss": 0.2941, "lr": 1.3722575897794181e-05, "epoch": 3.202230106436898, "percentage": 64.15, "elapsed_time": "9:42:09", "remaining_time": "5:25:23"}
790
+ {"current_steps": 790, "total_steps": 1230, "loss": 0.2934, "lr": 1.3668710841367472e-05, "epoch": 3.2062848454130766, "percentage": 64.23, "elapsed_time": "9:42:54", "remaining_time": "5:24:39"}
791
+ {"current_steps": 791, "total_steps": 1230, "loss": 0.2931, "lr": 1.361489677627324e-05, "epoch": 3.210339584389255, "percentage": 64.31, "elapsed_time": "9:43:37", "remaining_time": "5:23:54"}
792
+ {"current_steps": 792, "total_steps": 1230, "loss": 0.2784, "lr": 1.3561134135922585e-05, "epoch": 3.2143943233654335, "percentage": 64.39, "elapsed_time": "9:44:22", "remaining_time": "5:23:10"}
793
+ {"current_steps": 793, "total_steps": 1230, "loss": 0.2878, "lr": 1.350742335331241e-05, "epoch": 3.2184490623416115, "percentage": 64.47, "elapsed_time": "9:45:04", "remaining_time": "5:22:24"}
794
+ {"current_steps": 794, "total_steps": 1230, "loss": 0.2838, "lr": 1.345376486102198e-05, "epoch": 3.22250380131779, "percentage": 64.55, "elapsed_time": "9:45:50", "remaining_time": "5:21:41"}
795
+ {"current_steps": 795, "total_steps": 1230, "loss": 0.2919, "lr": 1.3400159091209414e-05, "epoch": 3.2265585402939685, "percentage": 64.63, "elapsed_time": "9:46:33", "remaining_time": "5:20:56"}
796
+ {"current_steps": 796, "total_steps": 1230, "loss": 0.2968, "lr": 1.3346606475608216e-05, "epoch": 3.230613279270147, "percentage": 64.72, "elapsed_time": "9:47:15", "remaining_time": "5:20:11"}
797
+ {"current_steps": 797, "total_steps": 1230, "loss": 0.296, "lr": 1.3293107445523781e-05, "epoch": 3.2346680182463254, "percentage": 64.8, "elapsed_time": "9:47:57", "remaining_time": "5:19:25"}
798
+ {"current_steps": 798, "total_steps": 1230, "loss": 0.2852, "lr": 1.3239662431829949e-05, "epoch": 3.238722757222504, "percentage": 64.88, "elapsed_time": "9:48:43", "remaining_time": "5:18:42"}
799
+ {"current_steps": 799, "total_steps": 1230, "loss": 0.2899, "lr": 1.3186271864965509e-05, "epoch": 3.2427774961986824, "percentage": 64.96, "elapsed_time": "9:49:26", "remaining_time": "5:17:57"}
800
+ {"current_steps": 800, "total_steps": 1230, "loss": 0.2916, "lr": 1.3132936174930756e-05, "epoch": 3.2468322351748604, "percentage": 65.04, "elapsed_time": "9:50:11", "remaining_time": "5:17:13"}
801
+ {"current_steps": 801, "total_steps": 1230, "loss": 0.2761, "lr": 1.3079655791283995e-05, "epoch": 3.250886974151039, "percentage": 65.12, "elapsed_time": "9:50:53", "remaining_time": "5:16:27"}
802
+ {"current_steps": 802, "total_steps": 1230, "loss": 0.2929, "lr": 1.3026431143138108e-05, "epoch": 3.2549417131272174, "percentage": 65.2, "elapsed_time": "9:51:37", "remaining_time": "5:15:43"}
803
+ {"current_steps": 803, "total_steps": 1230, "loss": 0.2917, "lr": 1.2973262659157114e-05, "epoch": 3.258996452103396, "percentage": 65.28, "elapsed_time": "9:52:17", "remaining_time": "5:14:57"}
804
+ {"current_steps": 804, "total_steps": 1230, "loss": 0.295, "lr": 1.2920150767552651e-05, "epoch": 3.2630511910795743, "percentage": 65.37, "elapsed_time": "9:53:02", "remaining_time": "5:14:13"}
805
+ {"current_steps": 805, "total_steps": 1230, "loss": 0.2919, "lr": 1.2867095896080607e-05, "epoch": 3.267105930055753, "percentage": 65.45, "elapsed_time": "9:53:46", "remaining_time": "5:13:29"}
806
+ {"current_steps": 806, "total_steps": 1230, "loss": 0.2934, "lr": 1.2814098472037612e-05, "epoch": 3.2711606690319313, "percentage": 65.53, "elapsed_time": "9:54:30", "remaining_time": "5:12:44"}
807
+ {"current_steps": 807, "total_steps": 1230, "loss": 0.2723, "lr": 1.276115892225764e-05, "epoch": 3.2752154080081093, "percentage": 65.61, "elapsed_time": "9:55:15", "remaining_time": "5:12:00"}
808
+ {"current_steps": 808, "total_steps": 1230, "loss": 0.296, "lr": 1.2708277673108555e-05, "epoch": 3.2792701469842878, "percentage": 65.69, "elapsed_time": "9:55:58", "remaining_time": "5:11:15"}
809
+ {"current_steps": 809, "total_steps": 1230, "loss": 0.2817, "lr": 1.2655455150488649e-05, "epoch": 3.2833248859604662, "percentage": 65.77, "elapsed_time": "9:56:41", "remaining_time": "5:10:31"}
810
+ {"current_steps": 810, "total_steps": 1230, "loss": 0.2948, "lr": 1.2602691779823272e-05, "epoch": 3.2873796249366447, "percentage": 65.85, "elapsed_time": "9:57:26", "remaining_time": "5:09:46"}
811
+ {"current_steps": 811, "total_steps": 1230, "loss": 0.2826, "lr": 1.2549987986061355e-05, "epoch": 3.291434363912823, "percentage": 65.93, "elapsed_time": "9:58:11", "remaining_time": "5:09:03"}
812
+ {"current_steps": 812, "total_steps": 1230, "loss": 0.2927, "lr": 1.2497344193672005e-05, "epoch": 3.2954891028890017, "percentage": 66.02, "elapsed_time": "9:58:56", "remaining_time": "5:08:19"}
813
+ {"current_steps": 813, "total_steps": 1230, "loss": 0.2916, "lr": 1.2444760826641092e-05, "epoch": 3.29954384186518, "percentage": 66.1, "elapsed_time": "9:59:38", "remaining_time": "5:07:33"}
814
+ {"current_steps": 814, "total_steps": 1230, "loss": 0.2923, "lr": 1.2392238308467817e-05, "epoch": 3.303598580841358, "percentage": 66.18, "elapsed_time": "10:00:25", "remaining_time": "5:06:50"}
815
+ {"current_steps": 815, "total_steps": 1230, "loss": 0.2766, "lr": 1.2339777062161326e-05, "epoch": 3.3076533198175366, "percentage": 66.26, "elapsed_time": "10:01:09", "remaining_time": "5:06:06"}
816
+ {"current_steps": 816, "total_steps": 1230, "loss": 0.298, "lr": 1.2287377510237293e-05, "epoch": 3.311708058793715, "percentage": 66.34, "elapsed_time": "10:01:53", "remaining_time": "5:05:22"}
817
+ {"current_steps": 817, "total_steps": 1230, "loss": 0.2778, "lr": 1.2235040074714488e-05, "epoch": 3.3157627977698936, "percentage": 66.42, "elapsed_time": "10:02:36", "remaining_time": "5:04:37"}
818
+ {"current_steps": 818, "total_steps": 1230, "loss": 0.2891, "lr": 1.2182765177111434e-05, "epoch": 3.319817536746072, "percentage": 66.5, "elapsed_time": "10:03:19", "remaining_time": "5:03:52"}
819
+ {"current_steps": 819, "total_steps": 1230, "loss": 0.286, "lr": 1.213055323844297e-05, "epoch": 3.3238722757222505, "percentage": 66.59, "elapsed_time": "10:04:05", "remaining_time": "5:03:09"}
820
+ {"current_steps": 820, "total_steps": 1230, "loss": 0.2865, "lr": 1.2078404679216864e-05, "epoch": 3.327927014698429, "percentage": 66.67, "elapsed_time": "10:04:48", "remaining_time": "5:02:24"}
821
+ {"current_steps": 821, "total_steps": 1230, "loss": 0.2947, "lr": 1.2026319919430458e-05, "epoch": 3.331981753674607, "percentage": 66.75, "elapsed_time": "10:05:35", "remaining_time": "5:01:41"}
822
+ {"current_steps": 822, "total_steps": 1230, "loss": 0.2921, "lr": 1.1974299378567227e-05, "epoch": 3.3360364926507855, "percentage": 66.83, "elapsed_time": "10:06:19", "remaining_time": "5:00:57"}
823
+ {"current_steps": 823, "total_steps": 1230, "loss": 0.2809, "lr": 1.1922343475593462e-05, "epoch": 3.340091231626964, "percentage": 66.91, "elapsed_time": "10:07:05", "remaining_time": "5:00:13"}
824
+ {"current_steps": 824, "total_steps": 1230, "loss": 0.2997, "lr": 1.187045262895488e-05, "epoch": 3.3441459706031424, "percentage": 66.99, "elapsed_time": "10:07:48", "remaining_time": "4:59:28"}
825
+ {"current_steps": 825, "total_steps": 1230, "loss": 0.2846, "lr": 1.1818627256573203e-05, "epoch": 3.348200709579321, "percentage": 67.07, "elapsed_time": "10:08:31", "remaining_time": "4:58:43"}
826
+ {"current_steps": 826, "total_steps": 1230, "loss": 0.2857, "lr": 1.1766867775842864e-05, "epoch": 3.3522554485554994, "percentage": 67.15, "elapsed_time": "10:09:17", "remaining_time": "4:58:00"}
827
+ {"current_steps": 827, "total_steps": 1230, "loss": 0.2871, "lr": 1.1715174603627615e-05, "epoch": 3.356310187531678, "percentage": 67.24, "elapsed_time": "10:09:58", "remaining_time": "4:57:14"}
828
+ {"current_steps": 828, "total_steps": 1230, "loss": 0.2842, "lr": 1.1663548156257147e-05, "epoch": 3.360364926507856, "percentage": 67.32, "elapsed_time": "10:10:42", "remaining_time": "4:56:30"}
829
+ {"current_steps": 829, "total_steps": 1230, "loss": 0.2762, "lr": 1.161198884952377e-05, "epoch": 3.3644196654840344, "percentage": 67.4, "elapsed_time": "10:11:26", "remaining_time": "4:55:45"}
830
+ {"current_steps": 830, "total_steps": 1230, "loss": 0.2863, "lr": 1.1560497098679056e-05, "epoch": 3.368474404460213, "percentage": 67.48, "elapsed_time": "10:12:11", "remaining_time": "4:55:02"}
831
+ {"current_steps": 831, "total_steps": 1230, "loss": 0.2978, "lr": 1.1509073318430479e-05, "epoch": 3.3725291434363913, "percentage": 67.56, "elapsed_time": "10:12:56", "remaining_time": "4:54:17"}
832
+ {"current_steps": 832, "total_steps": 1230, "loss": 0.2875, "lr": 1.1457717922938116e-05, "epoch": 3.37658388241257, "percentage": 67.64, "elapsed_time": "10:13:42", "remaining_time": "4:53:34"}
833
+ {"current_steps": 833, "total_steps": 1230, "loss": 0.2721, "lr": 1.1406431325811233e-05, "epoch": 3.3806386213887483, "percentage": 67.72, "elapsed_time": "10:14:26", "remaining_time": "4:52:50"}
834
+ {"current_steps": 834, "total_steps": 1230, "loss": 0.2887, "lr": 1.135521394010506e-05, "epoch": 3.3846933603649267, "percentage": 67.8, "elapsed_time": "10:15:09", "remaining_time": "4:52:05"}
835
+ {"current_steps": 835, "total_steps": 1230, "loss": 0.2836, "lr": 1.1304066178317367e-05, "epoch": 3.3887480993411048, "percentage": 67.89, "elapsed_time": "10:15:52", "remaining_time": "4:51:20"}
836
+ {"current_steps": 836, "total_steps": 1230, "loss": 0.2859, "lr": 1.1252988452385199e-05, "epoch": 3.3928028383172832, "percentage": 67.97, "elapsed_time": "10:16:36", "remaining_time": "4:50:36"}
837
+ {"current_steps": 837, "total_steps": 1230, "loss": 0.2931, "lr": 1.1201981173681536e-05, "epoch": 3.3968575772934617, "percentage": 68.05, "elapsed_time": "10:17:23", "remaining_time": "4:49:53"}
838
+ {"current_steps": 838, "total_steps": 1230, "loss": 0.2867, "lr": 1.1151044753011991e-05, "epoch": 3.40091231626964, "percentage": 68.13, "elapsed_time": "10:18:05", "remaining_time": "4:49:08"}
839
+ {"current_steps": 839, "total_steps": 1230, "loss": 0.2895, "lr": 1.1100179600611491e-05, "epoch": 3.4049670552458187, "percentage": 68.21, "elapsed_time": "10:18:48", "remaining_time": "4:48:23"}
840
+ {"current_steps": 840, "total_steps": 1230, "loss": 0.2958, "lr": 1.1049386126140985e-05, "epoch": 3.409021794221997, "percentage": 68.29, "elapsed_time": "10:19:33", "remaining_time": "4:47:38"}
841
+ {"current_steps": 841, "total_steps": 1230, "loss": 0.2841, "lr": 1.0998664738684128e-05, "epoch": 3.4130765331981756, "percentage": 68.37, "elapsed_time": "10:20:16", "remaining_time": "4:46:54"}
842
+ {"current_steps": 842, "total_steps": 1230, "loss": 0.2794, "lr": 1.0948015846744e-05, "epoch": 3.4171312721743536, "percentage": 68.46, "elapsed_time": "10:21:01", "remaining_time": "4:46:10"}
843
+ {"current_steps": 843, "total_steps": 1230, "loss": 0.2881, "lr": 1.0897439858239832e-05, "epoch": 3.421186011150532, "percentage": 68.54, "elapsed_time": "10:21:43", "remaining_time": "4:45:24"}
844
+ {"current_steps": 844, "total_steps": 1230, "loss": 0.2776, "lr": 1.0846937180503652e-05, "epoch": 3.4252407501267106, "percentage": 68.62, "elapsed_time": "10:22:24", "remaining_time": "4:44:39"}
845
+ {"current_steps": 845, "total_steps": 1230, "loss": 0.2924, "lr": 1.0796508220277117e-05, "epoch": 3.429295489102889, "percentage": 68.7, "elapsed_time": "10:23:08", "remaining_time": "4:43:55"}
846
+ {"current_steps": 846, "total_steps": 1230, "loss": 0.2821, "lr": 1.0746153383708107e-05, "epoch": 3.4333502280790675, "percentage": 68.78, "elapsed_time": "10:23:49", "remaining_time": "4:43:09"}
847
+ {"current_steps": 847, "total_steps": 1230, "loss": 0.2858, "lr": 1.0695873076347579e-05, "epoch": 3.437404967055246, "percentage": 68.86, "elapsed_time": "10:24:35", "remaining_time": "4:42:25"}
848
+ {"current_steps": 848, "total_steps": 1230, "loss": 0.2909, "lr": 1.0645667703146205e-05, "epoch": 3.441459706031424, "percentage": 68.94, "elapsed_time": "10:25:19", "remaining_time": "4:41:41"}
849
+ {"current_steps": 849, "total_steps": 1230, "loss": 0.2904, "lr": 1.0595537668451161e-05, "epoch": 3.4455144450076025, "percentage": 69.02, "elapsed_time": "10:26:04", "remaining_time": "4:40:57"}
850
+ {"current_steps": 850, "total_steps": 1230, "loss": 0.2913, "lr": 1.0545483376002854e-05, "epoch": 3.449569183983781, "percentage": 69.11, "elapsed_time": "10:26:50", "remaining_time": "4:40:14"}
851
+ {"current_steps": 851, "total_steps": 1230, "loss": 0.2963, "lr": 1.0495505228931676e-05, "epoch": 3.4536239229599595, "percentage": 69.19, "elapsed_time": "10:27:32", "remaining_time": "4:39:28"}
852
+ {"current_steps": 852, "total_steps": 1230, "loss": 0.2847, "lr": 1.044560362975474e-05, "epoch": 3.457678661936138, "percentage": 69.27, "elapsed_time": "10:28:15", "remaining_time": "4:38:44"}
853
+ {"current_steps": 853, "total_steps": 1230, "loss": 0.2898, "lr": 1.0395778980372695e-05, "epoch": 3.4617334009123164, "percentage": 69.35, "elapsed_time": "10:29:00", "remaining_time": "4:38:00"}
854
+ {"current_steps": 854, "total_steps": 1230, "loss": 0.3095, "lr": 1.0346031682066381e-05, "epoch": 3.4657881398884944, "percentage": 69.43, "elapsed_time": "10:29:44", "remaining_time": "4:37:15"}
855
+ {"current_steps": 855, "total_steps": 1230, "loss": 0.2827, "lr": 1.0296362135493724e-05, "epoch": 3.469842878864673, "percentage": 69.51, "elapsed_time": "10:30:28", "remaining_time": "4:36:31"}
856
+ {"current_steps": 856, "total_steps": 1230, "loss": 0.2989, "lr": 1.0246770740686422e-05, "epoch": 3.4738976178408514, "percentage": 69.59, "elapsed_time": "10:31:12", "remaining_time": "4:35:46"}
857
+ {"current_steps": 857, "total_steps": 1230, "loss": 0.2865, "lr": 1.0197257897046743e-05, "epoch": 3.47795235681703, "percentage": 69.67, "elapsed_time": "10:31:54", "remaining_time": "4:35:01"}
858
+ {"current_steps": 858, "total_steps": 1230, "loss": 0.2885, "lr": 1.014782400334433e-05, "epoch": 3.4820070957932083, "percentage": 69.76, "elapsed_time": "10:32:35", "remaining_time": "4:34:16"}
859
+ {"current_steps": 859, "total_steps": 1230, "loss": 0.2949, "lr": 1.009846945771296e-05, "epoch": 3.486061834769387, "percentage": 69.84, "elapsed_time": "10:33:18", "remaining_time": "4:33:31"}
860
+ {"current_steps": 860, "total_steps": 1230, "loss": 0.2864, "lr": 1.0049194657647363e-05, "epoch": 3.4901165737455653, "percentage": 69.92, "elapsed_time": "10:34:04", "remaining_time": "4:32:48"}
861
+ {"current_steps": 861, "total_steps": 1230, "loss": 0.2891, "lr": 1.0000000000000006e-05, "epoch": 3.4941713127217433, "percentage": 70.0, "elapsed_time": "10:34:50", "remaining_time": "4:32:04"}
862
+ {"current_steps": 862, "total_steps": 1230, "loss": 0.2814, "lr": 9.950885880977891e-06, "epoch": 3.498226051697922, "percentage": 70.08, "elapsed_time": "10:35:33", "remaining_time": "4:31:19"}
863
+ {"current_steps": 863, "total_steps": 1230, "loss": 0.2823, "lr": 9.901852696139382e-06, "epoch": 3.5022807906741003, "percentage": 70.16, "elapsed_time": "10:36:15", "remaining_time": "4:30:34"}
864
+ {"current_steps": 864, "total_steps": 1230, "loss": 0.2871, "lr": 9.852900840391027e-06, "epoch": 3.5063355296502787, "percentage": 70.24, "elapsed_time": "10:36:59", "remaining_time": "4:29:50"}
865
+ {"current_steps": 865, "total_steps": 1230, "loss": 0.2847, "lr": 9.804030707984313e-06, "epoch": 3.510390268626457, "percentage": 70.33, "elapsed_time": "10:37:45", "remaining_time": "4:29:06"}
866
+ {"current_steps": 866, "total_steps": 1230, "loss": 0.2899, "lr": 9.755242692512599e-06, "epoch": 3.5144450076026357, "percentage": 70.41, "elapsed_time": "10:38:28", "remaining_time": "4:28:21"}
867
+ {"current_steps": 867, "total_steps": 1230, "loss": 0.2906, "lr": 9.70653718690782e-06, "epoch": 3.518499746578814, "percentage": 70.49, "elapsed_time": "10:39:11", "remaining_time": "4:27:37"}
868
+ {"current_steps": 868, "total_steps": 1230, "loss": 0.303, "lr": 9.657914583437454e-06, "epoch": 3.522554485554992, "percentage": 70.57, "elapsed_time": "10:39:57", "remaining_time": "4:26:53"}
869
+ {"current_steps": 869, "total_steps": 1230, "loss": 0.2791, "lr": 9.609375273701246e-06, "epoch": 3.5266092245311706, "percentage": 70.65, "elapsed_time": "10:40:39", "remaining_time": "4:26:08"}
870
+ {"current_steps": 870, "total_steps": 1230, "loss": 0.2823, "lr": 9.560919648628133e-06, "epoch": 3.530663963507349, "percentage": 70.73, "elapsed_time": "10:41:23", "remaining_time": "4:25:24"}
871
+ {"current_steps": 871, "total_steps": 1230, "loss": 0.2907, "lr": 9.512548098473047e-06, "epoch": 3.5347187024835276, "percentage": 70.81, "elapsed_time": "10:42:04", "remaining_time": "4:24:38"}
872
+ {"current_steps": 872, "total_steps": 1230, "loss": 0.2941, "lr": 9.464261012813825e-06, "epoch": 3.538773441459706, "percentage": 70.89, "elapsed_time": "10:42:47", "remaining_time": "4:23:53"}
873
+ {"current_steps": 873, "total_steps": 1230, "loss": 0.2828, "lr": 9.416058780547987e-06, "epoch": 3.5428281804358845, "percentage": 70.98, "elapsed_time": "10:43:31", "remaining_time": "4:23:09"}
874
+ {"current_steps": 874, "total_steps": 1230, "loss": 0.2855, "lr": 9.367941789889714e-06, "epoch": 3.546882919412063, "percentage": 71.06, "elapsed_time": "10:44:16", "remaining_time": "4:22:25"}
875
+ {"current_steps": 875, "total_steps": 1230, "loss": 0.294, "lr": 9.319910428366607e-06, "epoch": 3.550937658388241, "percentage": 71.14, "elapsed_time": "10:44:59", "remaining_time": "4:21:41"}
876
+ {"current_steps": 876, "total_steps": 1230, "loss": 0.2909, "lr": 9.271965082816667e-06, "epoch": 3.5549923973644195, "percentage": 71.22, "elapsed_time": "10:45:42", "remaining_time": "4:20:56"}
877
+ {"current_steps": 877, "total_steps": 1230, "loss": 0.289, "lr": 9.224106139385111e-06, "epoch": 3.559047136340598, "percentage": 71.3, "elapsed_time": "10:46:26", "remaining_time": "4:20:11"}
878
+ {"current_steps": 878, "total_steps": 1230, "loss": 0.2955, "lr": 9.176333983521291e-06, "epoch": 3.5631018753167765, "percentage": 71.38, "elapsed_time": "10:47:08", "remaining_time": "4:19:26"}
879
+ {"current_steps": 879, "total_steps": 1230, "loss": 0.2896, "lr": 9.12864899997558e-06, "epoch": 3.567156614292955, "percentage": 71.46, "elapsed_time": "10:47:51", "remaining_time": "4:18:42"}
880
+ {"current_steps": 880, "total_steps": 1230, "loss": 0.2865, "lr": 9.08105157279628e-06, "epoch": 3.5712113532691334, "percentage": 71.54, "elapsed_time": "10:48:37", "remaining_time": "4:17:58"}
881
+ {"current_steps": 881, "total_steps": 1230, "loss": 0.2878, "lr": 9.03354208532653e-06, "epoch": 3.575266092245312, "percentage": 71.63, "elapsed_time": "10:49:21", "remaining_time": "4:17:14"}
882
+ {"current_steps": 882, "total_steps": 1230, "loss": 0.2899, "lr": 8.986120920201205e-06, "epoch": 3.57932083122149, "percentage": 71.71, "elapsed_time": "10:50:05", "remaining_time": "4:16:29"}
883
+ {"current_steps": 883, "total_steps": 1230, "loss": 0.3, "lr": 8.938788459343852e-06, "epoch": 3.5833755701976684, "percentage": 71.79, "elapsed_time": "10:50:52", "remaining_time": "4:15:46"}
884
+ {"current_steps": 884, "total_steps": 1230, "loss": 0.2902, "lr": 8.8915450839636e-06, "epoch": 3.587430309173847, "percentage": 71.87, "elapsed_time": "10:51:33", "remaining_time": "4:15:01"}
885
+ {"current_steps": 885, "total_steps": 1230, "loss": 0.2911, "lr": 8.844391174552116e-06, "epoch": 3.5914850481500253, "percentage": 71.95, "elapsed_time": "10:52:19", "remaining_time": "4:14:17"}
886
+ {"current_steps": 886, "total_steps": 1230, "loss": 0.2816, "lr": 8.797327110880479e-06, "epoch": 3.595539787126204, "percentage": 72.03, "elapsed_time": "10:52:59", "remaining_time": "4:13:31"}
887
+ {"current_steps": 887, "total_steps": 1230, "loss": 0.2919, "lr": 8.750353271996206e-06, "epoch": 3.5995945261023823, "percentage": 72.11, "elapsed_time": "10:53:44", "remaining_time": "4:12:47"}
888
+ {"current_steps": 888, "total_steps": 1230, "loss": 0.2845, "lr": 8.703470036220132e-06, "epoch": 3.6036492650785608, "percentage": 72.2, "elapsed_time": "10:54:28", "remaining_time": "4:12:03"}
889
+ {"current_steps": 889, "total_steps": 1230, "loss": 0.2781, "lr": 8.656677781143394e-06, "epoch": 3.607704004054739, "percentage": 72.28, "elapsed_time": "10:55:14", "remaining_time": "4:11:19"}
890
+ {"current_steps": 890, "total_steps": 1230, "loss": 0.2781, "lr": 8.609976883624377e-06, "epoch": 3.6117587430309173, "percentage": 72.36, "elapsed_time": "10:55:58", "remaining_time": "4:10:35"}
891
+ {"current_steps": 891, "total_steps": 1230, "loss": 0.29, "lr": 8.563367719785698e-06, "epoch": 3.6158134820070957, "percentage": 72.44, "elapsed_time": "10:56:42", "remaining_time": "4:09:51"}
892
+ {"current_steps": 892, "total_steps": 1230, "loss": 0.2896, "lr": 8.516850665011138e-06, "epoch": 3.619868220983274, "percentage": 72.52, "elapsed_time": "10:57:24", "remaining_time": "4:09:06"}
893
+ {"current_steps": 893, "total_steps": 1230, "loss": 0.2935, "lr": 8.47042609394269e-06, "epoch": 3.6239229599594527, "percentage": 72.6, "elapsed_time": "10:58:07", "remaining_time": "4:08:21"}
894
+ {"current_steps": 894, "total_steps": 1230, "loss": 0.2842, "lr": 8.424094380477432e-06, "epoch": 3.627977698935631, "percentage": 72.68, "elapsed_time": "10:58:51", "remaining_time": "4:07:37"}
895
+ {"current_steps": 895, "total_steps": 1230, "loss": 0.2978, "lr": 8.37785589776465e-06, "epoch": 3.6320324379118096, "percentage": 72.76, "elapsed_time": "10:59:36", "remaining_time": "4:06:53"}
896
+ {"current_steps": 896, "total_steps": 1230, "loss": 0.2864, "lr": 8.331711018202694e-06, "epoch": 3.6360871768879877, "percentage": 72.85, "elapsed_time": "11:00:18", "remaining_time": "4:06:08"}
897
+ {"current_steps": 897, "total_steps": 1230, "loss": 0.2931, "lr": 8.285660113436104e-06, "epoch": 3.640141915864166, "percentage": 72.93, "elapsed_time": "11:01:00", "remaining_time": "4:05:23"}
898
+ {"current_steps": 898, "total_steps": 1230, "loss": 0.2957, "lr": 8.239703554352527e-06, "epoch": 3.6441966548403446, "percentage": 73.01, "elapsed_time": "11:01:42", "remaining_time": "4:04:38"}
899
+ {"current_steps": 899, "total_steps": 1230, "loss": 0.2783, "lr": 8.193841711079775e-06, "epoch": 3.648251393816523, "percentage": 73.09, "elapsed_time": "11:02:25", "remaining_time": "4:03:53"}
900
+ {"current_steps": 900, "total_steps": 1230, "loss": 0.295, "lr": 8.148074952982828e-06, "epoch": 3.6523061327927016, "percentage": 73.17, "elapsed_time": "11:03:09", "remaining_time": "4:03:09"}
901
+ {"current_steps": 901, "total_steps": 1230, "loss": 0.2948, "lr": 8.102403648660859e-06, "epoch": 3.65636087176888, "percentage": 73.25, "elapsed_time": "11:03:52", "remaining_time": "4:02:24"}
902
+ {"current_steps": 902, "total_steps": 1230, "loss": 0.2913, "lr": 8.056828165944282e-06, "epoch": 3.6604156107450585, "percentage": 73.33, "elapsed_time": "11:04:36", "remaining_time": "4:01:40"}
903
+ {"current_steps": 903, "total_steps": 1230, "loss": 0.2856, "lr": 8.011348871891762e-06, "epoch": 3.6644703497212365, "percentage": 73.41, "elapsed_time": "11:05:19", "remaining_time": "4:00:55"}
904
+ {"current_steps": 904, "total_steps": 1230, "loss": 0.2895, "lr": 7.965966132787287e-06, "epoch": 3.668525088697415, "percentage": 73.5, "elapsed_time": "11:06:03", "remaining_time": "4:00:11"}
905
+ {"current_steps": 905, "total_steps": 1230, "loss": 0.2836, "lr": 7.920680314137189e-06, "epoch": 3.6725798276735935, "percentage": 73.58, "elapsed_time": "11:06:47", "remaining_time": "3:59:27"}
906
+ {"current_steps": 906, "total_steps": 1230, "loss": 0.2877, "lr": 7.875491780667246e-06, "epoch": 3.676634566649772, "percentage": 73.66, "elapsed_time": "11:07:32", "remaining_time": "3:58:43"}
907
+ {"current_steps": 907, "total_steps": 1230, "loss": 0.2916, "lr": 7.830400896319667e-06, "epoch": 3.6806893056259504, "percentage": 73.74, "elapsed_time": "11:08:13", "remaining_time": "3:57:58"}
908
+ {"current_steps": 908, "total_steps": 1230, "loss": 0.2848, "lr": 7.785408024250259e-06, "epoch": 3.684744044602129, "percentage": 73.82, "elapsed_time": "11:08:55", "remaining_time": "3:57:13"}
909
+ {"current_steps": 909, "total_steps": 1230, "loss": 0.2766, "lr": 7.74051352682542e-06, "epoch": 3.6887987835783074, "percentage": 73.9, "elapsed_time": "11:09:38", "remaining_time": "3:56:28"}
910
+ {"current_steps": 910, "total_steps": 1230, "loss": 0.2966, "lr": 7.695717765619257e-06, "epoch": 3.6928535225544854, "percentage": 73.98, "elapsed_time": "11:10:21", "remaining_time": "3:55:43"}
911
+ {"current_steps": 911, "total_steps": 1230, "loss": 0.2992, "lr": 7.651021101410673e-06, "epoch": 3.696908261530664, "percentage": 74.07, "elapsed_time": "11:11:07", "remaining_time": "3:55:00"}
912
+ {"current_steps": 912, "total_steps": 1230, "loss": 0.2861, "lr": 7.606423894180464e-06, "epoch": 3.7009630005068423, "percentage": 74.15, "elapsed_time": "11:11:49", "remaining_time": "3:54:15"}
913
+ {"current_steps": 913, "total_steps": 1230, "loss": 0.2851, "lr": 7.56192650310839e-06, "epoch": 3.705017739483021, "percentage": 74.23, "elapsed_time": "11:12:33", "remaining_time": "3:53:30"}
914
+ {"current_steps": 914, "total_steps": 1230, "loss": 0.2904, "lr": 7.517529286570349e-06, "epoch": 3.7090724784591993, "percentage": 74.31, "elapsed_time": "11:13:18", "remaining_time": "3:52:47"}
915
+ {"current_steps": 915, "total_steps": 1230, "loss": 0.295, "lr": 7.473232602135387e-06, "epoch": 3.7131272174353773, "percentage": 74.39, "elapsed_time": "11:14:04", "remaining_time": "3:52:03"}
916
+ {"current_steps": 916, "total_steps": 1230, "loss": 0.2853, "lr": 7.429036806562935e-06, "epoch": 3.7171819564115562, "percentage": 74.47, "elapsed_time": "11:14:48", "remaining_time": "3:51:19"}
917
+ {"current_steps": 917, "total_steps": 1230, "loss": 0.2833, "lr": 7.3849422557998455e-06, "epoch": 3.7212366953877343, "percentage": 74.55, "elapsed_time": "11:15:33", "remaining_time": "3:50:35"}
918
+ {"current_steps": 918, "total_steps": 1230, "loss": 0.2914, "lr": 7.340949304977567e-06, "epoch": 3.7252914343639127, "percentage": 74.63, "elapsed_time": "11:16:18", "remaining_time": "3:49:51"}
919
+ {"current_steps": 919, "total_steps": 1230, "loss": 0.2778, "lr": 7.297058308409282e-06, "epoch": 3.729346173340091, "percentage": 74.72, "elapsed_time": "11:17:01", "remaining_time": "3:49:06"}
920
+ {"current_steps": 920, "total_steps": 1230, "loss": 0.2741, "lr": 7.25326961958704e-06, "epoch": 3.7334009123162697, "percentage": 74.8, "elapsed_time": "11:17:43", "remaining_time": "3:48:21"}
921
+ {"current_steps": 921, "total_steps": 1230, "loss": 0.2898, "lr": 7.209583591178921e-06, "epoch": 3.737455651292448, "percentage": 74.88, "elapsed_time": "11:18:26", "remaining_time": "3:47:37"}
922
+ {"current_steps": 922, "total_steps": 1230, "loss": 0.2846, "lr": 7.1660005750261925e-06, "epoch": 3.741510390268626, "percentage": 74.96, "elapsed_time": "11:19:08", "remaining_time": "3:46:52"}
923
+ {"current_steps": 923, "total_steps": 1230, "loss": 0.289, "lr": 7.1225209221404765e-06, "epoch": 3.745565129244805, "percentage": 75.04, "elapsed_time": "11:19:52", "remaining_time": "3:46:08"}
924
+ {"current_steps": 924, "total_steps": 1230, "loss": 0.2878, "lr": 7.079144982700909e-06, "epoch": 3.749619868220983, "percentage": 75.12, "elapsed_time": "11:20:38", "remaining_time": "3:45:24"}
925
+ {"current_steps": 925, "total_steps": 1230, "loss": 0.2816, "lr": 7.0358731060513695e-06, "epoch": 3.7536746071971616, "percentage": 75.2, "elapsed_time": "11:21:21", "remaining_time": "3:44:39"}
926
+ {"current_steps": 926, "total_steps": 1230, "loss": 0.2896, "lr": 6.99270564069757e-06, "epoch": 3.75772934617334, "percentage": 75.28, "elapsed_time": "11:22:05", "remaining_time": "3:43:55"}
927
+ {"current_steps": 927, "total_steps": 1230, "loss": 0.2852, "lr": 6.949642934304375e-06, "epoch": 3.7617840851495186, "percentage": 75.37, "elapsed_time": "11:22:48", "remaining_time": "3:43:10"}
928
+ {"current_steps": 928, "total_steps": 1230, "loss": 0.2872, "lr": 6.906685333692871e-06, "epoch": 3.765838824125697, "percentage": 75.45, "elapsed_time": "11:23:32", "remaining_time": "3:42:26"}
929
+ {"current_steps": 929, "total_steps": 1230, "loss": 0.2879, "lr": 6.86383318483769e-06, "epoch": 3.769893563101875, "percentage": 75.53, "elapsed_time": "11:24:14", "remaining_time": "3:41:41"}
930
+ {"current_steps": 930, "total_steps": 1230, "loss": 0.3329, "lr": 6.821086832864139e-06, "epoch": 3.773948302078054, "percentage": 75.61, "elapsed_time": "11:24:59", "remaining_time": "3:40:58"}
931
+ {"current_steps": 931, "total_steps": 1230, "loss": 0.2864, "lr": 6.77844662204546e-06, "epoch": 3.778003041054232, "percentage": 75.69, "elapsed_time": "11:25:45", "remaining_time": "3:40:14"}
932
+ {"current_steps": 932, "total_steps": 1230, "loss": 0.2918, "lr": 6.7359128958000455e-06, "epoch": 3.7820577800304105, "percentage": 75.77, "elapsed_time": "11:26:29", "remaining_time": "3:39:29"}
933
+ {"current_steps": 933, "total_steps": 1230, "loss": 0.281, "lr": 6.693485996688695e-06, "epoch": 3.786112519006589, "percentage": 75.85, "elapsed_time": "11:27:12", "remaining_time": "3:38:45"}
934
+ {"current_steps": 934, "total_steps": 1230, "loss": 0.292, "lr": 6.651166266411801e-06, "epoch": 3.7901672579827674, "percentage": 75.93, "elapsed_time": "11:27:57", "remaining_time": "3:38:01"}
935
+ {"current_steps": 935, "total_steps": 1230, "loss": 0.2996, "lr": 6.6089540458066725e-06, "epoch": 3.794221996958946, "percentage": 76.02, "elapsed_time": "11:28:42", "remaining_time": "3:37:17"}
936
+ {"current_steps": 936, "total_steps": 1230, "loss": 0.2836, "lr": 6.566849674844711e-06, "epoch": 3.798276735935124, "percentage": 76.1, "elapsed_time": "11:29:28", "remaining_time": "3:36:33"}
937
+ {"current_steps": 937, "total_steps": 1230, "loss": 0.2786, "lr": 6.524853492628747e-06, "epoch": 3.802331474911303, "percentage": 76.18, "elapsed_time": "11:30:12", "remaining_time": "3:35:49"}
938
+ {"current_steps": 938, "total_steps": 1230, "loss": 0.2945, "lr": 6.4829658373902536e-06, "epoch": 3.806386213887481, "percentage": 76.26, "elapsed_time": "11:30:54", "remaining_time": "3:35:04"}
939
+ {"current_steps": 939, "total_steps": 1230, "loss": 0.2703, "lr": 6.441187046486648e-06, "epoch": 3.8104409528636594, "percentage": 76.34, "elapsed_time": "11:31:38", "remaining_time": "3:34:20"}
940
+ {"current_steps": 940, "total_steps": 1230, "loss": 0.2897, "lr": 6.399517456398567e-06, "epoch": 3.814495691839838, "percentage": 76.42, "elapsed_time": "11:32:21", "remaining_time": "3:33:35"}
941
+ {"current_steps": 941, "total_steps": 1230, "loss": 0.2943, "lr": 6.357957402727164e-06, "epoch": 3.8185504308160163, "percentage": 76.5, "elapsed_time": "11:33:02", "remaining_time": "3:32:50"}
942
+ {"current_steps": 942, "total_steps": 1230, "loss": 0.2811, "lr": 6.316507220191395e-06, "epoch": 3.822605169792195, "percentage": 76.59, "elapsed_time": "11:33:42", "remaining_time": "3:32:05"}
943
+ {"current_steps": 943, "total_steps": 1230, "loss": 0.2805, "lr": 6.275167242625331e-06, "epoch": 3.826659908768373, "percentage": 76.67, "elapsed_time": "11:34:25", "remaining_time": "3:31:20"}
944
+ {"current_steps": 944, "total_steps": 1230, "loss": 0.29, "lr": 6.233937802975471e-06, "epoch": 3.8307146477445513, "percentage": 76.75, "elapsed_time": "11:35:09", "remaining_time": "3:30:36"}
945
+ {"current_steps": 945, "total_steps": 1230, "loss": 0.2839, "lr": 6.192819233298046e-06, "epoch": 3.8347693867207298, "percentage": 76.83, "elapsed_time": "11:35:53", "remaining_time": "3:29:52"}
946
+ {"current_steps": 946, "total_steps": 1230, "loss": 0.272, "lr": 6.151811864756383e-06, "epoch": 3.8388241256969082, "percentage": 76.91, "elapsed_time": "11:36:35", "remaining_time": "3:29:07"}
947
+ {"current_steps": 947, "total_steps": 1230, "loss": 0.2947, "lr": 6.1109160276181655e-06, "epoch": 3.8428788646730867, "percentage": 76.99, "elapsed_time": "11:37:16", "remaining_time": "3:28:22"}
948
+ {"current_steps": 948, "total_steps": 1230, "loss": 0.2769, "lr": 6.070132051252868e-06, "epoch": 3.846933603649265, "percentage": 77.07, "elapsed_time": "11:37:59", "remaining_time": "3:27:37"}
949
+ {"current_steps": 949, "total_steps": 1230, "loss": 0.2915, "lr": 6.0294602641290034e-06, "epoch": 3.8509883426254437, "percentage": 77.15, "elapsed_time": "11:38:42", "remaining_time": "3:26:53"}
950
+ {"current_steps": 950, "total_steps": 1230, "loss": 0.2998, "lr": 5.988900993811575e-06, "epoch": 3.8550430816016217, "percentage": 77.24, "elapsed_time": "11:39:26", "remaining_time": "3:26:09"}
951
+ {"current_steps": 951, "total_steps": 1230, "loss": 0.2891, "lr": 5.948454566959363e-06, "epoch": 3.8590978205778, "percentage": 77.32, "elapsed_time": "11:40:11", "remaining_time": "3:25:25"}
952
+ {"current_steps": 952, "total_steps": 1230, "loss": 0.2871, "lr": 5.908121309322328e-06, "epoch": 3.8631525595539786, "percentage": 77.4, "elapsed_time": "11:40:57", "remaining_time": "3:24:41"}
953
+ {"current_steps": 953, "total_steps": 1230, "loss": 0.2886, "lr": 5.867901545738976e-06, "epoch": 3.867207298530157, "percentage": 77.48, "elapsed_time": "11:41:42", "remaining_time": "3:23:57"}
954
+ {"current_steps": 954, "total_steps": 1230, "loss": 0.2915, "lr": 5.827795600133774e-06, "epoch": 3.8712620375063356, "percentage": 77.56, "elapsed_time": "11:42:29", "remaining_time": "3:23:14"}
955
+ {"current_steps": 955, "total_steps": 1230, "loss": 0.2909, "lr": 5.787803795514466e-06, "epoch": 3.875316776482514, "percentage": 77.64, "elapsed_time": "11:43:15", "remaining_time": "3:22:30"}
956
+ {"current_steps": 956, "total_steps": 1230, "loss": 0.2866, "lr": 5.747926453969576e-06, "epoch": 3.8793715154586925, "percentage": 77.72, "elapsed_time": "11:43:58", "remaining_time": "3:21:46"}
957
+ {"current_steps": 957, "total_steps": 1230, "loss": 0.297, "lr": 5.708163896665708e-06, "epoch": 3.8834262544348706, "percentage": 77.8, "elapsed_time": "11:44:42", "remaining_time": "3:21:01"}
958
+ {"current_steps": 958, "total_steps": 1230, "loss": 0.2837, "lr": 5.668516443845047e-06, "epoch": 3.887480993411049, "percentage": 77.89, "elapsed_time": "11:45:26", "remaining_time": "3:20:17"}
959
+ {"current_steps": 959, "total_steps": 1230, "loss": 0.2989, "lr": 5.6289844148227225e-06, "epoch": 3.8915357323872275, "percentage": 77.97, "elapsed_time": "11:46:12", "remaining_time": "3:19:33"}
960
+ {"current_steps": 960, "total_steps": 1230, "loss": 0.281, "lr": 5.5895681279842615e-06, "epoch": 3.895590471363406, "percentage": 78.05, "elapsed_time": "11:46:54", "remaining_time": "3:18:49"}
961
+ {"current_steps": 961, "total_steps": 1230, "loss": 0.2831, "lr": 5.550267900783019e-06, "epoch": 3.8996452103395844, "percentage": 78.13, "elapsed_time": "11:47:40", "remaining_time": "3:18:05"}
962
+ {"current_steps": 962, "total_steps": 1230, "loss": 0.2895, "lr": 5.511084049737623e-06, "epoch": 3.903699949315763, "percentage": 78.21, "elapsed_time": "11:48:20", "remaining_time": "3:17:20"}
963
+ {"current_steps": 963, "total_steps": 1230, "loss": 0.2909, "lr": 5.4720168904294215e-06, "epoch": 3.9077546882919414, "percentage": 78.29, "elapsed_time": "11:49:02", "remaining_time": "3:16:35"}
964
+ {"current_steps": 964, "total_steps": 1230, "loss": 0.2897, "lr": 5.433066737499948e-06, "epoch": 3.9118094272681194, "percentage": 78.37, "elapsed_time": "11:49:48", "remaining_time": "3:15:51"}
965
+ {"current_steps": 965, "total_steps": 1230, "loss": 0.2872, "lr": 5.394233904648376e-06, "epoch": 3.915864166244298, "percentage": 78.46, "elapsed_time": "11:50:29", "remaining_time": "3:15:06"}
966
+ {"current_steps": 966, "total_steps": 1230, "loss": 0.2834, "lr": 5.355518704628997e-06, "epoch": 3.9199189052204764, "percentage": 78.54, "elapsed_time": "11:51:13", "remaining_time": "3:14:22"}
967
+ {"current_steps": 967, "total_steps": 1230, "loss": 0.2766, "lr": 5.316921449248731e-06, "epoch": 3.923973644196655, "percentage": 78.62, "elapsed_time": "11:51:54", "remaining_time": "3:13:37"}
968
+ {"current_steps": 968, "total_steps": 1230, "loss": 0.2907, "lr": 5.278442449364538e-06, "epoch": 3.9280283831728333, "percentage": 78.7, "elapsed_time": "11:52:39", "remaining_time": "3:12:53"}
969
+ {"current_steps": 969, "total_steps": 1230, "loss": 0.2949, "lr": 5.240082014881016e-06, "epoch": 3.932083122149012, "percentage": 78.78, "elapsed_time": "11:53:23", "remaining_time": "3:12:08"}
970
+ {"current_steps": 970, "total_steps": 1230, "loss": 0.2909, "lr": 5.201840454747822e-06, "epoch": 3.9361378611251903, "percentage": 78.86, "elapsed_time": "11:54:06", "remaining_time": "3:11:24"}
971
+ {"current_steps": 971, "total_steps": 1230, "loss": 0.2788, "lr": 5.163718076957223e-06, "epoch": 3.9401926001013683, "percentage": 78.94, "elapsed_time": "11:54:50", "remaining_time": "3:10:40"}
972
+ {"current_steps": 972, "total_steps": 1230, "loss": 0.2954, "lr": 5.125715188541609e-06, "epoch": 3.9442473390775468, "percentage": 79.02, "elapsed_time": "11:55:35", "remaining_time": "3:09:56"}
973
+ {"current_steps": 973, "total_steps": 1230, "loss": 0.2948, "lr": 5.087832095571021e-06, "epoch": 3.9483020780537252, "percentage": 79.11, "elapsed_time": "11:56:21", "remaining_time": "3:09:12"}
974
+ {"current_steps": 974, "total_steps": 1230, "loss": 0.2897, "lr": 5.0500691031506766e-06, "epoch": 3.9523568170299037, "percentage": 79.19, "elapsed_time": "11:57:03", "remaining_time": "3:08:28"}
975
+ {"current_steps": 975, "total_steps": 1230, "loss": 0.2934, "lr": 5.01242651541854e-06, "epoch": 3.956411556006082, "percentage": 79.27, "elapsed_time": "11:57:43", "remaining_time": "3:07:42"}
976
+ {"current_steps": 976, "total_steps": 1230, "loss": 0.279, "lr": 4.974904635542815e-06, "epoch": 3.9604662949822607, "percentage": 79.35, "elapsed_time": "11:58:29", "remaining_time": "3:06:59"}
977
+ {"current_steps": 977, "total_steps": 1230, "loss": 0.2881, "lr": 4.937503765719582e-06, "epoch": 3.964521033958439, "percentage": 79.43, "elapsed_time": "11:59:10", "remaining_time": "3:06:14"}
978
+ {"current_steps": 978, "total_steps": 1230, "loss": 0.2937, "lr": 4.900224207170299e-06, "epoch": 3.968575772934617, "percentage": 79.51, "elapsed_time": "11:59:53", "remaining_time": "3:05:29"}
979
+ {"current_steps": 979, "total_steps": 1230, "loss": 0.2886, "lr": 4.8630662601394065e-06, "epoch": 3.9726305119107956, "percentage": 79.59, "elapsed_time": "12:00:37", "remaining_time": "3:04:45"}
980
+ {"current_steps": 980, "total_steps": 1230, "loss": 0.2813, "lr": 4.8260302238918995e-06, "epoch": 3.976685250886974, "percentage": 79.67, "elapsed_time": "12:01:20", "remaining_time": "3:04:01"}
981
+ {"current_steps": 981, "total_steps": 1230, "loss": 0.281, "lr": 4.789116396710924e-06, "epoch": 3.9807399898631526, "percentage": 79.76, "elapsed_time": "12:02:02", "remaining_time": "3:03:16"}
982
+ {"current_steps": 982, "total_steps": 1230, "loss": 0.2807, "lr": 4.752325075895368e-06, "epoch": 3.984794728839331, "percentage": 79.84, "elapsed_time": "12:02:45", "remaining_time": "3:02:31"}
983
+ {"current_steps": 983, "total_steps": 1230, "loss": 0.279, "lr": 4.715656557757473e-06, "epoch": 3.9888494678155095, "percentage": 79.92, "elapsed_time": "12:03:32", "remaining_time": "3:01:48"}
984
+ {"current_steps": 984, "total_steps": 1230, "loss": 0.2781, "lr": 4.679111137620442e-06, "epoch": 3.992904206791688, "percentage": 80.0, "elapsed_time": "12:04:18", "remaining_time": "3:01:04"}
985
+ {"current_steps": 985, "total_steps": 1230, "loss": 0.2903, "lr": 4.6426891098160585e-06, "epoch": 3.996958945767866, "percentage": 80.08, "elapsed_time": "12:05:02", "remaining_time": "3:00:20"}
986
+ {"current_steps": 986, "total_steps": 1230, "loss": 0.2726, "lr": 4.6063907676823474e-06, "epoch": 4.002027369488089, "percentage": 80.16, "elapsed_time": "12:08:13", "remaining_time": "3:00:12"}
987
+ {"current_steps": 987, "total_steps": 1230, "loss": 0.2563, "lr": 4.570216403561141e-06, "epoch": 4.006082108464268, "percentage": 80.24, "elapsed_time": "12:08:55", "remaining_time": "2:59:27"}
988
+ {"current_steps": 988, "total_steps": 1230, "loss": 0.2601, "lr": 4.534166308795815e-06, "epoch": 4.010136847440446, "percentage": 80.33, "elapsed_time": "12:09:40", "remaining_time": "2:58:43"}
989
+ {"current_steps": 989, "total_steps": 1230, "loss": 0.2613, "lr": 4.498240773728859e-06, "epoch": 4.014191586416624, "percentage": 80.41, "elapsed_time": "12:10:25", "remaining_time": "2:57:59"}