sedrickkeh commited on
Commit
57dd12e
·
verified ·
1 Parent(s): 88d0bea

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b31fad5dd17c86708030af46d501e807a63177907b5606cae8a22c7f2ea8c968
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b39859f15065b889aa4637b00d423bcfaefe86a20b07f5c1efe24cc1a72582e6
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:653a23bb93cb9282ef9b33a21ecac312c0920d7df0c30f82dd0fdc38e32ab87d
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92c8bfe6edb42ef5b2752127c2bd1ee7a008812d1e60be8fe0528fa4f8addffb
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71645cd770e0faff6c5ac5711f75699b60f2ef2a3a256495a80e9344ebdcf636
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ae07b17baab99dc6bd8aa394ce6b22802faa5f0e14dafa95dce3daf891d54e4
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82b078fcb8b7cfb331871edcb316e1bc2362ac9250bd2dc6fec3e0eb7a36a34d
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b35ae933bc11c02ba0fc4eea598392889ce5052c60985b7da4b5f2358064713
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -790,3 +790,390 @@
790
  {"current_steps": 790, "total_steps": 1955, "loss": 0.3382, "lr": 2.9761904617142078e-05, "epoch": 2.020460358056266, "percentage": 40.41, "elapsed_time": "4:47:22", "remaining_time": "7:03:46"}
791
  {"current_steps": 791, "total_steps": 1955, "loss": 0.3115, "lr": 2.9730712806844208e-05, "epoch": 2.023017902813299, "percentage": 40.46, "elapsed_time": "4:47:43", "remaining_time": "7:03:23"}
792
  {"current_steps": 792, "total_steps": 1955, "loss": 0.3198, "lr": 2.9699489957197208e-05, "epoch": 2.0255754475703327, "percentage": 40.51, "elapsed_time": "4:48:06", "remaining_time": "7:03:03"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
790
  {"current_steps": 790, "total_steps": 1955, "loss": 0.3382, "lr": 2.9761904617142078e-05, "epoch": 2.020460358056266, "percentage": 40.41, "elapsed_time": "4:47:22", "remaining_time": "7:03:46"}
791
  {"current_steps": 791, "total_steps": 1955, "loss": 0.3115, "lr": 2.9730712806844208e-05, "epoch": 2.023017902813299, "percentage": 40.46, "elapsed_time": "4:47:43", "remaining_time": "7:03:23"}
792
  {"current_steps": 792, "total_steps": 1955, "loss": 0.3198, "lr": 2.9699489957197208e-05, "epoch": 2.0255754475703327, "percentage": 40.51, "elapsed_time": "4:48:06", "remaining_time": "7:03:03"}
793
+ {"current_steps": 793, "total_steps": 1955, "loss": 0.3248, "lr": 2.9668236167796746e-05, "epoch": 2.028132992327366, "percentage": 40.56, "elapsed_time": "4:48:29", "remaining_time": "7:02:43"}
794
+ {"current_steps": 794, "total_steps": 1955, "loss": 0.3341, "lr": 2.9636951538337187e-05, "epoch": 2.030690537084399, "percentage": 40.61, "elapsed_time": "4:48:53", "remaining_time": "7:02:25"}
795
+ {"current_steps": 795, "total_steps": 1955, "loss": 0.307, "lr": 2.960563616861129e-05, "epoch": 2.0332480818414322, "percentage": 40.66, "elapsed_time": "4:49:14", "remaining_time": "7:02:01"}
796
+ {"current_steps": 796, "total_steps": 1955, "loss": 0.3321, "lr": 2.957429015850985e-05, "epoch": 2.0358056265984654, "percentage": 40.72, "elapsed_time": "4:49:38", "remaining_time": "7:01:43"}
797
+ {"current_steps": 797, "total_steps": 1955, "loss": 0.3132, "lr": 2.9542913608021405e-05, "epoch": 2.0383631713554986, "percentage": 40.77, "elapsed_time": "4:49:54", "remaining_time": "7:01:13"}
798
+ {"current_steps": 798, "total_steps": 1955, "loss": 0.3234, "lr": 2.9511506617231906e-05, "epoch": 2.040920716112532, "percentage": 40.82, "elapsed_time": "4:50:17", "remaining_time": "7:00:53"}
799
+ {"current_steps": 799, "total_steps": 1955, "loss": 0.2968, "lr": 2.948006928632442e-05, "epoch": 2.0434782608695654, "percentage": 40.87, "elapsed_time": "4:50:39", "remaining_time": "7:00:31"}
800
+ {"current_steps": 800, "total_steps": 1955, "loss": 0.3139, "lr": 2.9448601715578774e-05, "epoch": 2.0460358056265986, "percentage": 40.92, "elapsed_time": "4:50:58", "remaining_time": "7:00:05"}
801
+ {"current_steps": 801, "total_steps": 1955, "loss": 0.3174, "lr": 2.9417104005371267e-05, "epoch": 2.0485933503836318, "percentage": 40.97, "elapsed_time": "4:51:15", "remaining_time": "6:59:37"}
802
+ {"current_steps": 802, "total_steps": 1955, "loss": 0.3044, "lr": 2.9385576256174347e-05, "epoch": 2.051150895140665, "percentage": 41.02, "elapsed_time": "4:51:38", "remaining_time": "6:59:16"}
803
+ {"current_steps": 803, "total_steps": 1955, "loss": 0.3064, "lr": 2.9354018568556256e-05, "epoch": 2.053708439897698, "percentage": 41.07, "elapsed_time": "4:51:56", "remaining_time": "6:58:50"}
804
+ {"current_steps": 804, "total_steps": 1955, "loss": 0.3241, "lr": 2.932243104318075e-05, "epoch": 2.0562659846547313, "percentage": 41.13, "elapsed_time": "4:52:16", "remaining_time": "6:58:25"}
805
+ {"current_steps": 805, "total_steps": 1955, "loss": 0.3277, "lr": 2.9290813780806768e-05, "epoch": 2.0588235294117645, "percentage": 41.18, "elapsed_time": "4:52:37", "remaining_time": "6:58:01"}
806
+ {"current_steps": 806, "total_steps": 1955, "loss": 0.32, "lr": 2.9259166882288088e-05, "epoch": 2.061381074168798, "percentage": 41.23, "elapsed_time": "4:52:59", "remaining_time": "6:57:40"}
807
+ {"current_steps": 807, "total_steps": 1955, "loss": 0.3268, "lr": 2.9227490448573047e-05, "epoch": 2.0639386189258313, "percentage": 41.28, "elapsed_time": "4:53:21", "remaining_time": "6:57:19"}
808
+ {"current_steps": 808, "total_steps": 1955, "loss": 0.3294, "lr": 2.919578458070416e-05, "epoch": 2.0664961636828645, "percentage": 41.33, "elapsed_time": "4:53:45", "remaining_time": "6:56:59"}
809
+ {"current_steps": 809, "total_steps": 1955, "loss": 0.3115, "lr": 2.9164049379817866e-05, "epoch": 2.0690537084398977, "percentage": 41.38, "elapsed_time": "4:54:08", "remaining_time": "6:56:40"}
810
+ {"current_steps": 810, "total_steps": 1955, "loss": 0.3049, "lr": 2.913228494714416e-05, "epoch": 2.071611253196931, "percentage": 41.43, "elapsed_time": "4:54:27", "remaining_time": "6:56:14"}
811
+ {"current_steps": 811, "total_steps": 1955, "loss": 0.3363, "lr": 2.910049138400626e-05, "epoch": 2.074168797953964, "percentage": 41.48, "elapsed_time": "4:54:47", "remaining_time": "6:55:49"}
812
+ {"current_steps": 812, "total_steps": 1955, "loss": 0.358, "lr": 2.9068668791820345e-05, "epoch": 2.0767263427109977, "percentage": 41.53, "elapsed_time": "4:55:06", "remaining_time": "6:55:24"}
813
+ {"current_steps": 813, "total_steps": 1955, "loss": 0.3174, "lr": 2.9036817272095158e-05, "epoch": 2.079283887468031, "percentage": 41.59, "elapsed_time": "4:55:28", "remaining_time": "6:55:02"}
814
+ {"current_steps": 814, "total_steps": 1955, "loss": 0.3239, "lr": 2.900493692643173e-05, "epoch": 2.081841432225064, "percentage": 41.64, "elapsed_time": "4:55:52", "remaining_time": "6:54:43"}
815
+ {"current_steps": 815, "total_steps": 1955, "loss": 0.3282, "lr": 2.897302785652305e-05, "epoch": 2.084398976982097, "percentage": 41.69, "elapsed_time": "4:56:14", "remaining_time": "6:54:22"}
816
+ {"current_steps": 816, "total_steps": 1955, "loss": 0.3249, "lr": 2.894109016415371e-05, "epoch": 2.0869565217391304, "percentage": 41.74, "elapsed_time": "4:56:36", "remaining_time": "6:54:00"}
817
+ {"current_steps": 817, "total_steps": 1955, "loss": 0.3053, "lr": 2.890912395119962e-05, "epoch": 2.0895140664961636, "percentage": 41.79, "elapsed_time": "4:56:59", "remaining_time": "6:53:41"}
818
+ {"current_steps": 818, "total_steps": 1955, "loss": 0.3313, "lr": 2.8877129319627667e-05, "epoch": 2.0920716112531967, "percentage": 41.84, "elapsed_time": "4:57:22", "remaining_time": "6:53:20"}
819
+ {"current_steps": 819, "total_steps": 1955, "loss": 0.3286, "lr": 2.8845106371495385e-05, "epoch": 2.0946291560102304, "percentage": 41.89, "elapsed_time": "4:57:42", "remaining_time": "6:52:57"}
820
+ {"current_steps": 820, "total_steps": 1955, "loss": 0.3053, "lr": 2.8813055208950618e-05, "epoch": 2.0971867007672635, "percentage": 41.94, "elapsed_time": "4:58:05", "remaining_time": "6:52:36"}
821
+ {"current_steps": 821, "total_steps": 1955, "loss": 0.3288, "lr": 2.8780975934231238e-05, "epoch": 2.0997442455242967, "percentage": 41.99, "elapsed_time": "4:58:27", "remaining_time": "6:52:15"}
822
+ {"current_steps": 822, "total_steps": 1955, "loss": 0.34, "lr": 2.874886864966477e-05, "epoch": 2.10230179028133, "percentage": 42.05, "elapsed_time": "4:58:50", "remaining_time": "6:51:54"}
823
+ {"current_steps": 823, "total_steps": 1955, "loss": 0.304, "lr": 2.8716733457668086e-05, "epoch": 2.104859335038363, "percentage": 42.1, "elapsed_time": "4:59:11", "remaining_time": "6:51:31"}
824
+ {"current_steps": 824, "total_steps": 1955, "loss": 0.3421, "lr": 2.86845704607471e-05, "epoch": 2.1074168797953963, "percentage": 42.15, "elapsed_time": "4:59:32", "remaining_time": "6:51:08"}
825
+ {"current_steps": 825, "total_steps": 1955, "loss": 0.3289, "lr": 2.8652379761496375e-05, "epoch": 2.10997442455243, "percentage": 42.2, "elapsed_time": "4:59:55", "remaining_time": "6:50:48"}
826
+ {"current_steps": 826, "total_steps": 1955, "loss": 0.3053, "lr": 2.8620161462598886e-05, "epoch": 2.112531969309463, "percentage": 42.25, "elapsed_time": "5:00:18", "remaining_time": "6:50:28"}
827
+ {"current_steps": 827, "total_steps": 1955, "loss": 0.319, "lr": 2.8587915666825626e-05, "epoch": 2.1150895140664963, "percentage": 42.3, "elapsed_time": "5:00:39", "remaining_time": "6:50:05"}
828
+ {"current_steps": 828, "total_steps": 1955, "loss": 0.3104, "lr": 2.8555642477035288e-05, "epoch": 2.1176470588235294, "percentage": 42.35, "elapsed_time": "5:00:56", "remaining_time": "6:49:37"}
829
+ {"current_steps": 829, "total_steps": 1955, "loss": 0.3424, "lr": 2.8523341996173976e-05, "epoch": 2.1202046035805626, "percentage": 42.4, "elapsed_time": "5:01:19", "remaining_time": "6:49:16"}
830
+ {"current_steps": 830, "total_steps": 1955, "loss": 0.2976, "lr": 2.8491014327274812e-05, "epoch": 2.122762148337596, "percentage": 42.46, "elapsed_time": "5:01:36", "remaining_time": "6:48:48"}
831
+ {"current_steps": 831, "total_steps": 1955, "loss": 0.2949, "lr": 2.8458659573457677e-05, "epoch": 2.125319693094629, "percentage": 42.51, "elapsed_time": "5:01:59", "remaining_time": "6:48:28"}
832
+ {"current_steps": 832, "total_steps": 1955, "loss": 0.3298, "lr": 2.842627783792883e-05, "epoch": 2.1278772378516626, "percentage": 42.56, "elapsed_time": "5:02:23", "remaining_time": "6:48:09"}
833
+ {"current_steps": 833, "total_steps": 1955, "loss": 0.323, "lr": 2.839386922398059e-05, "epoch": 2.130434782608696, "percentage": 42.61, "elapsed_time": "5:02:45", "remaining_time": "6:47:48"}
834
+ {"current_steps": 834, "total_steps": 1955, "loss": 0.3196, "lr": 2.8361433834991042e-05, "epoch": 2.132992327365729, "percentage": 42.66, "elapsed_time": "5:03:05", "remaining_time": "6:47:23"}
835
+ {"current_steps": 835, "total_steps": 1955, "loss": 0.3214, "lr": 2.832897177442365e-05, "epoch": 2.135549872122762, "percentage": 42.71, "elapsed_time": "5:03:26", "remaining_time": "6:47:00"}
836
+ {"current_steps": 836, "total_steps": 1955, "loss": 0.3298, "lr": 2.8296483145826964e-05, "epoch": 2.1381074168797953, "percentage": 42.76, "elapsed_time": "5:03:48", "remaining_time": "6:46:39"}
837
+ {"current_steps": 837, "total_steps": 1955, "loss": 0.3132, "lr": 2.8263968052834295e-05, "epoch": 2.1406649616368285, "percentage": 42.81, "elapsed_time": "5:04:09", "remaining_time": "6:46:15"}
838
+ {"current_steps": 838, "total_steps": 1955, "loss": 0.3151, "lr": 2.8231426599163355e-05, "epoch": 2.1432225063938617, "percentage": 42.86, "elapsed_time": "5:04:32", "remaining_time": "6:45:55"}
839
+ {"current_steps": 839, "total_steps": 1955, "loss": 0.3188, "lr": 2.8198858888615947e-05, "epoch": 2.1457800511508953, "percentage": 42.92, "elapsed_time": "5:04:54", "remaining_time": "6:45:34"}
840
+ {"current_steps": 840, "total_steps": 1955, "loss": 0.3358, "lr": 2.816626502507763e-05, "epoch": 2.1483375959079285, "percentage": 42.97, "elapsed_time": "5:05:14", "remaining_time": "6:45:10"}
841
+ {"current_steps": 841, "total_steps": 1955, "loss": 0.2889, "lr": 2.8133645112517388e-05, "epoch": 2.1508951406649617, "percentage": 43.02, "elapsed_time": "5:05:31", "remaining_time": "6:44:42"}
842
+ {"current_steps": 842, "total_steps": 1955, "loss": 0.3322, "lr": 2.8100999254987297e-05, "epoch": 2.153452685421995, "percentage": 43.07, "elapsed_time": "5:05:51", "remaining_time": "6:44:18"}
843
+ {"current_steps": 843, "total_steps": 1955, "loss": 0.3193, "lr": 2.8068327556622193e-05, "epoch": 2.156010230179028, "percentage": 43.12, "elapsed_time": "5:06:13", "remaining_time": "6:43:56"}
844
+ {"current_steps": 844, "total_steps": 1955, "loss": 0.3214, "lr": 2.8035630121639334e-05, "epoch": 2.1585677749360612, "percentage": 43.17, "elapsed_time": "5:06:34", "remaining_time": "6:43:33"}
845
+ {"current_steps": 845, "total_steps": 1955, "loss": 0.3372, "lr": 2.800290705433807e-05, "epoch": 2.1611253196930944, "percentage": 43.22, "elapsed_time": "5:06:59", "remaining_time": "6:43:16"}
846
+ {"current_steps": 846, "total_steps": 1955, "loss": 0.3294, "lr": 2.7970158459099542e-05, "epoch": 2.163682864450128, "percentage": 43.27, "elapsed_time": "5:07:22", "remaining_time": "6:42:55"}
847
+ {"current_steps": 847, "total_steps": 1955, "loss": 0.3105, "lr": 2.793738444038629e-05, "epoch": 2.166240409207161, "percentage": 43.32, "elapsed_time": "5:07:41", "remaining_time": "6:42:30"}
848
+ {"current_steps": 848, "total_steps": 1955, "loss": 0.3208, "lr": 2.7904585102741955e-05, "epoch": 2.1687979539641944, "percentage": 43.38, "elapsed_time": "5:08:03", "remaining_time": "6:42:08"}
849
+ {"current_steps": 849, "total_steps": 1955, "loss": 0.3354, "lr": 2.7871760550790967e-05, "epoch": 2.1713554987212276, "percentage": 43.43, "elapsed_time": "5:08:23", "remaining_time": "6:41:44"}
850
+ {"current_steps": 850, "total_steps": 1955, "loss": 0.34, "lr": 2.783891088923815e-05, "epoch": 2.1739130434782608, "percentage": 43.48, "elapsed_time": "5:08:44", "remaining_time": "6:41:21"}
851
+ {"current_steps": 851, "total_steps": 1955, "loss": 0.3314, "lr": 2.780603622286844e-05, "epoch": 2.176470588235294, "percentage": 43.53, "elapsed_time": "5:09:07", "remaining_time": "6:41:01"}
852
+ {"current_steps": 852, "total_steps": 1955, "loss": 0.3126, "lr": 2.777313665654654e-05, "epoch": 2.1790281329923276, "percentage": 43.58, "elapsed_time": "5:09:27", "remaining_time": "6:40:37"}
853
+ {"current_steps": 853, "total_steps": 1955, "loss": 0.3409, "lr": 2.7740212295216565e-05, "epoch": 2.1815856777493607, "percentage": 43.63, "elapsed_time": "5:09:49", "remaining_time": "6:40:16"}
854
+ {"current_steps": 854, "total_steps": 1955, "loss": 0.3349, "lr": 2.770726324390174e-05, "epoch": 2.184143222506394, "percentage": 43.68, "elapsed_time": "5:10:13", "remaining_time": "6:39:56"}
855
+ {"current_steps": 855, "total_steps": 1955, "loss": 0.3216, "lr": 2.7674289607704032e-05, "epoch": 2.186700767263427, "percentage": 43.73, "elapsed_time": "5:10:37", "remaining_time": "6:39:38"}
856
+ {"current_steps": 856, "total_steps": 1955, "loss": 0.3196, "lr": 2.7641291491803834e-05, "epoch": 2.1892583120204603, "percentage": 43.79, "elapsed_time": "5:10:58", "remaining_time": "6:39:15"}
857
+ {"current_steps": 857, "total_steps": 1955, "loss": 0.3302, "lr": 2.7608269001459634e-05, "epoch": 2.1918158567774935, "percentage": 43.84, "elapsed_time": "5:11:19", "remaining_time": "6:38:52"}
858
+ {"current_steps": 858, "total_steps": 1955, "loss": 0.327, "lr": 2.757522224200765e-05, "epoch": 2.1943734015345266, "percentage": 43.89, "elapsed_time": "5:11:40", "remaining_time": "6:38:29"}
859
+ {"current_steps": 859, "total_steps": 1955, "loss": 0.3246, "lr": 2.754215131886154e-05, "epoch": 2.1969309462915603, "percentage": 43.94, "elapsed_time": "5:12:03", "remaining_time": "6:38:09"}
860
+ {"current_steps": 860, "total_steps": 1955, "loss": 0.3588, "lr": 2.7509056337512015e-05, "epoch": 2.1994884910485935, "percentage": 43.99, "elapsed_time": "5:12:24", "remaining_time": "6:37:47"}
861
+ {"current_steps": 861, "total_steps": 1955, "loss": 0.3191, "lr": 2.747593740352655e-05, "epoch": 2.2020460358056266, "percentage": 44.04, "elapsed_time": "5:12:48", "remaining_time": "6:37:27"}
862
+ {"current_steps": 862, "total_steps": 1955, "loss": 0.3175, "lr": 2.744279462254901e-05, "epoch": 2.20460358056266, "percentage": 44.09, "elapsed_time": "5:13:10", "remaining_time": "6:37:05"}
863
+ {"current_steps": 863, "total_steps": 1955, "loss": 0.3341, "lr": 2.740962810029933e-05, "epoch": 2.207161125319693, "percentage": 44.14, "elapsed_time": "5:13:31", "remaining_time": "6:36:42"}
864
+ {"current_steps": 864, "total_steps": 1955, "loss": 0.304, "lr": 2.7376437942573177e-05, "epoch": 2.209718670076726, "percentage": 44.19, "elapsed_time": "5:13:53", "remaining_time": "6:36:21"}
865
+ {"current_steps": 865, "total_steps": 1955, "loss": 0.3102, "lr": 2.734322425524162e-05, "epoch": 2.21227621483376, "percentage": 44.25, "elapsed_time": "5:14:14", "remaining_time": "6:35:58"}
866
+ {"current_steps": 866, "total_steps": 1955, "loss": 0.3248, "lr": 2.730998714425077e-05, "epoch": 2.214833759590793, "percentage": 44.3, "elapsed_time": "5:14:33", "remaining_time": "6:35:33"}
867
+ {"current_steps": 867, "total_steps": 1955, "loss": 0.3223, "lr": 2.7276726715621468e-05, "epoch": 2.217391304347826, "percentage": 44.35, "elapsed_time": "5:14:57", "remaining_time": "6:35:15"}
868
+ {"current_steps": 868, "total_steps": 1955, "loss": 0.3453, "lr": 2.724344307544892e-05, "epoch": 2.2199488491048593, "percentage": 44.4, "elapsed_time": "5:15:21", "remaining_time": "6:34:55"}
869
+ {"current_steps": 869, "total_steps": 1955, "loss": 0.3431, "lr": 2.721013632990239e-05, "epoch": 2.2225063938618925, "percentage": 44.45, "elapsed_time": "5:15:42", "remaining_time": "6:34:32"}
870
+ {"current_steps": 870, "total_steps": 1955, "loss": 0.3378, "lr": 2.7176806585224818e-05, "epoch": 2.2250639386189257, "percentage": 44.5, "elapsed_time": "5:16:04", "remaining_time": "6:34:11"}
871
+ {"current_steps": 871, "total_steps": 1955, "loss": 0.2963, "lr": 2.714345394773255e-05, "epoch": 2.227621483375959, "percentage": 44.55, "elapsed_time": "5:16:26", "remaining_time": "6:33:49"}
872
+ {"current_steps": 872, "total_steps": 1955, "loss": 0.315, "lr": 2.7110078523814905e-05, "epoch": 2.2301790281329925, "percentage": 44.6, "elapsed_time": "5:16:44", "remaining_time": "6:33:23"}
873
+ {"current_steps": 873, "total_steps": 1955, "loss": 0.3068, "lr": 2.707668041993393e-05, "epoch": 2.2327365728900257, "percentage": 44.65, "elapsed_time": "5:17:06", "remaining_time": "6:33:00"}
874
+ {"current_steps": 874, "total_steps": 1955, "loss": 0.3044, "lr": 2.7043259742623994e-05, "epoch": 2.235294117647059, "percentage": 44.71, "elapsed_time": "5:17:28", "remaining_time": "6:32:40"}
875
+ {"current_steps": 875, "total_steps": 1955, "loss": 0.3062, "lr": 2.7009816598491475e-05, "epoch": 2.237851662404092, "percentage": 44.76, "elapsed_time": "5:17:50", "remaining_time": "6:32:17"}
876
+ {"current_steps": 876, "total_steps": 1955, "loss": 0.3414, "lr": 2.697635109421443e-05, "epoch": 2.2404092071611252, "percentage": 44.81, "elapsed_time": "5:18:12", "remaining_time": "6:31:57"}
877
+ {"current_steps": 877, "total_steps": 1955, "loss": 0.3275, "lr": 2.694286333654221e-05, "epoch": 2.2429667519181584, "percentage": 44.86, "elapsed_time": "5:18:35", "remaining_time": "6:31:37"}
878
+ {"current_steps": 878, "total_steps": 1955, "loss": 0.334, "lr": 2.690935343229519e-05, "epoch": 2.2455242966751916, "percentage": 44.91, "elapsed_time": "5:18:58", "remaining_time": "6:31:15"}
879
+ {"current_steps": 879, "total_steps": 1955, "loss": 0.3429, "lr": 2.687582148836436e-05, "epoch": 2.2480818414322252, "percentage": 44.96, "elapsed_time": "5:19:19", "remaining_time": "6:30:53"}
880
+ {"current_steps": 880, "total_steps": 1955, "loss": 0.3334, "lr": 2.684226761171102e-05, "epoch": 2.2506393861892584, "percentage": 45.01, "elapsed_time": "5:19:42", "remaining_time": "6:30:32"}
881
+ {"current_steps": 881, "total_steps": 1955, "loss": 0.3094, "lr": 2.6808691909366446e-05, "epoch": 2.2531969309462916, "percentage": 45.06, "elapsed_time": "5:20:03", "remaining_time": "6:30:10"}
882
+ {"current_steps": 882, "total_steps": 1955, "loss": 0.3366, "lr": 2.677509448843151e-05, "epoch": 2.2557544757033248, "percentage": 45.12, "elapsed_time": "5:20:24", "remaining_time": "6:29:47"}
883
+ {"current_steps": 883, "total_steps": 1955, "loss": 0.3363, "lr": 2.674147545607638e-05, "epoch": 2.258312020460358, "percentage": 45.17, "elapsed_time": "5:20:47", "remaining_time": "6:29:27"}
884
+ {"current_steps": 884, "total_steps": 1955, "loss": 0.3012, "lr": 2.6707834919540155e-05, "epoch": 2.260869565217391, "percentage": 45.22, "elapsed_time": "5:21:11", "remaining_time": "6:29:07"}
885
+ {"current_steps": 885, "total_steps": 1955, "loss": 0.333, "lr": 2.6674172986130532e-05, "epoch": 2.2634271099744243, "percentage": 45.27, "elapsed_time": "5:21:34", "remaining_time": "6:28:47"}
886
+ {"current_steps": 886, "total_steps": 1955, "loss": 0.3116, "lr": 2.6640489763223455e-05, "epoch": 2.265984654731458, "percentage": 45.32, "elapsed_time": "5:21:57", "remaining_time": "6:28:28"}
887
+ {"current_steps": 887, "total_steps": 1955, "loss": 0.3119, "lr": 2.6606785358262786e-05, "epoch": 2.268542199488491, "percentage": 45.37, "elapsed_time": "5:22:16", "remaining_time": "6:28:02"}
888
+ {"current_steps": 888, "total_steps": 1955, "loss": 0.3366, "lr": 2.6573059878759938e-05, "epoch": 2.2710997442455243, "percentage": 45.42, "elapsed_time": "5:22:37", "remaining_time": "6:27:39"}
889
+ {"current_steps": 889, "total_steps": 1955, "loss": 0.3092, "lr": 2.6539313432293572e-05, "epoch": 2.2736572890025575, "percentage": 45.47, "elapsed_time": "5:22:58", "remaining_time": "6:27:16"}
890
+ {"current_steps": 890, "total_steps": 1955, "loss": 0.2995, "lr": 2.6505546126509217e-05, "epoch": 2.2762148337595907, "percentage": 45.52, "elapsed_time": "5:23:12", "remaining_time": "6:26:45"}
891
+ {"current_steps": 891, "total_steps": 1955, "loss": 0.3179, "lr": 2.6471758069118933e-05, "epoch": 2.2787723785166243, "percentage": 45.58, "elapsed_time": "5:23:36", "remaining_time": "6:26:25"}
892
+ {"current_steps": 892, "total_steps": 1955, "loss": 0.3497, "lr": 2.643794936790098e-05, "epoch": 2.2813299232736575, "percentage": 45.63, "elapsed_time": "5:23:57", "remaining_time": "6:26:03"}
893
+ {"current_steps": 893, "total_steps": 1955, "loss": 0.3282, "lr": 2.640412013069948e-05, "epoch": 2.2838874680306906, "percentage": 45.68, "elapsed_time": "5:24:20", "remaining_time": "6:25:43"}
894
+ {"current_steps": 894, "total_steps": 1955, "loss": 0.3046, "lr": 2.6370270465424047e-05, "epoch": 2.286445012787724, "percentage": 45.73, "elapsed_time": "5:24:40", "remaining_time": "6:25:19"}
895
+ {"current_steps": 895, "total_steps": 1955, "loss": 0.2953, "lr": 2.633640048004946e-05, "epoch": 2.289002557544757, "percentage": 45.78, "elapsed_time": "5:25:02", "remaining_time": "6:24:58"}
896
+ {"current_steps": 896, "total_steps": 1955, "loss": 0.3436, "lr": 2.6302510282615316e-05, "epoch": 2.29156010230179, "percentage": 45.83, "elapsed_time": "5:25:24", "remaining_time": "6:24:36"}
897
+ {"current_steps": 897, "total_steps": 1955, "loss": 0.3117, "lr": 2.6268599981225685e-05, "epoch": 2.2941176470588234, "percentage": 45.88, "elapsed_time": "5:25:47", "remaining_time": "6:24:16"}
898
+ {"current_steps": 898, "total_steps": 1955, "loss": 0.3051, "lr": 2.623466968404877e-05, "epoch": 2.296675191815857, "percentage": 45.93, "elapsed_time": "5:26:08", "remaining_time": "6:23:53"}
899
+ {"current_steps": 899, "total_steps": 1955, "loss": 0.3172, "lr": 2.620071949931656e-05, "epoch": 2.29923273657289, "percentage": 45.98, "elapsed_time": "5:26:29", "remaining_time": "6:23:30"}
900
+ {"current_steps": 900, "total_steps": 1955, "loss": 0.3393, "lr": 2.616674953532446e-05, "epoch": 2.3017902813299234, "percentage": 46.04, "elapsed_time": "5:26:52", "remaining_time": "6:23:09"}
901
+ {"current_steps": 901, "total_steps": 1955, "loss": 0.3628, "lr": 2.6132759900430998e-05, "epoch": 2.3043478260869565, "percentage": 46.09, "elapsed_time": "5:27:15", "remaining_time": "6:22:49"}
902
+ {"current_steps": 902, "total_steps": 1955, "loss": 0.3245, "lr": 2.6098750703057426e-05, "epoch": 2.3069053708439897, "percentage": 46.14, "elapsed_time": "5:27:39", "remaining_time": "6:22:30"}
903
+ {"current_steps": 903, "total_steps": 1955, "loss": 0.3261, "lr": 2.606472205168741e-05, "epoch": 2.309462915601023, "percentage": 46.19, "elapsed_time": "5:27:57", "remaining_time": "6:22:03"}
904
+ {"current_steps": 904, "total_steps": 1955, "loss": 0.3371, "lr": 2.603067405486666e-05, "epoch": 2.312020460358056, "percentage": 46.24, "elapsed_time": "5:28:17", "remaining_time": "6:21:40"}
905
+ {"current_steps": 905, "total_steps": 1955, "loss": 0.3622, "lr": 2.59966068212026e-05, "epoch": 2.3145780051150897, "percentage": 46.29, "elapsed_time": "5:28:33", "remaining_time": "6:21:11"}
906
+ {"current_steps": 906, "total_steps": 1955, "loss": 0.3458, "lr": 2.5962520459364035e-05, "epoch": 2.317135549872123, "percentage": 46.34, "elapsed_time": "5:28:55", "remaining_time": "6:20:50"}
907
+ {"current_steps": 907, "total_steps": 1955, "loss": 0.2972, "lr": 2.5928415078080746e-05, "epoch": 2.319693094629156, "percentage": 46.39, "elapsed_time": "5:29:15", "remaining_time": "6:20:26"}
908
+ {"current_steps": 908, "total_steps": 1955, "loss": 0.3154, "lr": 2.5894290786143214e-05, "epoch": 2.3222506393861893, "percentage": 46.45, "elapsed_time": "5:29:37", "remaining_time": "6:20:05"}
909
+ {"current_steps": 909, "total_steps": 1955, "loss": 0.3015, "lr": 2.5860147692402233e-05, "epoch": 2.3248081841432224, "percentage": 46.5, "elapsed_time": "5:29:59", "remaining_time": "6:19:43"}
910
+ {"current_steps": 910, "total_steps": 1955, "loss": 0.3105, "lr": 2.5825985905768565e-05, "epoch": 2.3273657289002556, "percentage": 46.55, "elapsed_time": "5:30:19", "remaining_time": "6:19:19"}
911
+ {"current_steps": 911, "total_steps": 1955, "loss": 0.3448, "lr": 2.579180553521262e-05, "epoch": 2.329923273657289, "percentage": 46.6, "elapsed_time": "5:30:43", "remaining_time": "6:19:00"}
912
+ {"current_steps": 912, "total_steps": 1955, "loss": 0.3219, "lr": 2.5757606689764057e-05, "epoch": 2.3324808184143224, "percentage": 46.65, "elapsed_time": "5:31:07", "remaining_time": "6:18:40"}
913
+ {"current_steps": 913, "total_steps": 1955, "loss": 0.3591, "lr": 2.5723389478511492e-05, "epoch": 2.3350383631713556, "percentage": 46.7, "elapsed_time": "5:31:30", "remaining_time": "6:18:20"}
914
+ {"current_steps": 914, "total_steps": 1955, "loss": 0.321, "lr": 2.568915401060211e-05, "epoch": 2.337595907928389, "percentage": 46.75, "elapsed_time": "5:31:51", "remaining_time": "6:17:57"}
915
+ {"current_steps": 915, "total_steps": 1955, "loss": 0.3017, "lr": 2.5654900395241346e-05, "epoch": 2.340153452685422, "percentage": 46.8, "elapsed_time": "5:32:11", "remaining_time": "6:17:34"}
916
+ {"current_steps": 916, "total_steps": 1955, "loss": 0.301, "lr": 2.5620628741692504e-05, "epoch": 2.342710997442455, "percentage": 46.85, "elapsed_time": "5:32:32", "remaining_time": "6:17:11"}
917
+ {"current_steps": 917, "total_steps": 1955, "loss": 0.3132, "lr": 2.5586339159276444e-05, "epoch": 2.3452685421994883, "percentage": 46.91, "elapsed_time": "5:32:52", "remaining_time": "6:16:48"}
918
+ {"current_steps": 918, "total_steps": 1955, "loss": 0.3195, "lr": 2.5552031757371206e-05, "epoch": 2.3478260869565215, "percentage": 46.96, "elapsed_time": "5:33:12", "remaining_time": "6:16:24"}
919
+ {"current_steps": 919, "total_steps": 1955, "loss": 0.3219, "lr": 2.551770664541167e-05, "epoch": 2.350383631713555, "percentage": 47.01, "elapsed_time": "5:33:34", "remaining_time": "6:16:03"}
920
+ {"current_steps": 920, "total_steps": 1955, "loss": 0.325, "lr": 2.5483363932889216e-05, "epoch": 2.3529411764705883, "percentage": 47.06, "elapsed_time": "5:33:58", "remaining_time": "6:15:43"}
921
+ {"current_steps": 921, "total_steps": 1955, "loss": 0.3539, "lr": 2.5449003729351365e-05, "epoch": 2.3554987212276215, "percentage": 47.11, "elapsed_time": "5:34:23", "remaining_time": "6:15:24"}
922
+ {"current_steps": 922, "total_steps": 1955, "loss": 0.3276, "lr": 2.541462614440142e-05, "epoch": 2.3580562659846547, "percentage": 47.16, "elapsed_time": "5:34:42", "remaining_time": "6:15:00"}
923
+ {"current_steps": 923, "total_steps": 1955, "loss": 0.3261, "lr": 2.538023128769816e-05, "epoch": 2.360613810741688, "percentage": 47.21, "elapsed_time": "5:35:04", "remaining_time": "6:14:39"}
924
+ {"current_steps": 924, "total_steps": 1955, "loss": 0.3035, "lr": 2.5345819268955403e-05, "epoch": 2.363171355498721, "percentage": 47.26, "elapsed_time": "5:35:28", "remaining_time": "6:14:18"}
925
+ {"current_steps": 925, "total_steps": 1955, "loss": 0.2997, "lr": 2.5311390197941763e-05, "epoch": 2.3657289002557547, "percentage": 47.31, "elapsed_time": "5:35:51", "remaining_time": "6:13:59"}
926
+ {"current_steps": 926, "total_steps": 1955, "loss": 0.3344, "lr": 2.5276944184480224e-05, "epoch": 2.368286445012788, "percentage": 47.37, "elapsed_time": "5:36:14", "remaining_time": "6:13:39"}
927
+ {"current_steps": 927, "total_steps": 1955, "loss": 0.3241, "lr": 2.5242481338447812e-05, "epoch": 2.370843989769821, "percentage": 47.42, "elapsed_time": "5:36:38", "remaining_time": "6:13:18"}
928
+ {"current_steps": 928, "total_steps": 1955, "loss": 0.3217, "lr": 2.520800176977527e-05, "epoch": 2.373401534526854, "percentage": 47.47, "elapsed_time": "5:36:57", "remaining_time": "6:12:54"}
929
+ {"current_steps": 929, "total_steps": 1955, "loss": 0.3298, "lr": 2.5173505588446642e-05, "epoch": 2.3759590792838874, "percentage": 47.52, "elapsed_time": "5:37:19", "remaining_time": "6:12:32"}
930
+ {"current_steps": 930, "total_steps": 1955, "loss": 0.345, "lr": 2.5138992904499e-05, "epoch": 2.3785166240409206, "percentage": 47.57, "elapsed_time": "5:37:40", "remaining_time": "6:12:10"}
931
+ {"current_steps": 931, "total_steps": 1955, "loss": 0.3381, "lr": 2.5104463828022033e-05, "epoch": 2.381074168797954, "percentage": 47.62, "elapsed_time": "5:38:03", "remaining_time": "6:11:50"}
932
+ {"current_steps": 932, "total_steps": 1955, "loss": 0.329, "lr": 2.5069918469157744e-05, "epoch": 2.3836317135549874, "percentage": 47.67, "elapsed_time": "5:38:26", "remaining_time": "6:11:29"}
933
+ {"current_steps": 933, "total_steps": 1955, "loss": 0.3325, "lr": 2.5035356938100045e-05, "epoch": 2.3861892583120206, "percentage": 47.72, "elapsed_time": "5:38:50", "remaining_time": "6:11:10"}
934
+ {"current_steps": 934, "total_steps": 1955, "loss": 0.3208, "lr": 2.5000779345094466e-05, "epoch": 2.3887468030690537, "percentage": 47.77, "elapsed_time": "5:39:09", "remaining_time": "6:10:45"}
935
+ {"current_steps": 935, "total_steps": 1955, "loss": 0.2977, "lr": 2.4966185800437743e-05, "epoch": 2.391304347826087, "percentage": 47.83, "elapsed_time": "5:39:29", "remaining_time": "6:10:21"}
936
+ {"current_steps": 936, "total_steps": 1955, "loss": 0.2902, "lr": 2.493157641447751e-05, "epoch": 2.39386189258312, "percentage": 47.88, "elapsed_time": "5:39:53", "remaining_time": "6:10:02"}
937
+ {"current_steps": 937, "total_steps": 1955, "loss": 0.3014, "lr": 2.489695129761193e-05, "epoch": 2.3964194373401533, "percentage": 47.93, "elapsed_time": "5:40:12", "remaining_time": "6:09:36"}
938
+ {"current_steps": 938, "total_steps": 1955, "loss": 0.3054, "lr": 2.486231056028934e-05, "epoch": 2.398976982097187, "percentage": 47.98, "elapsed_time": "5:40:34", "remaining_time": "6:09:15"}
939
+ {"current_steps": 939, "total_steps": 1955, "loss": 0.3234, "lr": 2.4827654313007917e-05, "epoch": 2.40153452685422, "percentage": 48.03, "elapsed_time": "5:40:56", "remaining_time": "6:08:53"}
940
+ {"current_steps": 940, "total_steps": 1955, "loss": 0.3125, "lr": 2.4792982666315306e-05, "epoch": 2.4040920716112533, "percentage": 48.08, "elapsed_time": "5:41:18", "remaining_time": "6:08:32"}
941
+ {"current_steps": 941, "total_steps": 1955, "loss": 0.3219, "lr": 2.4758295730808253e-05, "epoch": 2.4066496163682864, "percentage": 48.13, "elapsed_time": "5:41:42", "remaining_time": "6:08:12"}
942
+ {"current_steps": 942, "total_steps": 1955, "loss": 0.316, "lr": 2.4723593617132307e-05, "epoch": 2.4092071611253196, "percentage": 48.18, "elapsed_time": "5:42:03", "remaining_time": "6:07:50"}
943
+ {"current_steps": 943, "total_steps": 1955, "loss": 0.3195, "lr": 2.468887643598141e-05, "epoch": 2.411764705882353, "percentage": 48.24, "elapsed_time": "5:42:24", "remaining_time": "6:07:27"}
944
+ {"current_steps": 944, "total_steps": 1955, "loss": 0.323, "lr": 2.4654144298097574e-05, "epoch": 2.414322250639386, "percentage": 48.29, "elapsed_time": "5:42:44", "remaining_time": "6:07:03"}
945
+ {"current_steps": 945, "total_steps": 1955, "loss": 0.3522, "lr": 2.4619397314270527e-05, "epoch": 2.4168797953964196, "percentage": 48.34, "elapsed_time": "5:43:06", "remaining_time": "6:06:42"}
946
+ {"current_steps": 946, "total_steps": 1955, "loss": 0.3437, "lr": 2.4584635595337328e-05, "epoch": 2.419437340153453, "percentage": 48.39, "elapsed_time": "5:43:29", "remaining_time": "6:06:22"}
947
+ {"current_steps": 947, "total_steps": 1955, "loss": 0.3243, "lr": 2.454985925218207e-05, "epoch": 2.421994884910486, "percentage": 48.44, "elapsed_time": "5:43:52", "remaining_time": "6:06:01"}
948
+ {"current_steps": 948, "total_steps": 1955, "loss": 0.3671, "lr": 2.4515068395735488e-05, "epoch": 2.424552429667519, "percentage": 48.49, "elapsed_time": "5:44:14", "remaining_time": "6:05:39"}
949
+ {"current_steps": 949, "total_steps": 1955, "loss": 0.3531, "lr": 2.4480263136974584e-05, "epoch": 2.4271099744245523, "percentage": 48.54, "elapsed_time": "5:44:35", "remaining_time": "6:05:17"}
950
+ {"current_steps": 950, "total_steps": 1955, "loss": 0.3129, "lr": 2.444544358692234e-05, "epoch": 2.4296675191815855, "percentage": 48.59, "elapsed_time": "5:44:58", "remaining_time": "6:04:56"}
951
+ {"current_steps": 951, "total_steps": 1955, "loss": 0.3579, "lr": 2.4410609856647297e-05, "epoch": 2.4322250639386187, "percentage": 48.64, "elapsed_time": "5:45:21", "remaining_time": "6:04:36"}
952
+ {"current_steps": 952, "total_steps": 1955, "loss": 0.3213, "lr": 2.4375762057263243e-05, "epoch": 2.4347826086956523, "percentage": 48.7, "elapsed_time": "5:45:42", "remaining_time": "6:04:13"}
953
+ {"current_steps": 953, "total_steps": 1955, "loss": 0.3158, "lr": 2.4340900299928843e-05, "epoch": 2.4373401534526855, "percentage": 48.75, "elapsed_time": "5:46:03", "remaining_time": "6:03:50"}
954
+ {"current_steps": 954, "total_steps": 1955, "loss": 0.3413, "lr": 2.430602469584727e-05, "epoch": 2.4398976982097187, "percentage": 48.8, "elapsed_time": "5:46:26", "remaining_time": "6:03:30"}
955
+ {"current_steps": 955, "total_steps": 1955, "loss": 0.3219, "lr": 2.4271135356265884e-05, "epoch": 2.442455242966752, "percentage": 48.85, "elapsed_time": "5:46:48", "remaining_time": "6:03:08"}
956
+ {"current_steps": 956, "total_steps": 1955, "loss": 0.3485, "lr": 2.423623239247586e-05, "epoch": 2.445012787723785, "percentage": 48.9, "elapsed_time": "5:47:11", "remaining_time": "6:02:48"}
957
+ {"current_steps": 957, "total_steps": 1955, "loss": 0.3219, "lr": 2.4201315915811815e-05, "epoch": 2.4475703324808182, "percentage": 48.95, "elapsed_time": "5:47:34", "remaining_time": "6:02:28"}
958
+ {"current_steps": 958, "total_steps": 1955, "loss": 0.33, "lr": 2.416638603765149e-05, "epoch": 2.4501278772378514, "percentage": 49.0, "elapsed_time": "5:47:56", "remaining_time": "6:02:06"}
959
+ {"current_steps": 959, "total_steps": 1955, "loss": 0.302, "lr": 2.4131442869415355e-05, "epoch": 2.452685421994885, "percentage": 49.05, "elapsed_time": "5:48:19", "remaining_time": "6:01:45"}
960
+ {"current_steps": 960, "total_steps": 1955, "loss": 0.3052, "lr": 2.4096486522566288e-05, "epoch": 2.455242966751918, "percentage": 49.1, "elapsed_time": "5:48:39", "remaining_time": "6:01:21"}
961
+ {"current_steps": 961, "total_steps": 1955, "loss": 0.3419, "lr": 2.4061517108609187e-05, "epoch": 2.4578005115089514, "percentage": 49.16, "elapsed_time": "5:48:59", "remaining_time": "6:00:58"}
962
+ {"current_steps": 962, "total_steps": 1955, "loss": 0.3144, "lr": 2.4026534739090657e-05, "epoch": 2.4603580562659846, "percentage": 49.21, "elapsed_time": "5:49:22", "remaining_time": "6:00:38"}
963
+ {"current_steps": 963, "total_steps": 1955, "loss": 0.3656, "lr": 2.3991539525598613e-05, "epoch": 2.4629156010230178, "percentage": 49.26, "elapsed_time": "5:49:45", "remaining_time": "6:00:17"}
964
+ {"current_steps": 964, "total_steps": 1955, "loss": 0.3412, "lr": 2.3956531579761948e-05, "epoch": 2.4654731457800514, "percentage": 49.31, "elapsed_time": "5:50:10", "remaining_time": "5:59:58"}
965
+ {"current_steps": 965, "total_steps": 1955, "loss": 0.3339, "lr": 2.3921511013250155e-05, "epoch": 2.4680306905370846, "percentage": 49.36, "elapsed_time": "5:50:33", "remaining_time": "5:59:38"}
966
+ {"current_steps": 966, "total_steps": 1955, "loss": 0.3225, "lr": 2.3886477937772984e-05, "epoch": 2.4705882352941178, "percentage": 49.41, "elapsed_time": "5:50:52", "remaining_time": "5:59:13"}
967
+ {"current_steps": 967, "total_steps": 1955, "loss": 0.3167, "lr": 2.3851432465080124e-05, "epoch": 2.473145780051151, "percentage": 49.46, "elapsed_time": "5:51:13", "remaining_time": "5:58:51"}
968
+ {"current_steps": 968, "total_steps": 1955, "loss": 0.3129, "lr": 2.3816374706960762e-05, "epoch": 2.475703324808184, "percentage": 49.51, "elapsed_time": "5:51:31", "remaining_time": "5:58:25"}
969
+ {"current_steps": 969, "total_steps": 1955, "loss": 0.3213, "lr": 2.378130477524329e-05, "epoch": 2.4782608695652173, "percentage": 49.57, "elapsed_time": "5:51:50", "remaining_time": "5:58:00"}
970
+ {"current_steps": 970, "total_steps": 1955, "loss": 0.3184, "lr": 2.374622278179495e-05, "epoch": 2.4808184143222505, "percentage": 49.62, "elapsed_time": "5:52:14", "remaining_time": "5:57:41"}
971
+ {"current_steps": 971, "total_steps": 1955, "loss": 0.3465, "lr": 2.371112883852143e-05, "epoch": 2.483375959079284, "percentage": 49.67, "elapsed_time": "5:52:36", "remaining_time": "5:57:20"}
972
+ {"current_steps": 972, "total_steps": 1955, "loss": 0.3098, "lr": 2.3676023057366558e-05, "epoch": 2.4859335038363173, "percentage": 49.72, "elapsed_time": "5:53:00", "remaining_time": "5:57:00"}
973
+ {"current_steps": 973, "total_steps": 1955, "loss": 0.3344, "lr": 2.3640905550311915e-05, "epoch": 2.4884910485933505, "percentage": 49.77, "elapsed_time": "5:53:19", "remaining_time": "5:56:35"}
974
+ {"current_steps": 974, "total_steps": 1955, "loss": 0.3345, "lr": 2.360577642937647e-05, "epoch": 2.4910485933503836, "percentage": 49.82, "elapsed_time": "5:53:43", "remaining_time": "5:56:15"}
975
+ {"current_steps": 975, "total_steps": 1955, "loss": 0.3266, "lr": 2.3570635806616276e-05, "epoch": 2.493606138107417, "percentage": 49.87, "elapsed_time": "5:54:06", "remaining_time": "5:55:55"}
976
+ {"current_steps": 976, "total_steps": 1955, "loss": 0.3137, "lr": 2.3535483794124036e-05, "epoch": 2.49616368286445, "percentage": 49.92, "elapsed_time": "5:54:25", "remaining_time": "5:55:30"}
977
+ {"current_steps": 977, "total_steps": 1955, "loss": 0.351, "lr": 2.3500320504028802e-05, "epoch": 2.498721227621483, "percentage": 49.97, "elapsed_time": "5:54:48", "remaining_time": "5:55:09"}
978
+ {"current_steps": 978, "total_steps": 1955, "loss": 0.3494, "lr": 2.3465146048495607e-05, "epoch": 2.501278772378517, "percentage": 50.03, "elapsed_time": "5:55:09", "remaining_time": "5:54:47"}
979
+ {"current_steps": 979, "total_steps": 1955, "loss": 0.3197, "lr": 2.342996053972508e-05, "epoch": 2.50383631713555, "percentage": 50.08, "elapsed_time": "5:55:30", "remaining_time": "5:54:25"}
980
+ {"current_steps": 980, "total_steps": 1955, "loss": 0.3039, "lr": 2.3394764089953127e-05, "epoch": 2.506393861892583, "percentage": 50.13, "elapsed_time": "5:55:55", "remaining_time": "5:54:06"}
981
+ {"current_steps": 981, "total_steps": 1955, "loss": 0.3518, "lr": 2.335955681145055e-05, "epoch": 2.5089514066496164, "percentage": 50.18, "elapsed_time": "5:56:18", "remaining_time": "5:53:45"}
982
+ {"current_steps": 982, "total_steps": 1955, "loss": 0.3102, "lr": 2.332433881652268e-05, "epoch": 2.5115089514066495, "percentage": 50.23, "elapsed_time": "5:56:39", "remaining_time": "5:53:23"}
983
+ {"current_steps": 983, "total_steps": 1955, "loss": 0.351, "lr": 2.3289110217509036e-05, "epoch": 2.5140664961636827, "percentage": 50.28, "elapsed_time": "5:57:03", "remaining_time": "5:53:04"}
984
+ {"current_steps": 984, "total_steps": 1955, "loss": 0.3389, "lr": 2.3253871126782982e-05, "epoch": 2.516624040920716, "percentage": 50.33, "elapsed_time": "5:57:27", "remaining_time": "5:52:44"}
985
+ {"current_steps": 985, "total_steps": 1955, "loss": 0.3298, "lr": 2.3218621656751325e-05, "epoch": 2.5191815856777495, "percentage": 50.38, "elapsed_time": "5:57:48", "remaining_time": "5:52:21"}
986
+ {"current_steps": 986, "total_steps": 1955, "loss": 0.337, "lr": 2.3183361919853988e-05, "epoch": 2.5217391304347827, "percentage": 50.43, "elapsed_time": "5:58:10", "remaining_time": "5:51:59"}
987
+ {"current_steps": 987, "total_steps": 1955, "loss": 0.3347, "lr": 2.3148092028563646e-05, "epoch": 2.524296675191816, "percentage": 50.49, "elapsed_time": "5:58:28", "remaining_time": "5:51:34"}
988
+ {"current_steps": 988, "total_steps": 1955, "loss": 0.3055, "lr": 2.3112812095385362e-05, "epoch": 2.526854219948849, "percentage": 50.54, "elapsed_time": "5:58:52", "remaining_time": "5:51:15"}
989
+ {"current_steps": 989, "total_steps": 1955, "loss": 0.3085, "lr": 2.307752223285624e-05, "epoch": 2.5294117647058822, "percentage": 50.59, "elapsed_time": "5:59:14", "remaining_time": "5:50:52"}
990
+ {"current_steps": 990, "total_steps": 1955, "loss": 0.3495, "lr": 2.3042222553545038e-05, "epoch": 2.531969309462916, "percentage": 50.64, "elapsed_time": "5:59:37", "remaining_time": "5:50:33"}
991
+ {"current_steps": 991, "total_steps": 1955, "loss": 0.334, "lr": 2.3006913170051836e-05, "epoch": 2.5345268542199486, "percentage": 50.69, "elapsed_time": "6:00:02", "remaining_time": "5:50:13"}
992
+ {"current_steps": 992, "total_steps": 1955, "loss": 0.3295, "lr": 2.2971594195007695e-05, "epoch": 2.5370843989769822, "percentage": 50.74, "elapsed_time": "6:00:25", "remaining_time": "5:49:53"}
993
+ {"current_steps": 993, "total_steps": 1955, "loss": 0.3217, "lr": 2.2936265741074225e-05, "epoch": 2.5396419437340154, "percentage": 50.79, "elapsed_time": "6:00:47", "remaining_time": "5:49:31"}
994
+ {"current_steps": 994, "total_steps": 1955, "loss": 0.3421, "lr": 2.2900927920943304e-05, "epoch": 2.5421994884910486, "percentage": 50.84, "elapsed_time": "6:01:07", "remaining_time": "5:49:08"}
995
+ {"current_steps": 995, "total_steps": 1955, "loss": 0.3025, "lr": 2.286558084733668e-05, "epoch": 2.544757033248082, "percentage": 50.9, "elapsed_time": "6:01:27", "remaining_time": "5:48:44"}
996
+ {"current_steps": 996, "total_steps": 1955, "loss": 0.2954, "lr": 2.2830224633005607e-05, "epoch": 2.547314578005115, "percentage": 50.95, "elapsed_time": "6:01:47", "remaining_time": "5:48:21"}
997
+ {"current_steps": 997, "total_steps": 1955, "loss": 0.2948, "lr": 2.279485939073052e-05, "epoch": 2.5498721227621486, "percentage": 51.0, "elapsed_time": "6:02:09", "remaining_time": "5:47:59"}
998
+ {"current_steps": 998, "total_steps": 1955, "loss": 0.3201, "lr": 2.275948523332062e-05, "epoch": 2.5524296675191813, "percentage": 51.05, "elapsed_time": "6:02:32", "remaining_time": "5:47:38"}
999
+ {"current_steps": 999, "total_steps": 1955, "loss": 0.3102, "lr": 2.2724102273613577e-05, "epoch": 2.554987212276215, "percentage": 51.1, "elapsed_time": "6:02:51", "remaining_time": "5:47:14"}
1000
+ {"current_steps": 1000, "total_steps": 1955, "loss": 0.3748, "lr": 2.268871062447512e-05, "epoch": 2.557544757033248, "percentage": 51.15, "elapsed_time": "6:03:14", "remaining_time": "5:46:54"}
1001
+ {"current_steps": 1001, "total_steps": 1955, "loss": 0.3456, "lr": 2.265331039879869e-05, "epoch": 2.5601023017902813, "percentage": 51.2, "elapsed_time": "6:03:38", "remaining_time": "5:46:34"}
1002
+ {"current_steps": 1002, "total_steps": 1955, "loss": 0.3052, "lr": 2.2617901709505115e-05, "epoch": 2.5626598465473145, "percentage": 51.25, "elapsed_time": "6:04:01", "remaining_time": "5:46:13"}
1003
+ {"current_steps": 1003, "total_steps": 1955, "loss": 0.3488, "lr": 2.258248466954219e-05, "epoch": 2.5652173913043477, "percentage": 51.3, "elapsed_time": "6:04:21", "remaining_time": "5:45:49"}
1004
+ {"current_steps": 1004, "total_steps": 1955, "loss": 0.3031, "lr": 2.2547059391884364e-05, "epoch": 2.5677749360613813, "percentage": 51.36, "elapsed_time": "6:04:43", "remaining_time": "5:45:28"}
1005
+ {"current_steps": 1005, "total_steps": 1955, "loss": 0.3217, "lr": 2.251162598953235e-05, "epoch": 2.5703324808184145, "percentage": 51.41, "elapsed_time": "6:05:05", "remaining_time": "5:45:06"}
1006
+ {"current_steps": 1006, "total_steps": 1955, "loss": 0.3247, "lr": 2.2476184575512795e-05, "epoch": 2.5728900255754477, "percentage": 51.46, "elapsed_time": "6:05:27", "remaining_time": "5:44:44"}
1007
+ {"current_steps": 1007, "total_steps": 1955, "loss": 0.2896, "lr": 2.2440735262877884e-05, "epoch": 2.575447570332481, "percentage": 51.51, "elapsed_time": "6:05:47", "remaining_time": "5:44:21"}
1008
+ {"current_steps": 1008, "total_steps": 1955, "loss": 0.3172, "lr": 2.2405278164705015e-05, "epoch": 2.578005115089514, "percentage": 51.56, "elapsed_time": "6:06:11", "remaining_time": "5:44:01"}
1009
+ {"current_steps": 1009, "total_steps": 1955, "loss": 0.3219, "lr": 2.2369813394096403e-05, "epoch": 2.580562659846547, "percentage": 51.61, "elapsed_time": "6:06:32", "remaining_time": "5:43:39"}
1010
+ {"current_steps": 1010, "total_steps": 1955, "loss": 0.3319, "lr": 2.2334341064178737e-05, "epoch": 2.5831202046035804, "percentage": 51.66, "elapsed_time": "6:06:55", "remaining_time": "5:43:18"}
1011
+ {"current_steps": 1011, "total_steps": 1955, "loss": 0.3419, "lr": 2.229886128810285e-05, "epoch": 2.585677749360614, "percentage": 51.71, "elapsed_time": "6:07:14", "remaining_time": "5:42:54"}
1012
+ {"current_steps": 1012, "total_steps": 1955, "loss": 0.3294, "lr": 2.2263374179043283e-05, "epoch": 2.588235294117647, "percentage": 51.76, "elapsed_time": "6:07:35", "remaining_time": "5:42:31"}
1013
+ {"current_steps": 1013, "total_steps": 1955, "loss": 0.3115, "lr": 2.2227879850197995e-05, "epoch": 2.5907928388746804, "percentage": 51.82, "elapsed_time": "6:07:53", "remaining_time": "5:42:06"}
1014
+ {"current_steps": 1014, "total_steps": 1955, "loss": 0.322, "lr": 2.2192378414787976e-05, "epoch": 2.5933503836317136, "percentage": 51.87, "elapsed_time": "6:08:14", "remaining_time": "5:41:43"}
1015
+ {"current_steps": 1015, "total_steps": 1955, "loss": 0.3253, "lr": 2.215686998605686e-05, "epoch": 2.5959079283887467, "percentage": 51.92, "elapsed_time": "6:08:33", "remaining_time": "5:41:19"}
1016
+ {"current_steps": 1016, "total_steps": 1955, "loss": 0.3672, "lr": 2.212135467727062e-05, "epoch": 2.59846547314578, "percentage": 51.97, "elapsed_time": "6:08:55", "remaining_time": "5:40:57"}
1017
+ {"current_steps": 1017, "total_steps": 1955, "loss": 0.338, "lr": 2.2085832601717168e-05, "epoch": 2.601023017902813, "percentage": 52.02, "elapsed_time": "6:09:19", "remaining_time": "5:40:38"}
1018
+ {"current_steps": 1018, "total_steps": 1955, "loss": 0.3187, "lr": 2.2050303872705973e-05, "epoch": 2.6035805626598467, "percentage": 52.07, "elapsed_time": "6:09:41", "remaining_time": "5:40:16"}
1019
+ {"current_steps": 1019, "total_steps": 1955, "loss": 0.3005, "lr": 2.2014768603567767e-05, "epoch": 2.60613810741688, "percentage": 52.12, "elapsed_time": "6:10:05", "remaining_time": "5:39:56"}
1020
+ {"current_steps": 1020, "total_steps": 1955, "loss": 0.3411, "lr": 2.1979226907654115e-05, "epoch": 2.608695652173913, "percentage": 52.17, "elapsed_time": "6:10:29", "remaining_time": "5:39:36"}
1021
+ {"current_steps": 1021, "total_steps": 1955, "loss": 0.3113, "lr": 2.1943678898337087e-05, "epoch": 2.6112531969309463, "percentage": 52.23, "elapsed_time": "6:10:51", "remaining_time": "5:39:15"}
1022
+ {"current_steps": 1022, "total_steps": 1955, "loss": 0.3354, "lr": 2.190812468900892e-05, "epoch": 2.6138107416879794, "percentage": 52.28, "elapsed_time": "6:11:08", "remaining_time": "5:38:49"}
1023
+ {"current_steps": 1023, "total_steps": 1955, "loss": 0.3068, "lr": 2.1872564393081576e-05, "epoch": 2.6163682864450126, "percentage": 52.33, "elapsed_time": "6:11:31", "remaining_time": "5:38:28"}
1024
+ {"current_steps": 1024, "total_steps": 1955, "loss": 0.3269, "lr": 2.1836998123986483e-05, "epoch": 2.618925831202046, "percentage": 52.38, "elapsed_time": "6:11:51", "remaining_time": "5:38:05"}
1025
+ {"current_steps": 1025, "total_steps": 1955, "loss": 0.2779, "lr": 2.1801425995174096e-05, "epoch": 2.6214833759590794, "percentage": 52.43, "elapsed_time": "6:12:11", "remaining_time": "5:37:41"}
1026
+ {"current_steps": 1026, "total_steps": 1955, "loss": 0.3133, "lr": 2.1765848120113564e-05, "epoch": 2.6240409207161126, "percentage": 52.48, "elapsed_time": "6:12:34", "remaining_time": "5:37:21"}
1027
+ {"current_steps": 1027, "total_steps": 1955, "loss": 0.2822, "lr": 2.1730264612292365e-05, "epoch": 2.626598465473146, "percentage": 52.53, "elapsed_time": "6:12:54", "remaining_time": "5:36:57"}
1028
+ {"current_steps": 1028, "total_steps": 1955, "loss": 0.3406, "lr": 2.1694675585215957e-05, "epoch": 2.629156010230179, "percentage": 52.58, "elapsed_time": "6:13:15", "remaining_time": "5:36:34"}
1029
+ {"current_steps": 1029, "total_steps": 1955, "loss": 0.3552, "lr": 2.165908115240739e-05, "epoch": 2.631713554987212, "percentage": 52.63, "elapsed_time": "6:13:34", "remaining_time": "5:36:10"}
1030
+ {"current_steps": 1030, "total_steps": 1955, "loss": 0.3322, "lr": 2.1623481427406952e-05, "epoch": 2.634271099744246, "percentage": 52.69, "elapsed_time": "6:13:52", "remaining_time": "5:35:45"}
1031
+ {"current_steps": 1031, "total_steps": 1955, "loss": 0.3031, "lr": 2.1587876523771833e-05, "epoch": 2.6368286445012785, "percentage": 52.74, "elapsed_time": "6:14:13", "remaining_time": "5:35:22"}
1032
+ {"current_steps": 1032, "total_steps": 1955, "loss": 0.3256, "lr": 2.155226655507573e-05, "epoch": 2.639386189258312, "percentage": 52.79, "elapsed_time": "6:14:36", "remaining_time": "5:35:02"}
1033
+ {"current_steps": 1033, "total_steps": 1955, "loss": 0.2972, "lr": 2.15166516349085e-05, "epoch": 2.6419437340153453, "percentage": 52.84, "elapsed_time": "6:14:58", "remaining_time": "5:34:41"}
1034
+ {"current_steps": 1034, "total_steps": 1955, "loss": 0.3377, "lr": 2.148103187687578e-05, "epoch": 2.6445012787723785, "percentage": 52.89, "elapsed_time": "6:15:21", "remaining_time": "5:34:20"}
1035
+ {"current_steps": 1035, "total_steps": 1955, "loss": 0.3582, "lr": 2.1445407394598656e-05, "epoch": 2.6470588235294117, "percentage": 52.94, "elapsed_time": "6:15:44", "remaining_time": "5:33:59"}
1036
+ {"current_steps": 1036, "total_steps": 1955, "loss": 0.3039, "lr": 2.140977830171328e-05, "epoch": 2.649616368286445, "percentage": 52.99, "elapsed_time": "6:16:05", "remaining_time": "5:33:36"}
1037
+ {"current_steps": 1037, "total_steps": 1955, "loss": 0.3474, "lr": 2.1374144711870514e-05, "epoch": 2.6521739130434785, "percentage": 53.04, "elapsed_time": "6:16:27", "remaining_time": "5:33:15"}
1038
+ {"current_steps": 1038, "total_steps": 1955, "loss": 0.307, "lr": 2.1338506738735552e-05, "epoch": 2.6547314578005117, "percentage": 53.09, "elapsed_time": "6:16:49", "remaining_time": "5:32:53"}
1039
+ {"current_steps": 1039, "total_steps": 1955, "loss": 0.3272, "lr": 2.1302864495987586e-05, "epoch": 2.657289002557545, "percentage": 53.15, "elapsed_time": "6:17:12", "remaining_time": "5:32:33"}
1040
+ {"current_steps": 1040, "total_steps": 1955, "loss": 0.3461, "lr": 2.126721809731941e-05, "epoch": 2.659846547314578, "percentage": 53.2, "elapsed_time": "6:17:32", "remaining_time": "5:32:10"}
1041
+ {"current_steps": 1041, "total_steps": 1955, "loss": 0.3144, "lr": 2.123156765643709e-05, "epoch": 2.662404092071611, "percentage": 53.25, "elapsed_time": "6:17:53", "remaining_time": "5:31:46"}
1042
+ {"current_steps": 1042, "total_steps": 1955, "loss": 0.3302, "lr": 2.1195913287059578e-05, "epoch": 2.6649616368286444, "percentage": 53.3, "elapsed_time": "6:18:15", "remaining_time": "5:31:26"}
1043
+ {"current_steps": 1043, "total_steps": 1955, "loss": 0.3137, "lr": 2.1160255102918357e-05, "epoch": 2.6675191815856776, "percentage": 53.35, "elapsed_time": "6:18:37", "remaining_time": "5:31:04"}
1044
+ {"current_steps": 1044, "total_steps": 1955, "loss": 0.333, "lr": 2.1124593217757092e-05, "epoch": 2.670076726342711, "percentage": 53.4, "elapsed_time": "6:19:01", "remaining_time": "5:30:44"}
1045
+ {"current_steps": 1045, "total_steps": 1955, "loss": 0.3068, "lr": 2.1088927745331224e-05, "epoch": 2.6726342710997444, "percentage": 53.45, "elapsed_time": "6:19:23", "remaining_time": "5:30:23"}
1046
+ {"current_steps": 1046, "total_steps": 1955, "loss": 0.3276, "lr": 2.1053258799407668e-05, "epoch": 2.6751918158567776, "percentage": 53.5, "elapsed_time": "6:19:44", "remaining_time": "5:29:59"}
1047
+ {"current_steps": 1047, "total_steps": 1955, "loss": 0.3097, "lr": 2.1017586493764404e-05, "epoch": 2.6777493606138107, "percentage": 53.55, "elapsed_time": "6:20:06", "remaining_time": "5:29:38"}
1048
+ {"current_steps": 1048, "total_steps": 1955, "loss": 0.3087, "lr": 2.0981910942190123e-05, "epoch": 2.680306905370844, "percentage": 53.61, "elapsed_time": "6:20:29", "remaining_time": "5:29:17"}
1049
+ {"current_steps": 1049, "total_steps": 1955, "loss": 0.3047, "lr": 2.0946232258483888e-05, "epoch": 2.682864450127877, "percentage": 53.66, "elapsed_time": "6:20:51", "remaining_time": "5:28:56"}
1050
+ {"current_steps": 1050, "total_steps": 1955, "loss": 0.3233, "lr": 2.091055055645474e-05, "epoch": 2.6854219948849103, "percentage": 53.71, "elapsed_time": "6:21:14", "remaining_time": "5:28:35"}
1051
+ {"current_steps": 1051, "total_steps": 1955, "loss": 0.3097, "lr": 2.087486594992135e-05, "epoch": 2.687979539641944, "percentage": 53.76, "elapsed_time": "6:21:34", "remaining_time": "5:28:11"}
1052
+ {"current_steps": 1052, "total_steps": 1955, "loss": 0.326, "lr": 2.0839178552711653e-05, "epoch": 2.690537084398977, "percentage": 53.81, "elapsed_time": "6:21:58", "remaining_time": "5:27:52"}
1053
+ {"current_steps": 1053, "total_steps": 1955, "loss": 0.3007, "lr": 2.0803488478662488e-05, "epoch": 2.6930946291560103, "percentage": 53.86, "elapsed_time": "6:22:23", "remaining_time": "5:27:33"}
1054
+ {"current_steps": 1054, "total_steps": 1955, "loss": 0.324, "lr": 2.0767795841619235e-05, "epoch": 2.6956521739130435, "percentage": 53.91, "elapsed_time": "6:22:44", "remaining_time": "5:27:10"}
1055
+ {"current_steps": 1055, "total_steps": 1955, "loss": 0.3136, "lr": 2.0732100755435446e-05, "epoch": 2.6982097186700766, "percentage": 53.96, "elapsed_time": "6:23:04", "remaining_time": "5:26:47"}
1056
+ {"current_steps": 1056, "total_steps": 1955, "loss": 0.3167, "lr": 2.0696403333972483e-05, "epoch": 2.70076726342711, "percentage": 54.02, "elapsed_time": "6:23:25", "remaining_time": "5:26:25"}
1057
+ {"current_steps": 1057, "total_steps": 1955, "loss": 0.3387, "lr": 2.0660703691099154e-05, "epoch": 2.703324808184143, "percentage": 54.07, "elapsed_time": "6:23:48", "remaining_time": "5:26:04"}
1058
+ {"current_steps": 1058, "total_steps": 1955, "loss": 0.3124, "lr": 2.062500194069138e-05, "epoch": 2.7058823529411766, "percentage": 54.12, "elapsed_time": "6:24:10", "remaining_time": "5:25:42"}
1059
+ {"current_steps": 1059, "total_steps": 1955, "loss": 0.2979, "lr": 2.058929819663176e-05, "epoch": 2.70843989769821, "percentage": 54.17, "elapsed_time": "6:24:31", "remaining_time": "5:25:20"}
1060
+ {"current_steps": 1060, "total_steps": 1955, "loss": 0.3174, "lr": 2.0553592572809287e-05, "epoch": 2.710997442455243, "percentage": 54.22, "elapsed_time": "6:24:52", "remaining_time": "5:24:57"}
1061
+ {"current_steps": 1061, "total_steps": 1955, "loss": 0.3318, "lr": 2.051788518311895e-05, "epoch": 2.713554987212276, "percentage": 54.27, "elapsed_time": "6:25:09", "remaining_time": "5:24:32"}
1062
+ {"current_steps": 1062, "total_steps": 1955, "loss": 0.3285, "lr": 2.048217614146134e-05, "epoch": 2.7161125319693094, "percentage": 54.32, "elapsed_time": "6:25:29", "remaining_time": "5:24:08"}
1063
+ {"current_steps": 1063, "total_steps": 1955, "loss": 0.336, "lr": 2.0446465561742346e-05, "epoch": 2.718670076726343, "percentage": 54.37, "elapsed_time": "6:25:52", "remaining_time": "5:23:48"}
1064
+ {"current_steps": 1064, "total_steps": 1955, "loss": 0.319, "lr": 2.041075355787276e-05, "epoch": 2.7212276214833757, "percentage": 54.42, "elapsed_time": "6:26:14", "remaining_time": "5:23:26"}
1065
+ {"current_steps": 1065, "total_steps": 1955, "loss": 0.3066, "lr": 2.0375040243767903e-05, "epoch": 2.7237851662404093, "percentage": 54.48, "elapsed_time": "6:26:37", "remaining_time": "5:23:05"}
1066
+ {"current_steps": 1066, "total_steps": 1955, "loss": 0.2905, "lr": 2.0339325733347294e-05, "epoch": 2.7263427109974425, "percentage": 54.53, "elapsed_time": "6:26:56", "remaining_time": "5:22:41"}
1067
+ {"current_steps": 1067, "total_steps": 1955, "loss": 0.3346, "lr": 2.0303610140534246e-05, "epoch": 2.7289002557544757, "percentage": 54.58, "elapsed_time": "6:27:20", "remaining_time": "5:22:21"}
1068
+ {"current_steps": 1068, "total_steps": 1955, "loss": 0.3194, "lr": 2.0267893579255547e-05, "epoch": 2.731457800511509, "percentage": 54.63, "elapsed_time": "6:27:41", "remaining_time": "5:21:58"}
1069
+ {"current_steps": 1069, "total_steps": 1955, "loss": 0.3272, "lr": 2.0232176163441055e-05, "epoch": 2.734015345268542, "percentage": 54.68, "elapsed_time": "6:28:00", "remaining_time": "5:21:34"}
1070
+ {"current_steps": 1070, "total_steps": 1955, "loss": 0.3344, "lr": 2.0196458007023367e-05, "epoch": 2.7365728900255757, "percentage": 54.73, "elapsed_time": "6:28:20", "remaining_time": "5:21:12"}
1071
+ {"current_steps": 1071, "total_steps": 1955, "loss": 0.3331, "lr": 2.0160739223937447e-05, "epoch": 2.7391304347826084, "percentage": 54.78, "elapsed_time": "6:28:38", "remaining_time": "5:20:46"}
1072
+ {"current_steps": 1072, "total_steps": 1955, "loss": 0.3395, "lr": 2.0125019928120238e-05, "epoch": 2.741687979539642, "percentage": 54.83, "elapsed_time": "6:29:01", "remaining_time": "5:20:26"}
1073
+ {"current_steps": 1073, "total_steps": 1955, "loss": 0.2995, "lr": 2.0089300233510332e-05, "epoch": 2.7442455242966752, "percentage": 54.88, "elapsed_time": "6:29:19", "remaining_time": "5:20:01"}
1074
+ {"current_steps": 1074, "total_steps": 1955, "loss": 0.318, "lr": 2.0053580254047586e-05, "epoch": 2.7468030690537084, "percentage": 54.94, "elapsed_time": "6:29:38", "remaining_time": "5:19:37"}
1075
+ {"current_steps": 1075, "total_steps": 1955, "loss": 0.3234, "lr": 2.0017860103672778e-05, "epoch": 2.7493606138107416, "percentage": 54.99, "elapsed_time": "6:29:57", "remaining_time": "5:19:13"}
1076
+ {"current_steps": 1076, "total_steps": 1955, "loss": 0.3608, "lr": 1.9982139896327232e-05, "epoch": 2.7519181585677748, "percentage": 55.04, "elapsed_time": "6:30:19", "remaining_time": "5:18:51"}
1077
+ {"current_steps": 1077, "total_steps": 1955, "loss": 0.3273, "lr": 1.994641974595242e-05, "epoch": 2.7544757033248084, "percentage": 55.09, "elapsed_time": "6:30:41", "remaining_time": "5:18:30"}
1078
+ {"current_steps": 1078, "total_steps": 1955, "loss": 0.3286, "lr": 1.9910699766489675e-05, "epoch": 2.7570332480818416, "percentage": 55.14, "elapsed_time": "6:31:02", "remaining_time": "5:18:07"}
1079
+ {"current_steps": 1079, "total_steps": 1955, "loss": 0.3344, "lr": 1.987498007187977e-05, "epoch": 2.7595907928388748, "percentage": 55.19, "elapsed_time": "6:31:21", "remaining_time": "5:17:43"}
1080
+ {"current_steps": 1080, "total_steps": 1955, "loss": 0.3407, "lr": 1.9839260776062556e-05, "epoch": 2.762148337595908, "percentage": 55.24, "elapsed_time": "6:31:45", "remaining_time": "5:17:23"}
1081
+ {"current_steps": 1081, "total_steps": 1955, "loss": 0.3352, "lr": 1.9803541992976632e-05, "epoch": 2.764705882352941, "percentage": 55.29, "elapsed_time": "6:32:07", "remaining_time": "5:17:02"}
1082
+ {"current_steps": 1082, "total_steps": 1955, "loss": 0.3375, "lr": 1.976782383655895e-05, "epoch": 2.7672634271099743, "percentage": 55.35, "elapsed_time": "6:32:32", "remaining_time": "5:16:42"}
1083
+ {"current_steps": 1083, "total_steps": 1955, "loss": 0.345, "lr": 1.973210642074446e-05, "epoch": 2.7698209718670075, "percentage": 55.4, "elapsed_time": "6:32:53", "remaining_time": "5:16:20"}
1084
+ {"current_steps": 1084, "total_steps": 1955, "loss": 0.3572, "lr": 1.969638985946576e-05, "epoch": 2.772378516624041, "percentage": 55.45, "elapsed_time": "6:33:13", "remaining_time": "5:15:57"}
1085
+ {"current_steps": 1085, "total_steps": 1955, "loss": 0.3173, "lr": 1.966067426665271e-05, "epoch": 2.7749360613810743, "percentage": 55.5, "elapsed_time": "6:33:32", "remaining_time": "5:15:33"}
1086
+ {"current_steps": 1086, "total_steps": 1955, "loss": 0.344, "lr": 1.96249597562321e-05, "epoch": 2.7774936061381075, "percentage": 55.55, "elapsed_time": "6:33:55", "remaining_time": "5:15:12"}
1087
+ {"current_steps": 1087, "total_steps": 1955, "loss": 0.3454, "lr": 1.958924644212725e-05, "epoch": 2.7800511508951407, "percentage": 55.6, "elapsed_time": "6:34:17", "remaining_time": "5:14:51"}
1088
+ {"current_steps": 1088, "total_steps": 1955, "loss": 0.3408, "lr": 1.9553534438257657e-05, "epoch": 2.782608695652174, "percentage": 55.65, "elapsed_time": "6:34:34", "remaining_time": "5:14:26"}
1089
+ {"current_steps": 1089, "total_steps": 1955, "loss": 0.3812, "lr": 1.9517823858538668e-05, "epoch": 2.785166240409207, "percentage": 55.7, "elapsed_time": "6:34:59", "remaining_time": "5:14:06"}
1090
+ {"current_steps": 1090, "total_steps": 1955, "loss": 0.31, "lr": 1.9482114816881054e-05, "epoch": 2.78772378516624, "percentage": 55.75, "elapsed_time": "6:35:21", "remaining_time": "5:13:44"}
1091
+ {"current_steps": 1091, "total_steps": 1955, "loss": 0.327, "lr": 1.9446407427190713e-05, "epoch": 2.790281329923274, "percentage": 55.81, "elapsed_time": "6:35:44", "remaining_time": "5:13:24"}
1092
+ {"current_steps": 1092, "total_steps": 1955, "loss": 0.3102, "lr": 1.941070180336824e-05, "epoch": 2.792838874680307, "percentage": 55.86, "elapsed_time": "6:36:05", "remaining_time": "5:13:01"}
1093
+ {"current_steps": 1093, "total_steps": 1955, "loss": 0.3031, "lr": 1.9374998059308628e-05, "epoch": 2.79539641943734, "percentage": 55.91, "elapsed_time": "6:36:28", "remaining_time": "5:12:41"}
1094
+ {"current_steps": 1094, "total_steps": 1955, "loss": 0.3159, "lr": 1.933929630890085e-05, "epoch": 2.7979539641943734, "percentage": 55.96, "elapsed_time": "6:36:52", "remaining_time": "5:12:21"}
1095
+ {"current_steps": 1095, "total_steps": 1955, "loss": 0.3369, "lr": 1.9303596666027524e-05, "epoch": 2.8005115089514065, "percentage": 56.01, "elapsed_time": "6:37:11", "remaining_time": "5:11:57"}
1096
+ {"current_steps": 1096, "total_steps": 1955, "loss": 0.2971, "lr": 1.926789924456456e-05, "epoch": 2.80306905370844, "percentage": 56.06, "elapsed_time": "6:37:32", "remaining_time": "5:11:34"}
1097
+ {"current_steps": 1097, "total_steps": 1955, "loss": 0.3122, "lr": 1.9232204158380765e-05, "epoch": 2.805626598465473, "percentage": 56.11, "elapsed_time": "6:37:55", "remaining_time": "5:11:13"}
1098
+ {"current_steps": 1098, "total_steps": 1955, "loss": 0.3483, "lr": 1.919651152133752e-05, "epoch": 2.8081841432225065, "percentage": 56.16, "elapsed_time": "6:38:17", "remaining_time": "5:10:52"}
1099
+ {"current_steps": 1099, "total_steps": 1955, "loss": 0.3082, "lr": 1.9160821447288354e-05, "epoch": 2.8107416879795397, "percentage": 56.21, "elapsed_time": "6:38:40", "remaining_time": "5:10:31"}
1100
+ {"current_steps": 1100, "total_steps": 1955, "loss": 0.3197, "lr": 1.9125134050078652e-05, "epoch": 2.813299232736573, "percentage": 56.27, "elapsed_time": "6:38:58", "remaining_time": "5:10:07"}
1101
+ {"current_steps": 1101, "total_steps": 1955, "loss": 0.3163, "lr": 1.9089449443545264e-05, "epoch": 2.815856777493606, "percentage": 56.32, "elapsed_time": "6:39:20", "remaining_time": "5:09:45"}
1102
+ {"current_steps": 1102, "total_steps": 1955, "loss": 0.3013, "lr": 1.9053767741516112e-05, "epoch": 2.8184143222506393, "percentage": 56.37, "elapsed_time": "6:39:39", "remaining_time": "5:09:21"}
1103
+ {"current_steps": 1103, "total_steps": 1955, "loss": 0.3204, "lr": 1.901808905780988e-05, "epoch": 2.820971867007673, "percentage": 56.42, "elapsed_time": "6:39:58", "remaining_time": "5:08:57"}
1104
+ {"current_steps": 1104, "total_steps": 1955, "loss": 0.3301, "lr": 1.8982413506235606e-05, "epoch": 2.8235294117647056, "percentage": 56.47, "elapsed_time": "6:40:20", "remaining_time": "5:08:36"}
1105
+ {"current_steps": 1105, "total_steps": 1955, "loss": 0.309, "lr": 1.894674120059234e-05, "epoch": 2.8260869565217392, "percentage": 56.52, "elapsed_time": "6:40:43", "remaining_time": "5:08:14"}
1106
+ {"current_steps": 1106, "total_steps": 1955, "loss": 0.2934, "lr": 1.891107225466878e-05, "epoch": 2.8286445012787724, "percentage": 56.57, "elapsed_time": "6:41:03", "remaining_time": "5:07:51"}
1107
+ {"current_steps": 1107, "total_steps": 1955, "loss": 0.3196, "lr": 1.8875406782242915e-05, "epoch": 2.8312020460358056, "percentage": 56.62, "elapsed_time": "6:41:23", "remaining_time": "5:07:28"}
1108
+ {"current_steps": 1108, "total_steps": 1955, "loss": 0.3031, "lr": 1.8839744897081643e-05, "epoch": 2.833759590792839, "percentage": 56.68, "elapsed_time": "6:41:44", "remaining_time": "5:07:06"}
1109
+ {"current_steps": 1109, "total_steps": 1955, "loss": 0.3005, "lr": 1.880408671294043e-05, "epoch": 2.836317135549872, "percentage": 56.73, "elapsed_time": "6:42:09", "remaining_time": "5:06:47"}
1110
+ {"current_steps": 1110, "total_steps": 1955, "loss": 0.3287, "lr": 1.8768432343562915e-05, "epoch": 2.8388746803069056, "percentage": 56.78, "elapsed_time": "6:42:32", "remaining_time": "5:06:26"}
1111
+ {"current_steps": 1111, "total_steps": 1955, "loss": 0.3434, "lr": 1.8732781902680595e-05, "epoch": 2.8414322250639388, "percentage": 56.83, "elapsed_time": "6:42:54", "remaining_time": "5:06:04"}
1112
+ {"current_steps": 1112, "total_steps": 1955, "loss": 0.2954, "lr": 1.8697135504012417e-05, "epoch": 2.843989769820972, "percentage": 56.88, "elapsed_time": "6:43:15", "remaining_time": "5:05:42"}
1113
+ {"current_steps": 1113, "total_steps": 1955, "loss": 0.3169, "lr": 1.8661493261264448e-05, "epoch": 2.846547314578005, "percentage": 56.93, "elapsed_time": "6:43:36", "remaining_time": "5:05:20"}
1114
+ {"current_steps": 1114, "total_steps": 1955, "loss": 0.3471, "lr": 1.8625855288129483e-05, "epoch": 2.8491048593350383, "percentage": 56.98, "elapsed_time": "6:44:00", "remaining_time": "5:04:59"}
1115
+ {"current_steps": 1115, "total_steps": 1955, "loss": 0.3076, "lr": 1.8590221698286722e-05, "epoch": 2.8516624040920715, "percentage": 57.03, "elapsed_time": "6:44:24", "remaining_time": "5:04:39"}
1116
+ {"current_steps": 1116, "total_steps": 1955, "loss": 0.3291, "lr": 1.855459260540135e-05, "epoch": 2.8542199488491047, "percentage": 57.08, "elapsed_time": "6:44:44", "remaining_time": "5:04:16"}
1117
+ {"current_steps": 1117, "total_steps": 1955, "loss": 0.3094, "lr": 1.8518968123124227e-05, "epoch": 2.8567774936061383, "percentage": 57.14, "elapsed_time": "6:45:07", "remaining_time": "5:03:56"}
1118
+ {"current_steps": 1118, "total_steps": 1955, "loss": 0.3397, "lr": 1.848334836509151e-05, "epoch": 2.8593350383631715, "percentage": 57.19, "elapsed_time": "6:45:28", "remaining_time": "5:03:33"}
1119
+ {"current_steps": 1119, "total_steps": 1955, "loss": 0.2936, "lr": 1.844773344492427e-05, "epoch": 2.8618925831202047, "percentage": 57.24, "elapsed_time": "6:45:49", "remaining_time": "5:03:11"}
1120
+ {"current_steps": 1120, "total_steps": 1955, "loss": 0.3141, "lr": 1.8412123476228173e-05, "epoch": 2.864450127877238, "percentage": 57.29, "elapsed_time": "6:46:12", "remaining_time": "5:02:50"}
1121
+ {"current_steps": 1121, "total_steps": 1955, "loss": 0.3163, "lr": 1.8376518572593055e-05, "epoch": 2.867007672634271, "percentage": 57.34, "elapsed_time": "6:46:33", "remaining_time": "5:02:27"}
1122
+ {"current_steps": 1122, "total_steps": 1955, "loss": 0.3139, "lr": 1.8340918847592618e-05, "epoch": 2.869565217391304, "percentage": 57.39, "elapsed_time": "6:46:53", "remaining_time": "5:02:04"}
1123
+ {"current_steps": 1123, "total_steps": 1955, "loss": 0.3355, "lr": 1.830532441478405e-05, "epoch": 2.8721227621483374, "percentage": 57.44, "elapsed_time": "6:47:15", "remaining_time": "5:01:43"}
1124
+ {"current_steps": 1124, "total_steps": 1955, "loss": 0.3355, "lr": 1.8269735387707635e-05, "epoch": 2.874680306905371, "percentage": 57.49, "elapsed_time": "6:47:39", "remaining_time": "5:01:23"}
1125
+ {"current_steps": 1125, "total_steps": 1955, "loss": 0.336, "lr": 1.823415187988644e-05, "epoch": 2.877237851662404, "percentage": 57.54, "elapsed_time": "6:48:01", "remaining_time": "5:01:01"}
1126
+ {"current_steps": 1126, "total_steps": 1955, "loss": 0.2814, "lr": 1.8198574004825914e-05, "epoch": 2.8797953964194374, "percentage": 57.6, "elapsed_time": "6:48:22", "remaining_time": "5:00:39"}
1127
+ {"current_steps": 1127, "total_steps": 1955, "loss": 0.3422, "lr": 1.816300187601352e-05, "epoch": 2.8823529411764706, "percentage": 57.65, "elapsed_time": "6:48:45", "remaining_time": "5:00:18"}
1128
+ {"current_steps": 1128, "total_steps": 1955, "loss": 0.311, "lr": 1.812743560691843e-05, "epoch": 2.8849104859335037, "percentage": 57.7, "elapsed_time": "6:49:04", "remaining_time": "4:59:55"}
1129
+ {"current_steps": 1129, "total_steps": 1955, "loss": 0.3214, "lr": 1.8091875310991088e-05, "epoch": 2.887468030690537, "percentage": 57.75, "elapsed_time": "6:49:27", "remaining_time": "4:59:34"}
1130
+ {"current_steps": 1130, "total_steps": 1955, "loss": 0.3261, "lr": 1.8056321101662916e-05, "epoch": 2.89002557544757, "percentage": 57.8, "elapsed_time": "6:49:45", "remaining_time": "4:59:09"}
1131
+ {"current_steps": 1131, "total_steps": 1955, "loss": 0.3148, "lr": 1.80207730923459e-05, "epoch": 2.8925831202046037, "percentage": 57.85, "elapsed_time": "6:50:06", "remaining_time": "4:58:46"}
1132
+ {"current_steps": 1132, "total_steps": 1955, "loss": 0.3101, "lr": 1.7985231396432243e-05, "epoch": 2.895140664961637, "percentage": 57.9, "elapsed_time": "6:50:28", "remaining_time": "4:58:25"}
1133
+ {"current_steps": 1133, "total_steps": 1955, "loss": 0.3354, "lr": 1.7949696127294033e-05, "epoch": 2.89769820971867, "percentage": 57.95, "elapsed_time": "6:50:49", "remaining_time": "4:58:03"}
1134
+ {"current_steps": 1134, "total_steps": 1955, "loss": 0.3499, "lr": 1.791416739828284e-05, "epoch": 2.9002557544757033, "percentage": 58.01, "elapsed_time": "6:51:09", "remaining_time": "4:57:40"}
1135
+ {"current_steps": 1135, "total_steps": 1955, "loss": 0.353, "lr": 1.787864532272938e-05, "epoch": 2.9028132992327365, "percentage": 58.06, "elapsed_time": "6:51:32", "remaining_time": "4:57:19"}
1136
+ {"current_steps": 1136, "total_steps": 1955, "loss": 0.3157, "lr": 1.784313001394314e-05, "epoch": 2.90537084398977, "percentage": 58.11, "elapsed_time": "6:51:50", "remaining_time": "4:56:55"}
1137
+ {"current_steps": 1137, "total_steps": 1955, "loss": 0.3105, "lr": 1.7807621585212037e-05, "epoch": 2.907928388746803, "percentage": 58.16, "elapsed_time": "6:52:11", "remaining_time": "4:56:32"}
1138
+ {"current_steps": 1138, "total_steps": 1955, "loss": 0.3263, "lr": 1.7772120149802012e-05, "epoch": 2.9104859335038364, "percentage": 58.21, "elapsed_time": "6:52:33", "remaining_time": "4:56:11"}
1139
+ {"current_steps": 1139, "total_steps": 1955, "loss": 0.3311, "lr": 1.7736625820956724e-05, "epoch": 2.9130434782608696, "percentage": 58.26, "elapsed_time": "6:52:55", "remaining_time": "4:55:49"}
1140
+ {"current_steps": 1140, "total_steps": 1955, "loss": 0.318, "lr": 1.7701138711897158e-05, "epoch": 2.915601023017903, "percentage": 58.31, "elapsed_time": "6:53:18", "remaining_time": "4:55:28"}
1141
+ {"current_steps": 1141, "total_steps": 1955, "loss": 0.3339, "lr": 1.7665658935821263e-05, "epoch": 2.918158567774936, "percentage": 58.36, "elapsed_time": "6:53:43", "remaining_time": "4:55:09"}
1142
+ {"current_steps": 1142, "total_steps": 1955, "loss": 0.3508, "lr": 1.763018660590361e-05, "epoch": 2.920716112531969, "percentage": 58.41, "elapsed_time": "6:54:06", "remaining_time": "4:54:48"}
1143
+ {"current_steps": 1143, "total_steps": 1955, "loss": 0.3179, "lr": 1.7594721835294995e-05, "epoch": 2.923273657289003, "percentage": 58.47, "elapsed_time": "6:54:25", "remaining_time": "4:54:24"}
1144
+ {"current_steps": 1144, "total_steps": 1955, "loss": 0.3059, "lr": 1.755926473712212e-05, "epoch": 2.9258312020460355, "percentage": 58.52, "elapsed_time": "6:54:44", "remaining_time": "4:54:01"}
1145
+ {"current_steps": 1145, "total_steps": 1955, "loss": 0.2786, "lr": 1.752381542448721e-05, "epoch": 2.928388746803069, "percentage": 58.57, "elapsed_time": "6:55:06", "remaining_time": "4:53:39"}
1146
+ {"current_steps": 1146, "total_steps": 1955, "loss": 0.3171, "lr": 1.7488374010467652e-05, "epoch": 2.9309462915601023, "percentage": 58.62, "elapsed_time": "6:55:29", "remaining_time": "4:53:18"}
1147
+ {"current_steps": 1147, "total_steps": 1955, "loss": 0.3163, "lr": 1.7452940608115642e-05, "epoch": 2.9335038363171355, "percentage": 58.67, "elapsed_time": "6:55:52", "remaining_time": "4:52:57"}
1148
+ {"current_steps": 1148, "total_steps": 1955, "loss": 0.3185, "lr": 1.7417515330457817e-05, "epoch": 2.9360613810741687, "percentage": 58.72, "elapsed_time": "6:56:15", "remaining_time": "4:52:36"}
1149
+ {"current_steps": 1149, "total_steps": 1955, "loss": 0.337, "lr": 1.738209829049489e-05, "epoch": 2.938618925831202, "percentage": 58.77, "elapsed_time": "6:56:37", "remaining_time": "4:52:15"}
1150
+ {"current_steps": 1150, "total_steps": 1955, "loss": 0.3091, "lr": 1.7346689601201314e-05, "epoch": 2.9411764705882355, "percentage": 58.82, "elapsed_time": "6:56:58", "remaining_time": "4:51:52"}
1151
+ {"current_steps": 1151, "total_steps": 1955, "loss": 0.3283, "lr": 1.7311289375524886e-05, "epoch": 2.9437340153452687, "percentage": 58.87, "elapsed_time": "6:57:18", "remaining_time": "4:51:30"}
1152
+ {"current_steps": 1152, "total_steps": 1955, "loss": 0.3276, "lr": 1.727589772638643e-05, "epoch": 2.946291560102302, "percentage": 58.93, "elapsed_time": "6:57:39", "remaining_time": "4:51:07"}
1153
+ {"current_steps": 1153, "total_steps": 1955, "loss": 0.304, "lr": 1.7240514766679387e-05, "epoch": 2.948849104859335, "percentage": 58.98, "elapsed_time": "6:58:03", "remaining_time": "4:50:47"}
1154
+ {"current_steps": 1154, "total_steps": 1955, "loss": 0.3216, "lr": 1.720514060926949e-05, "epoch": 2.9514066496163682, "percentage": 59.03, "elapsed_time": "6:58:26", "remaining_time": "4:50:26"}
1155
+ {"current_steps": 1155, "total_steps": 1955, "loss": 0.3282, "lr": 1.71697753669944e-05, "epoch": 2.9539641943734014, "percentage": 59.08, "elapsed_time": "6:58:49", "remaining_time": "4:50:05"}
1156
+ {"current_steps": 1156, "total_steps": 1955, "loss": 0.3632, "lr": 1.7134419152663325e-05, "epoch": 2.9565217391304346, "percentage": 59.13, "elapsed_time": "6:59:12", "remaining_time": "4:49:44"}
1157
+ {"current_steps": 1157, "total_steps": 1955, "loss": 0.3193, "lr": 1.7099072079056702e-05, "epoch": 2.959079283887468, "percentage": 59.18, "elapsed_time": "6:59:32", "remaining_time": "4:49:21"}
1158
+ {"current_steps": 1158, "total_steps": 1955, "loss": 0.327, "lr": 1.706373425892578e-05, "epoch": 2.9616368286445014, "percentage": 59.23, "elapsed_time": "6:59:52", "remaining_time": "4:48:59"}
1159
+ {"current_steps": 1159, "total_steps": 1955, "loss": 0.3274, "lr": 1.7028405804992315e-05, "epoch": 2.9641943734015346, "percentage": 59.28, "elapsed_time": "7:00:14", "remaining_time": "4:48:37"}
1160
+ {"current_steps": 1160, "total_steps": 1955, "loss": 0.3413, "lr": 1.6993086829948167e-05, "epoch": 2.9667519181585678, "percentage": 59.34, "elapsed_time": "7:00:33", "remaining_time": "4:48:13"}
1161
+ {"current_steps": 1161, "total_steps": 1955, "loss": 0.3159, "lr": 1.6957777446454972e-05, "epoch": 2.969309462915601, "percentage": 59.39, "elapsed_time": "7:00:53", "remaining_time": "4:47:50"}
1162
+ {"current_steps": 1162, "total_steps": 1955, "loss": 0.3182, "lr": 1.692247776714377e-05, "epoch": 2.971867007672634, "percentage": 59.44, "elapsed_time": "7:01:14", "remaining_time": "4:47:28"}
1163
+ {"current_steps": 1163, "total_steps": 1955, "loss": 0.3323, "lr": 1.6887187904614638e-05, "epoch": 2.9744245524296673, "percentage": 59.49, "elapsed_time": "7:01:37", "remaining_time": "4:47:07"}
1164
+ {"current_steps": 1164, "total_steps": 1955, "loss": 0.3041, "lr": 1.6851907971436364e-05, "epoch": 2.976982097186701, "percentage": 59.54, "elapsed_time": "7:01:59", "remaining_time": "4:46:45"}
1165
+ {"current_steps": 1165, "total_steps": 1955, "loss": 0.3076, "lr": 1.6816638080146022e-05, "epoch": 2.979539641943734, "percentage": 59.59, "elapsed_time": "7:02:21", "remaining_time": "4:46:24"}
1166
+ {"current_steps": 1166, "total_steps": 1955, "loss": 0.3246, "lr": 1.6781378343248682e-05, "epoch": 2.9820971867007673, "percentage": 59.64, "elapsed_time": "7:02:43", "remaining_time": "4:46:02"}
1167
+ {"current_steps": 1167, "total_steps": 1955, "loss": 0.3437, "lr": 1.6746128873217025e-05, "epoch": 2.9846547314578005, "percentage": 59.69, "elapsed_time": "7:03:07", "remaining_time": "4:45:42"}
1168
+ {"current_steps": 1168, "total_steps": 1955, "loss": 0.2999, "lr": 1.6710889782490964e-05, "epoch": 2.9872122762148337, "percentage": 59.74, "elapsed_time": "7:03:28", "remaining_time": "4:45:20"}
1169
+ {"current_steps": 1169, "total_steps": 1955, "loss": 0.2981, "lr": 1.6675661183477328e-05, "epoch": 2.9897698209718673, "percentage": 59.8, "elapsed_time": "7:03:48", "remaining_time": "4:44:57"}
1170
+ {"current_steps": 1170, "total_steps": 1955, "loss": 0.3322, "lr": 1.664044318854946e-05, "epoch": 2.9923273657289, "percentage": 59.85, "elapsed_time": "7:04:07", "remaining_time": "4:44:33"}
1171
+ {"current_steps": 1171, "total_steps": 1955, "loss": 0.3234, "lr": 1.6605235910046876e-05, "epoch": 2.9948849104859336, "percentage": 59.9, "elapsed_time": "7:04:28", "remaining_time": "4:44:11"}
1172
+ {"current_steps": 1172, "total_steps": 1955, "loss": 0.3306, "lr": 1.6570039460274924e-05, "epoch": 2.997442455242967, "percentage": 59.95, "elapsed_time": "7:04:52", "remaining_time": "4:43:51"}
1173
+ {"current_steps": 1173, "total_steps": 1955, "loss": 0.2791, "lr": 1.65348539515044e-05, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "7:05:13", "remaining_time": "4:43:29"}
1174
+ {"current_steps": 1174, "total_steps": 1955, "loss": 0.2421, "lr": 1.64996794959712e-05, "epoch": 3.002557544757033, "percentage": 60.05, "elapsed_time": "7:06:25", "remaining_time": "4:43:40"}
1175
+ {"current_steps": 1175, "total_steps": 1955, "loss": 0.2452, "lr": 1.6464516205875974e-05, "epoch": 3.0051150895140664, "percentage": 60.1, "elapsed_time": "7:06:49", "remaining_time": "4:43:20"}
1176
+ {"current_steps": 1176, "total_steps": 1955, "loss": 0.2298, "lr": 1.642936419338373e-05, "epoch": 3.0076726342710995, "percentage": 60.15, "elapsed_time": "7:07:08", "remaining_time": "4:42:56"}
1177
+ {"current_steps": 1177, "total_steps": 1955, "loss": 0.2713, "lr": 1.6394223570623534e-05, "epoch": 3.010230179028133, "percentage": 60.2, "elapsed_time": "7:07:32", "remaining_time": "4:42:36"}
1178
+ {"current_steps": 1178, "total_steps": 1955, "loss": 0.2563, "lr": 1.6359094449688092e-05, "epoch": 3.0127877237851663, "percentage": 60.26, "elapsed_time": "7:07:54", "remaining_time": "4:42:14"}
1179
+ {"current_steps": 1179, "total_steps": 1955, "loss": 0.2265, "lr": 1.6323976942633445e-05, "epoch": 3.0153452685421995, "percentage": 60.31, "elapsed_time": "7:08:16", "remaining_time": "4:41:53"}