gsmyrnis commited on
Commit
ad6a1a8
·
verified ·
1 Parent(s): 5051d06

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebc84336db90dc1633f94ebc28e0f0d5d8ad00905174728f35c145b3be756686
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7dc62bfdc55c3feb1d53dfe52ddbbf97ec832f229c5a176f15fd2d7ea878595
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a79af1892742ca3523f4e15304c3ce85db9716926e4c1ff99475283575086575
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad22e53c34eaef6d84ce02a1622508fb2c9fe14a7a97d996e06bf968b7c271e1
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13bd40bed7c53f107e8351390bc47b8ff3689aaa376b8ab4475bb0843af684dd
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d39e5c4468a777c3ddd384e647067b8e5da851ab8c17183d2da18202c941f49c
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab8894a8ee2b4b455bc656f6a37857368054704d91160d056166417e77602e13
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f05626dc0f31afdf1b3b4d24ddff2e3dcac84c444178f6a32b229c191ac1c539
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -983,3 +983,491 @@
983
  {"current_steps": 983, "total_steps": 2440, "loss": 0.3202, "lr": 2.98260507249244e-05, "epoch": 2.0122824974411464, "percentage": 40.29, "elapsed_time": "5:07:19", "remaining_time": "7:35:31"}
984
  {"current_steps": 984, "total_steps": 2440, "loss": 0.3509, "lr": 2.9801119980682095e-05, "epoch": 2.014329580348004, "percentage": 40.33, "elapsed_time": "5:07:37", "remaining_time": "7:35:11"}
985
  {"current_steps": 985, "total_steps": 2440, "loss": 0.3281, "lr": 2.977616917737388e-05, "epoch": 2.016376663254862, "percentage": 40.37, "elapsed_time": "5:07:53", "remaining_time": "7:34:48"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
983
  {"current_steps": 983, "total_steps": 2440, "loss": 0.3202, "lr": 2.98260507249244e-05, "epoch": 2.0122824974411464, "percentage": 40.29, "elapsed_time": "5:07:19", "remaining_time": "7:35:31"}
984
  {"current_steps": 984, "total_steps": 2440, "loss": 0.3509, "lr": 2.9801119980682095e-05, "epoch": 2.014329580348004, "percentage": 40.33, "elapsed_time": "5:07:37", "remaining_time": "7:35:11"}
985
  {"current_steps": 985, "total_steps": 2440, "loss": 0.3281, "lr": 2.977616917737388e-05, "epoch": 2.016376663254862, "percentage": 40.37, "elapsed_time": "5:07:53", "remaining_time": "7:34:48"}
986
+ {"current_steps": 986, "total_steps": 2440, "loss": 0.3161, "lr": 2.9751198366064304e-05, "epoch": 2.0184237461617194, "percentage": 40.41, "elapsed_time": "5:08:12", "remaining_time": "7:34:30"}
987
+ {"current_steps": 987, "total_steps": 2440, "loss": 0.3251, "lr": 2.9726207597858872e-05, "epoch": 2.0204708290685773, "percentage": 40.45, "elapsed_time": "5:08:27", "remaining_time": "7:34:06"}
988
+ {"current_steps": 988, "total_steps": 2440, "loss": 0.3391, "lr": 2.9701196923903927e-05, "epoch": 2.022517911975435, "percentage": 40.49, "elapsed_time": "5:08:48", "remaining_time": "7:33:49"}
989
+ {"current_steps": 989, "total_steps": 2440, "loss": 0.361, "lr": 2.9676166395386553e-05, "epoch": 2.024564994882293, "percentage": 40.53, "elapsed_time": "5:09:09", "remaining_time": "7:33:34"}
990
+ {"current_steps": 990, "total_steps": 2440, "loss": 0.312, "lr": 2.965111606353447e-05, "epoch": 2.0266120777891503, "percentage": 40.57, "elapsed_time": "5:09:24", "remaining_time": "7:33:10"}
991
+ {"current_steps": 991, "total_steps": 2440, "loss": 0.3209, "lr": 2.9626045979615928e-05, "epoch": 2.0286591606960083, "percentage": 40.61, "elapsed_time": "5:09:44", "remaining_time": "7:32:53"}
992
+ {"current_steps": 992, "total_steps": 2440, "loss": 0.3498, "lr": 2.9600956194939598e-05, "epoch": 2.030706243602866, "percentage": 40.66, "elapsed_time": "5:10:01", "remaining_time": "7:32:32"}
993
+ {"current_steps": 993, "total_steps": 2440, "loss": 0.3422, "lr": 2.957584676085447e-05, "epoch": 2.0327533265097237, "percentage": 40.7, "elapsed_time": "5:10:22", "remaining_time": "7:32:16"}
994
+ {"current_steps": 994, "total_steps": 2440, "loss": 0.3199, "lr": 2.9550717728749768e-05, "epoch": 2.0348004094165812, "percentage": 40.74, "elapsed_time": "5:10:39", "remaining_time": "7:31:55"}
995
+ {"current_steps": 995, "total_steps": 2440, "loss": 0.2871, "lr": 2.9525569150054796e-05, "epoch": 2.036847492323439, "percentage": 40.78, "elapsed_time": "5:10:54", "remaining_time": "7:31:31"}
996
+ {"current_steps": 996, "total_steps": 2440, "loss": 0.3268, "lr": 2.950040107623887e-05, "epoch": 2.0388945752302967, "percentage": 40.82, "elapsed_time": "5:11:09", "remaining_time": "7:31:07"}
997
+ {"current_steps": 997, "total_steps": 2440, "loss": 0.3268, "lr": 2.947521355881122e-05, "epoch": 2.0409416581371547, "percentage": 40.86, "elapsed_time": "5:11:30", "remaining_time": "7:30:51"}
998
+ {"current_steps": 998, "total_steps": 2440, "loss": 0.325, "lr": 2.9450006649320862e-05, "epoch": 2.042988741044012, "percentage": 40.9, "elapsed_time": "5:11:48", "remaining_time": "7:30:31"}
999
+ {"current_steps": 999, "total_steps": 2440, "loss": 0.3144, "lr": 2.9424780399356497e-05, "epoch": 2.04503582395087, "percentage": 40.94, "elapsed_time": "5:12:07", "remaining_time": "7:30:12"}
1000
+ {"current_steps": 1000, "total_steps": 2440, "loss": 0.3324, "lr": 2.9399534860546404e-05, "epoch": 2.0470829068577276, "percentage": 40.98, "elapsed_time": "5:12:26", "remaining_time": "7:29:54"}
1001
+ {"current_steps": 1001, "total_steps": 2440, "loss": 0.3458, "lr": 2.937427008455835e-05, "epoch": 2.0491299897645856, "percentage": 41.02, "elapsed_time": "5:12:43", "remaining_time": "7:29:34"}
1002
+ {"current_steps": 1002, "total_steps": 2440, "loss": 0.3638, "lr": 2.9348986123099462e-05, "epoch": 2.051177072671443, "percentage": 41.07, "elapsed_time": "5:13:03", "remaining_time": "7:29:17"}
1003
+ {"current_steps": 1003, "total_steps": 2440, "loss": 0.3596, "lr": 2.932368302791614e-05, "epoch": 2.053224155578301, "percentage": 41.11, "elapsed_time": "5:13:24", "remaining_time": "7:29:01"}
1004
+ {"current_steps": 1004, "total_steps": 2440, "loss": 0.3048, "lr": 2.9298360850793944e-05, "epoch": 2.0552712384851586, "percentage": 41.15, "elapsed_time": "5:13:39", "remaining_time": "7:28:37"}
1005
+ {"current_steps": 1005, "total_steps": 2440, "loss": 0.3154, "lr": 2.9273019643557474e-05, "epoch": 2.0573183213920165, "percentage": 41.19, "elapsed_time": "5:13:59", "remaining_time": "7:28:20"}
1006
+ {"current_steps": 1006, "total_steps": 2440, "loss": 0.3397, "lr": 2.92476594580703e-05, "epoch": 2.059365404298874, "percentage": 41.23, "elapsed_time": "5:14:18", "remaining_time": "7:28:01"}
1007
+ {"current_steps": 1007, "total_steps": 2440, "loss": 0.3315, "lr": 2.9222280346234816e-05, "epoch": 2.061412487205732, "percentage": 41.27, "elapsed_time": "5:14:38", "remaining_time": "7:27:44"}
1008
+ {"current_steps": 1008, "total_steps": 2440, "loss": 0.3334, "lr": 2.919688235999215e-05, "epoch": 2.0634595701125895, "percentage": 41.31, "elapsed_time": "5:15:00", "remaining_time": "7:27:30"}
1009
+ {"current_steps": 1009, "total_steps": 2440, "loss": 0.3386, "lr": 2.917146555132206e-05, "epoch": 2.0655066530194475, "percentage": 41.35, "elapsed_time": "5:15:21", "remaining_time": "7:27:14"}
1010
+ {"current_steps": 1010, "total_steps": 2440, "loss": 0.3199, "lr": 2.914602997224285e-05, "epoch": 2.067553735926305, "percentage": 41.39, "elapsed_time": "5:15:42", "remaining_time": "7:26:59"}
1011
+ {"current_steps": 1011, "total_steps": 2440, "loss": 0.3507, "lr": 2.912057567481119e-05, "epoch": 2.069600818833163, "percentage": 41.43, "elapsed_time": "5:15:59", "remaining_time": "7:26:38"}
1012
+ {"current_steps": 1012, "total_steps": 2440, "loss": 0.3462, "lr": 2.909510271112212e-05, "epoch": 2.0716479017400204, "percentage": 41.48, "elapsed_time": "5:16:16", "remaining_time": "7:26:17"}
1013
+ {"current_steps": 1013, "total_steps": 2440, "loss": 0.3271, "lr": 2.906961113330883e-05, "epoch": 2.0736949846468784, "percentage": 41.52, "elapsed_time": "5:16:37", "remaining_time": "7:26:01"}
1014
+ {"current_steps": 1014, "total_steps": 2440, "loss": 0.311, "lr": 2.904410099354263e-05, "epoch": 2.075742067553736, "percentage": 41.56, "elapsed_time": "5:16:52", "remaining_time": "7:25:37"}
1015
+ {"current_steps": 1015, "total_steps": 2440, "loss": 0.3242, "lr": 2.9018572344032823e-05, "epoch": 2.0777891504605934, "percentage": 41.6, "elapsed_time": "5:17:15", "remaining_time": "7:25:25"}
1016
+ {"current_steps": 1016, "total_steps": 2440, "loss": 0.3472, "lr": 2.8993025237026578e-05, "epoch": 2.0798362333674514, "percentage": 41.64, "elapsed_time": "5:17:31", "remaining_time": "7:25:02"}
1017
+ {"current_steps": 1017, "total_steps": 2440, "loss": 0.3055, "lr": 2.8967459724808856e-05, "epoch": 2.0818833162743093, "percentage": 41.68, "elapsed_time": "5:17:46", "remaining_time": "7:24:38"}
1018
+ {"current_steps": 1018, "total_steps": 2440, "loss": 0.3099, "lr": 2.8941875859702283e-05, "epoch": 2.083930399181167, "percentage": 41.72, "elapsed_time": "5:18:06", "remaining_time": "7:24:20"}
1019
+ {"current_steps": 1019, "total_steps": 2440, "loss": 0.3301, "lr": 2.891627369406703e-05, "epoch": 2.0859774820880244, "percentage": 41.76, "elapsed_time": "5:18:30", "remaining_time": "7:24:09"}
1020
+ {"current_steps": 1020, "total_steps": 2440, "loss": 0.3559, "lr": 2.889065328030074e-05, "epoch": 2.0880245649948823, "percentage": 41.8, "elapsed_time": "5:18:50", "remaining_time": "7:23:52"}
1021
+ {"current_steps": 1021, "total_steps": 2440, "loss": 0.3301, "lr": 2.88650146708384e-05, "epoch": 2.09007164790174, "percentage": 41.84, "elapsed_time": "5:19:08", "remaining_time": "7:23:32"}
1022
+ {"current_steps": 1022, "total_steps": 2440, "loss": 0.3413, "lr": 2.883935791815222e-05, "epoch": 2.092118730808598, "percentage": 41.89, "elapsed_time": "5:19:28", "remaining_time": "7:23:16"}
1023
+ {"current_steps": 1023, "total_steps": 2440, "loss": 0.3469, "lr": 2.8813683074751578e-05, "epoch": 2.0941658137154553, "percentage": 41.93, "elapsed_time": "5:19:44", "remaining_time": "7:22:53"}
1024
+ {"current_steps": 1024, "total_steps": 2440, "loss": 0.3339, "lr": 2.878799019318283e-05, "epoch": 2.0962128966223132, "percentage": 41.97, "elapsed_time": "5:20:00", "remaining_time": "7:22:30"}
1025
+ {"current_steps": 1025, "total_steps": 2440, "loss": 0.3278, "lr": 2.8762279326029293e-05, "epoch": 2.0982599795291708, "percentage": 42.01, "elapsed_time": "5:20:20", "remaining_time": "7:22:13"}
1026
+ {"current_steps": 1026, "total_steps": 2440, "loss": 0.3548, "lr": 2.8736550525911066e-05, "epoch": 2.1003070624360287, "percentage": 42.05, "elapsed_time": "5:20:42", "remaining_time": "7:21:58"}
1027
+ {"current_steps": 1027, "total_steps": 2440, "loss": 0.321, "lr": 2.8710803845484955e-05, "epoch": 2.1023541453428862, "percentage": 42.09, "elapsed_time": "5:21:05", "remaining_time": "7:21:45"}
1028
+ {"current_steps": 1028, "total_steps": 2440, "loss": 0.3174, "lr": 2.8685039337444368e-05, "epoch": 2.104401228249744, "percentage": 42.13, "elapsed_time": "5:21:24", "remaining_time": "7:21:28"}
1029
+ {"current_steps": 1029, "total_steps": 2440, "loss": 0.3046, "lr": 2.8659257054519182e-05, "epoch": 2.1064483111566017, "percentage": 42.17, "elapsed_time": "5:21:44", "remaining_time": "7:21:10"}
1030
+ {"current_steps": 1030, "total_steps": 2440, "loss": 0.3526, "lr": 2.8633457049475678e-05, "epoch": 2.1084953940634596, "percentage": 42.21, "elapsed_time": "5:22:05", "remaining_time": "7:20:55"}
1031
+ {"current_steps": 1031, "total_steps": 2440, "loss": 0.3179, "lr": 2.8607639375116388e-05, "epoch": 2.110542476970317, "percentage": 42.25, "elapsed_time": "5:22:26", "remaining_time": "7:20:39"}
1032
+ {"current_steps": 1032, "total_steps": 2440, "loss": 0.3393, "lr": 2.858180408428001e-05, "epoch": 2.112589559877175, "percentage": 42.3, "elapsed_time": "5:22:45", "remaining_time": "7:20:21"}
1033
+ {"current_steps": 1033, "total_steps": 2440, "loss": 0.3248, "lr": 2.855595122984129e-05, "epoch": 2.1146366427840326, "percentage": 42.34, "elapsed_time": "5:23:03", "remaining_time": "7:20:01"}
1034
+ {"current_steps": 1034, "total_steps": 2440, "loss": 0.3283, "lr": 2.853008086471094e-05, "epoch": 2.1166837256908906, "percentage": 42.38, "elapsed_time": "5:23:23", "remaining_time": "7:19:44"}
1035
+ {"current_steps": 1035, "total_steps": 2440, "loss": 0.3048, "lr": 2.8504193041835497e-05, "epoch": 2.118730808597748, "percentage": 42.42, "elapsed_time": "5:23:40", "remaining_time": "7:19:23"}
1036
+ {"current_steps": 1036, "total_steps": 2440, "loss": 0.3667, "lr": 2.847828781419722e-05, "epoch": 2.120777891504606, "percentage": 42.46, "elapsed_time": "5:23:59", "remaining_time": "7:19:04"}
1037
+ {"current_steps": 1037, "total_steps": 2440, "loss": 0.3601, "lr": 2.8452365234813992e-05, "epoch": 2.1228249744114636, "percentage": 42.5, "elapsed_time": "5:24:20", "remaining_time": "7:18:49"}
1038
+ {"current_steps": 1038, "total_steps": 2440, "loss": 0.3289, "lr": 2.842642535673922e-05, "epoch": 2.1248720573183215, "percentage": 42.54, "elapsed_time": "5:24:41", "remaining_time": "7:18:32"}
1039
+ {"current_steps": 1039, "total_steps": 2440, "loss": 0.3147, "lr": 2.8400468233061708e-05, "epoch": 2.126919140225179, "percentage": 42.58, "elapsed_time": "5:25:01", "remaining_time": "7:18:15"}
1040
+ {"current_steps": 1040, "total_steps": 2440, "loss": 0.3269, "lr": 2.8374493916905544e-05, "epoch": 2.128966223132037, "percentage": 42.62, "elapsed_time": "5:25:23", "remaining_time": "7:18:01"}
1041
+ {"current_steps": 1041, "total_steps": 2440, "loss": 0.3076, "lr": 2.834850246143002e-05, "epoch": 2.1310133060388945, "percentage": 42.66, "elapsed_time": "5:25:42", "remaining_time": "7:17:43"}
1042
+ {"current_steps": 1042, "total_steps": 2440, "loss": 0.3315, "lr": 2.832249391982949e-05, "epoch": 2.1330603889457525, "percentage": 42.7, "elapsed_time": "5:26:06", "remaining_time": "7:17:31"}
1043
+ {"current_steps": 1043, "total_steps": 2440, "loss": 0.2945, "lr": 2.8296468345333298e-05, "epoch": 2.13510747185261, "percentage": 42.75, "elapsed_time": "5:26:25", "remaining_time": "7:17:13"}
1044
+ {"current_steps": 1044, "total_steps": 2440, "loss": 0.3556, "lr": 2.827042579120562e-05, "epoch": 2.137154554759468, "percentage": 42.79, "elapsed_time": "5:26:44", "remaining_time": "7:16:54"}
1045
+ {"current_steps": 1045, "total_steps": 2440, "loss": 0.3301, "lr": 2.8244366310745398e-05, "epoch": 2.1392016376663254, "percentage": 42.83, "elapsed_time": "5:27:01", "remaining_time": "7:16:33"}
1046
+ {"current_steps": 1046, "total_steps": 2440, "loss": 0.3672, "lr": 2.8218289957286226e-05, "epoch": 2.1412487205731834, "percentage": 42.87, "elapsed_time": "5:27:19", "remaining_time": "7:16:13"}
1047
+ {"current_steps": 1047, "total_steps": 2440, "loss": 0.3148, "lr": 2.8192196784196198e-05, "epoch": 2.143295803480041, "percentage": 42.91, "elapsed_time": "5:27:39", "remaining_time": "7:15:56"}
1048
+ {"current_steps": 1048, "total_steps": 2440, "loss": 0.3252, "lr": 2.816608684487787e-05, "epoch": 2.145342886386899, "percentage": 42.95, "elapsed_time": "5:27:58", "remaining_time": "7:15:38"}
1049
+ {"current_steps": 1049, "total_steps": 2440, "loss": 0.3354, "lr": 2.813996019276809e-05, "epoch": 2.1473899692937564, "percentage": 42.99, "elapsed_time": "5:28:18", "remaining_time": "7:15:20"}
1050
+ {"current_steps": 1050, "total_steps": 2440, "loss": 0.3146, "lr": 2.8113816881337902e-05, "epoch": 2.1494370522006143, "percentage": 43.03, "elapsed_time": "5:28:38", "remaining_time": "7:15:04"}
1051
+ {"current_steps": 1051, "total_steps": 2440, "loss": 0.3041, "lr": 2.8087656964092472e-05, "epoch": 2.151484135107472, "percentage": 43.07, "elapsed_time": "5:28:57", "remaining_time": "7:14:45"}
1052
+ {"current_steps": 1052, "total_steps": 2440, "loss": 0.3639, "lr": 2.806148049457093e-05, "epoch": 2.15353121801433, "percentage": 43.11, "elapsed_time": "5:29:15", "remaining_time": "7:14:24"}
1053
+ {"current_steps": 1053, "total_steps": 2440, "loss": 0.3317, "lr": 2.803528752634629e-05, "epoch": 2.1555783009211873, "percentage": 43.16, "elapsed_time": "5:29:36", "remaining_time": "7:14:09"}
1054
+ {"current_steps": 1054, "total_steps": 2440, "loss": 0.3363, "lr": 2.8009078113025335e-05, "epoch": 2.1576253838280453, "percentage": 43.2, "elapsed_time": "5:29:57", "remaining_time": "7:13:53"}
1055
+ {"current_steps": 1055, "total_steps": 2440, "loss": 0.3088, "lr": 2.798285230824849e-05, "epoch": 2.1596724667349028, "percentage": 43.24, "elapsed_time": "5:30:15", "remaining_time": "7:13:34"}
1056
+ {"current_steps": 1056, "total_steps": 2440, "loss": 0.3472, "lr": 2.795661016568975e-05, "epoch": 2.1617195496417603, "percentage": 43.28, "elapsed_time": "5:30:35", "remaining_time": "7:13:16"}
1057
+ {"current_steps": 1057, "total_steps": 2440, "loss": 0.347, "lr": 2.7930351739056533e-05, "epoch": 2.1637666325486182, "percentage": 43.32, "elapsed_time": "5:30:54", "remaining_time": "7:12:57"}
1058
+ {"current_steps": 1058, "total_steps": 2440, "loss": 0.325, "lr": 2.7904077082089574e-05, "epoch": 2.1658137154554757, "percentage": 43.36, "elapsed_time": "5:31:11", "remaining_time": "7:12:37"}
1059
+ {"current_steps": 1059, "total_steps": 2440, "loss": 0.3066, "lr": 2.787778624856286e-05, "epoch": 2.1678607983623337, "percentage": 43.4, "elapsed_time": "5:31:28", "remaining_time": "7:12:16"}
1060
+ {"current_steps": 1060, "total_steps": 2440, "loss": 0.3415, "lr": 2.7851479292283442e-05, "epoch": 2.169907881269191, "percentage": 43.44, "elapsed_time": "5:31:47", "remaining_time": "7:11:56"}
1061
+ {"current_steps": 1061, "total_steps": 2440, "loss": 0.3498, "lr": 2.782515626709139e-05, "epoch": 2.171954964176049, "percentage": 43.48, "elapsed_time": "5:32:08", "remaining_time": "7:11:40"}
1062
+ {"current_steps": 1062, "total_steps": 2440, "loss": 0.3311, "lr": 2.7798817226859678e-05, "epoch": 2.1740020470829067, "percentage": 43.52, "elapsed_time": "5:32:27", "remaining_time": "7:11:23"}
1063
+ {"current_steps": 1063, "total_steps": 2440, "loss": 0.3393, "lr": 2.7772462225494013e-05, "epoch": 2.1760491299897646, "percentage": 43.57, "elapsed_time": "5:32:45", "remaining_time": "7:11:03"}
1064
+ {"current_steps": 1064, "total_steps": 2440, "loss": 0.2938, "lr": 2.7746091316932807e-05, "epoch": 2.178096212896622, "percentage": 43.61, "elapsed_time": "5:33:06", "remaining_time": "7:10:47"}
1065
+ {"current_steps": 1065, "total_steps": 2440, "loss": 0.3176, "lr": 2.7719704555147012e-05, "epoch": 2.18014329580348, "percentage": 43.65, "elapsed_time": "5:33:22", "remaining_time": "7:10:25"}
1066
+ {"current_steps": 1066, "total_steps": 2440, "loss": 0.3369, "lr": 2.7693301994140026e-05, "epoch": 2.1821903787103376, "percentage": 43.69, "elapsed_time": "5:33:45", "remaining_time": "7:10:11"}
1067
+ {"current_steps": 1067, "total_steps": 2440, "loss": 0.308, "lr": 2.7666883687947588e-05, "epoch": 2.1842374616171956, "percentage": 43.73, "elapsed_time": "5:34:04", "remaining_time": "7:09:53"}
1068
+ {"current_steps": 1068, "total_steps": 2440, "loss": 0.335, "lr": 2.7640449690637642e-05, "epoch": 2.186284544524053, "percentage": 43.77, "elapsed_time": "5:34:27", "remaining_time": "7:09:39"}
1069
+ {"current_steps": 1069, "total_steps": 2440, "loss": 0.3339, "lr": 2.761400005631028e-05, "epoch": 2.188331627430911, "percentage": 43.81, "elapsed_time": "5:34:47", "remaining_time": "7:09:21"}
1070
+ {"current_steps": 1070, "total_steps": 2440, "loss": 0.3348, "lr": 2.7587534839097556e-05, "epoch": 2.1903787103377685, "percentage": 43.85, "elapsed_time": "5:35:06", "remaining_time": "7:09:03"}
1071
+ {"current_steps": 1071, "total_steps": 2440, "loss": 0.3042, "lr": 2.756105409316345e-05, "epoch": 2.1924257932446265, "percentage": 43.89, "elapsed_time": "5:35:20", "remaining_time": "7:08:38"}
1072
+ {"current_steps": 1072, "total_steps": 2440, "loss": 0.3286, "lr": 2.7534557872703705e-05, "epoch": 2.194472876151484, "percentage": 43.93, "elapsed_time": "5:35:43", "remaining_time": "7:08:25"}
1073
+ {"current_steps": 1073, "total_steps": 2440, "loss": 0.3202, "lr": 2.750804623194574e-05, "epoch": 2.196519959058342, "percentage": 43.98, "elapsed_time": "5:36:05", "remaining_time": "7:08:10"}
1074
+ {"current_steps": 1074, "total_steps": 2440, "loss": 0.3158, "lr": 2.7481519225148537e-05, "epoch": 2.1985670419651995, "percentage": 44.02, "elapsed_time": "5:36:23", "remaining_time": "7:07:51"}
1075
+ {"current_steps": 1075, "total_steps": 2440, "loss": 0.3635, "lr": 2.7454976906602513e-05, "epoch": 2.2006141248720574, "percentage": 44.06, "elapsed_time": "5:36:41", "remaining_time": "7:07:31"}
1076
+ {"current_steps": 1076, "total_steps": 2440, "loss": 0.3378, "lr": 2.742841933062944e-05, "epoch": 2.202661207778915, "percentage": 44.1, "elapsed_time": "5:37:02", "remaining_time": "7:07:14"}
1077
+ {"current_steps": 1077, "total_steps": 2440, "loss": 0.3078, "lr": 2.7401846551582304e-05, "epoch": 2.204708290685773, "percentage": 44.14, "elapsed_time": "5:37:19", "remaining_time": "7:06:54"}
1078
+ {"current_steps": 1078, "total_steps": 2440, "loss": 0.3429, "lr": 2.7375258623845207e-05, "epoch": 2.2067553735926304, "percentage": 44.18, "elapsed_time": "5:37:40", "remaining_time": "7:06:38"}
1079
+ {"current_steps": 1079, "total_steps": 2440, "loss": 0.3338, "lr": 2.7348655601833255e-05, "epoch": 2.2088024564994884, "percentage": 44.22, "elapsed_time": "5:37:57", "remaining_time": "7:06:17"}
1080
+ {"current_steps": 1080, "total_steps": 2440, "loss": 0.3327, "lr": 2.7322037539992457e-05, "epoch": 2.210849539406346, "percentage": 44.26, "elapsed_time": "5:38:16", "remaining_time": "7:05:57"}
1081
+ {"current_steps": 1081, "total_steps": 2440, "loss": 0.3002, "lr": 2.7295404492799575e-05, "epoch": 2.212896622313204, "percentage": 44.3, "elapsed_time": "5:38:33", "remaining_time": "7:05:37"}
1082
+ {"current_steps": 1082, "total_steps": 2440, "loss": 0.3106, "lr": 2.726875651476207e-05, "epoch": 2.2149437052200613, "percentage": 44.34, "elapsed_time": "5:38:51", "remaining_time": "7:05:17"}
1083
+ {"current_steps": 1083, "total_steps": 2440, "loss": 0.364, "lr": 2.7242093660417954e-05, "epoch": 2.2169907881269193, "percentage": 44.39, "elapsed_time": "5:39:12", "remaining_time": "7:05:01"}
1084
+ {"current_steps": 1084, "total_steps": 2440, "loss": 0.2969, "lr": 2.721541598433567e-05, "epoch": 2.219037871033777, "percentage": 44.43, "elapsed_time": "5:39:26", "remaining_time": "7:04:36"}
1085
+ {"current_steps": 1085, "total_steps": 2440, "loss": 0.3346, "lr": 2.718872354111401e-05, "epoch": 2.2210849539406348, "percentage": 44.47, "elapsed_time": "5:39:47", "remaining_time": "7:04:20"}
1086
+ {"current_steps": 1086, "total_steps": 2440, "loss": 0.3648, "lr": 2.7162016385381975e-05, "epoch": 2.2231320368474923, "percentage": 44.51, "elapsed_time": "5:40:05", "remaining_time": "7:04:01"}
1087
+ {"current_steps": 1087, "total_steps": 2440, "loss": 0.3063, "lr": 2.7135294571798706e-05, "epoch": 2.2251791197543502, "percentage": 44.55, "elapsed_time": "5:40:29", "remaining_time": "7:03:49"}
1088
+ {"current_steps": 1088, "total_steps": 2440, "loss": 0.3403, "lr": 2.7108558155053296e-05, "epoch": 2.2272262026612077, "percentage": 44.59, "elapsed_time": "5:40:49", "remaining_time": "7:03:31"}
1089
+ {"current_steps": 1089, "total_steps": 2440, "loss": 0.3583, "lr": 2.7081807189864764e-05, "epoch": 2.2292732855680657, "percentage": 44.63, "elapsed_time": "5:41:09", "remaining_time": "7:03:14"}
1090
+ {"current_steps": 1090, "total_steps": 2440, "loss": 0.3144, "lr": 2.70550417309819e-05, "epoch": 2.231320368474923, "percentage": 44.67, "elapsed_time": "5:41:28", "remaining_time": "7:02:55"}
1091
+ {"current_steps": 1091, "total_steps": 2440, "loss": 0.3376, "lr": 2.7028261833183132e-05, "epoch": 2.233367451381781, "percentage": 44.71, "elapsed_time": "5:41:42", "remaining_time": "7:02:31"}
1092
+ {"current_steps": 1092, "total_steps": 2440, "loss": 0.2973, "lr": 2.7001467551276464e-05, "epoch": 2.2354145342886387, "percentage": 44.75, "elapsed_time": "5:42:01", "remaining_time": "7:02:12"}
1093
+ {"current_steps": 1093, "total_steps": 2440, "loss": 0.3222, "lr": 2.6974658940099337e-05, "epoch": 2.237461617195496, "percentage": 44.8, "elapsed_time": "5:42:18", "remaining_time": "7:01:51"}
1094
+ {"current_steps": 1094, "total_steps": 2440, "loss": 0.3585, "lr": 2.6947836054518484e-05, "epoch": 2.239508700102354, "percentage": 44.84, "elapsed_time": "5:42:36", "remaining_time": "7:01:31"}
1095
+ {"current_steps": 1095, "total_steps": 2440, "loss": 0.309, "lr": 2.6920998949429913e-05, "epoch": 2.241555783009212, "percentage": 44.88, "elapsed_time": "5:42:53", "remaining_time": "7:01:10"}
1096
+ {"current_steps": 1096, "total_steps": 2440, "loss": 0.332, "lr": 2.6894147679758678e-05, "epoch": 2.2436028659160696, "percentage": 44.92, "elapsed_time": "5:43:14", "remaining_time": "7:00:54"}
1097
+ {"current_steps": 1097, "total_steps": 2440, "loss": 0.3365, "lr": 2.6867282300458853e-05, "epoch": 2.245649948822927, "percentage": 44.96, "elapsed_time": "5:43:34", "remaining_time": "7:00:36"}
1098
+ {"current_steps": 1098, "total_steps": 2440, "loss": 0.3361, "lr": 2.684040286651338e-05, "epoch": 2.247697031729785, "percentage": 45.0, "elapsed_time": "5:43:50", "remaining_time": "7:00:14"}
1099
+ {"current_steps": 1099, "total_steps": 2440, "loss": 0.3142, "lr": 2.6813509432933957e-05, "epoch": 2.2497441146366426, "percentage": 45.04, "elapsed_time": "5:44:03", "remaining_time": "6:59:49"}
1100
+ {"current_steps": 1100, "total_steps": 2440, "loss": 0.3078, "lr": 2.6786602054760952e-05, "epoch": 2.2517911975435005, "percentage": 45.08, "elapsed_time": "5:44:20", "remaining_time": "6:59:28"}
1101
+ {"current_steps": 1101, "total_steps": 2440, "loss": 0.3151, "lr": 2.675968078706326e-05, "epoch": 2.253838280450358, "percentage": 45.12, "elapsed_time": "5:44:36", "remaining_time": "6:59:06"}
1102
+ {"current_steps": 1102, "total_steps": 2440, "loss": 0.3243, "lr": 2.673274568493821e-05, "epoch": 2.255885363357216, "percentage": 45.16, "elapsed_time": "5:44:55", "remaining_time": "6:58:47"}
1103
+ {"current_steps": 1103, "total_steps": 2440, "loss": 0.3284, "lr": 2.670579680351143e-05, "epoch": 2.2579324462640735, "percentage": 45.2, "elapsed_time": "5:45:15", "remaining_time": "6:58:30"}
1104
+ {"current_steps": 1104, "total_steps": 2440, "loss": 0.313, "lr": 2.667883419793676e-05, "epoch": 2.2599795291709315, "percentage": 45.25, "elapsed_time": "5:45:35", "remaining_time": "6:58:12"}
1105
+ {"current_steps": 1105, "total_steps": 2440, "loss": 0.3759, "lr": 2.6651857923396132e-05, "epoch": 2.262026612077789, "percentage": 45.29, "elapsed_time": "5:45:55", "remaining_time": "6:57:56"}
1106
+ {"current_steps": 1106, "total_steps": 2440, "loss": 0.3336, "lr": 2.6624868035099445e-05, "epoch": 2.264073694984647, "percentage": 45.33, "elapsed_time": "5:46:13", "remaining_time": "6:57:36"}
1107
+ {"current_steps": 1107, "total_steps": 2440, "loss": 0.3587, "lr": 2.659786458828446e-05, "epoch": 2.2661207778915045, "percentage": 45.37, "elapsed_time": "5:46:31", "remaining_time": "6:57:16"}
1108
+ {"current_steps": 1108, "total_steps": 2440, "loss": 0.3506, "lr": 2.6570847638216698e-05, "epoch": 2.2681678607983624, "percentage": 45.41, "elapsed_time": "5:46:51", "remaining_time": "6:56:58"}
1109
+ {"current_steps": 1109, "total_steps": 2440, "loss": 0.3451, "lr": 2.65438172401893e-05, "epoch": 2.27021494370522, "percentage": 45.45, "elapsed_time": "5:47:09", "remaining_time": "6:56:38"}
1110
+ {"current_steps": 1110, "total_steps": 2440, "loss": 0.3257, "lr": 2.6516773449522936e-05, "epoch": 2.272262026612078, "percentage": 45.49, "elapsed_time": "5:47:27", "remaining_time": "6:56:19"}
1111
+ {"current_steps": 1111, "total_steps": 2440, "loss": 0.3147, "lr": 2.648971632156569e-05, "epoch": 2.2743091095189354, "percentage": 45.53, "elapsed_time": "5:47:46", "remaining_time": "6:56:00"}
1112
+ {"current_steps": 1112, "total_steps": 2440, "loss": 0.2979, "lr": 2.6462645911692938e-05, "epoch": 2.2763561924257933, "percentage": 45.57, "elapsed_time": "5:48:01", "remaining_time": "6:55:37"}
1113
+ {"current_steps": 1113, "total_steps": 2440, "loss": 0.3065, "lr": 2.643556227530724e-05, "epoch": 2.278403275332651, "percentage": 45.61, "elapsed_time": "5:48:21", "remaining_time": "6:55:19"}
1114
+ {"current_steps": 1114, "total_steps": 2440, "loss": 0.332, "lr": 2.6408465467838225e-05, "epoch": 2.280450358239509, "percentage": 45.66, "elapsed_time": "5:48:39", "remaining_time": "6:55:00"}
1115
+ {"current_steps": 1115, "total_steps": 2440, "loss": 0.3963, "lr": 2.6381355544742482e-05, "epoch": 2.2824974411463663, "percentage": 45.7, "elapsed_time": "5:48:59", "remaining_time": "6:54:43"}
1116
+ {"current_steps": 1116, "total_steps": 2440, "loss": 0.3357, "lr": 2.6354232561503433e-05, "epoch": 2.2845445240532243, "percentage": 45.74, "elapsed_time": "5:49:21", "remaining_time": "6:54:28"}
1117
+ {"current_steps": 1117, "total_steps": 2440, "loss": 0.3089, "lr": 2.632709657363124e-05, "epoch": 2.286591606960082, "percentage": 45.78, "elapsed_time": "5:49:36", "remaining_time": "6:54:05"}
1118
+ {"current_steps": 1118, "total_steps": 2440, "loss": 0.3054, "lr": 2.6299947636662673e-05, "epoch": 2.2886386898669397, "percentage": 45.82, "elapsed_time": "5:49:51", "remaining_time": "6:53:42"}
1119
+ {"current_steps": 1119, "total_steps": 2440, "loss": 0.3278, "lr": 2.6272785806161005e-05, "epoch": 2.2906857727737973, "percentage": 45.86, "elapsed_time": "5:50:12", "remaining_time": "6:53:25"}
1120
+ {"current_steps": 1120, "total_steps": 2440, "loss": 0.3519, "lr": 2.6245611137715897e-05, "epoch": 2.292732855680655, "percentage": 45.9, "elapsed_time": "5:50:29", "remaining_time": "6:53:04"}
1121
+ {"current_steps": 1121, "total_steps": 2440, "loss": 0.3239, "lr": 2.621842368694329e-05, "epoch": 2.2947799385875127, "percentage": 45.94, "elapsed_time": "5:50:52", "remaining_time": "6:52:51"}
1122
+ {"current_steps": 1122, "total_steps": 2440, "loss": 0.3286, "lr": 2.6191223509485273e-05, "epoch": 2.2968270214943707, "percentage": 45.98, "elapsed_time": "5:51:13", "remaining_time": "6:52:34"}
1123
+ {"current_steps": 1123, "total_steps": 2440, "loss": 0.3364, "lr": 2.6164010661010007e-05, "epoch": 2.298874104401228, "percentage": 46.02, "elapsed_time": "5:51:34", "remaining_time": "6:52:19"}
1124
+ {"current_steps": 1124, "total_steps": 2440, "loss": 0.3086, "lr": 2.613678519721155e-05, "epoch": 2.300921187308086, "percentage": 46.07, "elapsed_time": "5:51:54", "remaining_time": "6:52:00"}
1125
+ {"current_steps": 1125, "total_steps": 2440, "loss": 0.3215, "lr": 2.61095471738098e-05, "epoch": 2.3029682702149437, "percentage": 46.11, "elapsed_time": "5:52:11", "remaining_time": "6:51:39"}
1126
+ {"current_steps": 1126, "total_steps": 2440, "loss": 0.3114, "lr": 2.6082296646550364e-05, "epoch": 2.3050153531218016, "percentage": 46.15, "elapsed_time": "5:52:28", "remaining_time": "6:51:19"}
1127
+ {"current_steps": 1127, "total_steps": 2440, "loss": 0.3621, "lr": 2.605503367120442e-05, "epoch": 2.307062436028659, "percentage": 46.19, "elapsed_time": "5:52:49", "remaining_time": "6:51:03"}
1128
+ {"current_steps": 1128, "total_steps": 2440, "loss": 0.3196, "lr": 2.6027758303568643e-05, "epoch": 2.309109518935517, "percentage": 46.23, "elapsed_time": "5:53:08", "remaining_time": "6:50:45"}
1129
+ {"current_steps": 1129, "total_steps": 2440, "loss": 0.3068, "lr": 2.6000470599465065e-05, "epoch": 2.3111566018423746, "percentage": 46.27, "elapsed_time": "5:53:28", "remaining_time": "6:50:27"}
1130
+ {"current_steps": 1130, "total_steps": 2440, "loss": 0.373, "lr": 2.5973170614740946e-05, "epoch": 2.313203684749232, "percentage": 46.31, "elapsed_time": "5:53:50", "remaining_time": "6:50:11"}
1131
+ {"current_steps": 1131, "total_steps": 2440, "loss": 0.3413, "lr": 2.5945858405268714e-05, "epoch": 2.31525076765609, "percentage": 46.35, "elapsed_time": "5:54:09", "remaining_time": "6:49:53"}
1132
+ {"current_steps": 1132, "total_steps": 2440, "loss": 0.3559, "lr": 2.5918534026945787e-05, "epoch": 2.317297850562948, "percentage": 46.39, "elapsed_time": "5:54:26", "remaining_time": "6:49:32"}
1133
+ {"current_steps": 1133, "total_steps": 2440, "loss": 0.3367, "lr": 2.5891197535694507e-05, "epoch": 2.3193449334698055, "percentage": 46.43, "elapsed_time": "5:54:48", "remaining_time": "6:49:17"}
1134
+ {"current_steps": 1134, "total_steps": 2440, "loss": 0.3529, "lr": 2.5863848987461993e-05, "epoch": 2.321392016376663, "percentage": 46.48, "elapsed_time": "5:55:08", "remaining_time": "6:49:00"}
1135
+ {"current_steps": 1135, "total_steps": 2440, "loss": 0.3347, "lr": 2.5836488438220044e-05, "epoch": 2.323439099283521, "percentage": 46.52, "elapsed_time": "5:55:27", "remaining_time": "6:48:41"}
1136
+ {"current_steps": 1136, "total_steps": 2440, "loss": 0.3366, "lr": 2.5809115943965027e-05, "epoch": 2.325486182190379, "percentage": 46.56, "elapsed_time": "5:55:45", "remaining_time": "6:48:22"}
1137
+ {"current_steps": 1137, "total_steps": 2440, "loss": 0.3106, "lr": 2.5781731560717745e-05, "epoch": 2.3275332650972365, "percentage": 46.6, "elapsed_time": "5:56:06", "remaining_time": "6:48:05"}
1138
+ {"current_steps": 1138, "total_steps": 2440, "loss": 0.3396, "lr": 2.575433534452334e-05, "epoch": 2.329580348004094, "percentage": 46.64, "elapsed_time": "5:56:24", "remaining_time": "6:47:46"}
1139
+ {"current_steps": 1139, "total_steps": 2440, "loss": 0.3439, "lr": 2.5726927351451178e-05, "epoch": 2.331627430910952, "percentage": 46.68, "elapsed_time": "5:56:40", "remaining_time": "6:47:24"}
1140
+ {"current_steps": 1140, "total_steps": 2440, "loss": 0.304, "lr": 2.5699507637594706e-05, "epoch": 2.3336745138178094, "percentage": 46.72, "elapsed_time": "5:56:57", "remaining_time": "6:47:03"}
1141
+ {"current_steps": 1141, "total_steps": 2440, "loss": 0.3276, "lr": 2.5672076259071385e-05, "epoch": 2.3357215967246674, "percentage": 46.76, "elapsed_time": "5:57:20", "remaining_time": "6:46:49"}
1142
+ {"current_steps": 1142, "total_steps": 2440, "loss": 0.36, "lr": 2.5644633272022536e-05, "epoch": 2.337768679631525, "percentage": 46.8, "elapsed_time": "5:57:41", "remaining_time": "6:46:32"}
1143
+ {"current_steps": 1143, "total_steps": 2440, "loss": 0.3062, "lr": 2.561717873261323e-05, "epoch": 2.339815762538383, "percentage": 46.84, "elapsed_time": "5:58:03", "remaining_time": "6:46:17"}
1144
+ {"current_steps": 1144, "total_steps": 2440, "loss": 0.3555, "lr": 2.558971269703219e-05, "epoch": 2.3418628454452404, "percentage": 46.89, "elapsed_time": "5:58:21", "remaining_time": "6:45:58"}
1145
+ {"current_steps": 1145, "total_steps": 2440, "loss": 0.3433, "lr": 2.556223522149168e-05, "epoch": 2.3439099283520983, "percentage": 46.93, "elapsed_time": "5:58:41", "remaining_time": "6:45:40"}
1146
+ {"current_steps": 1146, "total_steps": 2440, "loss": 0.3507, "lr": 2.5534746362227355e-05, "epoch": 2.345957011258956, "percentage": 46.97, "elapsed_time": "5:59:01", "remaining_time": "6:45:23"}
1147
+ {"current_steps": 1147, "total_steps": 2440, "loss": 0.3178, "lr": 2.5507246175498174e-05, "epoch": 2.348004094165814, "percentage": 47.01, "elapsed_time": "5:59:19", "remaining_time": "6:45:03"}
1148
+ {"current_steps": 1148, "total_steps": 2440, "loss": 0.3124, "lr": 2.5479734717586285e-05, "epoch": 2.3500511770726713, "percentage": 47.05, "elapsed_time": "5:59:36", "remaining_time": "6:44:43"}
1149
+ {"current_steps": 1149, "total_steps": 2440, "loss": 0.3179, "lr": 2.5452212044796912e-05, "epoch": 2.3520982599795293, "percentage": 47.09, "elapsed_time": "5:59:53", "remaining_time": "6:44:22"}
1150
+ {"current_steps": 1150, "total_steps": 2440, "loss": 0.2982, "lr": 2.5424678213458202e-05, "epoch": 2.3541453428863868, "percentage": 47.13, "elapsed_time": "6:00:08", "remaining_time": "6:43:59"}
1151
+ {"current_steps": 1151, "total_steps": 2440, "loss": 0.329, "lr": 2.539713327992117e-05, "epoch": 2.3561924257932447, "percentage": 47.17, "elapsed_time": "6:00:31", "remaining_time": "6:43:45"}
1152
+ {"current_steps": 1152, "total_steps": 2440, "loss": 0.3495, "lr": 2.5369577300559544e-05, "epoch": 2.3582395087001022, "percentage": 47.21, "elapsed_time": "6:00:47", "remaining_time": "6:43:23"}
1153
+ {"current_steps": 1153, "total_steps": 2440, "loss": 0.3218, "lr": 2.5342010331769635e-05, "epoch": 2.36028659160696, "percentage": 47.25, "elapsed_time": "6:01:06", "remaining_time": "6:43:04"}
1154
+ {"current_steps": 1154, "total_steps": 2440, "loss": 0.3714, "lr": 2.531443242997029e-05, "epoch": 2.3623336745138177, "percentage": 47.3, "elapsed_time": "6:01:25", "remaining_time": "6:42:45"}
1155
+ {"current_steps": 1155, "total_steps": 2440, "loss": 0.33, "lr": 2.5286843651602688e-05, "epoch": 2.3643807574206757, "percentage": 47.34, "elapsed_time": "6:01:43", "remaining_time": "6:42:26"}
1156
+ {"current_steps": 1156, "total_steps": 2440, "loss": 0.3338, "lr": 2.5259244053130295e-05, "epoch": 2.366427840327533, "percentage": 47.38, "elapsed_time": "6:02:04", "remaining_time": "6:42:10"}
1157
+ {"current_steps": 1157, "total_steps": 2440, "loss": 0.3303, "lr": 2.5231633691038716e-05, "epoch": 2.368474923234391, "percentage": 47.42, "elapsed_time": "6:02:21", "remaining_time": "6:41:48"}
1158
+ {"current_steps": 1158, "total_steps": 2440, "loss": 0.3108, "lr": 2.5204012621835575e-05, "epoch": 2.3705220061412486, "percentage": 47.46, "elapsed_time": "6:02:39", "remaining_time": "6:41:28"}
1159
+ {"current_steps": 1159, "total_steps": 2440, "loss": 0.3398, "lr": 2.5176380902050418e-05, "epoch": 2.3725690890481066, "percentage": 47.5, "elapsed_time": "6:02:54", "remaining_time": "6:41:06"}
1160
+ {"current_steps": 1160, "total_steps": 2440, "loss": 0.3199, "lr": 2.5148738588234593e-05, "epoch": 2.374616171954964, "percentage": 47.54, "elapsed_time": "6:03:09", "remaining_time": "6:40:43"}
1161
+ {"current_steps": 1161, "total_steps": 2440, "loss": 0.3288, "lr": 2.5121085736961112e-05, "epoch": 2.376663254861822, "percentage": 47.58, "elapsed_time": "6:03:30", "remaining_time": "6:40:26"}
1162
+ {"current_steps": 1162, "total_steps": 2440, "loss": 0.3483, "lr": 2.5093422404824574e-05, "epoch": 2.3787103377686796, "percentage": 47.62, "elapsed_time": "6:03:50", "remaining_time": "6:40:09"}
1163
+ {"current_steps": 1163, "total_steps": 2440, "loss": 0.3439, "lr": 2.506574864844102e-05, "epoch": 2.3807574206755375, "percentage": 47.66, "elapsed_time": "6:04:08", "remaining_time": "6:39:50"}
1164
+ {"current_steps": 1164, "total_steps": 2440, "loss": 0.3461, "lr": 2.5038064524447827e-05, "epoch": 2.382804503582395, "percentage": 47.7, "elapsed_time": "6:04:30", "remaining_time": "6:39:34"}
1165
+ {"current_steps": 1165, "total_steps": 2440, "loss": 0.3243, "lr": 2.5010370089503578e-05, "epoch": 2.384851586489253, "percentage": 47.75, "elapsed_time": "6:04:48", "remaining_time": "6:39:15"}
1166
+ {"current_steps": 1166, "total_steps": 2440, "loss": 0.3411, "lr": 2.4982665400287972e-05, "epoch": 2.3868986693961105, "percentage": 47.79, "elapsed_time": "6:05:08", "remaining_time": "6:38:57"}
1167
+ {"current_steps": 1167, "total_steps": 2440, "loss": 0.3319, "lr": 2.4954950513501697e-05, "epoch": 2.3889457523029685, "percentage": 47.83, "elapsed_time": "6:05:22", "remaining_time": "6:38:34"}
1168
+ {"current_steps": 1168, "total_steps": 2440, "loss": 0.3479, "lr": 2.4927225485866297e-05, "epoch": 2.390992835209826, "percentage": 47.87, "elapsed_time": "6:05:39", "remaining_time": "6:38:12"}
1169
+ {"current_steps": 1169, "total_steps": 2440, "loss": 0.3429, "lr": 2.4899490374124085e-05, "epoch": 2.393039918116684, "percentage": 47.91, "elapsed_time": "6:06:00", "remaining_time": "6:37:56"}
1170
+ {"current_steps": 1170, "total_steps": 2440, "loss": 0.3472, "lr": 2.4871745235038006e-05, "epoch": 2.3950870010235414, "percentage": 47.95, "elapsed_time": "6:06:19", "remaining_time": "6:37:37"}
1171
+ {"current_steps": 1171, "total_steps": 2440, "loss": 0.328, "lr": 2.4843990125391516e-05, "epoch": 2.397134083930399, "percentage": 47.99, "elapsed_time": "6:06:35", "remaining_time": "6:37:16"}
1172
+ {"current_steps": 1172, "total_steps": 2440, "loss": 0.3391, "lr": 2.4816225101988506e-05, "epoch": 2.399181166837257, "percentage": 48.03, "elapsed_time": "6:06:54", "remaining_time": "6:36:57"}
1173
+ {"current_steps": 1173, "total_steps": 2440, "loss": 0.3667, "lr": 2.478845022165313e-05, "epoch": 2.401228249744115, "percentage": 48.07, "elapsed_time": "6:07:14", "remaining_time": "6:36:39"}
1174
+ {"current_steps": 1174, "total_steps": 2440, "loss": 0.3301, "lr": 2.4760665541229712e-05, "epoch": 2.4032753326509724, "percentage": 48.11, "elapsed_time": "6:07:31", "remaining_time": "6:36:19"}
1175
+ {"current_steps": 1175, "total_steps": 2440, "loss": 0.3401, "lr": 2.473287111758267e-05, "epoch": 2.40532241555783, "percentage": 48.16, "elapsed_time": "6:07:50", "remaining_time": "6:36:01"}
1176
+ {"current_steps": 1176, "total_steps": 2440, "loss": 0.3218, "lr": 2.470506700759631e-05, "epoch": 2.407369498464688, "percentage": 48.2, "elapsed_time": "6:08:09", "remaining_time": "6:35:42"}
1177
+ {"current_steps": 1177, "total_steps": 2440, "loss": 0.3113, "lr": 2.467725326817481e-05, "epoch": 2.409416581371546, "percentage": 48.24, "elapsed_time": "6:08:26", "remaining_time": "6:35:21"}
1178
+ {"current_steps": 1178, "total_steps": 2440, "loss": 0.3269, "lr": 2.464942995624203e-05, "epoch": 2.4114636642784033, "percentage": 48.28, "elapsed_time": "6:08:46", "remaining_time": "6:35:03"}
1179
+ {"current_steps": 1179, "total_steps": 2440, "loss": 0.3411, "lr": 2.462159712874142e-05, "epoch": 2.413510747185261, "percentage": 48.32, "elapsed_time": "6:09:02", "remaining_time": "6:34:42"}
1180
+ {"current_steps": 1180, "total_steps": 2440, "loss": 0.3036, "lr": 2.4593754842635917e-05, "epoch": 2.4155578300921188, "percentage": 48.36, "elapsed_time": "6:09:16", "remaining_time": "6:34:18"}
1181
+ {"current_steps": 1181, "total_steps": 2440, "loss": 0.3898, "lr": 2.4565903154907807e-05, "epoch": 2.4176049129989763, "percentage": 48.4, "elapsed_time": "6:09:37", "remaining_time": "6:34:02"}
1182
+ {"current_steps": 1182, "total_steps": 2440, "loss": 0.3427, "lr": 2.453804212255862e-05, "epoch": 2.4196519959058342, "percentage": 48.44, "elapsed_time": "6:09:56", "remaining_time": "6:33:43"}
1183
+ {"current_steps": 1183, "total_steps": 2440, "loss": 0.3271, "lr": 2.451017180260902e-05, "epoch": 2.4216990788126918, "percentage": 48.48, "elapsed_time": "6:10:08", "remaining_time": "6:33:18"}
1184
+ {"current_steps": 1184, "total_steps": 2440, "loss": 0.3298, "lr": 2.448229225209865e-05, "epoch": 2.4237461617195497, "percentage": 48.52, "elapsed_time": "6:10:23", "remaining_time": "6:32:55"}
1185
+ {"current_steps": 1185, "total_steps": 2440, "loss": 0.3323, "lr": 2.4454403528086088e-05, "epoch": 2.425793244626407, "percentage": 48.57, "elapsed_time": "6:10:41", "remaining_time": "6:32:34"}
1186
+ {"current_steps": 1186, "total_steps": 2440, "loss": 0.3387, "lr": 2.4426505687648653e-05, "epoch": 2.427840327533265, "percentage": 48.61, "elapsed_time": "6:11:01", "remaining_time": "6:32:17"}
1187
+ {"current_steps": 1187, "total_steps": 2440, "loss": 0.3449, "lr": 2.4398598787882334e-05, "epoch": 2.4298874104401227, "percentage": 48.65, "elapsed_time": "6:11:20", "remaining_time": "6:31:58"}
1188
+ {"current_steps": 1188, "total_steps": 2440, "loss": 0.3006, "lr": 2.4370682885901657e-05, "epoch": 2.4319344933469806, "percentage": 48.69, "elapsed_time": "6:11:34", "remaining_time": "6:31:36"}
1189
+ {"current_steps": 1189, "total_steps": 2440, "loss": 0.3354, "lr": 2.4342758038839573e-05, "epoch": 2.433981576253838, "percentage": 48.73, "elapsed_time": "6:11:53", "remaining_time": "6:31:16"}
1190
+ {"current_steps": 1190, "total_steps": 2440, "loss": 0.3273, "lr": 2.4314824303847342e-05, "epoch": 2.436028659160696, "percentage": 48.77, "elapsed_time": "6:12:09", "remaining_time": "6:30:55"}
1191
+ {"current_steps": 1191, "total_steps": 2440, "loss": 0.3334, "lr": 2.4286881738094418e-05, "epoch": 2.4380757420675536, "percentage": 48.81, "elapsed_time": "6:12:28", "remaining_time": "6:30:36"}
1192
+ {"current_steps": 1192, "total_steps": 2440, "loss": 0.3405, "lr": 2.4258930398768317e-05, "epoch": 2.4401228249744116, "percentage": 48.85, "elapsed_time": "6:12:48", "remaining_time": "6:30:19"}
1193
+ {"current_steps": 1193, "total_steps": 2440, "loss": 0.2964, "lr": 2.423097034307452e-05, "epoch": 2.442169907881269, "percentage": 48.89, "elapsed_time": "6:13:01", "remaining_time": "6:29:54"}
1194
+ {"current_steps": 1194, "total_steps": 2440, "loss": 0.3122, "lr": 2.4203001628236346e-05, "epoch": 2.444216990788127, "percentage": 48.93, "elapsed_time": "6:13:18", "remaining_time": "6:29:34"}
1195
+ {"current_steps": 1195, "total_steps": 2440, "loss": 0.37, "lr": 2.4175024311494835e-05, "epoch": 2.4462640736949846, "percentage": 48.98, "elapsed_time": "6:13:38", "remaining_time": "6:29:16"}
1196
+ {"current_steps": 1196, "total_steps": 2440, "loss": 0.3462, "lr": 2.4147038450108627e-05, "epoch": 2.4483111566018425, "percentage": 49.02, "elapsed_time": "6:13:59", "remaining_time": "6:28:59"}
1197
+ {"current_steps": 1197, "total_steps": 2440, "loss": 0.3089, "lr": 2.4119044101353853e-05, "epoch": 2.4503582395087, "percentage": 49.06, "elapsed_time": "6:14:18", "remaining_time": "6:28:41"}
1198
+ {"current_steps": 1198, "total_steps": 2440, "loss": 0.3891, "lr": 2.4091041322524023e-05, "epoch": 2.452405322415558, "percentage": 49.1, "elapsed_time": "6:14:37", "remaining_time": "6:28:23"}
1199
+ {"current_steps": 1199, "total_steps": 2440, "loss": 0.3672, "lr": 2.406303017092988e-05, "epoch": 2.4544524053224155, "percentage": 49.14, "elapsed_time": "6:14:59", "remaining_time": "6:28:08"}
1200
+ {"current_steps": 1200, "total_steps": 2440, "loss": 0.3446, "lr": 2.403501070389932e-05, "epoch": 2.4564994882292734, "percentage": 49.18, "elapsed_time": "6:15:20", "remaining_time": "6:27:50"}
1201
+ {"current_steps": 1201, "total_steps": 2440, "loss": 0.3547, "lr": 2.4006982978777263e-05, "epoch": 2.458546571136131, "percentage": 49.22, "elapsed_time": "6:15:37", "remaining_time": "6:27:30"}
1202
+ {"current_steps": 1202, "total_steps": 2440, "loss": 0.3145, "lr": 2.39789470529255e-05, "epoch": 2.460593654042989, "percentage": 49.26, "elapsed_time": "6:15:59", "remaining_time": "6:27:15"}
1203
+ {"current_steps": 1203, "total_steps": 2440, "loss": 0.3512, "lr": 2.3950902983722645e-05, "epoch": 2.4626407369498464, "percentage": 49.3, "elapsed_time": "6:16:18", "remaining_time": "6:26:56"}
1204
+ {"current_steps": 1204, "total_steps": 2440, "loss": 0.331, "lr": 2.392285082856394e-05, "epoch": 2.4646878198567044, "percentage": 49.34, "elapsed_time": "6:16:33", "remaining_time": "6:26:34"}
1205
+ {"current_steps": 1205, "total_steps": 2440, "loss": 0.3697, "lr": 2.389479064486121e-05, "epoch": 2.466734902763562, "percentage": 49.39, "elapsed_time": "6:16:52", "remaining_time": "6:26:15"}
1206
+ {"current_steps": 1206, "total_steps": 2440, "loss": 0.3606, "lr": 2.3866722490042685e-05, "epoch": 2.46878198567042, "percentage": 49.43, "elapsed_time": "6:17:09", "remaining_time": "6:25:55"}
1207
+ {"current_steps": 1207, "total_steps": 2440, "loss": 0.3377, "lr": 2.3838646421552917e-05, "epoch": 2.4708290685772774, "percentage": 49.47, "elapsed_time": "6:17:26", "remaining_time": "6:25:34"}
1208
+ {"current_steps": 1208, "total_steps": 2440, "loss": 0.3262, "lr": 2.3810562496852666e-05, "epoch": 2.472876151484135, "percentage": 49.51, "elapsed_time": "6:17:46", "remaining_time": "6:25:16"}
1209
+ {"current_steps": 1209, "total_steps": 2440, "loss": 0.339, "lr": 2.3782470773418756e-05, "epoch": 2.474923234390993, "percentage": 49.55, "elapsed_time": "6:18:05", "remaining_time": "6:24:57"}
1210
+ {"current_steps": 1210, "total_steps": 2440, "loss": 0.33, "lr": 2.3754371308743975e-05, "epoch": 2.4769703172978508, "percentage": 49.59, "elapsed_time": "6:18:23", "remaining_time": "6:24:39"}
1211
+ {"current_steps": 1211, "total_steps": 2440, "loss": 0.3209, "lr": 2.372626416033696e-05, "epoch": 2.4790174002047083, "percentage": 49.63, "elapsed_time": "6:18:38", "remaining_time": "6:24:16"}
1212
+ {"current_steps": 1212, "total_steps": 2440, "loss": 0.3376, "lr": 2.3698149385722067e-05, "epoch": 2.481064483111566, "percentage": 49.67, "elapsed_time": "6:18:56", "remaining_time": "6:23:56"}
1213
+ {"current_steps": 1213, "total_steps": 2440, "loss": 0.3198, "lr": 2.367002704243927e-05, "epoch": 2.4831115660184238, "percentage": 49.71, "elapsed_time": "6:19:13", "remaining_time": "6:23:36"}
1214
+ {"current_steps": 1214, "total_steps": 2440, "loss": 0.3442, "lr": 2.3641897188044018e-05, "epoch": 2.4851586489252817, "percentage": 49.75, "elapsed_time": "6:19:32", "remaining_time": "6:23:17"}
1215
+ {"current_steps": 1215, "total_steps": 2440, "loss": 0.343, "lr": 2.3613759880107133e-05, "epoch": 2.487205731832139, "percentage": 49.8, "elapsed_time": "6:19:52", "remaining_time": "6:22:59"}
1216
+ {"current_steps": 1216, "total_steps": 2440, "loss": 0.3066, "lr": 2.3585615176214716e-05, "epoch": 2.4892528147389967, "percentage": 49.84, "elapsed_time": "6:20:07", "remaining_time": "6:22:38"}
1217
+ {"current_steps": 1217, "total_steps": 2440, "loss": 0.3325, "lr": 2.3557463133967976e-05, "epoch": 2.4912998976458547, "percentage": 49.88, "elapsed_time": "6:20:25", "remaining_time": "6:22:18"}
1218
+ {"current_steps": 1218, "total_steps": 2440, "loss": 0.3127, "lr": 2.3529303810983154e-05, "epoch": 2.493346980552712, "percentage": 49.92, "elapsed_time": "6:20:42", "remaining_time": "6:21:57"}
1219
+ {"current_steps": 1219, "total_steps": 2440, "loss": 0.3248, "lr": 2.3501137264891396e-05, "epoch": 2.49539406345957, "percentage": 49.96, "elapsed_time": "6:21:01", "remaining_time": "6:21:39"}
1220
+ {"current_steps": 1220, "total_steps": 2440, "loss": 0.3023, "lr": 2.3472963553338614e-05, "epoch": 2.4974411463664277, "percentage": 50.0, "elapsed_time": "6:21:18", "remaining_time": "6:21:18"}
1221
+ {"current_steps": 1221, "total_steps": 2440, "loss": 0.3252, "lr": 2.3444782733985396e-05, "epoch": 2.4994882292732856, "percentage": 50.04, "elapsed_time": "6:21:36", "remaining_time": "6:20:58"}
1222
+ {"current_steps": 1222, "total_steps": 2440, "loss": 0.3043, "lr": 2.3416594864506887e-05, "epoch": 2.501535312180143, "percentage": 50.08, "elapsed_time": "6:21:51", "remaining_time": "6:20:36"}
1223
+ {"current_steps": 1223, "total_steps": 2440, "loss": 0.3133, "lr": 2.338840000259264e-05, "epoch": 2.503582395087001, "percentage": 50.12, "elapsed_time": "6:22:08", "remaining_time": "6:20:16"}
1224
+ {"current_steps": 1224, "total_steps": 2440, "loss": 0.3141, "lr": 2.3360198205946542e-05, "epoch": 2.5056294779938586, "percentage": 50.16, "elapsed_time": "6:22:21", "remaining_time": "6:19:52"}
1225
+ {"current_steps": 1225, "total_steps": 2440, "loss": 0.3535, "lr": 2.333198953228664e-05, "epoch": 2.5076765609007166, "percentage": 50.2, "elapsed_time": "6:22:39", "remaining_time": "6:19:32"}
1226
+ {"current_steps": 1226, "total_steps": 2440, "loss": 0.3367, "lr": 2.3303774039345098e-05, "epoch": 2.509723643807574, "percentage": 50.25, "elapsed_time": "6:22:56", "remaining_time": "6:19:11"}
1227
+ {"current_steps": 1227, "total_steps": 2440, "loss": 0.3188, "lr": 2.3275551784867997e-05, "epoch": 2.511770726714432, "percentage": 50.29, "elapsed_time": "6:23:15", "remaining_time": "6:18:53"}
1228
+ {"current_steps": 1228, "total_steps": 2440, "loss": 0.3596, "lr": 2.3247322826615276e-05, "epoch": 2.5138178096212895, "percentage": 50.33, "elapsed_time": "6:23:34", "remaining_time": "6:18:34"}
1229
+ {"current_steps": 1229, "total_steps": 2440, "loss": 0.3395, "lr": 2.3219087222360603e-05, "epoch": 2.5158648925281475, "percentage": 50.37, "elapsed_time": "6:23:54", "remaining_time": "6:18:17"}
1230
+ {"current_steps": 1230, "total_steps": 2440, "loss": 0.3326, "lr": 2.3190845029891218e-05, "epoch": 2.517911975435005, "percentage": 50.41, "elapsed_time": "6:24:16", "remaining_time": "6:18:01"}
1231
+ {"current_steps": 1231, "total_steps": 2440, "loss": 0.3344, "lr": 2.316259630700787e-05, "epoch": 2.519959058341863, "percentage": 50.45, "elapsed_time": "6:24:33", "remaining_time": "6:17:40"}
1232
+ {"current_steps": 1232, "total_steps": 2440, "loss": 0.3346, "lr": 2.313434111152467e-05, "epoch": 2.5220061412487205, "percentage": 50.49, "elapsed_time": "6:24:48", "remaining_time": "6:17:18"}
1233
+ {"current_steps": 1233, "total_steps": 2440, "loss": 0.3448, "lr": 2.310607950126896e-05, "epoch": 2.5240532241555784, "percentage": 50.53, "elapsed_time": "6:25:07", "remaining_time": "6:17:00"}
1234
+ {"current_steps": 1234, "total_steps": 2440, "loss": 0.3359, "lr": 2.307781153408124e-05, "epoch": 2.526100307062436, "percentage": 50.57, "elapsed_time": "6:25:23", "remaining_time": "6:16:39"}
1235
+ {"current_steps": 1235, "total_steps": 2440, "loss": 0.3431, "lr": 2.3049537267814984e-05, "epoch": 2.528147389969294, "percentage": 50.61, "elapsed_time": "6:25:40", "remaining_time": "6:16:18"}
1236
+ {"current_steps": 1236, "total_steps": 2440, "loss": 0.3604, "lr": 2.3021256760336583e-05, "epoch": 2.5301944728761514, "percentage": 50.66, "elapsed_time": "6:26:00", "remaining_time": "6:16:01"}
1237
+ {"current_steps": 1237, "total_steps": 2440, "loss": 0.3472, "lr": 2.2992970069525202e-05, "epoch": 2.5322415557830094, "percentage": 50.7, "elapsed_time": "6:26:19", "remaining_time": "6:15:42"}
1238
+ {"current_steps": 1238, "total_steps": 2440, "loss": 0.3174, "lr": 2.296467725327264e-05, "epoch": 2.534288638689867, "percentage": 50.74, "elapsed_time": "6:26:41", "remaining_time": "6:15:26"}
1239
+ {"current_steps": 1239, "total_steps": 2440, "loss": 0.3093, "lr": 2.293637836948325e-05, "epoch": 2.536335721596725, "percentage": 50.78, "elapsed_time": "6:26:59", "remaining_time": "6:15:06"}
1240
+ {"current_steps": 1240, "total_steps": 2440, "loss": 0.3382, "lr": 2.29080734760738e-05, "epoch": 2.5383828045035823, "percentage": 50.82, "elapsed_time": "6:27:14", "remaining_time": "6:14:45"}
1241
+ {"current_steps": 1241, "total_steps": 2440, "loss": 0.3315, "lr": 2.2879762630973355e-05, "epoch": 2.54042988741044, "percentage": 50.86, "elapsed_time": "6:27:31", "remaining_time": "6:14:24"}
1242
+ {"current_steps": 1242, "total_steps": 2440, "loss": 0.3079, "lr": 2.285144589212316e-05, "epoch": 2.542476970317298, "percentage": 50.9, "elapsed_time": "6:27:45", "remaining_time": "6:14:00"}
1243
+ {"current_steps": 1243, "total_steps": 2440, "loss": 0.3422, "lr": 2.2823123317476522e-05, "epoch": 2.5445240532241558, "percentage": 50.94, "elapsed_time": "6:28:02", "remaining_time": "6:13:41"}
1244
+ {"current_steps": 1244, "total_steps": 2440, "loss": 0.3049, "lr": 2.2794794964998705e-05, "epoch": 2.5465711361310133, "percentage": 50.98, "elapsed_time": "6:28:23", "remaining_time": "6:13:24"}
1245
+ {"current_steps": 1245, "total_steps": 2440, "loss": 0.2992, "lr": 2.276646089266677e-05, "epoch": 2.548618219037871, "percentage": 51.02, "elapsed_time": "6:28:36", "remaining_time": "6:13:00"}
1246
+ {"current_steps": 1246, "total_steps": 2440, "loss": 0.3726, "lr": 2.273812115846951e-05, "epoch": 2.5506653019447287, "percentage": 51.07, "elapsed_time": "6:28:55", "remaining_time": "6:12:41"}
1247
+ {"current_steps": 1247, "total_steps": 2440, "loss": 0.2909, "lr": 2.2709775820407292e-05, "epoch": 2.5527123848515867, "percentage": 51.11, "elapsed_time": "6:29:12", "remaining_time": "6:12:20"}
1248
+ {"current_steps": 1248, "total_steps": 2440, "loss": 0.3669, "lr": 2.2681424936491954e-05, "epoch": 2.554759467758444, "percentage": 51.15, "elapsed_time": "6:29:27", "remaining_time": "6:11:58"}
1249
+ {"current_steps": 1249, "total_steps": 2440, "loss": 0.3403, "lr": 2.2653068564746692e-05, "epoch": 2.5568065506653017, "percentage": 51.19, "elapsed_time": "6:29:47", "remaining_time": "6:11:41"}
1250
+ {"current_steps": 1250, "total_steps": 2440, "loss": 0.3603, "lr": 2.2624706763205935e-05, "epoch": 2.5588536335721597, "percentage": 51.23, "elapsed_time": "6:30:05", "remaining_time": "6:11:21"}
1251
+ {"current_steps": 1251, "total_steps": 2440, "loss": 0.3554, "lr": 2.2596339589915197e-05, "epoch": 2.5609007164790176, "percentage": 51.27, "elapsed_time": "6:30:25", "remaining_time": "6:11:04"}
1252
+ {"current_steps": 1252, "total_steps": 2440, "loss": 0.3136, "lr": 2.2567967102931025e-05, "epoch": 2.562947799385875, "percentage": 51.31, "elapsed_time": "6:30:45", "remaining_time": "6:10:47"}
1253
+ {"current_steps": 1253, "total_steps": 2440, "loss": 0.3256, "lr": 2.2539589360320802e-05, "epoch": 2.5649948822927326, "percentage": 51.35, "elapsed_time": "6:31:01", "remaining_time": "6:10:25"}
1254
+ {"current_steps": 1254, "total_steps": 2440, "loss": 0.3414, "lr": 2.2511206420162716e-05, "epoch": 2.5670419651995906, "percentage": 51.39, "elapsed_time": "6:31:23", "remaining_time": "6:10:10"}
1255
+ {"current_steps": 1255, "total_steps": 2440, "loss": 0.3102, "lr": 2.2482818340545534e-05, "epoch": 2.5690890481064486, "percentage": 51.43, "elapsed_time": "6:31:39", "remaining_time": "6:09:49"}
1256
+ {"current_steps": 1256, "total_steps": 2440, "loss": 0.3434, "lr": 2.2454425179568594e-05, "epoch": 2.571136131013306, "percentage": 51.48, "elapsed_time": "6:31:56", "remaining_time": "6:09:28"}
1257
+ {"current_steps": 1257, "total_steps": 2440, "loss": 0.318, "lr": 2.2426026995341602e-05, "epoch": 2.5731832139201636, "percentage": 51.52, "elapsed_time": "6:32:15", "remaining_time": "6:09:10"}
1258
+ {"current_steps": 1258, "total_steps": 2440, "loss": 0.3749, "lr": 2.2397623845984548e-05, "epoch": 2.5752302968270215, "percentage": 51.56, "elapsed_time": "6:32:35", "remaining_time": "6:08:52"}
1259
+ {"current_steps": 1259, "total_steps": 2440, "loss": 0.298, "lr": 2.2369215789627593e-05, "epoch": 2.5772773797338795, "percentage": 51.6, "elapsed_time": "6:32:51", "remaining_time": "6:08:30"}
1260
+ {"current_steps": 1260, "total_steps": 2440, "loss": 0.3419, "lr": 2.234080288441095e-05, "epoch": 2.579324462640737, "percentage": 51.64, "elapsed_time": "6:33:11", "remaining_time": "6:08:13"}
1261
+ {"current_steps": 1261, "total_steps": 2440, "loss": 0.3501, "lr": 2.2312385188484718e-05, "epoch": 2.5813715455475945, "percentage": 51.68, "elapsed_time": "6:33:29", "remaining_time": "6:07:53"}
1262
+ {"current_steps": 1262, "total_steps": 2440, "loss": 0.339, "lr": 2.2283962760008845e-05, "epoch": 2.5834186284544525, "percentage": 51.72, "elapsed_time": "6:33:48", "remaining_time": "6:07:35"}
1263
+ {"current_steps": 1263, "total_steps": 2440, "loss": 0.3334, "lr": 2.225553565715294e-05, "epoch": 2.58546571136131, "percentage": 51.76, "elapsed_time": "6:34:06", "remaining_time": "6:07:16"}
1264
+ {"current_steps": 1264, "total_steps": 2440, "loss": 0.3139, "lr": 2.2227103938096176e-05, "epoch": 2.587512794268168, "percentage": 51.8, "elapsed_time": "6:34:18", "remaining_time": "6:06:50"}
1265
+ {"current_steps": 1265, "total_steps": 2440, "loss": 0.3232, "lr": 2.2198667661027193e-05, "epoch": 2.5895598771750254, "percentage": 51.84, "elapsed_time": "6:34:35", "remaining_time": "6:06:31"}
1266
+ {"current_steps": 1266, "total_steps": 2440, "loss": 0.3089, "lr": 2.2170226884143942e-05, "epoch": 2.5916069600818834, "percentage": 51.89, "elapsed_time": "6:34:55", "remaining_time": "6:06:13"}
1267
+ {"current_steps": 1267, "total_steps": 2440, "loss": 0.3069, "lr": 2.2141781665653584e-05, "epoch": 2.593654042988741, "percentage": 51.93, "elapsed_time": "6:35:16", "remaining_time": "6:05:56"}
1268
+ {"current_steps": 1268, "total_steps": 2440, "loss": 0.3343, "lr": 2.2113332063772387e-05, "epoch": 2.595701125895599, "percentage": 51.97, "elapsed_time": "6:35:36", "remaining_time": "6:05:39"}
1269
+ {"current_steps": 1269, "total_steps": 2440, "loss": 0.3246, "lr": 2.208487813672557e-05, "epoch": 2.5977482088024564, "percentage": 52.01, "elapsed_time": "6:35:51", "remaining_time": "6:05:17"}
1270
+ {"current_steps": 1270, "total_steps": 2440, "loss": 0.3543, "lr": 2.205641994274721e-05, "epoch": 2.5997952917093143, "percentage": 52.05, "elapsed_time": "6:36:11", "remaining_time": "6:04:59"}
1271
+ {"current_steps": 1271, "total_steps": 2440, "loss": 0.3412, "lr": 2.2027957540080125e-05, "epoch": 2.601842374616172, "percentage": 52.09, "elapsed_time": "6:36:26", "remaining_time": "6:04:37"}
1272
+ {"current_steps": 1272, "total_steps": 2440, "loss": 0.321, "lr": 2.199949098697574e-05, "epoch": 2.60388945752303, "percentage": 52.13, "elapsed_time": "6:36:42", "remaining_time": "6:04:16"}
1273
+ {"current_steps": 1273, "total_steps": 2440, "loss": 0.321, "lr": 2.1971020341693973e-05, "epoch": 2.6059365404298873, "percentage": 52.17, "elapsed_time": "6:37:02", "remaining_time": "6:03:59"}
1274
+ {"current_steps": 1274, "total_steps": 2440, "loss": 0.3366, "lr": 2.1942545662503115e-05, "epoch": 2.6079836233367453, "percentage": 52.21, "elapsed_time": "6:37:20", "remaining_time": "6:03:39"}
1275
+ {"current_steps": 1275, "total_steps": 2440, "loss": 0.346, "lr": 2.1914067007679733e-05, "epoch": 2.610030706243603, "percentage": 52.25, "elapsed_time": "6:37:40", "remaining_time": "6:03:21"}
1276
+ {"current_steps": 1276, "total_steps": 2440, "loss": 0.3471, "lr": 2.188558443550849e-05, "epoch": 2.6120777891504607, "percentage": 52.3, "elapsed_time": "6:37:55", "remaining_time": "6:02:59"}
1277
+ {"current_steps": 1277, "total_steps": 2440, "loss": 0.3523, "lr": 2.185709800428211e-05, "epoch": 2.6141248720573182, "percentage": 52.34, "elapsed_time": "6:38:17", "remaining_time": "6:02:44"}
1278
+ {"current_steps": 1278, "total_steps": 2440, "loss": 0.3456, "lr": 2.1828607772301187e-05, "epoch": 2.616171954964176, "percentage": 52.38, "elapsed_time": "6:38:34", "remaining_time": "6:02:23"}
1279
+ {"current_steps": 1279, "total_steps": 2440, "loss": 0.3309, "lr": 2.180011379787411e-05, "epoch": 2.6182190378710337, "percentage": 52.42, "elapsed_time": "6:38:48", "remaining_time": "6:02:00"}
1280
+ {"current_steps": 1280, "total_steps": 2440, "loss": 0.3351, "lr": 2.1771616139316903e-05, "epoch": 2.6202661207778917, "percentage": 52.46, "elapsed_time": "6:39:07", "remaining_time": "6:01:42"}
1281
+ {"current_steps": 1281, "total_steps": 2440, "loss": 0.3046, "lr": 2.174311485495317e-05, "epoch": 2.622313203684749, "percentage": 52.5, "elapsed_time": "6:39:28", "remaining_time": "6:01:26"}
1282
+ {"current_steps": 1282, "total_steps": 2440, "loss": 0.303, "lr": 2.1714610003113887e-05, "epoch": 2.6243602865916067, "percentage": 52.54, "elapsed_time": "6:39:48", "remaining_time": "6:01:08"}
1283
+ {"current_steps": 1283, "total_steps": 2440, "loss": 0.3213, "lr": 2.168610164213738e-05, "epoch": 2.6264073694984647, "percentage": 52.58, "elapsed_time": "6:40:04", "remaining_time": "6:00:47"}
1284
+ {"current_steps": 1284, "total_steps": 2440, "loss": 0.351, "lr": 2.1657589830369113e-05, "epoch": 2.6284544524053226, "percentage": 52.62, "elapsed_time": "6:40:25", "remaining_time": "6:00:30"}
1285
+ {"current_steps": 1285, "total_steps": 2440, "loss": 0.3868, "lr": 2.1629074626161647e-05, "epoch": 2.63050153531218, "percentage": 52.66, "elapsed_time": "6:40:46", "remaining_time": "6:00:14"}
1286
+ {"current_steps": 1286, "total_steps": 2440, "loss": 0.3175, "lr": 2.1600556087874472e-05, "epoch": 2.6325486182190376, "percentage": 52.7, "elapsed_time": "6:41:07", "remaining_time": "5:59:57"}
1287
+ {"current_steps": 1287, "total_steps": 2440, "loss": 0.3262, "lr": 2.1572034273873893e-05, "epoch": 2.6345957011258956, "percentage": 52.75, "elapsed_time": "6:41:25", "remaining_time": "5:59:37"}
1288
+ {"current_steps": 1288, "total_steps": 2440, "loss": 0.3716, "lr": 2.1543509242532932e-05, "epoch": 2.6366427840327535, "percentage": 52.79, "elapsed_time": "6:41:42", "remaining_time": "5:59:17"}
1289
+ {"current_steps": 1289, "total_steps": 2440, "loss": 0.3166, "lr": 2.1514981052231187e-05, "epoch": 2.638689866939611, "percentage": 52.83, "elapsed_time": "6:42:00", "remaining_time": "5:58:57"}
1290
+ {"current_steps": 1290, "total_steps": 2440, "loss": 0.3315, "lr": 2.1486449761354727e-05, "epoch": 2.6407369498464686, "percentage": 52.87, "elapsed_time": "6:42:18", "remaining_time": "5:58:38"}
1291
+ {"current_steps": 1291, "total_steps": 2440, "loss": 0.3225, "lr": 2.145791542829597e-05, "epoch": 2.6427840327533265, "percentage": 52.91, "elapsed_time": "6:42:36", "remaining_time": "5:58:19"}
1292
+ {"current_steps": 1292, "total_steps": 2440, "loss": 0.3839, "lr": 2.142937811145354e-05, "epoch": 2.6448311156601845, "percentage": 52.95, "elapsed_time": "6:42:56", "remaining_time": "5:58:02"}
1293
+ {"current_steps": 1293, "total_steps": 2440, "loss": 0.3277, "lr": 2.140083786923221e-05, "epoch": 2.646878198567042, "percentage": 52.99, "elapsed_time": "6:43:15", "remaining_time": "5:57:43"}
1294
+ {"current_steps": 1294, "total_steps": 2440, "loss": 0.3396, "lr": 2.1372294760042686e-05, "epoch": 2.6489252814738995, "percentage": 53.03, "elapsed_time": "6:43:34", "remaining_time": "5:57:25"}
1295
+ {"current_steps": 1295, "total_steps": 2440, "loss": 0.3199, "lr": 2.1343748842301575e-05, "epoch": 2.6509723643807575, "percentage": 53.07, "elapsed_time": "6:43:51", "remaining_time": "5:57:04"}
1296
+ {"current_steps": 1296, "total_steps": 2440, "loss": 0.3264, "lr": 2.1315200174431235e-05, "epoch": 2.6530194472876154, "percentage": 53.11, "elapsed_time": "6:44:09", "remaining_time": "5:56:45"}
1297
+ {"current_steps": 1297, "total_steps": 2440, "loss": 0.3196, "lr": 2.1286648814859636e-05, "epoch": 2.655066530194473, "percentage": 53.16, "elapsed_time": "6:44:29", "remaining_time": "5:56:27"}
1298
+ {"current_steps": 1298, "total_steps": 2440, "loss": 0.3132, "lr": 2.1258094822020263e-05, "epoch": 2.6571136131013304, "percentage": 53.2, "elapsed_time": "6:44:45", "remaining_time": "5:56:06"}
1299
+ {"current_steps": 1299, "total_steps": 2440, "loss": 0.3238, "lr": 2.1229538254351995e-05, "epoch": 2.6591606960081884, "percentage": 53.24, "elapsed_time": "6:45:01", "remaining_time": "5:55:45"}
1300
+ {"current_steps": 1300, "total_steps": 2440, "loss": 0.3843, "lr": 2.120097917029897e-05, "epoch": 2.661207778915046, "percentage": 53.28, "elapsed_time": "6:45:21", "remaining_time": "5:55:28"}
1301
+ {"current_steps": 1301, "total_steps": 2440, "loss": 0.3292, "lr": 2.1172417628310487e-05, "epoch": 2.663254861821904, "percentage": 53.32, "elapsed_time": "6:45:41", "remaining_time": "5:55:10"}
1302
+ {"current_steps": 1302, "total_steps": 2440, "loss": 0.3102, "lr": 2.1143853686840874e-05, "epoch": 2.6653019447287614, "percentage": 53.36, "elapsed_time": "6:46:00", "remaining_time": "5:54:51"}
1303
+ {"current_steps": 1303, "total_steps": 2440, "loss": 0.3156, "lr": 2.1115287404349357e-05, "epoch": 2.6673490276356193, "percentage": 53.4, "elapsed_time": "6:46:21", "remaining_time": "5:54:35"}
1304
+ {"current_steps": 1304, "total_steps": 2440, "loss": 0.3461, "lr": 2.1086718839299972e-05, "epoch": 2.669396110542477, "percentage": 53.44, "elapsed_time": "6:46:43", "remaining_time": "5:54:19"}
1305
+ {"current_steps": 1305, "total_steps": 2440, "loss": 0.3357, "lr": 2.1058148050161412e-05, "epoch": 2.671443193449335, "percentage": 53.48, "elapsed_time": "6:47:02", "remaining_time": "5:54:01"}
1306
+ {"current_steps": 1306, "total_steps": 2440, "loss": 0.3454, "lr": 2.1029575095406933e-05, "epoch": 2.6734902763561923, "percentage": 53.52, "elapsed_time": "6:47:19", "remaining_time": "5:53:40"}
1307
+ {"current_steps": 1307, "total_steps": 2440, "loss": 0.3403, "lr": 2.1001000033514215e-05, "epoch": 2.6755373592630503, "percentage": 53.57, "elapsed_time": "6:47:42", "remaining_time": "5:53:26"}
1308
+ {"current_steps": 1308, "total_steps": 2440, "loss": 0.3643, "lr": 2.097242292296525e-05, "epoch": 2.6775844421699078, "percentage": 53.61, "elapsed_time": "6:48:02", "remaining_time": "5:53:08"}
1309
+ {"current_steps": 1309, "total_steps": 2440, "loss": 0.3224, "lr": 2.0943843822246234e-05, "epoch": 2.6796315250767657, "percentage": 53.65, "elapsed_time": "6:48:25", "remaining_time": "5:52:53"}
1310
+ {"current_steps": 1310, "total_steps": 2440, "loss": 0.3368, "lr": 2.0915262789847414e-05, "epoch": 2.6816786079836232, "percentage": 53.69, "elapsed_time": "6:48:42", "remaining_time": "5:52:32"}
1311
+ {"current_steps": 1311, "total_steps": 2440, "loss": 0.311, "lr": 2.088667988426302e-05, "epoch": 2.683725690890481, "percentage": 53.73, "elapsed_time": "6:49:01", "remaining_time": "5:52:14"}
1312
+ {"current_steps": 1312, "total_steps": 2440, "loss": 0.3145, "lr": 2.0858095163991094e-05, "epoch": 2.6857727737973387, "percentage": 53.77, "elapsed_time": "6:49:18", "remaining_time": "5:51:54"}
1313
+ {"current_steps": 1313, "total_steps": 2440, "loss": 0.343, "lr": 2.0829508687533387e-05, "epoch": 2.6878198567041967, "percentage": 53.81, "elapsed_time": "6:49:38", "remaining_time": "5:51:36"}
1314
+ {"current_steps": 1314, "total_steps": 2440, "loss": 0.3102, "lr": 2.0800920513395276e-05, "epoch": 2.689866939611054, "percentage": 53.85, "elapsed_time": "6:49:56", "remaining_time": "5:51:17"}
1315
+ {"current_steps": 1315, "total_steps": 2440, "loss": 0.3628, "lr": 2.077233070008557e-05, "epoch": 2.691914022517912, "percentage": 53.89, "elapsed_time": "6:50:15", "remaining_time": "5:50:58"}
1316
+ {"current_steps": 1316, "total_steps": 2440, "loss": 0.3611, "lr": 2.074373930611647e-05, "epoch": 2.6939611054247696, "percentage": 53.93, "elapsed_time": "6:50:38", "remaining_time": "5:50:43"}
1317
+ {"current_steps": 1317, "total_steps": 2440, "loss": 0.4382, "lr": 2.0715146390003395e-05, "epoch": 2.6960081883316276, "percentage": 53.98, "elapsed_time": "6:51:01", "remaining_time": "5:50:28"}
1318
+ {"current_steps": 1318, "total_steps": 2440, "loss": 0.3316, "lr": 2.0686552010264872e-05, "epoch": 2.698055271238485, "percentage": 54.02, "elapsed_time": "6:51:18", "remaining_time": "5:50:08"}
1319
+ {"current_steps": 1319, "total_steps": 2440, "loss": 0.3241, "lr": 2.0657956225422438e-05, "epoch": 2.7001023541453426, "percentage": 54.06, "elapsed_time": "6:51:34", "remaining_time": "5:49:47"}
1320
+ {"current_steps": 1320, "total_steps": 2440, "loss": 0.3634, "lr": 2.0629359094000502e-05, "epoch": 2.7021494370522006, "percentage": 54.1, "elapsed_time": "6:51:52", "remaining_time": "5:49:28"}
1321
+ {"current_steps": 1321, "total_steps": 2440, "loss": 0.3434, "lr": 2.060076067452622e-05, "epoch": 2.7041965199590585, "percentage": 54.14, "elapsed_time": "6:52:14", "remaining_time": "5:49:12"}
1322
+ {"current_steps": 1322, "total_steps": 2440, "loss": 0.3592, "lr": 2.0572161025529396e-05, "epoch": 2.706243602865916, "percentage": 54.18, "elapsed_time": "6:52:34", "remaining_time": "5:48:54"}
1323
+ {"current_steps": 1323, "total_steps": 2440, "loss": 0.3273, "lr": 2.0543560205542338e-05, "epoch": 2.7082906857727735, "percentage": 54.22, "elapsed_time": "6:52:52", "remaining_time": "5:48:35"}
1324
+ {"current_steps": 1324, "total_steps": 2440, "loss": 0.3528, "lr": 2.0514958273099778e-05, "epoch": 2.7103377686796315, "percentage": 54.26, "elapsed_time": "6:53:11", "remaining_time": "5:48:16"}
1325
+ {"current_steps": 1325, "total_steps": 2440, "loss": 0.3279, "lr": 2.0486355286738675e-05, "epoch": 2.7123848515864895, "percentage": 54.3, "elapsed_time": "6:53:29", "remaining_time": "5:47:57"}
1326
+ {"current_steps": 1326, "total_steps": 2440, "loss": 0.3154, "lr": 2.0457751304998196e-05, "epoch": 2.714431934493347, "percentage": 54.34, "elapsed_time": "6:53:49", "remaining_time": "5:47:39"}
1327
+ {"current_steps": 1327, "total_steps": 2440, "loss": 0.3122, "lr": 2.042914638641952e-05, "epoch": 2.7164790174002045, "percentage": 54.39, "elapsed_time": "6:54:07", "remaining_time": "5:47:20"}
1328
+ {"current_steps": 1328, "total_steps": 2440, "loss": 0.2987, "lr": 2.0400540589545738e-05, "epoch": 2.7185261003070624, "percentage": 54.43, "elapsed_time": "6:54:24", "remaining_time": "5:46:59"}
1329
+ {"current_steps": 1329, "total_steps": 2440, "loss": 0.3651, "lr": 2.0371933972921756e-05, "epoch": 2.7205731832139204, "percentage": 54.47, "elapsed_time": "6:54:43", "remaining_time": "5:46:41"}
1330
+ {"current_steps": 1330, "total_steps": 2440, "loss": 0.3056, "lr": 2.0343326595094154e-05, "epoch": 2.722620266120778, "percentage": 54.51, "elapsed_time": "6:55:01", "remaining_time": "5:46:22"}
1331
+ {"current_steps": 1331, "total_steps": 2440, "loss": 0.3078, "lr": 2.031471851461105e-05, "epoch": 2.7246673490276354, "percentage": 54.55, "elapsed_time": "6:55:18", "remaining_time": "5:46:02"}
1332
+ {"current_steps": 1332, "total_steps": 2440, "loss": 0.3019, "lr": 2.0286109790022023e-05, "epoch": 2.7267144319344934, "percentage": 54.59, "elapsed_time": "6:55:35", "remaining_time": "5:45:42"}
1333
+ {"current_steps": 1333, "total_steps": 2440, "loss": 0.3606, "lr": 2.0257500479877965e-05, "epoch": 2.7287615148413513, "percentage": 54.63, "elapsed_time": "6:55:55", "remaining_time": "5:45:24"}
1334
+ {"current_steps": 1334, "total_steps": 2440, "loss": 0.3188, "lr": 2.0228890642730967e-05, "epoch": 2.730808597748209, "percentage": 54.67, "elapsed_time": "6:56:15", "remaining_time": "5:45:07"}
1335
+ {"current_steps": 1335, "total_steps": 2440, "loss": 0.3233, "lr": 2.020028033713418e-05, "epoch": 2.7328556806550663, "percentage": 54.71, "elapsed_time": "6:56:34", "remaining_time": "5:44:48"}
1336
+ {"current_steps": 1336, "total_steps": 2440, "loss": 0.3563, "lr": 2.0171669621641743e-05, "epoch": 2.7349027635619243, "percentage": 54.75, "elapsed_time": "6:56:53", "remaining_time": "5:44:29"}
1337
+ {"current_steps": 1337, "total_steps": 2440, "loss": 0.3107, "lr": 2.0143058554808622e-05, "epoch": 2.7369498464687823, "percentage": 54.8, "elapsed_time": "6:57:12", "remaining_time": "5:44:11"}
1338
+ {"current_steps": 1338, "total_steps": 2440, "loss": 0.3445, "lr": 2.0114447195190486e-05, "epoch": 2.7389969293756398, "percentage": 54.84, "elapsed_time": "6:57:35", "remaining_time": "5:43:55"}
1339
+ {"current_steps": 1339, "total_steps": 2440, "loss": 0.3426, "lr": 2.0085835601343627e-05, "epoch": 2.7410440122824973, "percentage": 54.88, "elapsed_time": "6:57:52", "remaining_time": "5:43:36"}
1340
+ {"current_steps": 1340, "total_steps": 2440, "loss": 0.3216, "lr": 2.005722383182481e-05, "epoch": 2.7430910951893552, "percentage": 54.92, "elapsed_time": "6:58:11", "remaining_time": "5:43:17"}
1341
+ {"current_steps": 1341, "total_steps": 2440, "loss": 0.3888, "lr": 2.002861194519114e-05, "epoch": 2.7451381780962127, "percentage": 54.96, "elapsed_time": "6:58:34", "remaining_time": "5:43:02"}
1342
+ {"current_steps": 1342, "total_steps": 2440, "loss": 0.3448, "lr": 2e-05, "epoch": 2.7471852610030707, "percentage": 55.0, "elapsed_time": "6:58:51", "remaining_time": "5:42:42"}
1343
+ {"current_steps": 1343, "total_steps": 2440, "loss": 0.3303, "lr": 1.9971388054808863e-05, "epoch": 2.749232343909928, "percentage": 55.04, "elapsed_time": "6:59:12", "remaining_time": "5:42:24"}
1344
+ {"current_steps": 1344, "total_steps": 2440, "loss": 0.3378, "lr": 1.99427761681752e-05, "epoch": 2.751279426816786, "percentage": 55.08, "elapsed_time": "6:59:33", "remaining_time": "5:42:08"}
1345
+ {"current_steps": 1345, "total_steps": 2440, "loss": 0.3204, "lr": 1.9914164398656383e-05, "epoch": 2.7533265097236437, "percentage": 55.12, "elapsed_time": "6:59:51", "remaining_time": "5:41:48"}
1346
+ {"current_steps": 1346, "total_steps": 2440, "loss": 0.3245, "lr": 1.988555280480952e-05, "epoch": 2.7553735926305016, "percentage": 55.16, "elapsed_time": "7:00:08", "remaining_time": "5:41:28"}
1347
+ {"current_steps": 1347, "total_steps": 2440, "loss": 0.2973, "lr": 1.9856941445191388e-05, "epoch": 2.757420675537359, "percentage": 55.2, "elapsed_time": "7:00:27", "remaining_time": "5:41:10"}
1348
+ {"current_steps": 1348, "total_steps": 2440, "loss": 0.3462, "lr": 1.9828330378358264e-05, "epoch": 2.759467758444217, "percentage": 55.25, "elapsed_time": "7:00:50", "remaining_time": "5:40:54"}
1349
+ {"current_steps": 1349, "total_steps": 2440, "loss": 0.3348, "lr": 1.9799719662865828e-05, "epoch": 2.7615148413510746, "percentage": 55.29, "elapsed_time": "7:01:07", "remaining_time": "5:40:35"}
1350
+ {"current_steps": 1350, "total_steps": 2440, "loss": 0.3041, "lr": 1.9771109357269047e-05, "epoch": 2.7635619242579326, "percentage": 55.33, "elapsed_time": "7:01:22", "remaining_time": "5:40:13"}
1351
+ {"current_steps": 1351, "total_steps": 2440, "loss": 0.3442, "lr": 1.974249952012204e-05, "epoch": 2.76560900716479, "percentage": 55.37, "elapsed_time": "7:01:42", "remaining_time": "5:39:55"}
1352
+ {"current_steps": 1352, "total_steps": 2440, "loss": 0.3133, "lr": 1.9713890209977977e-05, "epoch": 2.767656090071648, "percentage": 55.41, "elapsed_time": "7:02:01", "remaining_time": "5:39:36"}
1353
+ {"current_steps": 1353, "total_steps": 2440, "loss": 0.3091, "lr": 1.9685281485388955e-05, "epoch": 2.7697031729785055, "percentage": 55.45, "elapsed_time": "7:02:19", "remaining_time": "5:39:17"}
1354
+ {"current_steps": 1354, "total_steps": 2440, "loss": 0.2957, "lr": 1.9656673404905852e-05, "epoch": 2.7717502558853635, "percentage": 55.49, "elapsed_time": "7:02:40", "remaining_time": "5:39:00"}
1355
+ {"current_steps": 1355, "total_steps": 2440, "loss": 0.3413, "lr": 1.9628066027078247e-05, "epoch": 2.773797338792221, "percentage": 55.53, "elapsed_time": "7:03:00", "remaining_time": "5:38:43"}
1356
+ {"current_steps": 1356, "total_steps": 2440, "loss": 0.2997, "lr": 1.9599459410454266e-05, "epoch": 2.775844421699079, "percentage": 55.57, "elapsed_time": "7:03:18", "remaining_time": "5:38:23"}
1357
+ {"current_steps": 1357, "total_steps": 2440, "loss": 0.3397, "lr": 1.957085361358049e-05, "epoch": 2.7778915046059365, "percentage": 55.61, "elapsed_time": "7:03:34", "remaining_time": "5:38:02"}
1358
+ {"current_steps": 1358, "total_steps": 2440, "loss": 0.3269, "lr": 1.9542248695001808e-05, "epoch": 2.7799385875127944, "percentage": 55.66, "elapsed_time": "7:03:51", "remaining_time": "5:37:43"}
1359
+ {"current_steps": 1359, "total_steps": 2440, "loss": 0.3398, "lr": 1.9513644713261328e-05, "epoch": 2.781985670419652, "percentage": 55.7, "elapsed_time": "7:04:14", "remaining_time": "5:37:27"}
1360
+ {"current_steps": 1360, "total_steps": 2440, "loss": 0.3247, "lr": 1.9485041726900232e-05, "epoch": 2.7840327533265095, "percentage": 55.74, "elapsed_time": "7:04:34", "remaining_time": "5:37:09"}
1361
+ {"current_steps": 1361, "total_steps": 2440, "loss": 0.3699, "lr": 1.9456439794457665e-05, "epoch": 2.7860798362333674, "percentage": 55.78, "elapsed_time": "7:04:56", "remaining_time": "5:36:53"}
1362
+ {"current_steps": 1362, "total_steps": 2440, "loss": 0.3315, "lr": 1.942783897447061e-05, "epoch": 2.7881269191402254, "percentage": 55.82, "elapsed_time": "7:05:15", "remaining_time": "5:36:35"}
1363
+ {"current_steps": 1363, "total_steps": 2440, "loss": 0.3325, "lr": 1.939923932547379e-05, "epoch": 2.790174002047083, "percentage": 55.86, "elapsed_time": "7:05:35", "remaining_time": "5:36:17"}
1364
+ {"current_steps": 1364, "total_steps": 2440, "loss": 0.3048, "lr": 1.93706409059995e-05, "epoch": 2.7922210849539404, "percentage": 55.9, "elapsed_time": "7:05:51", "remaining_time": "5:35:56"}
1365
+ {"current_steps": 1365, "total_steps": 2440, "loss": 0.3478, "lr": 1.9342043774577562e-05, "epoch": 2.7942681678607983, "percentage": 55.94, "elapsed_time": "7:06:10", "remaining_time": "5:35:37"}
1366
+ {"current_steps": 1366, "total_steps": 2440, "loss": 0.3428, "lr": 1.931344798973513e-05, "epoch": 2.7963152507676563, "percentage": 55.98, "elapsed_time": "7:06:28", "remaining_time": "5:35:18"}
1367
+ {"current_steps": 1367, "total_steps": 2440, "loss": 0.3641, "lr": 1.928485360999661e-05, "epoch": 2.798362333674514, "percentage": 56.02, "elapsed_time": "7:06:50", "remaining_time": "5:35:02"}
1368
+ {"current_steps": 1368, "total_steps": 2440, "loss": 0.2993, "lr": 1.9256260693883534e-05, "epoch": 2.8004094165813713, "percentage": 56.07, "elapsed_time": "7:07:06", "remaining_time": "5:34:41"}
1369
+ {"current_steps": 1369, "total_steps": 2440, "loss": 0.3298, "lr": 1.922766929991443e-05, "epoch": 2.8024564994882293, "percentage": 56.11, "elapsed_time": "7:07:28", "remaining_time": "5:34:25"}
1370
+ {"current_steps": 1370, "total_steps": 2440, "loss": 0.293, "lr": 1.9199079486604727e-05, "epoch": 2.8045035823950872, "percentage": 56.15, "elapsed_time": "7:07:42", "remaining_time": "5:34:02"}
1371
+ {"current_steps": 1371, "total_steps": 2440, "loss": 0.3239, "lr": 1.9170491312466616e-05, "epoch": 2.8065506653019447, "percentage": 56.19, "elapsed_time": "7:07:59", "remaining_time": "5:33:42"}
1372
+ {"current_steps": 1372, "total_steps": 2440, "loss": 0.3502, "lr": 1.914190483600891e-05, "epoch": 2.8085977482088023, "percentage": 56.23, "elapsed_time": "7:08:16", "remaining_time": "5:33:22"}
1373
+ {"current_steps": 1373, "total_steps": 2440, "loss": 0.3357, "lr": 1.9113320115736986e-05, "epoch": 2.81064483111566, "percentage": 56.27, "elapsed_time": "7:08:34", "remaining_time": "5:33:03"}
1374
+ {"current_steps": 1374, "total_steps": 2440, "loss": 0.3185, "lr": 1.9084737210152593e-05, "epoch": 2.812691914022518, "percentage": 56.31, "elapsed_time": "7:08:51", "remaining_time": "5:32:43"}
1375
+ {"current_steps": 1375, "total_steps": 2440, "loss": 0.3228, "lr": 1.9056156177753776e-05, "epoch": 2.8147389969293757, "percentage": 56.35, "elapsed_time": "7:09:13", "remaining_time": "5:32:26"}
1376
+ {"current_steps": 1376, "total_steps": 2440, "loss": 0.3475, "lr": 1.902757707703475e-05, "epoch": 2.816786079836233, "percentage": 56.39, "elapsed_time": "7:09:30", "remaining_time": "5:32:07"}
1377
+ {"current_steps": 1377, "total_steps": 2440, "loss": 0.3325, "lr": 1.899899996648579e-05, "epoch": 2.818833162743091, "percentage": 56.43, "elapsed_time": "7:09:53", "remaining_time": "5:31:51"}
1378
+ {"current_steps": 1378, "total_steps": 2440, "loss": 0.3301, "lr": 1.897042490459307e-05, "epoch": 2.8208802456499487, "percentage": 56.48, "elapsed_time": "7:10:08", "remaining_time": "5:31:30"}
1379
+ {"current_steps": 1379, "total_steps": 2440, "loss": 0.3261, "lr": 1.8941851949838595e-05, "epoch": 2.8229273285568066, "percentage": 56.52, "elapsed_time": "7:10:27", "remaining_time": "5:31:11"}
1380
+ {"current_steps": 1380, "total_steps": 2440, "loss": 0.3602, "lr": 1.8913281160700038e-05, "epoch": 2.824974411463664, "percentage": 56.56, "elapsed_time": "7:10:46", "remaining_time": "5:30:53"}
1381
+ {"current_steps": 1381, "total_steps": 2440, "loss": 0.3173, "lr": 1.8884712595650653e-05, "epoch": 2.827021494370522, "percentage": 56.6, "elapsed_time": "7:10:59", "remaining_time": "5:30:30"}
1382
+ {"current_steps": 1382, "total_steps": 2440, "loss": 0.3549, "lr": 1.885614631315914e-05, "epoch": 2.8290685772773796, "percentage": 56.64, "elapsed_time": "7:11:16", "remaining_time": "5:30:09"}
1383
+ {"current_steps": 1383, "total_steps": 2440, "loss": 0.3202, "lr": 1.8827582371689516e-05, "epoch": 2.8311156601842375, "percentage": 56.68, "elapsed_time": "7:11:37", "remaining_time": "5:29:52"}
1384
+ {"current_steps": 1384, "total_steps": 2440, "loss": 0.3704, "lr": 1.8799020829701036e-05, "epoch": 2.833162743091095, "percentage": 56.72, "elapsed_time": "7:11:57", "remaining_time": "5:29:35"}
1385
+ {"current_steps": 1385, "total_steps": 2440, "loss": 0.3159, "lr": 1.8770461745648012e-05, "epoch": 2.835209825997953, "percentage": 56.76, "elapsed_time": "7:12:15", "remaining_time": "5:29:15"}
1386
+ {"current_steps": 1386, "total_steps": 2440, "loss": 0.347, "lr": 1.8741905177979743e-05, "epoch": 2.8372569089048105, "percentage": 56.8, "elapsed_time": "7:12:32", "remaining_time": "5:28:56"}
1387
+ {"current_steps": 1387, "total_steps": 2440, "loss": 0.3259, "lr": 1.871335118514037e-05, "epoch": 2.8393039918116685, "percentage": 56.84, "elapsed_time": "7:12:50", "remaining_time": "5:28:36"}
1388
+ {"current_steps": 1388, "total_steps": 2440, "loss": 0.3354, "lr": 1.8684799825568775e-05, "epoch": 2.841351074718526, "percentage": 56.89, "elapsed_time": "7:13:06", "remaining_time": "5:28:15"}
1389
+ {"current_steps": 1389, "total_steps": 2440, "loss": 0.3332, "lr": 1.8656251157698425e-05, "epoch": 2.843398157625384, "percentage": 56.93, "elapsed_time": "7:13:27", "remaining_time": "5:27:58"}
1390
+ {"current_steps": 1390, "total_steps": 2440, "loss": 0.3379, "lr": 1.862770523995732e-05, "epoch": 2.8454452405322415, "percentage": 56.97, "elapsed_time": "7:13:46", "remaining_time": "5:27:40"}
1391
+ {"current_steps": 1391, "total_steps": 2440, "loss": 0.3304, "lr": 1.85991621307678e-05, "epoch": 2.8474923234390994, "percentage": 57.01, "elapsed_time": "7:14:09", "remaining_time": "5:27:25"}
1392
+ {"current_steps": 1392, "total_steps": 2440, "loss": 0.3162, "lr": 1.8570621888546464e-05, "epoch": 2.849539406345957, "percentage": 57.05, "elapsed_time": "7:14:29", "remaining_time": "5:27:06"}
1393
+ {"current_steps": 1393, "total_steps": 2440, "loss": 0.3341, "lr": 1.854208457170404e-05, "epoch": 2.851586489252815, "percentage": 57.09, "elapsed_time": "7:14:48", "remaining_time": "5:26:48"}
1394
+ {"current_steps": 1394, "total_steps": 2440, "loss": 0.3385, "lr": 1.8513550238645283e-05, "epoch": 2.8536335721596724, "percentage": 57.13, "elapsed_time": "7:15:06", "remaining_time": "5:26:29"}
1395
+ {"current_steps": 1395, "total_steps": 2440, "loss": 0.3242, "lr": 1.8485018947768817e-05, "epoch": 2.8556806550665303, "percentage": 57.17, "elapsed_time": "7:15:22", "remaining_time": "5:26:08"}
1396
+ {"current_steps": 1396, "total_steps": 2440, "loss": 0.3172, "lr": 1.8456490757467075e-05, "epoch": 2.857727737973388, "percentage": 57.21, "elapsed_time": "7:15:43", "remaining_time": "5:25:51"}
1397
+ {"current_steps": 1397, "total_steps": 2440, "loss": 0.3256, "lr": 1.8427965726126114e-05, "epoch": 2.859774820880246, "percentage": 57.25, "elapsed_time": "7:16:03", "remaining_time": "5:25:33"}
1398
+ {"current_steps": 1398, "total_steps": 2440, "loss": 0.3375, "lr": 1.839944391212553e-05, "epoch": 2.8618219037871033, "percentage": 57.3, "elapsed_time": "7:16:19", "remaining_time": "5:25:12"}
1399
+ {"current_steps": 1399, "total_steps": 2440, "loss": 0.3388, "lr": 1.8370925373838356e-05, "epoch": 2.8638689866939613, "percentage": 57.34, "elapsed_time": "7:16:43", "remaining_time": "5:24:58"}
1400
+ {"current_steps": 1400, "total_steps": 2440, "loss": 0.361, "lr": 1.834241016963089e-05, "epoch": 2.865916069600819, "percentage": 57.38, "elapsed_time": "7:17:05", "remaining_time": "5:24:41"}
1401
+ {"current_steps": 1401, "total_steps": 2440, "loss": 0.3292, "lr": 1.8313898357862623e-05, "epoch": 2.8679631525076763, "percentage": 57.42, "elapsed_time": "7:17:24", "remaining_time": "5:24:22"}
1402
+ {"current_steps": 1402, "total_steps": 2440, "loss": 0.3239, "lr": 1.8285389996886113e-05, "epoch": 2.8700102354145343, "percentage": 57.46, "elapsed_time": "7:17:44", "remaining_time": "5:24:05"}
1403
+ {"current_steps": 1403, "total_steps": 2440, "loss": 0.3442, "lr": 1.8256885145046837e-05, "epoch": 2.872057318321392, "percentage": 57.5, "elapsed_time": "7:18:05", "remaining_time": "5:23:48"}
1404
+ {"current_steps": 1404, "total_steps": 2440, "loss": 0.3387, "lr": 1.82283838606831e-05, "epoch": 2.8741044012282497, "percentage": 57.54, "elapsed_time": "7:18:26", "remaining_time": "5:23:31"}
1405
+ {"current_steps": 1405, "total_steps": 2440, "loss": 0.364, "lr": 1.8199886202125897e-05, "epoch": 2.8761514841351072, "percentage": 57.58, "elapsed_time": "7:18:46", "remaining_time": "5:23:13"}
1406
+ {"current_steps": 1406, "total_steps": 2440, "loss": 0.3135, "lr": 1.817139222769882e-05, "epoch": 2.878198567041965, "percentage": 57.62, "elapsed_time": "7:19:04", "remaining_time": "5:22:54"}
1407
+ {"current_steps": 1407, "total_steps": 2440, "loss": 0.3293, "lr": 1.8142901995717894e-05, "epoch": 2.880245649948823, "percentage": 57.66, "elapsed_time": "7:19:23", "remaining_time": "5:22:35"}
1408
+ {"current_steps": 1408, "total_steps": 2440, "loss": 0.3382, "lr": 1.8114415564491513e-05, "epoch": 2.8822927328556807, "percentage": 57.7, "elapsed_time": "7:19:42", "remaining_time": "5:22:17"}
1409
+ {"current_steps": 1409, "total_steps": 2440, "loss": 0.3346, "lr": 1.8085932992320273e-05, "epoch": 2.884339815762538, "percentage": 57.75, "elapsed_time": "7:20:03", "remaining_time": "5:22:00"}
1410
+ {"current_steps": 1410, "total_steps": 2440, "loss": 0.3193, "lr": 1.805745433749689e-05, "epoch": 2.886386898669396, "percentage": 57.79, "elapsed_time": "7:20:25", "remaining_time": "5:21:43"}
1411
+ {"current_steps": 1411, "total_steps": 2440, "loss": 0.3352, "lr": 1.8028979658306033e-05, "epoch": 2.888433981576254, "percentage": 57.83, "elapsed_time": "7:20:45", "remaining_time": "5:21:25"}
1412
+ {"current_steps": 1412, "total_steps": 2440, "loss": 0.3704, "lr": 1.8000509013024266e-05, "epoch": 2.8904810644831116, "percentage": 57.87, "elapsed_time": "7:21:02", "remaining_time": "5:21:06"}
1413
+ {"current_steps": 1413, "total_steps": 2440, "loss": 0.3548, "lr": 1.7972042459919878e-05, "epoch": 2.892528147389969, "percentage": 57.91, "elapsed_time": "7:21:22", "remaining_time": "5:20:48"}
1414
+ {"current_steps": 1414, "total_steps": 2440, "loss": 0.3379, "lr": 1.794358005725279e-05, "epoch": 2.894575230296827, "percentage": 57.95, "elapsed_time": "7:21:39", "remaining_time": "5:20:28"}
1415
+ {"current_steps": 1415, "total_steps": 2440, "loss": 0.3685, "lr": 1.791512186327444e-05, "epoch": 2.896622313203685, "percentage": 57.99, "elapsed_time": "7:21:55", "remaining_time": "5:20:07"}
1416
+ {"current_steps": 1416, "total_steps": 2440, "loss": 0.3224, "lr": 1.7886667936227616e-05, "epoch": 2.8986693961105425, "percentage": 58.03, "elapsed_time": "7:22:16", "remaining_time": "5:19:50"}
1417
+ {"current_steps": 1417, "total_steps": 2440, "loss": 0.3234, "lr": 1.785821833434642e-05, "epoch": 2.9007164790174, "percentage": 58.07, "elapsed_time": "7:22:34", "remaining_time": "5:19:30"}
1418
+ {"current_steps": 1418, "total_steps": 2440, "loss": 0.305, "lr": 1.7829773115856065e-05, "epoch": 2.902763561924258, "percentage": 58.11, "elapsed_time": "7:22:50", "remaining_time": "5:19:10"}
1419
+ {"current_steps": 1419, "total_steps": 2440, "loss": 0.3463, "lr": 1.7801332338972813e-05, "epoch": 2.9048106448311155, "percentage": 58.16, "elapsed_time": "7:23:10", "remaining_time": "5:18:52"}
1420
+ {"current_steps": 1420, "total_steps": 2440, "loss": 0.3441, "lr": 1.7772896061903824e-05, "epoch": 2.9068577277379735, "percentage": 58.2, "elapsed_time": "7:23:28", "remaining_time": "5:18:33"}
1421
+ {"current_steps": 1421, "total_steps": 2440, "loss": 0.3243, "lr": 1.7744464342847062e-05, "epoch": 2.908904810644831, "percentage": 58.24, "elapsed_time": "7:23:44", "remaining_time": "5:18:12"}
1422
+ {"current_steps": 1422, "total_steps": 2440, "loss": 0.328, "lr": 1.771603723999116e-05, "epoch": 2.910951893551689, "percentage": 58.28, "elapsed_time": "7:24:01", "remaining_time": "5:17:52"}
1423
+ {"current_steps": 1423, "total_steps": 2440, "loss": 0.3239, "lr": 1.768761481151529e-05, "epoch": 2.9129989764585464, "percentage": 58.32, "elapsed_time": "7:24:19", "remaining_time": "5:17:32"}
1424
+ {"current_steps": 1424, "total_steps": 2440, "loss": 0.3373, "lr": 1.765919711558906e-05, "epoch": 2.9150460593654044, "percentage": 58.36, "elapsed_time": "7:24:35", "remaining_time": "5:17:12"}
1425
+ {"current_steps": 1425, "total_steps": 2440, "loss": 0.3473, "lr": 1.7630784210372413e-05, "epoch": 2.917093142272262, "percentage": 58.4, "elapsed_time": "7:24:54", "remaining_time": "5:16:53"}
1426
+ {"current_steps": 1426, "total_steps": 2440, "loss": 0.3285, "lr": 1.7602376154015456e-05, "epoch": 2.91914022517912, "percentage": 58.44, "elapsed_time": "7:25:12", "remaining_time": "5:16:34"}
1427
+ {"current_steps": 1427, "total_steps": 2440, "loss": 0.3024, "lr": 1.7573973004658404e-05, "epoch": 2.9211873080859774, "percentage": 58.48, "elapsed_time": "7:25:28", "remaining_time": "5:16:13"}
1428
+ {"current_steps": 1428, "total_steps": 2440, "loss": 0.3315, "lr": 1.7545574820431412e-05, "epoch": 2.9232343909928353, "percentage": 58.52, "elapsed_time": "7:25:47", "remaining_time": "5:15:55"}
1429
+ {"current_steps": 1429, "total_steps": 2440, "loss": 0.3519, "lr": 1.751718165945447e-05, "epoch": 2.925281473899693, "percentage": 58.57, "elapsed_time": "7:26:04", "remaining_time": "5:15:35"}
1430
+ {"current_steps": 1430, "total_steps": 2440, "loss": 0.3661, "lr": 1.7488793579837297e-05, "epoch": 2.927328556806551, "percentage": 58.61, "elapsed_time": "7:26:26", "remaining_time": "5:15:18"}
1431
+ {"current_steps": 1431, "total_steps": 2440, "loss": 0.3141, "lr": 1.74604106396792e-05, "epoch": 2.9293756397134083, "percentage": 58.65, "elapsed_time": "7:26:44", "remaining_time": "5:14:59"}
1432
+ {"current_steps": 1432, "total_steps": 2440, "loss": 0.3557, "lr": 1.743203289706898e-05, "epoch": 2.9314227226202663, "percentage": 58.69, "elapsed_time": "7:27:04", "remaining_time": "5:14:42"}
1433
+ {"current_steps": 1433, "total_steps": 2440, "loss": 0.399, "lr": 1.7403660410084806e-05, "epoch": 2.9334698055271238, "percentage": 58.73, "elapsed_time": "7:27:22", "remaining_time": "5:14:23"}
1434
+ {"current_steps": 1434, "total_steps": 2440, "loss": 0.3286, "lr": 1.737529323679407e-05, "epoch": 2.9355168884339817, "percentage": 58.77, "elapsed_time": "7:27:41", "remaining_time": "5:14:04"}
1435
+ {"current_steps": 1435, "total_steps": 2440, "loss": 0.3259, "lr": 1.734693143525331e-05, "epoch": 2.9375639713408392, "percentage": 58.81, "elapsed_time": "7:28:01", "remaining_time": "5:13:46"}
1436
+ {"current_steps": 1436, "total_steps": 2440, "loss": 0.3438, "lr": 1.731857506350805e-05, "epoch": 2.939611054247697, "percentage": 58.85, "elapsed_time": "7:28:18", "remaining_time": "5:13:26"}
1437
+ {"current_steps": 1437, "total_steps": 2440, "loss": 0.3561, "lr": 1.7290224179592718e-05, "epoch": 2.9416581371545547, "percentage": 58.89, "elapsed_time": "7:28:38", "remaining_time": "5:13:08"}
1438
+ {"current_steps": 1438, "total_steps": 2440, "loss": 0.2956, "lr": 1.7261878841530494e-05, "epoch": 2.943705220061412, "percentage": 58.93, "elapsed_time": "7:28:53", "remaining_time": "5:12:47"}
1439
+ {"current_steps": 1439, "total_steps": 2440, "loss": 0.3207, "lr": 1.7233539107333234e-05, "epoch": 2.94575230296827, "percentage": 58.98, "elapsed_time": "7:29:14", "remaining_time": "5:12:30"}
1440
+ {"current_steps": 1440, "total_steps": 2440, "loss": 0.3324, "lr": 1.72052050350013e-05, "epoch": 2.947799385875128, "percentage": 59.02, "elapsed_time": "7:29:31", "remaining_time": "5:12:10"}
1441
+ {"current_steps": 1441, "total_steps": 2440, "loss": 0.3296, "lr": 1.717687668252348e-05, "epoch": 2.9498464687819856, "percentage": 59.06, "elapsed_time": "7:29:50", "remaining_time": "5:11:51"}
1442
+ {"current_steps": 1442, "total_steps": 2440, "loss": 0.3504, "lr": 1.7148554107876847e-05, "epoch": 2.951893551688843, "percentage": 59.1, "elapsed_time": "7:30:06", "remaining_time": "5:11:30"}
1443
+ {"current_steps": 1443, "total_steps": 2440, "loss": 0.378, "lr": 1.7120237369026655e-05, "epoch": 2.953940634595701, "percentage": 59.14, "elapsed_time": "7:30:24", "remaining_time": "5:11:11"}
1444
+ {"current_steps": 1444, "total_steps": 2440, "loss": 0.3437, "lr": 1.7091926523926205e-05, "epoch": 2.955987717502559, "percentage": 59.18, "elapsed_time": "7:30:44", "remaining_time": "5:10:53"}
1445
+ {"current_steps": 1445, "total_steps": 2440, "loss": 0.3289, "lr": 1.7063621630516755e-05, "epoch": 2.9580348004094166, "percentage": 59.22, "elapsed_time": "7:30:59", "remaining_time": "5:10:32"}
1446
+ {"current_steps": 1446, "total_steps": 2440, "loss": 0.3148, "lr": 1.7035322746727366e-05, "epoch": 2.960081883316274, "percentage": 59.26, "elapsed_time": "7:31:19", "remaining_time": "5:10:14"}
1447
+ {"current_steps": 1447, "total_steps": 2440, "loss": 0.3389, "lr": 1.7007029930474804e-05, "epoch": 2.962128966223132, "percentage": 59.3, "elapsed_time": "7:31:41", "remaining_time": "5:09:58"}
1448
+ {"current_steps": 1448, "total_steps": 2440, "loss": 0.3286, "lr": 1.697874323966342e-05, "epoch": 2.96417604912999, "percentage": 59.34, "elapsed_time": "7:32:01", "remaining_time": "5:09:40"}
1449
+ {"current_steps": 1449, "total_steps": 2440, "loss": 0.3197, "lr": 1.6950462732185023e-05, "epoch": 2.9662231320368475, "percentage": 59.39, "elapsed_time": "7:32:19", "remaining_time": "5:09:21"}
1450
+ {"current_steps": 1450, "total_steps": 2440, "loss": 0.3297, "lr": 1.6922188465918763e-05, "epoch": 2.968270214943705, "percentage": 59.43, "elapsed_time": "7:32:38", "remaining_time": "5:09:02"}
1451
+ {"current_steps": 1451, "total_steps": 2440, "loss": 0.3577, "lr": 1.689392049873104e-05, "epoch": 2.970317297850563, "percentage": 59.47, "elapsed_time": "7:32:58", "remaining_time": "5:08:44"}
1452
+ {"current_steps": 1452, "total_steps": 2440, "loss": 0.3252, "lr": 1.6865658888475334e-05, "epoch": 2.972364380757421, "percentage": 59.51, "elapsed_time": "7:33:17", "remaining_time": "5:08:25"}
1453
+ {"current_steps": 1453, "total_steps": 2440, "loss": 0.3267, "lr": 1.6837403692992136e-05, "epoch": 2.9744114636642784, "percentage": 59.55, "elapsed_time": "7:33:32", "remaining_time": "5:08:05"}
1454
+ {"current_steps": 1454, "total_steps": 2440, "loss": 0.362, "lr": 1.680915497010879e-05, "epoch": 2.976458546571136, "percentage": 59.59, "elapsed_time": "7:33:47", "remaining_time": "5:07:43"}
1455
+ {"current_steps": 1455, "total_steps": 2440, "loss": 0.3455, "lr": 1.6780912777639407e-05, "epoch": 2.978505629477994, "percentage": 59.63, "elapsed_time": "7:34:04", "remaining_time": "5:07:24"}
1456
+ {"current_steps": 1456, "total_steps": 2440, "loss": 0.3476, "lr": 1.6752677173384734e-05, "epoch": 2.9805527123848514, "percentage": 59.67, "elapsed_time": "7:34:27", "remaining_time": "5:07:07"}
1457
+ {"current_steps": 1457, "total_steps": 2440, "loss": 0.373, "lr": 1.6724448215132006e-05, "epoch": 2.9825997952917094, "percentage": 59.71, "elapsed_time": "7:34:47", "remaining_time": "5:06:50"}
1458
+ {"current_steps": 1458, "total_steps": 2440, "loss": 0.3416, "lr": 1.669622596065491e-05, "epoch": 2.984646878198567, "percentage": 59.75, "elapsed_time": "7:35:07", "remaining_time": "5:06:32"}
1459
+ {"current_steps": 1459, "total_steps": 2440, "loss": 0.3336, "lr": 1.6668010467713363e-05, "epoch": 2.986693961105425, "percentage": 59.8, "elapsed_time": "7:35:25", "remaining_time": "5:06:13"}
1460
+ {"current_steps": 1460, "total_steps": 2440, "loss": 0.3281, "lr": 1.6639801794053468e-05, "epoch": 2.9887410440122824, "percentage": 59.84, "elapsed_time": "7:35:45", "remaining_time": "5:05:55"}
1461
+ {"current_steps": 1461, "total_steps": 2440, "loss": 0.3219, "lr": 1.6611599997407366e-05, "epoch": 2.9907881269191403, "percentage": 59.88, "elapsed_time": "7:36:05", "remaining_time": "5:05:37"}
1462
+ {"current_steps": 1462, "total_steps": 2440, "loss": 0.3253, "lr": 1.658340513549312e-05, "epoch": 2.992835209825998, "percentage": 59.92, "elapsed_time": "7:36:25", "remaining_time": "5:05:19"}
1463
+ {"current_steps": 1463, "total_steps": 2440, "loss": 0.3679, "lr": 1.6555217266014604e-05, "epoch": 2.9948822927328558, "percentage": 59.96, "elapsed_time": "7:36:42", "remaining_time": "5:04:59"}
1464
+ {"current_steps": 1464, "total_steps": 2440, "loss": 0.3107, "lr": 1.6527036446661396e-05, "epoch": 2.9969293756397133, "percentage": 60.0, "elapsed_time": "7:37:01", "remaining_time": "5:04:41"}
1465
+ {"current_steps": 1465, "total_steps": 2440, "loss": 0.3537, "lr": 1.649886273510861e-05, "epoch": 2.9989764585465712, "percentage": 60.04, "elapsed_time": "7:37:22", "remaining_time": "5:04:23"}
1466
+ {"current_steps": 1466, "total_steps": 2440, "loss": 0.4219, "lr": 1.6470696189016853e-05, "epoch": 3.0010235414534288, "percentage": 60.08, "elapsed_time": "7:38:51", "remaining_time": "5:04:51"}
1467
+ {"current_steps": 1467, "total_steps": 2440, "loss": 0.2489, "lr": 1.6442536866032027e-05, "epoch": 3.0030706243602867, "percentage": 60.12, "elapsed_time": "7:39:08", "remaining_time": "5:04:31"}
1468
+ {"current_steps": 1468, "total_steps": 2440, "loss": 0.2308, "lr": 1.641438482378529e-05, "epoch": 3.0051177072671442, "percentage": 60.16, "elapsed_time": "7:39:25", "remaining_time": "5:04:12"}
1469
+ {"current_steps": 1469, "total_steps": 2440, "loss": 0.2283, "lr": 1.6386240119892867e-05, "epoch": 3.007164790174002, "percentage": 60.2, "elapsed_time": "7:39:44", "remaining_time": "5:03:53"}
1470
+ {"current_steps": 1470, "total_steps": 2440, "loss": 0.2255, "lr": 1.6358102811955985e-05, "epoch": 3.0092118730808597, "percentage": 60.25, "elapsed_time": "7:40:05", "remaining_time": "5:03:35"}
1471
+ {"current_steps": 1471, "total_steps": 2440, "loss": 0.2499, "lr": 1.6329972957560736e-05, "epoch": 3.0112589559877176, "percentage": 60.29, "elapsed_time": "7:40:25", "remaining_time": "5:03:18"}
1472
+ {"current_steps": 1472, "total_steps": 2440, "loss": 0.2899, "lr": 1.6301850614277936e-05, "epoch": 3.013306038894575, "percentage": 60.33, "elapsed_time": "7:40:46", "remaining_time": "5:03:00"}
1473
+ {"current_steps": 1473, "total_steps": 2440, "loss": 0.23, "lr": 1.6273735839663044e-05, "epoch": 3.015353121801433, "percentage": 60.37, "elapsed_time": "7:41:02", "remaining_time": "5:02:39"}