sedrickkeh commited on
Commit
966fb92
·
verified ·
1 Parent(s): c3b3c2b

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc45d572185f1162e45b9f419e852e00a259a65aa74ee9696db1fdc7065e6a15
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bad07eb2ebee4c1a4357081b11e97d6070ccb120054ccbdb9457a4b1f43623c9
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bda1ffbcfd8027d335a93695f0fc86c85ef14e6917cb7a7be61a72147032a53f
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a980e6d8fd700d58d36f03ec901bec58551b5123ba5a22b3acbe918413aac6e
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:861b1530d4327d58d2d220b68a03844bd9fe57cb0ddb6073a97a73116c4fc83a
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dda8f552337d891f3cf8797f16ccf3ccc7a8ffdf7e35a64c8b4563811173aeec
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7450a591d911170ba7f7c37bac458ece7c35018ce0a03ac631cef293da8af94f
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f478646a66adb045b4f7dd1826d2e10ccfa3b585f62c2dd5fd5860e5f18e7513
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -250,3 +250,253 @@
250
  {"current_steps": 250, "total_steps": 750, "loss": 0.87, "lr": 8.43120818934367e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "3:53:09", "remaining_time": "7:46:19"}
251
  {"current_steps": 251, "total_steps": 750, "loss": 0.7984, "lr": 8.414244334398418e-06, "epoch": 1.004, "percentage": 33.47, "elapsed_time": "3:55:01", "remaining_time": "7:47:15"}
252
  {"current_steps": 252, "total_steps": 750, "loss": 0.8299, "lr": 8.397206521307584e-06, "epoch": 1.008, "percentage": 33.6, "elapsed_time": "3:55:59", "remaining_time": "7:46:21"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
250
  {"current_steps": 250, "total_steps": 750, "loss": 0.87, "lr": 8.43120818934367e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "3:53:09", "remaining_time": "7:46:19"}
251
  {"current_steps": 251, "total_steps": 750, "loss": 0.7984, "lr": 8.414244334398418e-06, "epoch": 1.004, "percentage": 33.47, "elapsed_time": "3:55:01", "remaining_time": "7:47:15"}
252
  {"current_steps": 252, "total_steps": 750, "loss": 0.8299, "lr": 8.397206521307584e-06, "epoch": 1.008, "percentage": 33.6, "elapsed_time": "3:55:59", "remaining_time": "7:46:21"}
253
+ {"current_steps": 253, "total_steps": 750, "loss": 0.8501, "lr": 8.380095119138209e-06, "epoch": 1.012, "percentage": 33.73, "elapsed_time": "3:56:55", "remaining_time": "7:45:25"}
254
+ {"current_steps": 254, "total_steps": 750, "loss": 0.8452, "lr": 8.362910498551402e-06, "epoch": 1.016, "percentage": 33.87, "elapsed_time": "3:57:49", "remaining_time": "7:44:24"}
255
+ {"current_steps": 255, "total_steps": 750, "loss": 0.8553, "lr": 8.345653031794292e-06, "epoch": 1.02, "percentage": 34.0, "elapsed_time": "3:58:43", "remaining_time": "7:43:24"}
256
+ {"current_steps": 256, "total_steps": 750, "loss": 0.7941, "lr": 8.328323092691985e-06, "epoch": 1.024, "percentage": 34.13, "elapsed_time": "3:59:35", "remaining_time": "7:42:20"}
257
+ {"current_steps": 257, "total_steps": 750, "loss": 0.8211, "lr": 8.310921056639451e-06, "epoch": 1.028, "percentage": 34.27, "elapsed_time": "4:00:31", "remaining_time": "7:41:24"}
258
+ {"current_steps": 258, "total_steps": 750, "loss": 0.8224, "lr": 8.293447300593402e-06, "epoch": 1.032, "percentage": 34.4, "elapsed_time": "4:01:26", "remaining_time": "7:40:25"}
259
+ {"current_steps": 259, "total_steps": 750, "loss": 0.8435, "lr": 8.275902203064125e-06, "epoch": 1.036, "percentage": 34.53, "elapsed_time": "4:02:24", "remaining_time": "7:39:33"}
260
+ {"current_steps": 260, "total_steps": 750, "loss": 0.8238, "lr": 8.258286144107277e-06, "epoch": 1.04, "percentage": 34.67, "elapsed_time": "4:03:20", "remaining_time": "7:38:37"}
261
+ {"current_steps": 261, "total_steps": 750, "loss": 0.8142, "lr": 8.240599505315656e-06, "epoch": 1.044, "percentage": 34.8, "elapsed_time": "4:04:11", "remaining_time": "7:37:29"}
262
+ {"current_steps": 262, "total_steps": 750, "loss": 0.8364, "lr": 8.222842669810936e-06, "epoch": 1.048, "percentage": 34.93, "elapsed_time": "4:05:09", "remaining_time": "7:36:38"}
263
+ {"current_steps": 263, "total_steps": 750, "loss": 0.8271, "lr": 8.205016022235368e-06, "epoch": 1.052, "percentage": 35.07, "elapsed_time": "4:06:00", "remaining_time": "7:35:32"}
264
+ {"current_steps": 264, "total_steps": 750, "loss": 0.8077, "lr": 8.18711994874345e-06, "epoch": 1.056, "percentage": 35.2, "elapsed_time": "4:06:57", "remaining_time": "7:34:37"}
265
+ {"current_steps": 265, "total_steps": 750, "loss": 0.7997, "lr": 8.16915483699355e-06, "epoch": 1.06, "percentage": 35.33, "elapsed_time": "4:07:47", "remaining_time": "7:33:30"}
266
+ {"current_steps": 266, "total_steps": 750, "loss": 0.8704, "lr": 8.151121076139534e-06, "epoch": 1.064, "percentage": 35.47, "elapsed_time": "4:08:47", "remaining_time": "7:32:40"}
267
+ {"current_steps": 267, "total_steps": 750, "loss": 0.8778, "lr": 8.133019056822303e-06, "epoch": 1.068, "percentage": 35.6, "elapsed_time": "4:09:57", "remaining_time": "7:32:09"}
268
+ {"current_steps": 268, "total_steps": 750, "loss": 0.8283, "lr": 8.11484917116136e-06, "epoch": 1.072, "percentage": 35.73, "elapsed_time": "4:11:06", "remaining_time": "7:31:37"}
269
+ {"current_steps": 269, "total_steps": 750, "loss": 0.8078, "lr": 8.096611812746302e-06, "epoch": 1.076, "percentage": 35.87, "elapsed_time": "4:12:08", "remaining_time": "7:30:51"}
270
+ {"current_steps": 270, "total_steps": 750, "loss": 0.8318, "lr": 8.078307376628292e-06, "epoch": 1.08, "percentage": 36.0, "elapsed_time": "4:12:59", "remaining_time": "7:29:46"}
271
+ {"current_steps": 271, "total_steps": 750, "loss": 0.7898, "lr": 8.059936259311514e-06, "epoch": 1.084, "percentage": 36.13, "elapsed_time": "4:13:50", "remaining_time": "7:28:40"}
272
+ {"current_steps": 272, "total_steps": 750, "loss": 0.8512, "lr": 8.041498858744572e-06, "epoch": 1.088, "percentage": 36.27, "elapsed_time": "4:14:52", "remaining_time": "7:27:54"}
273
+ {"current_steps": 273, "total_steps": 750, "loss": 0.8189, "lr": 8.022995574311876e-06, "epoch": 1.092, "percentage": 36.4, "elapsed_time": "4:15:51", "remaining_time": "7:27:02"}
274
+ {"current_steps": 274, "total_steps": 750, "loss": 0.7754, "lr": 8.004426806824985e-06, "epoch": 1.096, "percentage": 36.53, "elapsed_time": "4:16:35", "remaining_time": "7:25:44"}
275
+ {"current_steps": 275, "total_steps": 750, "loss": 0.7863, "lr": 7.985792958513932e-06, "epoch": 1.1, "percentage": 36.67, "elapsed_time": "4:17:15", "remaining_time": "7:24:21"}
276
+ {"current_steps": 276, "total_steps": 750, "loss": 0.8159, "lr": 7.967094433018508e-06, "epoch": 1.104, "percentage": 36.8, "elapsed_time": "4:18:14", "remaining_time": "7:23:30"}
277
+ {"current_steps": 277, "total_steps": 750, "loss": 0.8046, "lr": 7.948331635379517e-06, "epoch": 1.108, "percentage": 36.93, "elapsed_time": "4:19:13", "remaining_time": "7:22:38"}
278
+ {"current_steps": 278, "total_steps": 750, "loss": 0.8191, "lr": 7.929504972030003e-06, "epoch": 1.112, "percentage": 37.07, "elapsed_time": "4:19:54", "remaining_time": "7:21:17"}
279
+ {"current_steps": 279, "total_steps": 750, "loss": 0.8353, "lr": 7.910614850786448e-06, "epoch": 1.116, "percentage": 37.2, "elapsed_time": "4:20:52", "remaining_time": "7:20:24"}
280
+ {"current_steps": 280, "total_steps": 750, "loss": 0.8404, "lr": 7.891661680839932e-06, "epoch": 1.12, "percentage": 37.33, "elapsed_time": "4:21:52", "remaining_time": "7:19:34"}
281
+ {"current_steps": 281, "total_steps": 750, "loss": 0.8151, "lr": 7.872645872747281e-06, "epoch": 1.124, "percentage": 37.47, "elapsed_time": "4:22:46", "remaining_time": "7:18:34"}
282
+ {"current_steps": 282, "total_steps": 750, "loss": 0.8314, "lr": 7.85356783842216e-06, "epoch": 1.1280000000000001, "percentage": 37.6, "elapsed_time": "4:23:34", "remaining_time": "7:17:25"}
283
+ {"current_steps": 283, "total_steps": 750, "loss": 0.7978, "lr": 7.834427991126155e-06, "epoch": 1.1320000000000001, "percentage": 37.73, "elapsed_time": "4:24:25", "remaining_time": "7:16:20"}
284
+ {"current_steps": 284, "total_steps": 750, "loss": 0.8245, "lr": 7.815226745459831e-06, "epoch": 1.1360000000000001, "percentage": 37.87, "elapsed_time": "4:25:28", "remaining_time": "7:15:35"}
285
+ {"current_steps": 285, "total_steps": 750, "loss": 0.8185, "lr": 7.795964517353734e-06, "epoch": 1.1400000000000001, "percentage": 38.0, "elapsed_time": "4:26:22", "remaining_time": "7:14:37"}
286
+ {"current_steps": 286, "total_steps": 750, "loss": 0.8114, "lr": 7.776641724059398e-06, "epoch": 1.144, "percentage": 38.13, "elapsed_time": "4:27:21", "remaining_time": "7:13:44"}
287
+ {"current_steps": 287, "total_steps": 750, "loss": 0.8145, "lr": 7.757258784140286e-06, "epoch": 1.148, "percentage": 38.27, "elapsed_time": "4:28:06", "remaining_time": "7:12:30"}
288
+ {"current_steps": 288, "total_steps": 750, "loss": 0.8004, "lr": 7.737816117462752e-06, "epoch": 1.152, "percentage": 38.4, "elapsed_time": "4:29:07", "remaining_time": "7:11:43"}
289
+ {"current_steps": 289, "total_steps": 750, "loss": 0.8432, "lr": 7.718314145186918e-06, "epoch": 1.156, "percentage": 38.53, "elapsed_time": "4:30:02", "remaining_time": "7:10:46"}
290
+ {"current_steps": 290, "total_steps": 750, "loss": 0.8205, "lr": 7.698753289757565e-06, "epoch": 1.16, "percentage": 38.67, "elapsed_time": "4:31:06", "remaining_time": "7:10:01"}
291
+ {"current_steps": 291, "total_steps": 750, "loss": 0.82, "lr": 7.679133974894984e-06, "epoch": 1.164, "percentage": 38.8, "elapsed_time": "4:31:58", "remaining_time": "7:08:59"}
292
+ {"current_steps": 292, "total_steps": 750, "loss": 0.8316, "lr": 7.65945662558579e-06, "epoch": 1.168, "percentage": 38.93, "elapsed_time": "4:32:48", "remaining_time": "7:07:54"}
293
+ {"current_steps": 293, "total_steps": 750, "loss": 0.8174, "lr": 7.639721668073718e-06, "epoch": 1.172, "percentage": 39.07, "elapsed_time": "4:33:46", "remaining_time": "7:07:00"}
294
+ {"current_steps": 294, "total_steps": 750, "loss": 0.813, "lr": 7.619929529850397e-06, "epoch": 1.176, "percentage": 39.2, "elapsed_time": "4:34:33", "remaining_time": "7:05:50"}
295
+ {"current_steps": 295, "total_steps": 750, "loss": 0.8239, "lr": 7.600080639646077e-06, "epoch": 1.18, "percentage": 39.33, "elapsed_time": "4:35:27", "remaining_time": "7:04:51"}
296
+ {"current_steps": 296, "total_steps": 750, "loss": 0.8434, "lr": 7.580175427420358e-06, "epoch": 1.184, "percentage": 39.47, "elapsed_time": "4:36:27", "remaining_time": "7:04:01"}
297
+ {"current_steps": 297, "total_steps": 750, "loss": 0.8076, "lr": 7.560214324352858e-06, "epoch": 1.188, "percentage": 39.6, "elapsed_time": "4:37:30", "remaining_time": "7:03:15"}
298
+ {"current_steps": 298, "total_steps": 750, "loss": 0.8301, "lr": 7.54019776283389e-06, "epoch": 1.192, "percentage": 39.73, "elapsed_time": "4:38:21", "remaining_time": "7:02:11"}
299
+ {"current_steps": 299, "total_steps": 750, "loss": 0.8249, "lr": 7.520126176455084e-06, "epoch": 1.196, "percentage": 39.87, "elapsed_time": "4:39:15", "remaining_time": "7:01:13"}
300
+ {"current_steps": 300, "total_steps": 750, "loss": 0.7956, "lr": 7.500000000000001e-06, "epoch": 1.2, "percentage": 40.0, "elapsed_time": "4:40:06", "remaining_time": "7:00:10"}
301
+ {"current_steps": 301, "total_steps": 750, "loss": 0.8577, "lr": 7.479819669434712e-06, "epoch": 1.204, "percentage": 40.13, "elapsed_time": "4:40:51", "remaining_time": "6:58:57"}
302
+ {"current_steps": 302, "total_steps": 750, "loss": 0.8661, "lr": 7.459585621898353e-06, "epoch": 1.208, "percentage": 40.27, "elapsed_time": "4:41:53", "remaining_time": "6:58:10"}
303
+ {"current_steps": 303, "total_steps": 750, "loss": 0.8543, "lr": 7.4392982956936644e-06, "epoch": 1.212, "percentage": 40.4, "elapsed_time": "4:42:46", "remaining_time": "6:57:09"}
304
+ {"current_steps": 304, "total_steps": 750, "loss": 0.8148, "lr": 7.418958130277483e-06, "epoch": 1.216, "percentage": 40.53, "elapsed_time": "4:43:42", "remaining_time": "6:56:14"}
305
+ {"current_steps": 305, "total_steps": 750, "loss": 0.8162, "lr": 7.398565566251232e-06, "epoch": 1.22, "percentage": 40.67, "elapsed_time": "4:44:38", "remaining_time": "6:55:18"}
306
+ {"current_steps": 306, "total_steps": 750, "loss": 0.8242, "lr": 7.378121045351378e-06, "epoch": 1.224, "percentage": 40.8, "elapsed_time": "4:45:34", "remaining_time": "6:54:22"}
307
+ {"current_steps": 307, "total_steps": 750, "loss": 0.8429, "lr": 7.357625010439853e-06, "epoch": 1.228, "percentage": 40.93, "elapsed_time": "4:46:42", "remaining_time": "6:53:43"}
308
+ {"current_steps": 308, "total_steps": 750, "loss": 0.8413, "lr": 7.337077905494472e-06, "epoch": 1.232, "percentage": 41.07, "elapsed_time": "4:47:44", "remaining_time": "6:52:55"}
309
+ {"current_steps": 309, "total_steps": 750, "loss": 0.8431, "lr": 7.31648017559931e-06, "epoch": 1.236, "percentage": 41.2, "elapsed_time": "4:48:39", "remaining_time": "6:51:58"}
310
+ {"current_steps": 310, "total_steps": 750, "loss": 0.8634, "lr": 7.295832266935059e-06, "epoch": 1.24, "percentage": 41.33, "elapsed_time": "4:49:41", "remaining_time": "6:51:10"}
311
+ {"current_steps": 311, "total_steps": 750, "loss": 0.8387, "lr": 7.275134626769369e-06, "epoch": 1.244, "percentage": 41.47, "elapsed_time": "4:50:32", "remaining_time": "6:50:07"}
312
+ {"current_steps": 312, "total_steps": 750, "loss": 0.8087, "lr": 7.254387703447154e-06, "epoch": 1.248, "percentage": 41.6, "elapsed_time": "4:51:36", "remaining_time": "6:49:22"}
313
+ {"current_steps": 313, "total_steps": 750, "loss": 0.8138, "lr": 7.233591946380884e-06, "epoch": 1.252, "percentage": 41.73, "elapsed_time": "4:52:19", "remaining_time": "6:48:07"}
314
+ {"current_steps": 314, "total_steps": 750, "loss": 0.8258, "lr": 7.212747806040845e-06, "epoch": 1.256, "percentage": 41.87, "elapsed_time": "4:53:13", "remaining_time": "6:47:09"}
315
+ {"current_steps": 315, "total_steps": 750, "loss": 0.8444, "lr": 7.191855733945388e-06, "epoch": 1.26, "percentage": 42.0, "elapsed_time": "4:54:21", "remaining_time": "6:46:29"}
316
+ {"current_steps": 316, "total_steps": 750, "loss": 0.8155, "lr": 7.170916182651141e-06, "epoch": 1.264, "percentage": 42.13, "elapsed_time": "4:55:16", "remaining_time": "6:45:32"}
317
+ {"current_steps": 317, "total_steps": 750, "loss": 0.7777, "lr": 7.149929605743214e-06, "epoch": 1.268, "percentage": 42.27, "elapsed_time": "4:56:08", "remaining_time": "6:44:29"}
318
+ {"current_steps": 318, "total_steps": 750, "loss": 0.7944, "lr": 7.128896457825364e-06, "epoch": 1.272, "percentage": 42.4, "elapsed_time": "4:56:47", "remaining_time": "6:43:11"}
319
+ {"current_steps": 319, "total_steps": 750, "loss": 0.8503, "lr": 7.107817194510157e-06, "epoch": 1.276, "percentage": 42.53, "elapsed_time": "4:57:45", "remaining_time": "6:42:17"}
320
+ {"current_steps": 320, "total_steps": 750, "loss": 0.8266, "lr": 7.08669227240909e-06, "epoch": 1.28, "percentage": 42.67, "elapsed_time": "4:58:39", "remaining_time": "6:41:19"}
321
+ {"current_steps": 321, "total_steps": 750, "loss": 0.8107, "lr": 7.06552214912271e-06, "epoch": 1.284, "percentage": 42.8, "elapsed_time": "4:59:32", "remaining_time": "6:40:19"}
322
+ {"current_steps": 322, "total_steps": 750, "loss": 0.7889, "lr": 7.04430728323069e-06, "epoch": 1.288, "percentage": 42.93, "elapsed_time": "5:00:23", "remaining_time": "6:39:17"}
323
+ {"current_steps": 323, "total_steps": 750, "loss": 0.814, "lr": 7.023048134281907e-06, "epoch": 1.292, "percentage": 43.07, "elapsed_time": "5:01:21", "remaining_time": "6:38:23"}
324
+ {"current_steps": 324, "total_steps": 750, "loss": 0.8144, "lr": 7.0017451627844765e-06, "epoch": 1.296, "percentage": 43.2, "elapsed_time": "5:02:08", "remaining_time": "6:37:15"}
325
+ {"current_steps": 325, "total_steps": 750, "loss": 0.816, "lr": 6.980398830195785e-06, "epoch": 1.3, "percentage": 43.33, "elapsed_time": "5:03:09", "remaining_time": "6:36:26"}
326
+ {"current_steps": 326, "total_steps": 750, "loss": 0.8439, "lr": 6.959009598912493e-06, "epoch": 1.304, "percentage": 43.47, "elapsed_time": "5:04:04", "remaining_time": "6:35:28"}
327
+ {"current_steps": 327, "total_steps": 750, "loss": 0.8244, "lr": 6.9375779322605154e-06, "epoch": 1.308, "percentage": 43.6, "elapsed_time": "5:04:58", "remaining_time": "6:34:30"}
328
+ {"current_steps": 328, "total_steps": 750, "loss": 0.851, "lr": 6.916104294484988e-06, "epoch": 1.312, "percentage": 43.73, "elapsed_time": "5:05:59", "remaining_time": "6:33:41"}
329
+ {"current_steps": 329, "total_steps": 750, "loss": 0.7992, "lr": 6.8945891507402075e-06, "epoch": 1.316, "percentage": 43.87, "elapsed_time": "5:06:48", "remaining_time": "6:32:36"}
330
+ {"current_steps": 330, "total_steps": 750, "loss": 0.8443, "lr": 6.873032967079562e-06, "epoch": 1.32, "percentage": 44.0, "elapsed_time": "5:07:44", "remaining_time": "6:31:40"}
331
+ {"current_steps": 331, "total_steps": 750, "loss": 0.8277, "lr": 6.851436210445427e-06, "epoch": 1.324, "percentage": 44.13, "elapsed_time": "5:08:41", "remaining_time": "6:30:45"}
332
+ {"current_steps": 332, "total_steps": 750, "loss": 0.8135, "lr": 6.829799348659061e-06, "epoch": 1.328, "percentage": 44.27, "elapsed_time": "5:09:38", "remaining_time": "6:29:51"}
333
+ {"current_steps": 333, "total_steps": 750, "loss": 0.8288, "lr": 6.808122850410461e-06, "epoch": 1.332, "percentage": 44.4, "elapsed_time": "5:10:32", "remaining_time": "6:28:52"}
334
+ {"current_steps": 334, "total_steps": 750, "loss": 0.8283, "lr": 6.7864071852482205e-06, "epoch": 1.336, "percentage": 44.53, "elapsed_time": "5:11:34", "remaining_time": "6:28:03"}
335
+ {"current_steps": 335, "total_steps": 750, "loss": 0.8464, "lr": 6.7646528235693445e-06, "epoch": 1.34, "percentage": 44.67, "elapsed_time": "5:12:37", "remaining_time": "6:27:16"}
336
+ {"current_steps": 336, "total_steps": 750, "loss": 0.8347, "lr": 6.7428602366090764e-06, "epoch": 1.3439999999999999, "percentage": 44.8, "elapsed_time": "5:13:36", "remaining_time": "6:26:24"}
337
+ {"current_steps": 337, "total_steps": 750, "loss": 0.8384, "lr": 6.721029896430678e-06, "epoch": 1.3479999999999999, "percentage": 44.93, "elapsed_time": "5:14:35", "remaining_time": "6:25:32"}
338
+ {"current_steps": 338, "total_steps": 750, "loss": 0.8151, "lr": 6.699162275915208e-06, "epoch": 1.3519999999999999, "percentage": 45.07, "elapsed_time": "5:15:33", "remaining_time": "6:24:38"}
339
+ {"current_steps": 339, "total_steps": 750, "loss": 0.832, "lr": 6.677257848751276e-06, "epoch": 1.3559999999999999, "percentage": 45.2, "elapsed_time": "5:16:36", "remaining_time": "6:23:51"}
340
+ {"current_steps": 340, "total_steps": 750, "loss": 0.7989, "lr": 6.655317089424791e-06, "epoch": 1.3599999999999999, "percentage": 45.33, "elapsed_time": "5:17:29", "remaining_time": "6:22:51"}
341
+ {"current_steps": 341, "total_steps": 750, "loss": 0.8106, "lr": 6.633340473208673e-06, "epoch": 1.3639999999999999, "percentage": 45.47, "elapsed_time": "5:18:27", "remaining_time": "6:21:57"}
342
+ {"current_steps": 342, "total_steps": 750, "loss": 0.8197, "lr": 6.611328476152557e-06, "epoch": 1.3679999999999999, "percentage": 45.6, "elapsed_time": "5:19:25", "remaining_time": "6:21:03"}
343
+ {"current_steps": 343, "total_steps": 750, "loss": 0.836, "lr": 6.58928157507249e-06, "epoch": 1.3719999999999999, "percentage": 45.73, "elapsed_time": "5:20:17", "remaining_time": "6:20:02"}
344
+ {"current_steps": 344, "total_steps": 750, "loss": 0.8207, "lr": 6.567200247540599e-06, "epoch": 1.376, "percentage": 45.87, "elapsed_time": "5:21:17", "remaining_time": "6:19:12"}
345
+ {"current_steps": 345, "total_steps": 750, "loss": 0.8452, "lr": 6.545084971874738e-06, "epoch": 1.38, "percentage": 46.0, "elapsed_time": "5:22:20", "remaining_time": "6:18:23"}
346
+ {"current_steps": 346, "total_steps": 750, "loss": 0.7999, "lr": 6.522936227128139e-06, "epoch": 1.384, "percentage": 46.13, "elapsed_time": "5:23:20", "remaining_time": "6:17:32"}
347
+ {"current_steps": 347, "total_steps": 750, "loss": 0.8387, "lr": 6.500754493079029e-06, "epoch": 1.388, "percentage": 46.27, "elapsed_time": "5:24:23", "remaining_time": "6:16:44"}
348
+ {"current_steps": 348, "total_steps": 750, "loss": 0.8127, "lr": 6.4785402502202345e-06, "epoch": 1.392, "percentage": 46.4, "elapsed_time": "5:25:17", "remaining_time": "6:15:46"}
349
+ {"current_steps": 349, "total_steps": 750, "loss": 0.8312, "lr": 6.456293979748778e-06, "epoch": 1.396, "percentage": 46.53, "elapsed_time": "5:26:08", "remaining_time": "6:14:44"}
350
+ {"current_steps": 350, "total_steps": 750, "loss": 0.818, "lr": 6.434016163555452e-06, "epoch": 1.4, "percentage": 46.67, "elapsed_time": "5:27:03", "remaining_time": "6:13:46"}
351
+ {"current_steps": 351, "total_steps": 750, "loss": 0.8109, "lr": 6.411707284214384e-06, "epoch": 1.404, "percentage": 46.8, "elapsed_time": "5:27:59", "remaining_time": "6:12:50"}
352
+ {"current_steps": 352, "total_steps": 750, "loss": 0.8329, "lr": 6.389367824972575e-06, "epoch": 1.408, "percentage": 46.93, "elapsed_time": "5:28:57", "remaining_time": "6:11:56"}
353
+ {"current_steps": 353, "total_steps": 750, "loss": 0.8209, "lr": 6.366998269739442e-06, "epoch": 1.412, "percentage": 47.07, "elapsed_time": "5:29:53", "remaining_time": "6:11:00"}
354
+ {"current_steps": 354, "total_steps": 750, "loss": 0.8423, "lr": 6.344599103076329e-06, "epoch": 1.416, "percentage": 47.2, "elapsed_time": "5:30:49", "remaining_time": "6:10:04"}
355
+ {"current_steps": 355, "total_steps": 750, "loss": 0.8315, "lr": 6.322170810186013e-06, "epoch": 1.42, "percentage": 47.33, "elapsed_time": "5:31:54", "remaining_time": "6:09:18"}
356
+ {"current_steps": 356, "total_steps": 750, "loss": 0.8397, "lr": 6.299713876902188e-06, "epoch": 1.424, "percentage": 47.47, "elapsed_time": "5:32:46", "remaining_time": "6:08:17"}
357
+ {"current_steps": 357, "total_steps": 750, "loss": 0.8165, "lr": 6.277228789678953e-06, "epoch": 1.428, "percentage": 47.6, "elapsed_time": "5:33:46", "remaining_time": "6:07:25"}
358
+ {"current_steps": 358, "total_steps": 750, "loss": 0.8237, "lr": 6.254716035580264e-06, "epoch": 1.432, "percentage": 47.73, "elapsed_time": "5:34:41", "remaining_time": "6:06:28"}
359
+ {"current_steps": 359, "total_steps": 750, "loss": 0.8345, "lr": 6.23217610226939e-06, "epoch": 1.436, "percentage": 47.87, "elapsed_time": "5:35:28", "remaining_time": "6:05:22"}
360
+ {"current_steps": 360, "total_steps": 750, "loss": 0.7928, "lr": 6.209609477998339e-06, "epoch": 1.44, "percentage": 48.0, "elapsed_time": "5:36:19", "remaining_time": "6:04:21"}
361
+ {"current_steps": 361, "total_steps": 750, "loss": 0.8073, "lr": 6.187016651597299e-06, "epoch": 1.444, "percentage": 48.13, "elapsed_time": "5:37:09", "remaining_time": "6:03:18"}
362
+ {"current_steps": 362, "total_steps": 750, "loss": 0.8672, "lr": 6.16439811246403e-06, "epoch": 1.448, "percentage": 48.27, "elapsed_time": "5:38:11", "remaining_time": "6:02:28"}
363
+ {"current_steps": 363, "total_steps": 750, "loss": 0.8226, "lr": 6.141754350553279e-06, "epoch": 1.452, "percentage": 48.4, "elapsed_time": "5:39:02", "remaining_time": "6:01:27"}
364
+ {"current_steps": 364, "total_steps": 750, "loss": 0.7964, "lr": 6.119085856366158e-06, "epoch": 1.456, "percentage": 48.53, "elapsed_time": "5:39:52", "remaining_time": "6:00:24"}
365
+ {"current_steps": 365, "total_steps": 750, "loss": 0.7774, "lr": 6.0963931209395165e-06, "epoch": 1.46, "percentage": 48.67, "elapsed_time": "5:40:50", "remaining_time": "5:59:30"}
366
+ {"current_steps": 366, "total_steps": 750, "loss": 0.8087, "lr": 6.073676635835317e-06, "epoch": 1.464, "percentage": 48.8, "elapsed_time": "5:41:41", "remaining_time": "5:58:29"}
367
+ {"current_steps": 367, "total_steps": 750, "loss": 0.8159, "lr": 6.05093689312997e-06, "epoch": 1.468, "percentage": 48.93, "elapsed_time": "5:42:37", "remaining_time": "5:57:33"}
368
+ {"current_steps": 368, "total_steps": 750, "loss": 0.8259, "lr": 6.028174385403693e-06, "epoch": 1.472, "percentage": 49.07, "elapsed_time": "5:43:34", "remaining_time": "5:56:39"}
369
+ {"current_steps": 369, "total_steps": 750, "loss": 0.8156, "lr": 6.005389605729824e-06, "epoch": 1.476, "percentage": 49.2, "elapsed_time": "5:44:25", "remaining_time": "5:55:37"}
370
+ {"current_steps": 370, "total_steps": 750, "loss": 0.8131, "lr": 5.982583047664151e-06, "epoch": 1.48, "percentage": 49.33, "elapsed_time": "5:45:11", "remaining_time": "5:54:31"}
371
+ {"current_steps": 371, "total_steps": 750, "loss": 0.8305, "lr": 5.9597552052342174e-06, "epoch": 1.484, "percentage": 49.47, "elapsed_time": "5:46:04", "remaining_time": "5:53:32"}
372
+ {"current_steps": 372, "total_steps": 750, "loss": 0.8154, "lr": 5.936906572928625e-06, "epoch": 1.488, "percentage": 49.6, "elapsed_time": "5:47:01", "remaining_time": "5:52:37"}
373
+ {"current_steps": 373, "total_steps": 750, "loss": 0.8203, "lr": 5.914037645686308e-06, "epoch": 1.492, "percentage": 49.73, "elapsed_time": "5:47:57", "remaining_time": "5:51:41"}
374
+ {"current_steps": 374, "total_steps": 750, "loss": 0.8417, "lr": 5.891148918885834e-06, "epoch": 1.496, "percentage": 49.87, "elapsed_time": "5:48:53", "remaining_time": "5:50:45"}
375
+ {"current_steps": 375, "total_steps": 750, "loss": 0.8497, "lr": 5.8682408883346535e-06, "epoch": 1.5, "percentage": 50.0, "elapsed_time": "5:49:55", "remaining_time": "5:49:55"}
376
+ {"current_steps": 376, "total_steps": 750, "loss": 0.7931, "lr": 5.84531405025837e-06, "epoch": 1.504, "percentage": 50.13, "elapsed_time": "5:50:44", "remaining_time": "5:48:52"}
377
+ {"current_steps": 377, "total_steps": 750, "loss": 0.7777, "lr": 5.8223689012899945e-06, "epoch": 1.508, "percentage": 50.27, "elapsed_time": "5:51:42", "remaining_time": "5:47:58"}
378
+ {"current_steps": 378, "total_steps": 750, "loss": 0.8256, "lr": 5.799405938459175e-06, "epoch": 1.512, "percentage": 50.4, "elapsed_time": "5:52:36", "remaining_time": "5:47:00"}
379
+ {"current_steps": 379, "total_steps": 750, "loss": 0.8315, "lr": 5.776425659181438e-06, "epoch": 1.516, "percentage": 50.53, "elapsed_time": "5:53:31", "remaining_time": "5:46:03"}
380
+ {"current_steps": 380, "total_steps": 750, "loss": 0.8276, "lr": 5.753428561247416e-06, "epoch": 1.52, "percentage": 50.67, "elapsed_time": "5:54:29", "remaining_time": "5:45:09"}
381
+ {"current_steps": 381, "total_steps": 750, "loss": 0.8376, "lr": 5.730415142812059e-06, "epoch": 1.524, "percentage": 50.8, "elapsed_time": "5:55:23", "remaining_time": "5:44:12"}
382
+ {"current_steps": 382, "total_steps": 750, "loss": 0.8344, "lr": 5.707385902383845e-06, "epoch": 1.528, "percentage": 50.93, "elapsed_time": "5:56:19", "remaining_time": "5:43:15"}
383
+ {"current_steps": 383, "total_steps": 750, "loss": 0.8016, "lr": 5.684341338813986e-06, "epoch": 1.532, "percentage": 51.07, "elapsed_time": "5:57:15", "remaining_time": "5:42:19"}
384
+ {"current_steps": 384, "total_steps": 750, "loss": 0.8216, "lr": 5.661281951285613e-06, "epoch": 1.536, "percentage": 51.2, "elapsed_time": "5:58:05", "remaining_time": "5:41:18"}
385
+ {"current_steps": 385, "total_steps": 750, "loss": 0.8302, "lr": 5.638208239302975e-06, "epoch": 1.54, "percentage": 51.33, "elapsed_time": "5:59:02", "remaining_time": "5:40:23"}
386
+ {"current_steps": 386, "total_steps": 750, "loss": 0.8124, "lr": 5.615120702680604e-06, "epoch": 1.544, "percentage": 51.47, "elapsed_time": "5:59:52", "remaining_time": "5:39:21"}
387
+ {"current_steps": 387, "total_steps": 750, "loss": 0.7866, "lr": 5.592019841532507e-06, "epoch": 1.548, "percentage": 51.6, "elapsed_time": "6:00:38", "remaining_time": "5:38:16"}
388
+ {"current_steps": 388, "total_steps": 750, "loss": 0.8453, "lr": 5.568906156261309e-06, "epoch": 1.552, "percentage": 51.73, "elapsed_time": "6:01:30", "remaining_time": "5:37:16"}
389
+ {"current_steps": 389, "total_steps": 750, "loss": 0.8188, "lr": 5.54578014754744e-06, "epoch": 1.556, "percentage": 51.87, "elapsed_time": "6:02:17", "remaining_time": "5:36:13"}
390
+ {"current_steps": 390, "total_steps": 750, "loss": 0.8008, "lr": 5.522642316338268e-06, "epoch": 1.56, "percentage": 52.0, "elapsed_time": "6:03:09", "remaining_time": "5:35:13"}
391
+ {"current_steps": 391, "total_steps": 750, "loss": 0.876, "lr": 5.499493163837258e-06, "epoch": 1.564, "percentage": 52.13, "elapsed_time": "6:04:09", "remaining_time": "5:34:20"}
392
+ {"current_steps": 392, "total_steps": 750, "loss": 0.7961, "lr": 5.476333191493108e-06, "epoch": 1.568, "percentage": 52.27, "elapsed_time": "6:04:54", "remaining_time": "5:33:15"}
393
+ {"current_steps": 393, "total_steps": 750, "loss": 0.8384, "lr": 5.453162900988902e-06, "epoch": 1.572, "percentage": 52.4, "elapsed_time": "6:05:55", "remaining_time": "5:32:23"}
394
+ {"current_steps": 394, "total_steps": 750, "loss": 0.8287, "lr": 5.429982794231221e-06, "epoch": 1.576, "percentage": 52.53, "elapsed_time": "6:06:59", "remaining_time": "5:31:35"}
395
+ {"current_steps": 395, "total_steps": 750, "loss": 0.825, "lr": 5.406793373339292e-06, "epoch": 1.58, "percentage": 52.67, "elapsed_time": "6:07:57", "remaining_time": "5:30:41"}
396
+ {"current_steps": 396, "total_steps": 750, "loss": 0.8195, "lr": 5.383595140634093e-06, "epoch": 1.584, "percentage": 52.8, "elapsed_time": "6:08:53", "remaining_time": "5:29:45"}
397
+ {"current_steps": 397, "total_steps": 750, "loss": 0.7859, "lr": 5.360388598627487e-06, "epoch": 1.588, "percentage": 52.93, "elapsed_time": "6:09:54", "remaining_time": "5:28:54"}
398
+ {"current_steps": 398, "total_steps": 750, "loss": 0.7739, "lr": 5.337174250011326e-06, "epoch": 1.592, "percentage": 53.07, "elapsed_time": "6:10:42", "remaining_time": "5:27:51"}
399
+ {"current_steps": 399, "total_steps": 750, "loss": 0.8241, "lr": 5.3139525976465675e-06, "epoch": 1.596, "percentage": 53.2, "elapsed_time": "6:11:46", "remaining_time": "5:27:03"}
400
+ {"current_steps": 400, "total_steps": 750, "loss": 0.8186, "lr": 5.290724144552379e-06, "epoch": 1.6, "percentage": 53.33, "elapsed_time": "6:12:39", "remaining_time": "5:26:04"}
401
+ {"current_steps": 401, "total_steps": 750, "loss": 0.7989, "lr": 5.267489393895247e-06, "epoch": 1.604, "percentage": 53.47, "elapsed_time": "6:13:32", "remaining_time": "5:25:06"}
402
+ {"current_steps": 402, "total_steps": 750, "loss": 0.8459, "lr": 5.244248848978067e-06, "epoch": 1.608, "percentage": 53.6, "elapsed_time": "6:14:35", "remaining_time": "5:24:16"}
403
+ {"current_steps": 403, "total_steps": 750, "loss": 0.8308, "lr": 5.221003013229253e-06, "epoch": 1.612, "percentage": 53.73, "elapsed_time": "6:15:28", "remaining_time": "5:23:17"}
404
+ {"current_steps": 404, "total_steps": 750, "loss": 0.8204, "lr": 5.197752390191827e-06, "epoch": 1.616, "percentage": 53.87, "elapsed_time": "6:16:26", "remaining_time": "5:22:24"}
405
+ {"current_steps": 405, "total_steps": 750, "loss": 0.8598, "lr": 5.174497483512506e-06, "epoch": 1.62, "percentage": 54.0, "elapsed_time": "6:17:24", "remaining_time": "5:21:30"}
406
+ {"current_steps": 406, "total_steps": 750, "loss": 0.8271, "lr": 5.151238796930804e-06, "epoch": 1.624, "percentage": 54.13, "elapsed_time": "6:18:16", "remaining_time": "5:20:30"}
407
+ {"current_steps": 407, "total_steps": 750, "loss": 0.8019, "lr": 5.127976834268112e-06, "epoch": 1.6280000000000001, "percentage": 54.27, "elapsed_time": "6:19:08", "remaining_time": "5:19:31"}
408
+ {"current_steps": 408, "total_steps": 750, "loss": 0.8342, "lr": 5.1047120994167855e-06, "epoch": 1.6320000000000001, "percentage": 54.4, "elapsed_time": "6:20:01", "remaining_time": "5:18:32"}
409
+ {"current_steps": 409, "total_steps": 750, "loss": 0.8294, "lr": 5.081445096329229e-06, "epoch": 1.6360000000000001, "percentage": 54.53, "elapsed_time": "6:20:49", "remaining_time": "5:17:30"}
410
+ {"current_steps": 410, "total_steps": 750, "loss": 0.797, "lr": 5.0581763290069865e-06, "epoch": 1.6400000000000001, "percentage": 54.67, "elapsed_time": "6:21:40", "remaining_time": "5:16:31"}
411
+ {"current_steps": 411, "total_steps": 750, "loss": 0.7843, "lr": 5.034906301489808e-06, "epoch": 1.6440000000000001, "percentage": 54.8, "elapsed_time": "6:22:37", "remaining_time": "5:15:35"}
412
+ {"current_steps": 412, "total_steps": 750, "loss": 0.7805, "lr": 5.011635517844753e-06, "epoch": 1.6480000000000001, "percentage": 54.93, "elapsed_time": "6:23:19", "remaining_time": "5:14:28"}
413
+ {"current_steps": 413, "total_steps": 750, "loss": 0.8101, "lr": 4.988364482155249e-06, "epoch": 1.6520000000000001, "percentage": 55.07, "elapsed_time": "6:24:13", "remaining_time": "5:13:31"}
414
+ {"current_steps": 414, "total_steps": 750, "loss": 0.7977, "lr": 4.965093698510192e-06, "epoch": 1.6560000000000001, "percentage": 55.2, "elapsed_time": "6:25:11", "remaining_time": "5:12:37"}
415
+ {"current_steps": 415, "total_steps": 750, "loss": 0.8385, "lr": 4.941823670993016e-06, "epoch": 1.6600000000000001, "percentage": 55.33, "elapsed_time": "6:26:08", "remaining_time": "5:11:42"}
416
+ {"current_steps": 416, "total_steps": 750, "loss": 0.8213, "lr": 4.9185549036707715e-06, "epoch": 1.6640000000000001, "percentage": 55.47, "elapsed_time": "6:27:13", "remaining_time": "5:10:53"}
417
+ {"current_steps": 417, "total_steps": 750, "loss": 0.8416, "lr": 4.895287900583216e-06, "epoch": 1.6680000000000001, "percentage": 55.6, "elapsed_time": "6:28:07", "remaining_time": "5:09:56"}
418
+ {"current_steps": 418, "total_steps": 750, "loss": 0.809, "lr": 4.87202316573189e-06, "epoch": 1.6720000000000002, "percentage": 55.73, "elapsed_time": "6:29:00", "remaining_time": "5:08:58"}
419
+ {"current_steps": 419, "total_steps": 750, "loss": 0.8451, "lr": 4.8487612030691975e-06, "epoch": 1.6760000000000002, "percentage": 55.87, "elapsed_time": "6:30:01", "remaining_time": "5:08:06"}
420
+ {"current_steps": 420, "total_steps": 750, "loss": 0.8033, "lr": 4.825502516487497e-06, "epoch": 1.6800000000000002, "percentage": 56.0, "elapsed_time": "6:30:50", "remaining_time": "5:07:05"}
421
+ {"current_steps": 421, "total_steps": 750, "loss": 0.7785, "lr": 4.802247609808175e-06, "epoch": 1.6840000000000002, "percentage": 56.13, "elapsed_time": "6:31:46", "remaining_time": "5:06:09"}
422
+ {"current_steps": 422, "total_steps": 750, "loss": 0.8273, "lr": 4.778996986770747e-06, "epoch": 1.688, "percentage": 56.27, "elapsed_time": "6:32:43", "remaining_time": "5:05:14"}
423
+ {"current_steps": 423, "total_steps": 750, "loss": 0.8136, "lr": 4.755751151021934e-06, "epoch": 1.692, "percentage": 56.4, "elapsed_time": "6:33:39", "remaining_time": "5:04:19"}
424
+ {"current_steps": 424, "total_steps": 750, "loss": 0.7944, "lr": 4.732510606104754e-06, "epoch": 1.696, "percentage": 56.53, "elapsed_time": "6:34:30", "remaining_time": "5:03:19"}
425
+ {"current_steps": 425, "total_steps": 750, "loss": 0.7787, "lr": 4.7092758554476215e-06, "epoch": 1.7, "percentage": 56.67, "elapsed_time": "6:35:17", "remaining_time": "5:02:16"}
426
+ {"current_steps": 426, "total_steps": 750, "loss": 0.8449, "lr": 4.686047402353433e-06, "epoch": 1.704, "percentage": 56.8, "elapsed_time": "6:36:11", "remaining_time": "5:01:19"}
427
+ {"current_steps": 427, "total_steps": 750, "loss": 0.8656, "lr": 4.662825749988675e-06, "epoch": 1.708, "percentage": 56.93, "elapsed_time": "6:37:09", "remaining_time": "5:00:25"}
428
+ {"current_steps": 428, "total_steps": 750, "loss": 0.8263, "lr": 4.639611401372514e-06, "epoch": 1.712, "percentage": 57.07, "elapsed_time": "6:38:00", "remaining_time": "4:59:26"}
429
+ {"current_steps": 429, "total_steps": 750, "loss": 0.7882, "lr": 4.6164048593659076e-06, "epoch": 1.716, "percentage": 57.2, "elapsed_time": "6:38:57", "remaining_time": "4:58:31"}
430
+ {"current_steps": 430, "total_steps": 750, "loss": 0.8271, "lr": 4.59320662666071e-06, "epoch": 1.72, "percentage": 57.33, "elapsed_time": "6:40:07", "remaining_time": "4:57:46"}
431
+ {"current_steps": 431, "total_steps": 750, "loss": 0.8182, "lr": 4.570017205768779e-06, "epoch": 1.724, "percentage": 57.47, "elapsed_time": "6:41:01", "remaining_time": "4:56:48"}
432
+ {"current_steps": 432, "total_steps": 750, "loss": 0.7873, "lr": 4.546837099011101e-06, "epoch": 1.728, "percentage": 57.6, "elapsed_time": "6:41:54", "remaining_time": "4:55:50"}
433
+ {"current_steps": 433, "total_steps": 750, "loss": 0.8012, "lr": 4.523666808506893e-06, "epoch": 1.732, "percentage": 57.73, "elapsed_time": "6:42:51", "remaining_time": "4:54:55"}
434
+ {"current_steps": 434, "total_steps": 750, "loss": 0.8149, "lr": 4.500506836162746e-06, "epoch": 1.736, "percentage": 57.87, "elapsed_time": "6:43:46", "remaining_time": "4:53:59"}
435
+ {"current_steps": 435, "total_steps": 750, "loss": 0.8252, "lr": 4.477357683661734e-06, "epoch": 1.74, "percentage": 58.0, "elapsed_time": "6:44:47", "remaining_time": "4:53:07"}
436
+ {"current_steps": 436, "total_steps": 750, "loss": 0.7868, "lr": 4.45421985245256e-06, "epoch": 1.744, "percentage": 58.13, "elapsed_time": "6:45:40", "remaining_time": "4:52:09"}
437
+ {"current_steps": 437, "total_steps": 750, "loss": 0.8138, "lr": 4.431093843738693e-06, "epoch": 1.748, "percentage": 58.27, "elapsed_time": "6:46:42", "remaining_time": "4:51:18"}
438
+ {"current_steps": 438, "total_steps": 750, "loss": 0.8376, "lr": 4.4079801584674955e-06, "epoch": 1.752, "percentage": 58.4, "elapsed_time": "6:47:39", "remaining_time": "4:50:23"}
439
+ {"current_steps": 439, "total_steps": 750, "loss": 0.8347, "lr": 4.384879297319398e-06, "epoch": 1.756, "percentage": 58.53, "elapsed_time": "6:48:30", "remaining_time": "4:49:23"}
440
+ {"current_steps": 440, "total_steps": 750, "loss": 0.8501, "lr": 4.361791760697027e-06, "epoch": 1.76, "percentage": 58.67, "elapsed_time": "6:49:26", "remaining_time": "4:48:28"}
441
+ {"current_steps": 441, "total_steps": 750, "loss": 0.8194, "lr": 4.3387180487143875e-06, "epoch": 1.764, "percentage": 58.8, "elapsed_time": "6:50:23", "remaining_time": "4:47:33"}
442
+ {"current_steps": 442, "total_steps": 750, "loss": 0.8352, "lr": 4.315658661186016e-06, "epoch": 1.768, "percentage": 58.93, "elapsed_time": "6:51:12", "remaining_time": "4:46:32"}
443
+ {"current_steps": 443, "total_steps": 750, "loss": 0.8033, "lr": 4.2926140976161555e-06, "epoch": 1.772, "percentage": 59.07, "elapsed_time": "6:52:03", "remaining_time": "4:45:33"}
444
+ {"current_steps": 444, "total_steps": 750, "loss": 0.7962, "lr": 4.269584857187942e-06, "epoch": 1.776, "percentage": 59.2, "elapsed_time": "6:53:08", "remaining_time": "4:44:44"}
445
+ {"current_steps": 445, "total_steps": 750, "loss": 0.8152, "lr": 4.246571438752585e-06, "epoch": 1.78, "percentage": 59.33, "elapsed_time": "6:53:59", "remaining_time": "4:43:44"}
446
+ {"current_steps": 446, "total_steps": 750, "loss": 0.8351, "lr": 4.2235743408185635e-06, "epoch": 1.784, "percentage": 59.47, "elapsed_time": "6:54:55", "remaining_time": "4:42:48"}
447
+ {"current_steps": 447, "total_steps": 750, "loss": 0.8292, "lr": 4.200594061540827e-06, "epoch": 1.788, "percentage": 59.6, "elapsed_time": "6:55:53", "remaining_time": "4:41:55"}
448
+ {"current_steps": 448, "total_steps": 750, "loss": 0.8349, "lr": 4.1776310987100054e-06, "epoch": 1.792, "percentage": 59.73, "elapsed_time": "6:56:49", "remaining_time": "4:40:59"}
449
+ {"current_steps": 449, "total_steps": 750, "loss": 0.841, "lr": 4.154685949741631e-06, "epoch": 1.796, "percentage": 59.87, "elapsed_time": "6:57:37", "remaining_time": "4:39:58"}
450
+ {"current_steps": 450, "total_steps": 750, "loss": 0.8478, "lr": 4.131759111665349e-06, "epoch": 1.8, "percentage": 60.0, "elapsed_time": "6:58:41", "remaining_time": "4:39:07"}
451
+ {"current_steps": 451, "total_steps": 750, "loss": 0.842, "lr": 4.108851081114169e-06, "epoch": 1.804, "percentage": 60.13, "elapsed_time": "6:59:32", "remaining_time": "4:38:08"}
452
+ {"current_steps": 452, "total_steps": 750, "loss": 0.8085, "lr": 4.0859623543136935e-06, "epoch": 1.808, "percentage": 60.27, "elapsed_time": "7:00:31", "remaining_time": "4:37:15"}
453
+ {"current_steps": 453, "total_steps": 750, "loss": 0.8226, "lr": 4.063093427071376e-06, "epoch": 1.812, "percentage": 60.4, "elapsed_time": "7:01:28", "remaining_time": "4:36:19"}
454
+ {"current_steps": 454, "total_steps": 750, "loss": 0.7907, "lr": 4.040244794765783e-06, "epoch": 1.8159999999999998, "percentage": 60.53, "elapsed_time": "7:02:18", "remaining_time": "4:35:19"}
455
+ {"current_steps": 455, "total_steps": 750, "loss": 0.8148, "lr": 4.017416952335849e-06, "epoch": 1.8199999999999998, "percentage": 60.67, "elapsed_time": "7:03:17", "remaining_time": "4:34:26"}
456
+ {"current_steps": 456, "total_steps": 750, "loss": 0.8446, "lr": 3.994610394270178e-06, "epoch": 1.8239999999999998, "percentage": 60.8, "elapsed_time": "7:04:18", "remaining_time": "4:33:33"}
457
+ {"current_steps": 457, "total_steps": 750, "loss": 0.8151, "lr": 3.971825614596308e-06, "epoch": 1.8279999999999998, "percentage": 60.93, "elapsed_time": "7:05:17", "remaining_time": "4:32:40"}
458
+ {"current_steps": 458, "total_steps": 750, "loss": 0.8365, "lr": 3.949063106870031e-06, "epoch": 1.8319999999999999, "percentage": 61.07, "elapsed_time": "7:06:20", "remaining_time": "4:31:48"}
459
+ {"current_steps": 459, "total_steps": 750, "loss": 0.8226, "lr": 3.926323364164684e-06, "epoch": 1.8359999999999999, "percentage": 61.2, "elapsed_time": "7:07:28", "remaining_time": "4:31:00"}
460
+ {"current_steps": 460, "total_steps": 750, "loss": 0.7785, "lr": 3.903606879060483e-06, "epoch": 1.8399999999999999, "percentage": 61.33, "elapsed_time": "7:08:23", "remaining_time": "4:30:04"}
461
+ {"current_steps": 461, "total_steps": 750, "loss": 0.7751, "lr": 3.880914143633844e-06, "epoch": 1.8439999999999999, "percentage": 61.47, "elapsed_time": "7:09:08", "remaining_time": "4:29:01"}
462
+ {"current_steps": 462, "total_steps": 750, "loss": 0.8252, "lr": 3.8582456494467214e-06, "epoch": 1.8479999999999999, "percentage": 61.6, "elapsed_time": "7:10:15", "remaining_time": "4:28:12"}
463
+ {"current_steps": 463, "total_steps": 750, "loss": 0.782, "lr": 3.835601887535971e-06, "epoch": 1.8519999999999999, "percentage": 61.73, "elapsed_time": "7:11:11", "remaining_time": "4:27:17"}
464
+ {"current_steps": 464, "total_steps": 750, "loss": 0.7884, "lr": 3.812983348402703e-06, "epoch": 1.8559999999999999, "percentage": 61.87, "elapsed_time": "7:12:04", "remaining_time": "4:26:19"}
465
+ {"current_steps": 465, "total_steps": 750, "loss": 0.8269, "lr": 3.790390522001662e-06, "epoch": 1.8599999999999999, "percentage": 62.0, "elapsed_time": "7:13:01", "remaining_time": "4:25:24"}
466
+ {"current_steps": 466, "total_steps": 750, "loss": 0.8175, "lr": 3.767823897730612e-06, "epoch": 1.8639999999999999, "percentage": 62.13, "elapsed_time": "7:13:57", "remaining_time": "4:24:28"}
467
+ {"current_steps": 467, "total_steps": 750, "loss": 0.8265, "lr": 3.745283964419736e-06, "epoch": 1.8679999999999999, "percentage": 62.27, "elapsed_time": "7:14:53", "remaining_time": "4:23:32"}
468
+ {"current_steps": 468, "total_steps": 750, "loss": 0.8422, "lr": 3.7227712103210485e-06, "epoch": 1.8719999999999999, "percentage": 62.4, "elapsed_time": "7:15:45", "remaining_time": "4:22:34"}
469
+ {"current_steps": 469, "total_steps": 750, "loss": 0.8218, "lr": 3.700286123097814e-06, "epoch": 1.876, "percentage": 62.53, "elapsed_time": "7:16:38", "remaining_time": "4:21:37"}
470
+ {"current_steps": 470, "total_steps": 750, "loss": 0.7906, "lr": 3.6778291898139907e-06, "epoch": 1.88, "percentage": 62.67, "elapsed_time": "7:17:23", "remaining_time": "4:20:34"}
471
+ {"current_steps": 471, "total_steps": 750, "loss": 0.7864, "lr": 3.655400896923672e-06, "epoch": 1.884, "percentage": 62.8, "elapsed_time": "7:18:12", "remaining_time": "4:19:34"}
472
+ {"current_steps": 472, "total_steps": 750, "loss": 0.8228, "lr": 3.633001730260558e-06, "epoch": 1.888, "percentage": 62.93, "elapsed_time": "7:19:13", "remaining_time": "4:18:42"}
473
+ {"current_steps": 473, "total_steps": 750, "loss": 0.816, "lr": 3.6106321750274275e-06, "epoch": 1.892, "percentage": 63.07, "elapsed_time": "7:20:08", "remaining_time": "4:17:45"}
474
+ {"current_steps": 474, "total_steps": 750, "loss": 0.8663, "lr": 3.5882927157856175e-06, "epoch": 1.896, "percentage": 63.2, "elapsed_time": "7:21:15", "remaining_time": "4:16:56"}
475
+ {"current_steps": 475, "total_steps": 750, "loss": 0.8209, "lr": 3.5659838364445505e-06, "epoch": 1.9, "percentage": 63.33, "elapsed_time": "7:22:14", "remaining_time": "4:16:02"}
476
+ {"current_steps": 476, "total_steps": 750, "loss": 0.8279, "lr": 3.543706020251223e-06, "epoch": 1.904, "percentage": 63.47, "elapsed_time": "7:23:07", "remaining_time": "4:15:04"}
477
+ {"current_steps": 477, "total_steps": 750, "loss": 0.8156, "lr": 3.521459749779769e-06, "epoch": 1.908, "percentage": 63.6, "elapsed_time": "7:24:08", "remaining_time": "4:14:11"}
478
+ {"current_steps": 478, "total_steps": 750, "loss": 0.8152, "lr": 3.4992455069209717e-06, "epoch": 1.912, "percentage": 63.73, "elapsed_time": "7:25:00", "remaining_time": "4:13:13"}
479
+ {"current_steps": 479, "total_steps": 750, "loss": 0.832, "lr": 3.4770637728718608e-06, "epoch": 1.916, "percentage": 63.87, "elapsed_time": "7:25:56", "remaining_time": "4:12:17"}
480
+ {"current_steps": 480, "total_steps": 750, "loss": 0.8177, "lr": 3.4549150281252635e-06, "epoch": 1.92, "percentage": 64.0, "elapsed_time": "7:26:59", "remaining_time": "4:11:26"}
481
+ {"current_steps": 481, "total_steps": 750, "loss": 0.8401, "lr": 3.4327997524594026e-06, "epoch": 1.924, "percentage": 64.13, "elapsed_time": "7:27:58", "remaining_time": "4:10:31"}
482
+ {"current_steps": 482, "total_steps": 750, "loss": 0.8577, "lr": 3.4107184249275114e-06, "epoch": 1.928, "percentage": 64.27, "elapsed_time": "7:29:02", "remaining_time": "4:09:40"}
483
+ {"current_steps": 483, "total_steps": 750, "loss": 0.8171, "lr": 3.3886715238474454e-06, "epoch": 1.932, "percentage": 64.4, "elapsed_time": "7:30:02", "remaining_time": "4:08:46"}
484
+ {"current_steps": 484, "total_steps": 750, "loss": 0.8573, "lr": 3.3666595267913293e-06, "epoch": 1.936, "percentage": 64.53, "elapsed_time": "7:31:07", "remaining_time": "4:07:55"}
485
+ {"current_steps": 485, "total_steps": 750, "loss": 0.8174, "lr": 3.3446829105752103e-06, "epoch": 1.94, "percentage": 64.67, "elapsed_time": "7:32:12", "remaining_time": "4:07:04"}
486
+ {"current_steps": 486, "total_steps": 750, "loss": 0.8119, "lr": 3.322742151248726e-06, "epoch": 1.944, "percentage": 64.8, "elapsed_time": "7:33:02", "remaining_time": "4:06:05"}
487
+ {"current_steps": 487, "total_steps": 750, "loss": 0.8051, "lr": 3.3008377240847955e-06, "epoch": 1.948, "percentage": 64.93, "elapsed_time": "7:34:03", "remaining_time": "4:05:12"}
488
+ {"current_steps": 488, "total_steps": 750, "loss": 0.8547, "lr": 3.2789701035693242e-06, "epoch": 1.952, "percentage": 65.07, "elapsed_time": "7:34:56", "remaining_time": "4:04:15"}
489
+ {"current_steps": 489, "total_steps": 750, "loss": 0.8522, "lr": 3.2571397633909252e-06, "epoch": 1.956, "percentage": 65.2, "elapsed_time": "7:35:59", "remaining_time": "4:03:22"}
490
+ {"current_steps": 490, "total_steps": 750, "loss": 0.8417, "lr": 3.2353471764306567e-06, "epoch": 1.96, "percentage": 65.33, "elapsed_time": "7:37:05", "remaining_time": "4:02:32"}
491
+ {"current_steps": 491, "total_steps": 750, "loss": 0.7664, "lr": 3.2135928147517803e-06, "epoch": 1.964, "percentage": 65.47, "elapsed_time": "7:37:52", "remaining_time": "4:01:31"}
492
+ {"current_steps": 492, "total_steps": 750, "loss": 0.8248, "lr": 3.1918771495895395e-06, "epoch": 1.968, "percentage": 65.6, "elapsed_time": "7:38:50", "remaining_time": "4:00:36"}
493
+ {"current_steps": 493, "total_steps": 750, "loss": 0.8189, "lr": 3.1702006513409393e-06, "epoch": 1.972, "percentage": 65.73, "elapsed_time": "7:39:43", "remaining_time": "3:59:39"}
494
+ {"current_steps": 494, "total_steps": 750, "loss": 0.8193, "lr": 3.148563789554575e-06, "epoch": 1.976, "percentage": 65.87, "elapsed_time": "7:40:39", "remaining_time": "3:58:43"}
495
+ {"current_steps": 495, "total_steps": 750, "loss": 0.8297, "lr": 3.12696703292044e-06, "epoch": 1.98, "percentage": 66.0, "elapsed_time": "7:41:30", "remaining_time": "3:57:44"}
496
+ {"current_steps": 496, "total_steps": 750, "loss": 0.7984, "lr": 3.105410849259796e-06, "epoch": 1.984, "percentage": 66.13, "elapsed_time": "7:42:27", "remaining_time": "3:56:49"}
497
+ {"current_steps": 497, "total_steps": 750, "loss": 0.8072, "lr": 3.0838957055150136e-06, "epoch": 1.988, "percentage": 66.27, "elapsed_time": "7:43:16", "remaining_time": "3:55:50"}
498
+ {"current_steps": 498, "total_steps": 750, "loss": 0.7919, "lr": 3.0624220677394854e-06, "epoch": 1.992, "percentage": 66.4, "elapsed_time": "7:44:12", "remaining_time": "3:54:54"}
499
+ {"current_steps": 499, "total_steps": 750, "loss": 0.8406, "lr": 3.040990401087508e-06, "epoch": 1.996, "percentage": 66.53, "elapsed_time": "7:45:14", "remaining_time": "3:54:01"}
500
+ {"current_steps": 500, "total_steps": 750, "loss": 0.7982, "lr": 3.019601169804216e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "7:46:11", "remaining_time": "3:53:05"}
501
+ {"current_steps": 501, "total_steps": 750, "loss": 0.7587, "lr": 2.9982548372155264e-06, "epoch": 2.004, "percentage": 66.8, "elapsed_time": "7:48:10", "remaining_time": "3:52:40"}
502
+ {"current_steps": 502, "total_steps": 750, "loss": 0.7893, "lr": 2.9769518657180953e-06, "epoch": 2.008, "percentage": 66.93, "elapsed_time": "7:49:01", "remaining_time": "3:51:42"}