neginr commited on
Commit
a100655
·
verified ·
1 Parent(s): e502559

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0f5a141bdcbd87eaec7f19ed08de21401b5d84fc8adbf141811fe3cc6d84512
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90d621352746c1a7b2b72138296d131e167d8c691da627778451b7d3c3cd7033
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:837cb881a4501b2164a8cdd444ab6552aafce76bce2c4e65c19201cc88a05782
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b202fc9c6e180c0204cd02ac9f48791d72878842bc818b91276c33d57d2ba5ce
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dd107eeb00bc0d474f8d73ec8ac2067e75050dc6bae92f321ce255e47afcfbf
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce27d01988836c413c5af10d00ba1e55fa11834cba04936eba152995e73ef23c
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86edd7e08e1690c559e435b6ee165e96b2359b95d74e89b095dd6a4235979492
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f62013cb7342fc78c6e79398d09ea31cad5da5fb0ef3f79bf4b2abd8078b1357
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -357,3 +357,113 @@
357
  {"current_steps": 332, "total_steps": 550, "loss": 0.3276, "lr": 3.25546273227348e-05, "epoch": 3.01131221719457, "percentage": 60.36, "elapsed_time": "4:35:56", "remaining_time": "3:01:11"}
358
  {"current_steps": 333, "total_steps": 550, "loss": 0.322, "lr": 3.230534935874958e-05, "epoch": 3.020361990950226, "percentage": 60.55, "elapsed_time": "4:36:44", "remaining_time": "3:00:20"}
359
  {"current_steps": 334, "total_steps": 550, "loss": 0.3247, "lr": 3.205638133417019e-05, "epoch": 3.0294117647058822, "percentage": 60.73, "elapsed_time": "4:37:33", "remaining_time": "2:59:29"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
357
  {"current_steps": 332, "total_steps": 550, "loss": 0.3276, "lr": 3.25546273227348e-05, "epoch": 3.01131221719457, "percentage": 60.36, "elapsed_time": "4:35:56", "remaining_time": "3:01:11"}
358
  {"current_steps": 333, "total_steps": 550, "loss": 0.322, "lr": 3.230534935874958e-05, "epoch": 3.020361990950226, "percentage": 60.55, "elapsed_time": "4:36:44", "remaining_time": "3:00:20"}
359
  {"current_steps": 334, "total_steps": 550, "loss": 0.3247, "lr": 3.205638133417019e-05, "epoch": 3.0294117647058822, "percentage": 60.73, "elapsed_time": "4:37:33", "remaining_time": "2:59:29"}
360
+ {"current_steps": 335, "total_steps": 550, "loss": 0.328, "lr": 3.180773327739238e-05, "epoch": 3.0384615384615383, "percentage": 60.91, "elapsed_time": "4:38:22", "remaining_time": "2:58:39"}
361
+ {"current_steps": 336, "total_steps": 550, "loss": 0.3235, "lr": 3.155941520392362e-05, "epoch": 3.0475113122171944, "percentage": 61.09, "elapsed_time": "4:39:10", "remaining_time": "2:57:48"}
362
+ {"current_steps": 337, "total_steps": 550, "loss": 0.3203, "lr": 3.1311437115979696e-05, "epoch": 3.0565610859728505, "percentage": 61.27, "elapsed_time": "4:39:59", "remaining_time": "2:56:58"}
363
+ {"current_steps": 338, "total_steps": 550, "loss": 0.3221, "lr": 3.1063809002081834e-05, "epoch": 3.065610859728507, "percentage": 61.45, "elapsed_time": "4:40:48", "remaining_time": "2:56:07"}
364
+ {"current_steps": 339, "total_steps": 550, "loss": 0.3226, "lr": 3.0816540836654356e-05, "epoch": 3.074660633484163, "percentage": 61.64, "elapsed_time": "4:41:37", "remaining_time": "2:55:17"}
365
+ {"current_steps": 340, "total_steps": 550, "loss": 0.3214, "lr": 3.0569642579622905e-05, "epoch": 3.083710407239819, "percentage": 61.82, "elapsed_time": "4:42:26", "remaining_time": "2:54:26"}
366
+ {"current_steps": 341, "total_steps": 550, "loss": 0.3225, "lr": 3.0323124176013297e-05, "epoch": 3.0927601809954752, "percentage": 62.0, "elapsed_time": "4:43:14", "remaining_time": "2:53:36"}
367
+ {"current_steps": 342, "total_steps": 550, "loss": 0.3183, "lr": 3.007699555555086e-05, "epoch": 3.1018099547511313, "percentage": 62.18, "elapsed_time": "4:44:03", "remaining_time": "2:52:45"}
368
+ {"current_steps": 343, "total_steps": 550, "loss": 0.3221, "lr": 2.9831266632260534e-05, "epoch": 3.1108597285067874, "percentage": 62.36, "elapsed_time": "4:44:52", "remaining_time": "2:51:55"}
369
+ {"current_steps": 344, "total_steps": 550, "loss": 0.3233, "lr": 2.958594730406752e-05, "epoch": 3.1199095022624435, "percentage": 62.55, "elapsed_time": "4:45:41", "remaining_time": "2:51:04"}
370
+ {"current_steps": 345, "total_steps": 550, "loss": 0.3232, "lr": 2.9341047452398607e-05, "epoch": 3.1289592760180995, "percentage": 62.73, "elapsed_time": "4:46:30", "remaining_time": "2:50:14"}
371
+ {"current_steps": 346, "total_steps": 550, "loss": 0.3217, "lr": 2.9096576941784095e-05, "epoch": 3.1380090497737556, "percentage": 62.91, "elapsed_time": "4:47:19", "remaining_time": "2:49:24"}
372
+ {"current_steps": 347, "total_steps": 550, "loss": 0.3294, "lr": 2.8852545619460495e-05, "epoch": 3.1470588235294117, "percentage": 63.09, "elapsed_time": "4:48:07", "remaining_time": "2:48:33"}
373
+ {"current_steps": 348, "total_steps": 550, "loss": 0.3178, "lr": 2.860896331497391e-05, "epoch": 3.1561085972850678, "percentage": 63.27, "elapsed_time": "4:48:56", "remaining_time": "2:47:43"}
374
+ {"current_steps": 349, "total_steps": 550, "loss": 0.3208, "lr": 2.8365839839784038e-05, "epoch": 3.165158371040724, "percentage": 63.45, "elapsed_time": "4:49:44", "remaining_time": "2:46:52"}
375
+ {"current_steps": 350, "total_steps": 550, "loss": 0.3252, "lr": 2.8123184986869022e-05, "epoch": 3.17420814479638, "percentage": 63.64, "elapsed_time": "4:50:33", "remaining_time": "2:46:01"}
376
+ {"current_steps": 351, "total_steps": 550, "loss": 0.3219, "lr": 2.7881008530330914e-05, "epoch": 3.183257918552036, "percentage": 63.82, "elapsed_time": "4:51:21", "remaining_time": "2:45:11"}
377
+ {"current_steps": 352, "total_steps": 550, "loss": 0.3279, "lr": 2.7639320225002108e-05, "epoch": 3.1923076923076925, "percentage": 64.0, "elapsed_time": "4:52:09", "remaining_time": "2:44:20"}
378
+ {"current_steps": 353, "total_steps": 550, "loss": 0.3211, "lr": 2.7398129806052298e-05, "epoch": 3.2013574660633486, "percentage": 64.18, "elapsed_time": "4:52:58", "remaining_time": "2:43:30"}
379
+ {"current_steps": 354, "total_steps": 550, "loss": 0.3264, "lr": 2.715744698859637e-05, "epoch": 3.2104072398190047, "percentage": 64.36, "elapsed_time": "4:53:46", "remaining_time": "2:42:39"}
380
+ {"current_steps": 355, "total_steps": 550, "loss": 0.3247, "lr": 2.691728146730314e-05, "epoch": 3.2194570135746607, "percentage": 64.55, "elapsed_time": "4:54:35", "remaining_time": "2:41:48"}
381
+ {"current_steps": 356, "total_steps": 550, "loss": 0.3219, "lr": 2.6677642916004772e-05, "epoch": 3.228506787330317, "percentage": 64.73, "elapsed_time": "4:55:23", "remaining_time": "2:40:58"}
382
+ {"current_steps": 357, "total_steps": 550, "loss": 0.3224, "lr": 2.6438540987307174e-05, "epoch": 3.237556561085973, "percentage": 64.91, "elapsed_time": "4:56:12", "remaining_time": "2:40:07"}
383
+ {"current_steps": 358, "total_steps": 550, "loss": 0.3287, "lr": 2.6199985312201185e-05, "epoch": 3.246606334841629, "percentage": 65.09, "elapsed_time": "4:57:00", "remaining_time": "2:39:17"}
384
+ {"current_steps": 359, "total_steps": 550, "loss": 0.3195, "lr": 2.5961985499674587e-05, "epoch": 3.255656108597285, "percentage": 65.27, "elapsed_time": "4:57:49", "remaining_time": "2:38:27"}
385
+ {"current_steps": 360, "total_steps": 550, "loss": 0.3155, "lr": 2.5724551136325132e-05, "epoch": 3.264705882352941, "percentage": 65.45, "elapsed_time": "4:58:37", "remaining_time": "2:37:36"}
386
+ {"current_steps": 361, "total_steps": 550, "loss": 0.3245, "lr": 2.5487691785974366e-05, "epoch": 3.273755656108597, "percentage": 65.64, "elapsed_time": "4:59:26", "remaining_time": "2:36:46"}
387
+ {"current_steps": 362, "total_steps": 550, "loss": 0.3244, "lr": 2.5251416989282377e-05, "epoch": 3.2828054298642533, "percentage": 65.82, "elapsed_time": "5:00:14", "remaining_time": "2:35:55"}
388
+ {"current_steps": 363, "total_steps": 550, "loss": 0.3204, "lr": 2.501573626336352e-05, "epoch": 3.2918552036199094, "percentage": 66.0, "elapsed_time": "5:01:03", "remaining_time": "2:35:05"}
389
+ {"current_steps": 364, "total_steps": 550, "loss": 0.319, "lr": 2.478065910140308e-05, "epoch": 3.3009049773755654, "percentage": 66.18, "elapsed_time": "5:01:52", "remaining_time": "2:34:15"}
390
+ {"current_steps": 365, "total_steps": 550, "loss": 0.3234, "lr": 2.4546194972274852e-05, "epoch": 3.3099547511312215, "percentage": 66.36, "elapsed_time": "5:02:40", "remaining_time": "2:33:24"}
391
+ {"current_steps": 366, "total_steps": 550, "loss": 0.3222, "lr": 2.431235332015978e-05, "epoch": 3.3190045248868776, "percentage": 66.55, "elapsed_time": "5:03:29", "remaining_time": "2:32:34"}
392
+ {"current_steps": 367, "total_steps": 550, "loss": 0.3196, "lr": 2.4079143564165524e-05, "epoch": 3.328054298642534, "percentage": 66.73, "elapsed_time": "5:04:17", "remaining_time": "2:31:43"}
393
+ {"current_steps": 368, "total_steps": 550, "loss": 0.3238, "lr": 2.3846575097947015e-05, "epoch": 3.33710407239819, "percentage": 66.91, "elapsed_time": "5:05:05", "remaining_time": "2:30:53"}
394
+ {"current_steps": 369, "total_steps": 550, "loss": 0.3281, "lr": 2.361465728932819e-05, "epoch": 3.3461538461538463, "percentage": 67.09, "elapsed_time": "5:05:53", "remaining_time": "2:30:02"}
395
+ {"current_steps": 370, "total_steps": 550, "loss": 0.3197, "lr": 2.338339947992455e-05, "epoch": 3.3552036199095023, "percentage": 67.27, "elapsed_time": "5:06:42", "remaining_time": "2:29:12"}
396
+ {"current_steps": 371, "total_steps": 550, "loss": 0.3217, "lr": 2.315281098476694e-05, "epoch": 3.3642533936651584, "percentage": 67.45, "elapsed_time": "5:07:30", "remaining_time": "2:28:22"}
397
+ {"current_steps": 372, "total_steps": 550, "loss": 0.3244, "lr": 2.2922901091926334e-05, "epoch": 3.3733031674208145, "percentage": 67.64, "elapsed_time": "5:08:19", "remaining_time": "2:27:31"}
398
+ {"current_steps": 373, "total_steps": 550, "loss": 0.3229, "lr": 2.269367906213966e-05, "epoch": 3.3823529411764706, "percentage": 67.82, "elapsed_time": "5:09:07", "remaining_time": "2:26:41"}
399
+ {"current_steps": 374, "total_steps": 550, "loss": 0.3246, "lr": 2.24651541284369e-05, "epoch": 3.3914027149321266, "percentage": 68.0, "elapsed_time": "5:09:55", "remaining_time": "2:25:50"}
400
+ {"current_steps": 375, "total_steps": 550, "loss": 0.3255, "lr": 2.2237335495769035e-05, "epoch": 3.4004524886877827, "percentage": 68.18, "elapsed_time": "5:10:43", "remaining_time": "2:25:00"}
401
+ {"current_steps": 376, "total_steps": 550, "loss": 0.3222, "lr": 2.2010232340637375e-05, "epoch": 3.409502262443439, "percentage": 68.36, "elapsed_time": "5:11:32", "remaining_time": "2:24:10"}
402
+ {"current_steps": 377, "total_steps": 550, "loss": 0.3188, "lr": 2.1783853810723895e-05, "epoch": 3.418552036199095, "percentage": 68.55, "elapsed_time": "5:12:20", "remaining_time": "2:23:19"}
403
+ {"current_steps": 378, "total_steps": 550, "loss": 0.3233, "lr": 2.155820902452276e-05, "epoch": 3.427601809954751, "percentage": 68.73, "elapsed_time": "5:13:09", "remaining_time": "2:22:29"}
404
+ {"current_steps": 379, "total_steps": 550, "loss": 0.32, "lr": 2.1333307070973054e-05, "epoch": 3.4366515837104075, "percentage": 68.91, "elapsed_time": "5:13:58", "remaining_time": "2:21:39"}
405
+ {"current_steps": 380, "total_steps": 550, "loss": 0.3234, "lr": 2.11091570090927e-05, "epoch": 3.4457013574660635, "percentage": 69.09, "elapsed_time": "5:14:46", "remaining_time": "2:20:49"}
406
+ {"current_steps": 381, "total_steps": 550, "loss": 0.3236, "lr": 2.0885767867613485e-05, "epoch": 3.4547511312217196, "percentage": 69.27, "elapsed_time": "5:15:35", "remaining_time": "2:19:59"}
407
+ {"current_steps": 382, "total_steps": 550, "loss": 0.3193, "lr": 2.0663148644617443e-05, "epoch": 3.4638009049773757, "percentage": 69.45, "elapsed_time": "5:16:23", "remaining_time": "2:19:08"}
408
+ {"current_steps": 383, "total_steps": 550, "loss": 0.3197, "lr": 2.044130830717445e-05, "epoch": 3.4728506787330318, "percentage": 69.64, "elapsed_time": "5:17:11", "remaining_time": "2:18:18"}
409
+ {"current_steps": 384, "total_steps": 550, "loss": 0.3222, "lr": 2.0220255790980935e-05, "epoch": 3.481900452488688, "percentage": 69.82, "elapsed_time": "5:18:00", "remaining_time": "2:17:28"}
410
+ {"current_steps": 385, "total_steps": 550, "loss": 0.323, "lr": 2.0000000000000012e-05, "epoch": 3.490950226244344, "percentage": 70.0, "elapsed_time": "5:18:48", "remaining_time": "2:16:37"}
411
+ {"current_steps": 386, "total_steps": 550, "loss": 0.3233, "lr": 1.9780549806102827e-05, "epoch": 3.5, "percentage": 70.18, "elapsed_time": "5:19:37", "remaining_time": "2:15:47"}
412
+ {"current_steps": 387, "total_steps": 550, "loss": 0.3328, "lr": 1.9561914048711182e-05, "epoch": 3.509049773755656, "percentage": 70.36, "elapsed_time": "5:20:25", "remaining_time": "2:14:57"}
413
+ {"current_steps": 388, "total_steps": 550, "loss": 0.3206, "lr": 1.934410153444153e-05, "epoch": 3.518099547511312, "percentage": 70.55, "elapsed_time": "5:21:14", "remaining_time": "2:14:07"}
414
+ {"current_steps": 389, "total_steps": 550, "loss": 0.3234, "lr": 1.912712103675017e-05, "epoch": 3.5271493212669682, "percentage": 70.73, "elapsed_time": "5:22:02", "remaining_time": "2:13:17"}
415
+ {"current_steps": 390, "total_steps": 550, "loss": 0.326, "lr": 1.8910981295579903e-05, "epoch": 3.5361990950226243, "percentage": 70.91, "elapsed_time": "5:22:51", "remaining_time": "2:12:27"}
416
+ {"current_steps": 391, "total_steps": 550, "loss": 0.328, "lr": 1.8695691017008005e-05, "epoch": 3.5452488687782804, "percentage": 71.09, "elapsed_time": "5:23:40", "remaining_time": "2:11:37"}
417
+ {"current_steps": 392, "total_steps": 550, "loss": 0.3249, "lr": 1.8481258872895503e-05, "epoch": 3.5542986425339365, "percentage": 71.27, "elapsed_time": "5:24:28", "remaining_time": "2:10:47"}
418
+ {"current_steps": 393, "total_steps": 550, "loss": 0.325, "lr": 1.826769350053789e-05, "epoch": 3.5633484162895925, "percentage": 71.45, "elapsed_time": "5:25:17", "remaining_time": "2:09:57"}
419
+ {"current_steps": 394, "total_steps": 550, "loss": 0.3245, "lr": 1.8055003502317213e-05, "epoch": 3.5723981900452486, "percentage": 71.64, "elapsed_time": "5:26:06", "remaining_time": "2:09:06"}
420
+ {"current_steps": 395, "total_steps": 550, "loss": 0.3257, "lr": 1.7843197445355593e-05, "epoch": 3.581447963800905, "percentage": 71.82, "elapsed_time": "5:26:54", "remaining_time": "2:08:16"}
421
+ {"current_steps": 396, "total_steps": 550, "loss": 0.3267, "lr": 1.7632283861170135e-05, "epoch": 3.590497737556561, "percentage": 72.0, "elapsed_time": "5:27:42", "remaining_time": "2:07:26"}
422
+ {"current_steps": 397, "total_steps": 550, "loss": 0.3257, "lr": 1.7422271245329244e-05, "epoch": 3.5995475113122173, "percentage": 72.18, "elapsed_time": "5:28:31", "remaining_time": "2:06:36"}
423
+ {"current_steps": 398, "total_steps": 550, "loss": 0.3211, "lr": 1.721316805711045e-05, "epoch": 3.6085972850678734, "percentage": 72.36, "elapsed_time": "5:29:19", "remaining_time": "2:05:46"}
424
+ {"current_steps": 399, "total_steps": 550, "loss": 0.3201, "lr": 1.7004982719159712e-05, "epoch": 3.6176470588235294, "percentage": 72.55, "elapsed_time": "5:30:07", "remaining_time": "2:04:56"}
425
+ {"current_steps": 400, "total_steps": 550, "loss": 0.3223, "lr": 1.679772361715208e-05, "epoch": 3.6266968325791855, "percentage": 72.73, "elapsed_time": "5:30:55", "remaining_time": "2:04:05"}
426
+ {"current_steps": 401, "total_steps": 550, "loss": 0.3251, "lr": 1.6591399099453952e-05, "epoch": 3.6357466063348416, "percentage": 72.91, "elapsed_time": "5:31:44", "remaining_time": "2:03:15"}
427
+ {"current_steps": 402, "total_steps": 550, "loss": 0.3264, "lr": 1.6386017476786818e-05, "epoch": 3.6447963800904977, "percentage": 73.09, "elapsed_time": "5:32:32", "remaining_time": "2:02:25"}
428
+ {"current_steps": 403, "total_steps": 550, "loss": 0.3252, "lr": 1.6181587021892484e-05, "epoch": 3.6538461538461537, "percentage": 73.27, "elapsed_time": "5:33:21", "remaining_time": "2:01:35"}
429
+ {"current_steps": 404, "total_steps": 550, "loss": 0.3241, "lr": 1.5978115969199882e-05, "epoch": 3.66289592760181, "percentage": 73.45, "elapsed_time": "5:34:09", "remaining_time": "2:00:45"}
430
+ {"current_steps": 405, "total_steps": 550, "loss": 0.3224, "lr": 1.5775612514493343e-05, "epoch": 3.6719457013574663, "percentage": 73.64, "elapsed_time": "5:34:58", "remaining_time": "1:59:55"}
431
+ {"current_steps": 406, "total_steps": 550, "loss": 0.3214, "lr": 1.557408481458247e-05, "epoch": 3.6809954751131224, "percentage": 73.82, "elapsed_time": "5:35:47", "remaining_time": "1:59:05"}
432
+ {"current_steps": 407, "total_steps": 550, "loss": 0.3243, "lr": 1.537354098697367e-05, "epoch": 3.6900452488687785, "percentage": 74.0, "elapsed_time": "5:36:35", "remaining_time": "1:58:15"}
433
+ {"current_steps": 408, "total_steps": 550, "loss": 0.3262, "lr": 1.5173989109543055e-05, "epoch": 3.6990950226244346, "percentage": 74.18, "elapsed_time": "5:37:24", "remaining_time": "1:57:25"}
434
+ {"current_steps": 409, "total_steps": 550, "loss": 0.3248, "lr": 1.497543722021114e-05, "epoch": 3.7081447963800906, "percentage": 74.36, "elapsed_time": "5:38:12", "remaining_time": "1:56:35"}
435
+ {"current_steps": 410, "total_steps": 550, "loss": 0.3203, "lr": 1.4777893316619114e-05, "epoch": 3.7171945701357467, "percentage": 74.55, "elapsed_time": "5:39:00", "remaining_time": "1:55:45"}
436
+ {"current_steps": 411, "total_steps": 550, "loss": 0.3243, "lr": 1.4581365355806555e-05, "epoch": 3.726244343891403, "percentage": 74.73, "elapsed_time": "5:39:49", "remaining_time": "1:54:55"}
437
+ {"current_steps": 412, "total_steps": 550, "loss": 0.327, "lr": 1.4385861253891111e-05, "epoch": 3.735294117647059, "percentage": 74.91, "elapsed_time": "5:40:37", "remaining_time": "1:54:05"}
438
+ {"current_steps": 413, "total_steps": 550, "loss": 0.3237, "lr": 1.4191388885749487e-05, "epoch": 3.744343891402715, "percentage": 75.09, "elapsed_time": "5:41:26", "remaining_time": "1:53:15"}
439
+ {"current_steps": 414, "total_steps": 550, "loss": 0.3223, "lr": 1.3997956084700301e-05, "epoch": 3.753393665158371, "percentage": 75.27, "elapsed_time": "5:42:14", "remaining_time": "1:52:25"}
440
+ {"current_steps": 415, "total_steps": 550, "loss": 0.3258, "lr": 1.3805570642188602e-05, "epoch": 3.762443438914027, "percentage": 75.45, "elapsed_time": "5:43:02", "remaining_time": "1:51:35"}
441
+ {"current_steps": 416, "total_steps": 550, "loss": 0.3248, "lr": 1.3614240307471942e-05, "epoch": 3.771493212669683, "percentage": 75.64, "elapsed_time": "5:43:51", "remaining_time": "1:50:45"}
442
+ {"current_steps": 417, "total_steps": 550, "loss": 0.3223, "lr": 1.34239727873083e-05, "epoch": 3.7805429864253393, "percentage": 75.82, "elapsed_time": "5:44:39", "remaining_time": "1:49:55"}
443
+ {"current_steps": 418, "total_steps": 550, "loss": 0.321, "lr": 1.3234775745645684e-05, "epoch": 3.7895927601809953, "percentage": 76.0, "elapsed_time": "5:45:27", "remaining_time": "1:49:05"}
444
+ {"current_steps": 419, "total_steps": 550, "loss": 0.324, "lr": 1.3046656803313287e-05, "epoch": 3.7986425339366514, "percentage": 76.18, "elapsed_time": "5:46:16", "remaining_time": "1:48:15"}
445
+ {"current_steps": 420, "total_steps": 550, "loss": 0.3227, "lr": 1.2859623537714719e-05, "epoch": 3.8076923076923075, "percentage": 76.36, "elapsed_time": "5:47:04", "remaining_time": "1:47:25"}
446
+ {"current_steps": 421, "total_steps": 550, "loss": 0.3289, "lr": 1.2673683482522629e-05, "epoch": 3.8167420814479636, "percentage": 76.55, "elapsed_time": "5:47:52", "remaining_time": "1:46:35"}
447
+ {"current_steps": 422, "total_steps": 550, "loss": 0.3236, "lr": 1.248884412737532e-05, "epoch": 3.8257918552036196, "percentage": 76.73, "elapsed_time": "5:48:41", "remaining_time": "1:45:45"}
448
+ {"current_steps": 423, "total_steps": 550, "loss": 0.3273, "lr": 1.2305112917575092e-05, "epoch": 3.834841628959276, "percentage": 76.91, "elapsed_time": "5:49:29", "remaining_time": "1:44:55"}
449
+ {"current_steps": 424, "total_steps": 550, "loss": 0.3224, "lr": 1.2122497253788267e-05, "epoch": 3.8438914027149322, "percentage": 77.09, "elapsed_time": "5:50:17", "remaining_time": "1:44:05"}
450
+ {"current_steps": 425, "total_steps": 550, "loss": 0.3174, "lr": 1.1941004491747145e-05, "epoch": 3.8529411764705883, "percentage": 77.27, "elapsed_time": "5:51:05", "remaining_time": "1:43:15"}
451
+ {"current_steps": 426, "total_steps": 550, "loss": 0.3252, "lr": 1.1760641941953744e-05, "epoch": 3.8619909502262444, "percentage": 77.45, "elapsed_time": "5:51:54", "remaining_time": "1:42:26"}
452
+ {"current_steps": 427, "total_steps": 550, "loss": 0.3223, "lr": 1.1581416869385253e-05, "epoch": 3.8710407239819005, "percentage": 77.64, "elapsed_time": "5:52:43", "remaining_time": "1:41:36"}
453
+ {"current_steps": 428, "total_steps": 550, "loss": 0.3215, "lr": 1.1403336493201462e-05, "epoch": 3.8800904977375565, "percentage": 77.82, "elapsed_time": "5:53:31", "remaining_time": "1:40:46"}
454
+ {"current_steps": 429, "total_steps": 550, "loss": 0.3238, "lr": 1.1226407986453963e-05, "epoch": 3.8891402714932126, "percentage": 78.0, "elapsed_time": "5:54:20", "remaining_time": "1:39:56"}
455
+ {"current_steps": 430, "total_steps": 550, "loss": 0.3256, "lr": 1.1050638475797193e-05, "epoch": 3.8981900452488687, "percentage": 78.18, "elapsed_time": "5:55:08", "remaining_time": "1:39:06"}
456
+ {"current_steps": 431, "total_steps": 550, "loss": 0.3221, "lr": 1.0876035041201436e-05, "epoch": 3.9072398190045248, "percentage": 78.36, "elapsed_time": "5:55:57", "remaining_time": "1:38:16"}
457
+ {"current_steps": 432, "total_steps": 550, "loss": 0.3252, "lr": 1.070260471566757e-05, "epoch": 3.916289592760181, "percentage": 78.55, "elapsed_time": "5:56:45", "remaining_time": "1:37:26"}
458
+ {"current_steps": 433, "total_steps": 550, "loss": 0.3185, "lr": 1.0530354484943798e-05, "epoch": 3.9253393665158374, "percentage": 78.73, "elapsed_time": "5:57:33", "remaining_time": "1:36:36"}
459
+ {"current_steps": 434, "total_steps": 550, "loss": 0.3241, "lr": 1.0359291287244334e-05, "epoch": 3.9343891402714934, "percentage": 78.91, "elapsed_time": "5:58:22", "remaining_time": "1:35:47"}
460
+ {"current_steps": 435, "total_steps": 550, "loss": 0.3264, "lr": 1.0189422012969814e-05, "epoch": 3.9434389140271495, "percentage": 79.09, "elapsed_time": "5:59:10", "remaining_time": "1:34:57"}
461
+ {"current_steps": 436, "total_steps": 550, "loss": 0.3184, "lr": 1.0020753504429845e-05, "epoch": 3.9524886877828056, "percentage": 79.27, "elapsed_time": "5:59:59", "remaining_time": "1:34:07"}
462
+ {"current_steps": 437, "total_steps": 550, "loss": 0.3259, "lr": 9.85329255556735e-06, "epoch": 3.9615384615384617, "percentage": 79.45, "elapsed_time": "6:00:47", "remaining_time": "1:33:17"}
463
+ {"current_steps": 438, "total_steps": 550, "loss": 0.3239, "lr": 9.687045911684928e-06, "epoch": 3.9705882352941178, "percentage": 79.64, "elapsed_time": "6:01:36", "remaining_time": "1:32:27"}
464
+ {"current_steps": 439, "total_steps": 550, "loss": 0.323, "lr": 9.522020269173172e-06, "epoch": 3.979638009049774, "percentage": 79.82, "elapsed_time": "6:02:24", "remaining_time": "1:31:37"}
465
+ {"current_steps": 440, "total_steps": 550, "loss": 0.324, "lr": 9.358222275240884e-06, "epoch": 3.98868778280543, "percentage": 80.0, "elapsed_time": "6:03:12", "remaining_time": "1:30:48"}
466
+ {"current_steps": 441, "total_steps": 550, "loss": 0.3264, "lr": 9.195658527647371e-06, "epoch": 3.997737556561086, "percentage": 80.18, "elapsed_time": "6:04:00", "remaining_time": "1:29:58"}
467
+ {"current_steps": 442, "total_steps": 550, "loss": 0.3062, "lr": 9.034335574436701e-06, "epoch": 4.009049773755656, "percentage": 80.36, "elapsed_time": "6:06:45", "remaining_time": "1:29:36"}
468
+ {"current_steps": 443, "total_steps": 550, "loss": 0.3037, "lr": 8.8742599136739e-06, "epoch": 4.018099547511312, "percentage": 80.55, "elapsed_time": "6:07:33", "remaining_time": "1:28:46"}
469
+ {"current_steps": 444, "total_steps": 550, "loss": 0.3071, "lr": 8.715437993183235e-06, "epoch": 4.027149321266968, "percentage": 80.73, "elapsed_time": "6:08:21", "remaining_time": "1:27:56"}