sedrickkeh commited on
Commit
a242fe2
·
verified ·
1 Parent(s): 90ebe8f

Training in progress, step 700

Browse files
model-00001-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95ec6fa7b953a23a5d4bd1ade229cbf3714ce37c1a05b75ebefe4b9288e5af02
3
  size 4891730992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:898e85c9cde394df0575ff15e3222e9cd63b04a2fc6c1348d769524781722de0
3
  size 4891730992
model-00002-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89797a595d668beed22ad8f1b7f86bee1491bc3a6b733e3f7111e252045d38e9
3
  size 4876059352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00a14a6dfdf5b1734948922cc5c7497b2c4c5f9d616725420d207a57985080e8
3
  size 4876059352
model-00003-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4c70c5134cd97dc7a0406f0c50858bb9e2c6ad1ec68d062aa7eaade8a9a1402
3
  size 4876059384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b60744a1fe92f196b5a3dbaf6ef8b535857820836a71f375237e5f233213fe8b
3
  size 4876059384
model-00004-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:207a5914c70ec966a311382c0dddd0c5fdb2002491da32eb0b7584125dd73b60
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dacdf2bf3cd714c5a50fc37b747d21b480231c6b232c0df519761c55cf3bd95
3
  size 4876059416
model-00005-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a1069b0274e15592efc93acbac94f88ba32f5dd2da69a358af2d65021dd6aa8
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd8b044ac8140c21ccba5c765cec0b6ca07e17afeb700ec20de71d287b665d6f
3
  size 4876059416
model-00006-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d90336395d50d94da7fc4b2f8ce4d261e24f100bf931a75a4536fef439ea8714
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6ae6646464aea0a3b00092d5ec2c6d93a7ecde1dbba4d9e64f59f52ca41c087
3
  size 4876059416
model-00007-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4771329b92953079a062f808e3528a4bec7174a3b0cc538077debc920ee7c763
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fad20f2a0c4f10ed8fa0f54a684f592ef9296354e45577ada30c41badce20c0a
3
  size 4876059416
model-00008-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a0b326aa6ae668b2e6cb5f8b51101de760d809e763518a72754df470a919f47
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21d786c13694333e62311582ed2aca9fde5a22bbf4e32c739923da9a315f8081
3
  size 4876059416
model-00009-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91a484b2549b44a44ee7f50be69dc049e351ac58460eb9fb0d1169b164bd4311
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e449dab4ff6da3820f9ff057fbb666b769ad47c35d927541ba0ecdc9cec7615
3
  size 4876059416
model-00010-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c81db6d30915dfa922393b455eefacd9216bfc969dbe668271ca2f36e4ae920c
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65ca38646a49bb3ad27683e7091064c4b40644b74224b50be899fa6fb24b2fc1
3
  size 4876059416
model-00011-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a91c44995df7d05e554238e098c831826f4782211ba421b55e066f1461b1f3c5
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0caf7e37107503cbaa4e0fb6c9705bba8c62a6aec0f4099a664b4ed4e93a0d36
3
  size 4876059416
model-00012-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:252f6f17ce2d2120cbd1dbf21ccc562a96181055f41bc9555f7fefa6bb041edc
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39fd114eab418a5a3e66548a4496cb22dd2bf4c65a53a8b90ae98571afd39939
3
  size 4876059416
model-00013-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce9574e31a33ab81fc8852fae98a30cec91ed46f5374abbd83ca76546c0cf646
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03ae65f799804c19f80c8869c22a671b6d4427bdecc82a0ab736e52efb93cdb6
3
  size 4876059416
model-00014-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:884446068710a62034131130cf266f69f153826c8a45d6b1633e797aef08bdfd
3
  size 2123397800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:539e30e6e3d78b4a6faa7e3aea5e292c70912f79dcb9e38bf6d21fced055967c
3
  size 2123397800
trainer_log.jsonl CHANGED
@@ -601,3 +601,103 @@
601
  {"current_steps": 601, "total_steps": 1095, "loss": 0.3645, "lr": 5.0239206649955905e-06, "epoch": 1.6465753424657534, "percentage": 54.89, "elapsed_time": "19:04:36", "remaining_time": "15:40:49"}
602
  {"current_steps": 602, "total_steps": 1095, "loss": 0.3599, "lr": 5.007973582035569e-06, "epoch": 1.6493150684931508, "percentage": 54.98, "elapsed_time": "19:06:22", "remaining_time": "15:38:48"}
603
  {"current_steps": 603, "total_steps": 1095, "loss": 0.3637, "lr": 4.992026417964431e-06, "epoch": 1.652054794520548, "percentage": 55.07, "elapsed_time": "19:08:37", "remaining_time": "15:37:11"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
601
  {"current_steps": 601, "total_steps": 1095, "loss": 0.3645, "lr": 5.0239206649955905e-06, "epoch": 1.6465753424657534, "percentage": 54.89, "elapsed_time": "19:04:36", "remaining_time": "15:40:49"}
602
  {"current_steps": 602, "total_steps": 1095, "loss": 0.3599, "lr": 5.007973582035569e-06, "epoch": 1.6493150684931508, "percentage": 54.98, "elapsed_time": "19:06:22", "remaining_time": "15:38:48"}
603
  {"current_steps": 603, "total_steps": 1095, "loss": 0.3637, "lr": 4.992026417964431e-06, "epoch": 1.652054794520548, "percentage": 55.07, "elapsed_time": "19:08:37", "remaining_time": "15:37:11"}
604
+ {"current_steps": 604, "total_steps": 1095, "loss": 0.3701, "lr": 4.976079335004411e-06, "epoch": 1.654794520547945, "percentage": 55.16, "elapsed_time": "19:10:16", "remaining_time": "15:35:04"}
605
+ {"current_steps": 605, "total_steps": 1095, "loss": 0.3484, "lr": 4.960132495376919e-06, "epoch": 1.6575342465753424, "percentage": 55.25, "elapsed_time": "19:11:57", "remaining_time": "15:32:59"}
606
+ {"current_steps": 606, "total_steps": 1095, "loss": 0.3313, "lr": 4.944186061300884e-06, "epoch": 1.6602739726027398, "percentage": 55.34, "elapsed_time": "19:14:02", "remaining_time": "15:31:13"}
607
+ {"current_steps": 607, "total_steps": 1095, "loss": 0.3551, "lr": 4.928240194991119e-06, "epoch": 1.6630136986301371, "percentage": 55.43, "elapsed_time": "19:16:02", "remaining_time": "15:29:24"}
608
+ {"current_steps": 608, "total_steps": 1095, "loss": 0.3546, "lr": 4.912295058656654e-06, "epoch": 1.6657534246575343, "percentage": 55.53, "elapsed_time": "19:17:46", "remaining_time": "15:27:22"}
609
+ {"current_steps": 609, "total_steps": 1095, "loss": 0.3678, "lr": 4.8963508144991e-06, "epoch": 1.6684931506849314, "percentage": 55.62, "elapsed_time": "19:19:50", "remaining_time": "15:25:35"}
610
+ {"current_steps": 610, "total_steps": 1095, "loss": 0.3429, "lr": 4.880407624710986e-06, "epoch": 1.6712328767123288, "percentage": 55.71, "elapsed_time": "19:21:35", "remaining_time": "15:23:33"}
611
+ {"current_steps": 611, "total_steps": 1095, "loss": 0.354, "lr": 4.864465651474118e-06, "epoch": 1.6739726027397261, "percentage": 55.8, "elapsed_time": "19:23:42", "remaining_time": "15:21:49"}
612
+ {"current_steps": 612, "total_steps": 1095, "loss": 0.3912, "lr": 4.848525056957927e-06, "epoch": 1.6767123287671233, "percentage": 55.89, "elapsed_time": "19:25:27", "remaining_time": "15:19:47"}
613
+ {"current_steps": 613, "total_steps": 1095, "loss": 0.348, "lr": 4.832586003317818e-06, "epoch": 1.6794520547945204, "percentage": 55.98, "elapsed_time": "19:27:09", "remaining_time": "15:17:43"}
614
+ {"current_steps": 614, "total_steps": 1095, "loss": 0.3511, "lr": 4.816648652693522e-06, "epoch": 1.6821917808219178, "percentage": 56.07, "elapsed_time": "19:29:08", "remaining_time": "15:15:53"}
615
+ {"current_steps": 615, "total_steps": 1095, "loss": 0.3766, "lr": 4.800713167207449e-06, "epoch": 1.6849315068493151, "percentage": 56.16, "elapsed_time": "19:31:23", "remaining_time": "15:14:15"}
616
+ {"current_steps": 616, "total_steps": 1095, "loss": 0.3499, "lr": 4.784779708963029e-06, "epoch": 1.6876712328767123, "percentage": 56.26, "elapsed_time": "19:33:23", "remaining_time": "15:12:25"}
617
+ {"current_steps": 617, "total_steps": 1095, "loss": 0.3947, "lr": 4.768848440043076e-06, "epoch": 1.6904109589041096, "percentage": 56.35, "elapsed_time": "19:35:36", "remaining_time": "15:10:45"}
618
+ {"current_steps": 618, "total_steps": 1095, "loss": 0.3704, "lr": 4.752919522508133e-06, "epoch": 1.6931506849315068, "percentage": 56.44, "elapsed_time": "19:37:24", "remaining_time": "15:08:46"}
619
+ {"current_steps": 619, "total_steps": 1095, "loss": 0.3608, "lr": 4.736993118394817e-06, "epoch": 1.6958904109589041, "percentage": 56.53, "elapsed_time": "19:39:13", "remaining_time": "15:06:48"}
620
+ {"current_steps": 620, "total_steps": 1095, "loss": 0.3567, "lr": 4.721069389714188e-06, "epoch": 1.6986301369863015, "percentage": 56.62, "elapsed_time": "19:41:04", "remaining_time": "15:04:51"}
621
+ {"current_steps": 621, "total_steps": 1095, "loss": 0.3648, "lr": 4.70514849845008e-06, "epoch": 1.7013698630136986, "percentage": 56.71, "elapsed_time": "19:43:03", "remaining_time": "15:03:00"}
622
+ {"current_steps": 622, "total_steps": 1095, "loss": 0.3702, "lr": 4.689230606557468e-06, "epoch": 1.7041095890410958, "percentage": 56.8, "elapsed_time": "19:45:02", "remaining_time": "15:01:10"}
623
+ {"current_steps": 623, "total_steps": 1095, "loss": 0.3505, "lr": 4.6733158759608165e-06, "epoch": 1.7068493150684931, "percentage": 56.89, "elapsed_time": "19:46:37", "remaining_time": "14:59:01"}
624
+ {"current_steps": 624, "total_steps": 1095, "loss": 0.3666, "lr": 4.657404468552431e-06, "epoch": 1.7095890410958905, "percentage": 56.99, "elapsed_time": "19:48:40", "remaining_time": "14:57:12"}
625
+ {"current_steps": 625, "total_steps": 1095, "loss": 0.3662, "lr": 4.641496546190813e-06, "epoch": 1.7123287671232876, "percentage": 57.08, "elapsed_time": "19:50:50", "remaining_time": "14:55:30"}
626
+ {"current_steps": 626, "total_steps": 1095, "loss": 0.3555, "lr": 4.625592270699008e-06, "epoch": 1.7150684931506848, "percentage": 57.17, "elapsed_time": "19:52:43", "remaining_time": "14:53:35"}
627
+ {"current_steps": 627, "total_steps": 1095, "loss": 0.3507, "lr": 4.609691803862969e-06, "epoch": 1.7178082191780821, "percentage": 57.26, "elapsed_time": "19:54:32", "remaining_time": "14:51:36"}
628
+ {"current_steps": 628, "total_steps": 1095, "loss": 0.3644, "lr": 4.593795307429904e-06, "epoch": 1.7205479452054795, "percentage": 57.35, "elapsed_time": "19:57:01", "remaining_time": "14:50:08"}
629
+ {"current_steps": 629, "total_steps": 1095, "loss": 0.3812, "lr": 4.577902943106632e-06, "epoch": 1.7232876712328768, "percentage": 57.44, "elapsed_time": "19:59:08", "remaining_time": "14:48:23"}
630
+ {"current_steps": 630, "total_steps": 1095, "loss": 0.3563, "lr": 4.562014872557936e-06, "epoch": 1.726027397260274, "percentage": 57.53, "elapsed_time": "20:01:21", "remaining_time": "14:46:43"}
631
+ {"current_steps": 631, "total_steps": 1095, "loss": 0.3663, "lr": 4.546131257404923e-06, "epoch": 1.7287671232876711, "percentage": 57.63, "elapsed_time": "20:03:07", "remaining_time": "14:44:42"}
632
+ {"current_steps": 632, "total_steps": 1095, "loss": 0.3387, "lr": 4.530252259223379e-06, "epoch": 1.7315068493150685, "percentage": 57.72, "elapsed_time": "20:04:42", "remaining_time": "14:42:33"}
633
+ {"current_steps": 633, "total_steps": 1095, "loss": 0.3413, "lr": 4.514378039542118e-06, "epoch": 1.7342465753424658, "percentage": 57.81, "elapsed_time": "20:06:40", "remaining_time": "14:40:42"}
634
+ {"current_steps": 634, "total_steps": 1095, "loss": 0.3785, "lr": 4.498508759841354e-06, "epoch": 1.736986301369863, "percentage": 57.9, "elapsed_time": "20:08:36", "remaining_time": "14:38:49"}
635
+ {"current_steps": 635, "total_steps": 1095, "loss": 0.3627, "lr": 4.48264458155104e-06, "epoch": 1.7397260273972601, "percentage": 57.99, "elapsed_time": "20:10:53", "remaining_time": "14:37:10"}
636
+ {"current_steps": 636, "total_steps": 1095, "loss": 0.3705, "lr": 4.46678566604924e-06, "epoch": 1.7424657534246575, "percentage": 58.08, "elapsed_time": "20:12:59", "remaining_time": "14:35:24"}
637
+ {"current_steps": 637, "total_steps": 1095, "loss": 0.3618, "lr": 4.450932174660484e-06, "epoch": 1.7452054794520548, "percentage": 58.17, "elapsed_time": "20:15:06", "remaining_time": "14:33:39"}
638
+ {"current_steps": 638, "total_steps": 1095, "loss": 0.3602, "lr": 4.435084268654117e-06, "epoch": 1.7479452054794522, "percentage": 58.26, "elapsed_time": "20:16:42", "remaining_time": "14:31:31"}
639
+ {"current_steps": 639, "total_steps": 1095, "loss": 0.401, "lr": 4.419242109242679e-06, "epoch": 1.7506849315068493, "percentage": 58.36, "elapsed_time": "20:18:46", "remaining_time": "14:29:44"}
640
+ {"current_steps": 640, "total_steps": 1095, "loss": 0.366, "lr": 4.403405857580243e-06, "epoch": 1.7534246575342465, "percentage": 58.45, "elapsed_time": "20:20:47", "remaining_time": "14:27:54"}
641
+ {"current_steps": 641, "total_steps": 1095, "loss": 0.3666, "lr": 4.387575674760787e-06, "epoch": 1.7561643835616438, "percentage": 58.54, "elapsed_time": "20:22:32", "remaining_time": "14:25:53"}
642
+ {"current_steps": 642, "total_steps": 1095, "loss": 0.3589, "lr": 4.371751721816559e-06, "epoch": 1.7589041095890412, "percentage": 58.63, "elapsed_time": "20:24:30", "remaining_time": "14:24:01"}
643
+ {"current_steps": 643, "total_steps": 1095, "loss": 0.3654, "lr": 4.355934159716427e-06, "epoch": 1.7616438356164383, "percentage": 58.72, "elapsed_time": "20:26:21", "remaining_time": "14:22:04"}
644
+ {"current_steps": 644, "total_steps": 1095, "loss": 0.3422, "lr": 4.340123149364257e-06, "epoch": 1.7643835616438355, "percentage": 58.81, "elapsed_time": "20:28:16", "remaining_time": "14:20:10"}
645
+ {"current_steps": 645, "total_steps": 1095, "loss": 0.3726, "lr": 4.3243188515972575e-06, "epoch": 1.7671232876712328, "percentage": 58.9, "elapsed_time": "20:30:15", "remaining_time": "14:18:19"}
646
+ {"current_steps": 646, "total_steps": 1095, "loss": 0.3426, "lr": 4.308521427184359e-06, "epoch": 1.7698630136986302, "percentage": 59.0, "elapsed_time": "20:32:07", "remaining_time": "14:16:22"}
647
+ {"current_steps": 647, "total_steps": 1095, "loss": 0.3572, "lr": 4.292731036824574e-06, "epoch": 1.7726027397260276, "percentage": 59.09, "elapsed_time": "20:33:58", "remaining_time": "14:14:25"}
648
+ {"current_steps": 648, "total_steps": 1095, "loss": 0.3336, "lr": 4.276947841145355e-06, "epoch": 1.7753424657534247, "percentage": 59.18, "elapsed_time": "20:36:03", "remaining_time": "14:12:39"}
649
+ {"current_steps": 649, "total_steps": 1095, "loss": 0.3409, "lr": 4.261172000700972e-06, "epoch": 1.7780821917808218, "percentage": 59.27, "elapsed_time": "20:37:56", "remaining_time": "14:10:43"}
650
+ {"current_steps": 650, "total_steps": 1095, "loss": 0.3593, "lr": 4.245403675970877e-06, "epoch": 1.7808219178082192, "percentage": 59.36, "elapsed_time": "20:39:23", "remaining_time": "14:08:30"}
651
+ {"current_steps": 651, "total_steps": 1095, "loss": 0.3564, "lr": 4.229643027358058e-06, "epoch": 1.7835616438356166, "percentage": 59.45, "elapsed_time": "20:41:17", "remaining_time": "14:06:35"}
652
+ {"current_steps": 652, "total_steps": 1095, "loss": 0.3657, "lr": 4.213890215187432e-06, "epoch": 1.7863013698630137, "percentage": 59.54, "elapsed_time": "20:43:25", "remaining_time": "14:04:50"}
653
+ {"current_steps": 653, "total_steps": 1095, "loss": 0.3659, "lr": 4.198145399704185e-06, "epoch": 1.7890410958904108, "percentage": 59.63, "elapsed_time": "20:45:18", "remaining_time": "14:02:55"}
654
+ {"current_steps": 654, "total_steps": 1095, "loss": 0.3495, "lr": 4.182408741072166e-06, "epoch": 1.7917808219178082, "percentage": 59.73, "elapsed_time": "20:46:46", "remaining_time": "14:00:42"}
655
+ {"current_steps": 655, "total_steps": 1095, "loss": 0.3387, "lr": 4.166680399372248e-06, "epoch": 1.7945205479452055, "percentage": 59.82, "elapsed_time": "20:48:48", "remaining_time": "13:58:53"}
656
+ {"current_steps": 656, "total_steps": 1095, "loss": 0.3603, "lr": 4.1509605346007e-06, "epoch": 1.7972602739726027, "percentage": 59.91, "elapsed_time": "20:50:33", "remaining_time": "13:56:53"}
657
+ {"current_steps": 657, "total_steps": 1095, "loss": 0.3855, "lr": 4.135249306667553e-06, "epoch": 1.8, "percentage": 60.0, "elapsed_time": "20:52:40", "remaining_time": "13:55:06"}
658
+ {"current_steps": 658, "total_steps": 1095, "loss": 0.3639, "lr": 4.11954687539499e-06, "epoch": 1.8027397260273972, "percentage": 60.09, "elapsed_time": "20:54:04", "remaining_time": "13:52:52"}
659
+ {"current_steps": 659, "total_steps": 1095, "loss": 0.3755, "lr": 4.1038534005157035e-06, "epoch": 1.8054794520547945, "percentage": 60.18, "elapsed_time": "20:56:14", "remaining_time": "13:51:08"}
660
+ {"current_steps": 660, "total_steps": 1095, "loss": 0.362, "lr": 4.08816904167128e-06, "epoch": 1.808219178082192, "percentage": 60.27, "elapsed_time": "20:58:02", "remaining_time": "13:49:09"}
661
+ {"current_steps": 661, "total_steps": 1095, "loss": 0.3573, "lr": 4.0724939584105745e-06, "epoch": 1.810958904109589, "percentage": 60.37, "elapsed_time": "20:59:39", "remaining_time": "13:47:04"}
662
+ {"current_steps": 662, "total_steps": 1095, "loss": 0.387, "lr": 4.056828310188079e-06, "epoch": 1.8136986301369862, "percentage": 60.46, "elapsed_time": "21:01:54", "remaining_time": "13:45:22"}
663
+ {"current_steps": 663, "total_steps": 1095, "loss": 0.3388, "lr": 4.041172256362317e-06, "epoch": 1.8164383561643835, "percentage": 60.55, "elapsed_time": "21:03:48", "remaining_time": "13:43:28"}
664
+ {"current_steps": 664, "total_steps": 1095, "loss": 0.3801, "lr": 4.025525956194208e-06, "epoch": 1.819178082191781, "percentage": 60.64, "elapsed_time": "21:05:47", "remaining_time": "13:41:37"}
665
+ {"current_steps": 665, "total_steps": 1095, "loss": 0.3728, "lr": 4.009889568845453e-06, "epoch": 1.821917808219178, "percentage": 60.73, "elapsed_time": "21:07:34", "remaining_time": "13:39:38"}
666
+ {"current_steps": 666, "total_steps": 1095, "loss": 0.3596, "lr": 3.994263253376919e-06, "epoch": 1.8246575342465754, "percentage": 60.82, "elapsed_time": "21:09:32", "remaining_time": "13:37:45"}
667
+ {"current_steps": 667, "total_steps": 1095, "loss": 0.366, "lr": 3.978647168747009e-06, "epoch": 1.8273972602739725, "percentage": 60.91, "elapsed_time": "21:11:18", "remaining_time": "13:35:46"}
668
+ {"current_steps": 668, "total_steps": 1095, "loss": 0.3604, "lr": 3.96304147381006e-06, "epoch": 1.83013698630137, "percentage": 61.0, "elapsed_time": "21:13:17", "remaining_time": "13:33:54"}
669
+ {"current_steps": 669, "total_steps": 1095, "loss": 0.3771, "lr": 3.947446327314719e-06, "epoch": 1.8328767123287673, "percentage": 61.1, "elapsed_time": "21:15:01", "remaining_time": "13:31:54"}
670
+ {"current_steps": 670, "total_steps": 1095, "loss": 0.3664, "lr": 3.9318618879023255e-06, "epoch": 1.8356164383561644, "percentage": 61.19, "elapsed_time": "21:16:45", "remaining_time": "13:29:53"}
671
+ {"current_steps": 671, "total_steps": 1095, "loss": 0.3688, "lr": 3.916288314105307e-06, "epoch": 1.8383561643835615, "percentage": 61.28, "elapsed_time": "21:18:31", "remaining_time": "13:27:53"}
672
+ {"current_steps": 672, "total_steps": 1095, "loss": 0.3775, "lr": 3.900725764345557e-06, "epoch": 1.841095890410959, "percentage": 61.37, "elapsed_time": "21:20:19", "remaining_time": "13:25:55"}
673
+ {"current_steps": 673, "total_steps": 1095, "loss": 0.3623, "lr": 3.885174396932823e-06, "epoch": 1.8438356164383563, "percentage": 61.46, "elapsed_time": "21:21:54", "remaining_time": "13:23:48"}
674
+ {"current_steps": 674, "total_steps": 1095, "loss": 0.3575, "lr": 3.869634370063111e-06, "epoch": 1.8465753424657534, "percentage": 61.55, "elapsed_time": "21:23:50", "remaining_time": "13:21:55"}
675
+ {"current_steps": 675, "total_steps": 1095, "loss": 0.3667, "lr": 3.854105841817056e-06, "epoch": 1.8493150684931505, "percentage": 61.64, "elapsed_time": "21:25:41", "remaining_time": "13:19:59"}
676
+ {"current_steps": 676, "total_steps": 1095, "loss": 0.365, "lr": 3.83858897015833e-06, "epoch": 1.8520547945205479, "percentage": 61.74, "elapsed_time": "21:27:30", "remaining_time": "13:18:01"}
677
+ {"current_steps": 677, "total_steps": 1095, "loss": 0.3704, "lr": 3.823083912932023e-06, "epoch": 1.8547945205479452, "percentage": 61.83, "elapsed_time": "21:29:36", "remaining_time": "13:16:14"}
678
+ {"current_steps": 678, "total_steps": 1095, "loss": 0.3614, "lr": 3.8075908278630453e-06, "epoch": 1.8575342465753426, "percentage": 61.92, "elapsed_time": "21:31:21", "remaining_time": "13:14:14"}
679
+ {"current_steps": 679, "total_steps": 1095, "loss": 0.3473, "lr": 3.7921098725545236e-06, "epoch": 1.8602739726027397, "percentage": 62.01, "elapsed_time": "21:32:56", "remaining_time": "13:12:08"}
680
+ {"current_steps": 680, "total_steps": 1095, "loss": 0.3734, "lr": 3.776641204486191e-06, "epoch": 1.8630136986301369, "percentage": 62.1, "elapsed_time": "21:35:05", "remaining_time": "13:10:23"}
681
+ {"current_steps": 681, "total_steps": 1095, "loss": 0.347, "lr": 3.761184981012788e-06, "epoch": 1.8657534246575342, "percentage": 62.19, "elapsed_time": "21:36:51", "remaining_time": "13:08:24"}
682
+ {"current_steps": 682, "total_steps": 1095, "loss": 0.3717, "lr": 3.7457413593624668e-06, "epoch": 1.8684931506849316, "percentage": 62.28, "elapsed_time": "21:38:48", "remaining_time": "13:06:31"}
683
+ {"current_steps": 683, "total_steps": 1095, "loss": 0.3534, "lr": 3.7303104966351863e-06, "epoch": 1.8712328767123287, "percentage": 62.37, "elapsed_time": "21:40:39", "remaining_time": "13:04:35"}
684
+ {"current_steps": 684, "total_steps": 1095, "loss": 0.351, "lr": 3.71489254980111e-06, "epoch": 1.8739726027397259, "percentage": 62.47, "elapsed_time": "21:42:20", "remaining_time": "13:02:32"}
685
+ {"current_steps": 685, "total_steps": 1095, "loss": 0.389, "lr": 3.699487675699027e-06, "epoch": 1.8767123287671232, "percentage": 62.56, "elapsed_time": "21:44:04", "remaining_time": "13:00:32"}
686
+ {"current_steps": 686, "total_steps": 1095, "loss": 0.3692, "lr": 3.68409603103473e-06, "epoch": 1.8794520547945206, "percentage": 62.65, "elapsed_time": "21:46:00", "remaining_time": "12:58:39"}
687
+ {"current_steps": 687, "total_steps": 1095, "loss": 0.3552, "lr": 3.668717772379447e-06, "epoch": 1.882191780821918, "percentage": 62.74, "elapsed_time": "21:47:51", "remaining_time": "12:56:43"}
688
+ {"current_steps": 688, "total_steps": 1095, "loss": 0.3519, "lr": 3.6533530561682318e-06, "epoch": 1.884931506849315, "percentage": 62.83, "elapsed_time": "21:49:55", "remaining_time": "12:54:54"}
689
+ {"current_steps": 689, "total_steps": 1095, "loss": 0.3579, "lr": 3.6380020386983737e-06, "epoch": 1.8876712328767122, "percentage": 62.92, "elapsed_time": "21:51:42", "remaining_time": "12:52:56"}
690
+ {"current_steps": 690, "total_steps": 1095, "loss": 0.3614, "lr": 3.6226648761278238e-06, "epoch": 1.8904109589041096, "percentage": 63.01, "elapsed_time": "21:53:21", "remaining_time": "12:50:52"}
691
+ {"current_steps": 691, "total_steps": 1095, "loss": 0.3783, "lr": 3.6073417244735832e-06, "epoch": 1.893150684931507, "percentage": 63.11, "elapsed_time": "21:55:21", "remaining_time": "12:49:02"}
692
+ {"current_steps": 692, "total_steps": 1095, "loss": 0.3484, "lr": 3.59203273961013e-06, "epoch": 1.895890410958904, "percentage": 63.2, "elapsed_time": "21:57:08", "remaining_time": "12:47:03"}
693
+ {"current_steps": 693, "total_steps": 1095, "loss": 0.3863, "lr": 3.5767380772678373e-06, "epoch": 1.8986301369863012, "percentage": 63.29, "elapsed_time": "21:58:46", "remaining_time": "12:45:00"}
694
+ {"current_steps": 694, "total_steps": 1095, "loss": 0.374, "lr": 3.5614578930313705e-06, "epoch": 1.9013698630136986, "percentage": 63.38, "elapsed_time": "22:00:44", "remaining_time": "12:43:08"}
695
+ {"current_steps": 695, "total_steps": 1095, "loss": 0.3807, "lr": 3.5461923423381313e-06, "epoch": 1.904109589041096, "percentage": 63.47, "elapsed_time": "22:02:40", "remaining_time": "12:41:14"}
696
+ {"current_steps": 696, "total_steps": 1095, "loss": 0.3502, "lr": 3.5309415804766487e-06, "epoch": 1.9068493150684933, "percentage": 63.56, "elapsed_time": "22:04:28", "remaining_time": "12:39:17"}
697
+ {"current_steps": 697, "total_steps": 1095, "loss": 0.339, "lr": 3.515705762585021e-06, "epoch": 1.9095890410958904, "percentage": 63.65, "elapsed_time": "22:05:57", "remaining_time": "12:37:09"}
698
+ {"current_steps": 698, "total_steps": 1095, "loss": 0.3502, "lr": 3.5004850436493264e-06, "epoch": 1.9123287671232876, "percentage": 63.74, "elapsed_time": "22:07:42", "remaining_time": "12:35:09"}
699
+ {"current_steps": 699, "total_steps": 1095, "loss": 0.3599, "lr": 3.485279578502049e-06, "epoch": 1.915068493150685, "percentage": 63.84, "elapsed_time": "22:09:43", "remaining_time": "12:33:19"}
700
+ {"current_steps": 700, "total_steps": 1095, "loss": 0.3455, "lr": 3.4700895218205026e-06, "epoch": 1.9178082191780823, "percentage": 63.93, "elapsed_time": "22:11:30", "remaining_time": "12:31:21"}
701
+ {"current_steps": 701, "total_steps": 1095, "loss": 0.379, "lr": 3.4549150281252635e-06, "epoch": 1.9205479452054794, "percentage": 64.02, "elapsed_time": "22:17:57", "remaining_time": "12:32:00"}
702
+ {"current_steps": 702, "total_steps": 1095, "loss": 0.3508, "lr": 3.4397562517785883e-06, "epoch": 1.9232876712328766, "percentage": 64.11, "elapsed_time": "22:19:29", "remaining_time": "12:29:53"}
703
+ {"current_steps": 703, "total_steps": 1095, "loss": 0.3782, "lr": 3.424613346982855e-06, "epoch": 1.926027397260274, "percentage": 64.2, "elapsed_time": "22:21:22", "remaining_time": "12:27:57"}