Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32bbd419a0e4a843f7a77685908c3b0d4d82e72ad468e166ce1324fd84063a40
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:85228fe7970692b7475b7428f1fa44787b27f940ef2329854ee3c94139faa1e7
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:44226c965d155c742781f1fddfedd47a58622428a760859245bc13a065d481c0
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ee00e4c5ab64b45b2f92ea09f2f54e012e5f3eecb53816dbb27e64b52738f7b
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -480,3 +480,243 @@
|
|
| 480 |
{"current_steps": 480, "total_steps": 1195, "loss": 0.4055, "lr": 2.9915518954747038e-05, "epoch": 2.003129890453834, "percentage": 40.17, "elapsed_time": "5:15:50", "remaining_time": "7:50:27"}
|
| 481 |
{"current_steps": 481, "total_steps": 1195, "loss": 0.3777, "lr": 2.9864717288122986e-05, "epoch": 2.007303077725613, "percentage": 40.25, "elapsed_time": "5:16:26", "remaining_time": "7:49:43"}
|
| 482 |
{"current_steps": 482, "total_steps": 1195, "loss": 0.3875, "lr": 2.9813831372034035e-05, "epoch": 2.0114762649973916, "percentage": 40.33, "elapsed_time": "5:17:07", "remaining_time": "7:49:06"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 480 |
{"current_steps": 480, "total_steps": 1195, "loss": 0.4055, "lr": 2.9915518954747038e-05, "epoch": 2.003129890453834, "percentage": 40.17, "elapsed_time": "5:15:50", "remaining_time": "7:50:27"}
|
| 481 |
{"current_steps": 481, "total_steps": 1195, "loss": 0.3777, "lr": 2.9864717288122986e-05, "epoch": 2.007303077725613, "percentage": 40.25, "elapsed_time": "5:16:26", "remaining_time": "7:49:43"}
|
| 482 |
{"current_steps": 482, "total_steps": 1195, "loss": 0.3875, "lr": 2.9813831372034035e-05, "epoch": 2.0114762649973916, "percentage": 40.33, "elapsed_time": "5:17:07", "remaining_time": "7:49:06"}
|
| 483 |
+
{"current_steps": 483, "total_steps": 1195, "loss": 0.3846, "lr": 2.976286164107057e-05, "epoch": 2.0156494522691704, "percentage": 40.42, "elapsed_time": "5:17:51", "remaining_time": "7:48:33"}
|
| 484 |
+
{"current_steps": 484, "total_steps": 1195, "loss": 0.3661, "lr": 2.9711808530538776e-05, "epoch": 2.0198226395409495, "percentage": 40.5, "elapsed_time": "5:18:26", "remaining_time": "7:47:47"}
|
| 485 |
+
{"current_steps": 485, "total_steps": 1195, "loss": 0.3692, "lr": 2.966067247645696e-05, "epoch": 2.0239958268127283, "percentage": 40.59, "elapsed_time": "5:19:00", "remaining_time": "7:47:00"}
|
| 486 |
+
{"current_steps": 486, "total_steps": 1195, "loss": 0.3756, "lr": 2.9609453915551793e-05, "epoch": 2.028169014084507, "percentage": 40.67, "elapsed_time": "5:19:43", "remaining_time": "7:46:25"}
|
| 487 |
+
{"current_steps": 487, "total_steps": 1195, "loss": 0.3662, "lr": 2.9558153285254607e-05, "epoch": 2.0323422013562857, "percentage": 40.75, "elapsed_time": "5:20:24", "remaining_time": "7:45:48"}
|
| 488 |
+
{"current_steps": 488, "total_steps": 1195, "loss": 0.3626, "lr": 2.9506771023697628e-05, "epoch": 2.0365153886280645, "percentage": 40.84, "elapsed_time": "5:21:03", "remaining_time": "7:45:08"}
|
| 489 |
+
{"current_steps": 489, "total_steps": 1195, "loss": 0.3631, "lr": 2.9455307569710272e-05, "epoch": 2.0406885758998436, "percentage": 40.92, "elapsed_time": "5:21:38", "remaining_time": "7:44:22"}
|
| 490 |
+
{"current_steps": 490, "total_steps": 1195, "loss": 0.3486, "lr": 2.940376336281537e-05, "epoch": 2.0448617631716224, "percentage": 41.0, "elapsed_time": "5:22:21", "remaining_time": "7:43:48"}
|
| 491 |
+
{"current_steps": 491, "total_steps": 1195, "loss": 0.3528, "lr": 2.9352138843225413e-05, "epoch": 2.049034950443401, "percentage": 41.09, "elapsed_time": "5:22:58", "remaining_time": "7:43:05"}
|
| 492 |
+
{"current_steps": 492, "total_steps": 1195, "loss": 0.3759, "lr": 2.9300434451838814e-05, "epoch": 2.05320813771518, "percentage": 41.17, "elapsed_time": "5:23:38", "remaining_time": "7:42:25"}
|
| 493 |
+
{"current_steps": 493, "total_steps": 1195, "loss": 0.3719, "lr": 2.9248650630236125e-05, "epoch": 2.0573813249869586, "percentage": 41.26, "elapsed_time": "5:24:19", "remaining_time": "7:41:49"}
|
| 494 |
+
{"current_steps": 494, "total_steps": 1195, "loss": 0.3635, "lr": 2.9196787820676273e-05, "epoch": 2.0615545122587378, "percentage": 41.34, "elapsed_time": "5:24:59", "remaining_time": "7:41:11"}
|
| 495 |
+
{"current_steps": 495, "total_steps": 1195, "loss": 0.3664, "lr": 2.9144846466092773e-05, "epoch": 2.0657276995305165, "percentage": 41.42, "elapsed_time": "5:25:38", "remaining_time": "7:40:30"}
|
| 496 |
+
{"current_steps": 496, "total_steps": 1195, "loss": 0.3504, "lr": 2.9092827010089966e-05, "epoch": 2.0699008868022952, "percentage": 41.51, "elapsed_time": "5:26:22", "remaining_time": "7:39:57"}
|
| 497 |
+
{"current_steps": 497, "total_steps": 1195, "loss": 0.3831, "lr": 2.9040729896939194e-05, "epoch": 2.074074074074074, "percentage": 41.59, "elapsed_time": "5:27:01", "remaining_time": "7:39:17"}
|
| 498 |
+
{"current_steps": 498, "total_steps": 1195, "loss": 0.3564, "lr": 2.898855557157506e-05, "epoch": 2.0782472613458527, "percentage": 41.67, "elapsed_time": "5:27:43", "remaining_time": "7:38:41"}
|
| 499 |
+
{"current_steps": 499, "total_steps": 1195, "loss": 0.3699, "lr": 2.8936304479591566e-05, "epoch": 2.082420448617632, "percentage": 41.76, "elapsed_time": "5:28:21", "remaining_time": "7:37:59"}
|
| 500 |
+
{"current_steps": 500, "total_steps": 1195, "loss": 0.3619, "lr": 2.8883977067238363e-05, "epoch": 2.0865936358894106, "percentage": 41.84, "elapsed_time": "5:29:00", "remaining_time": "7:37:19"}
|
| 501 |
+
{"current_steps": 501, "total_steps": 1195, "loss": 0.3499, "lr": 2.8831573781416896e-05, "epoch": 2.0907668231611893, "percentage": 41.92, "elapsed_time": "5:29:36", "remaining_time": "7:36:35"}
|
| 502 |
+
{"current_steps": 502, "total_steps": 1195, "loss": 0.3781, "lr": 2.8779095069676622e-05, "epoch": 2.094940010432968, "percentage": 42.01, "elapsed_time": "5:30:12", "remaining_time": "7:35:50"}
|
| 503 |
+
{"current_steps": 503, "total_steps": 1195, "loss": 0.3577, "lr": 2.8726541380211154e-05, "epoch": 2.099113197704747, "percentage": 42.09, "elapsed_time": "5:30:52", "remaining_time": "7:35:12"}
|
| 504 |
+
{"current_steps": 504, "total_steps": 1195, "loss": 0.3412, "lr": 2.867391316185447e-05, "epoch": 2.103286384976526, "percentage": 42.18, "elapsed_time": "5:31:27", "remaining_time": "7:34:26"}
|
| 505 |
+
{"current_steps": 505, "total_steps": 1195, "loss": 0.3504, "lr": 2.8621210864077053e-05, "epoch": 2.1074595722483047, "percentage": 42.26, "elapsed_time": "5:32:09", "remaining_time": "7:33:50"}
|
| 506 |
+
{"current_steps": 506, "total_steps": 1195, "loss": 0.3482, "lr": 2.8568434936982048e-05, "epoch": 2.1116327595200834, "percentage": 42.34, "elapsed_time": "5:32:50", "remaining_time": "7:33:12"}
|
| 507 |
+
{"current_steps": 507, "total_steps": 1195, "loss": 0.3572, "lr": 2.8515585831301456e-05, "epoch": 2.115805946791862, "percentage": 42.43, "elapsed_time": "5:33:33", "remaining_time": "7:32:38"}
|
| 508 |
+
{"current_steps": 508, "total_steps": 1195, "loss": 0.3546, "lr": 2.8462663998392232e-05, "epoch": 2.119979134063641, "percentage": 42.51, "elapsed_time": "5:34:04", "remaining_time": "7:31:47"}
|
| 509 |
+
{"current_steps": 509, "total_steps": 1195, "loss": 0.3587, "lr": 2.840966989023248e-05, "epoch": 2.12415232133542, "percentage": 42.59, "elapsed_time": "5:34:45", "remaining_time": "7:31:10"}
|
| 510 |
+
{"current_steps": 510, "total_steps": 1195, "loss": 0.3809, "lr": 2.835660395941754e-05, "epoch": 2.128325508607199, "percentage": 42.68, "elapsed_time": "5:35:26", "remaining_time": "7:30:32"}
|
| 511 |
+
{"current_steps": 511, "total_steps": 1195, "loss": 0.3651, "lr": 2.830346665915619e-05, "epoch": 2.1324986958789776, "percentage": 42.76, "elapsed_time": "5:36:08", "remaining_time": "7:29:57"}
|
| 512 |
+
{"current_steps": 512, "total_steps": 1195, "loss": 0.3551, "lr": 2.8250258443266712e-05, "epoch": 2.1366718831507563, "percentage": 42.85, "elapsed_time": "5:36:46", "remaining_time": "7:29:15"}
|
| 513 |
+
{"current_steps": 513, "total_steps": 1195, "loss": 0.3522, "lr": 2.8196979766173034e-05, "epoch": 2.140845070422535, "percentage": 42.93, "elapsed_time": "5:37:29", "remaining_time": "7:28:39"}
|
| 514 |
+
{"current_steps": 514, "total_steps": 1195, "loss": 0.3717, "lr": 2.8143631082900894e-05, "epoch": 2.145018257694314, "percentage": 43.01, "elapsed_time": "5:38:00", "remaining_time": "7:27:49"}
|
| 515 |
+
{"current_steps": 515, "total_steps": 1195, "loss": 0.3369, "lr": 2.8090212849073877e-05, "epoch": 2.149191444966093, "percentage": 43.1, "elapsed_time": "5:38:38", "remaining_time": "7:27:07"}
|
| 516 |
+
{"current_steps": 516, "total_steps": 1195, "loss": 0.3725, "lr": 2.8036725520909586e-05, "epoch": 2.1533646322378717, "percentage": 43.18, "elapsed_time": "5:39:16", "remaining_time": "7:26:26"}
|
| 517 |
+
{"current_steps": 517, "total_steps": 1195, "loss": 0.3665, "lr": 2.7983169555215716e-05, "epoch": 2.1575378195096504, "percentage": 43.26, "elapsed_time": "5:40:04", "remaining_time": "7:25:58"}
|
| 518 |
+
{"current_steps": 518, "total_steps": 1195, "loss": 0.3509, "lr": 2.7929545409386162e-05, "epoch": 2.161711006781429, "percentage": 43.35, "elapsed_time": "5:40:42", "remaining_time": "7:25:16"}
|
| 519 |
+
{"current_steps": 519, "total_steps": 1195, "loss": 0.3727, "lr": 2.7875853541397107e-05, "epoch": 2.1658841940532083, "percentage": 43.43, "elapsed_time": "5:41:22", "remaining_time": "7:24:38"}
|
| 520 |
+
{"current_steps": 520, "total_steps": 1195, "loss": 0.3512, "lr": 2.782209440980312e-05, "epoch": 2.170057381324987, "percentage": 43.51, "elapsed_time": "5:42:02", "remaining_time": "7:23:59"}
|
| 521 |
+
{"current_steps": 521, "total_steps": 1195, "loss": 0.3463, "lr": 2.776826847373323e-05, "epoch": 2.174230568596766, "percentage": 43.6, "elapsed_time": "5:42:38", "remaining_time": "7:23:15"}
|
| 522 |
+
{"current_steps": 522, "total_steps": 1195, "loss": 0.3591, "lr": 2.7714376192887e-05, "epoch": 2.1784037558685445, "percentage": 43.68, "elapsed_time": "5:43:19", "remaining_time": "7:22:38"}
|
| 523 |
+
{"current_steps": 523, "total_steps": 1195, "loss": 0.3517, "lr": 2.7660418027530634e-05, "epoch": 2.1825769431403232, "percentage": 43.77, "elapsed_time": "5:43:53", "remaining_time": "7:21:51"}
|
| 524 |
+
{"current_steps": 524, "total_steps": 1195, "loss": 0.3743, "lr": 2.7606394438492986e-05, "epoch": 2.1867501304121024, "percentage": 43.85, "elapsed_time": "5:44:32", "remaining_time": "7:21:12"}
|
| 525 |
+
{"current_steps": 525, "total_steps": 1195, "loss": 0.3677, "lr": 2.7552305887161693e-05, "epoch": 2.190923317683881, "percentage": 43.93, "elapsed_time": "5:45:04", "remaining_time": "7:20:22"}
|
| 526 |
+
{"current_steps": 526, "total_steps": 1195, "loss": 0.3552, "lr": 2.7498152835479187e-05, "epoch": 2.19509650495566, "percentage": 44.02, "elapsed_time": "5:45:43", "remaining_time": "7:19:42"}
|
| 527 |
+
{"current_steps": 527, "total_steps": 1195, "loss": 0.3694, "lr": 2.7443935745938758e-05, "epoch": 2.1992696922274386, "percentage": 44.1, "elapsed_time": "5:46:17", "remaining_time": "7:18:56"}
|
| 528 |
+
{"current_steps": 528, "total_steps": 1195, "loss": 0.3511, "lr": 2.738965508158063e-05, "epoch": 2.2034428794992174, "percentage": 44.18, "elapsed_time": "5:46:51", "remaining_time": "7:18:10"}
|
| 529 |
+
{"current_steps": 529, "total_steps": 1195, "loss": 0.37, "lr": 2.733531130598796e-05, "epoch": 2.2076160667709965, "percentage": 44.27, "elapsed_time": "5:47:33", "remaining_time": "7:17:33"}
|
| 530 |
+
{"current_steps": 530, "total_steps": 1195, "loss": 0.3703, "lr": 2.728090488328293e-05, "epoch": 2.2117892540427753, "percentage": 44.35, "elapsed_time": "5:48:13", "remaining_time": "7:16:55"}
|
| 531 |
+
{"current_steps": 531, "total_steps": 1195, "loss": 0.3564, "lr": 2.722643627812275e-05, "epoch": 2.215962441314554, "percentage": 44.44, "elapsed_time": "5:48:53", "remaining_time": "7:16:16"}
|
| 532 |
+
{"current_steps": 532, "total_steps": 1195, "loss": 0.3498, "lr": 2.7171905955695694e-05, "epoch": 2.2201356285863327, "percentage": 44.52, "elapsed_time": "5:49:32", "remaining_time": "7:15:37"}
|
| 533 |
+
{"current_steps": 533, "total_steps": 1195, "loss": 0.3597, "lr": 2.711731438171713e-05, "epoch": 2.2243088158581115, "percentage": 44.6, "elapsed_time": "5:50:07", "remaining_time": "7:14:51"}
|
| 534 |
+
{"current_steps": 534, "total_steps": 1195, "loss": 0.3884, "lr": 2.7062662022425557e-05, "epoch": 2.2284820031298906, "percentage": 44.69, "elapsed_time": "5:50:45", "remaining_time": "7:14:10"}
|
| 535 |
+
{"current_steps": 535, "total_steps": 1195, "loss": 0.3715, "lr": 2.700794934457859e-05, "epoch": 2.2326551904016694, "percentage": 44.77, "elapsed_time": "5:51:21", "remaining_time": "7:13:26"}
|
| 536 |
+
{"current_steps": 536, "total_steps": 1195, "loss": 0.3776, "lr": 2.695317681544902e-05, "epoch": 2.236828377673448, "percentage": 44.85, "elapsed_time": "5:52:00", "remaining_time": "7:12:47"}
|
| 537 |
+
{"current_steps": 537, "total_steps": 1195, "loss": 0.3736, "lr": 2.6898344902820763e-05, "epoch": 2.241001564945227, "percentage": 44.94, "elapsed_time": "5:52:46", "remaining_time": "7:12:15"}
|
| 538 |
+
{"current_steps": 538, "total_steps": 1195, "loss": 0.3874, "lr": 2.6843454074984932e-05, "epoch": 2.2451747522170056, "percentage": 45.02, "elapsed_time": "5:53:26", "remaining_time": "7:11:37"}
|
| 539 |
+
{"current_steps": 539, "total_steps": 1195, "loss": 0.3701, "lr": 2.678850480073578e-05, "epoch": 2.2493479394887848, "percentage": 45.1, "elapsed_time": "5:54:08", "remaining_time": "7:11:01"}
|
| 540 |
+
{"current_steps": 540, "total_steps": 1195, "loss": 0.3605, "lr": 2.673349754936675e-05, "epoch": 2.2535211267605635, "percentage": 45.19, "elapsed_time": "5:54:46", "remaining_time": "7:10:19"}
|
| 541 |
+
{"current_steps": 541, "total_steps": 1195, "loss": 0.3594, "lr": 2.6678432790666397e-05, "epoch": 2.257694314032342, "percentage": 45.27, "elapsed_time": "5:55:23", "remaining_time": "7:09:36"}
|
| 542 |
+
{"current_steps": 542, "total_steps": 1195, "loss": 0.3568, "lr": 2.662331099491445e-05, "epoch": 2.261867501304121, "percentage": 45.36, "elapsed_time": "5:56:04", "remaining_time": "7:08:59"}
|
| 543 |
+
{"current_steps": 543, "total_steps": 1195, "loss": 0.3738, "lr": 2.6568132632877744e-05, "epoch": 2.2660406885758997, "percentage": 45.44, "elapsed_time": "5:56:44", "remaining_time": "7:08:21"}
|
| 544 |
+
{"current_steps": 544, "total_steps": 1195, "loss": 0.3656, "lr": 2.651289817580623e-05, "epoch": 2.270213875847679, "percentage": 45.52, "elapsed_time": "5:57:24", "remaining_time": "7:07:42"}
|
| 545 |
+
{"current_steps": 545, "total_steps": 1195, "loss": 0.3655, "lr": 2.6457608095428925e-05, "epoch": 2.2743870631194576, "percentage": 45.61, "elapsed_time": "5:58:03", "remaining_time": "7:07:03"}
|
| 546 |
+
{"current_steps": 546, "total_steps": 1195, "loss": 0.397, "lr": 2.640226286394991e-05, "epoch": 2.2785602503912363, "percentage": 45.69, "elapsed_time": "5:58:49", "remaining_time": "7:06:31"}
|
| 547 |
+
{"current_steps": 547, "total_steps": 1195, "loss": 0.3505, "lr": 2.6346862954044267e-05, "epoch": 2.282733437663015, "percentage": 45.77, "elapsed_time": "5:59:28", "remaining_time": "7:05:51"}
|
| 548 |
+
{"current_steps": 548, "total_steps": 1195, "loss": 0.3503, "lr": 2.6291408838854074e-05, "epoch": 2.286906624934794, "percentage": 45.86, "elapsed_time": "6:00:07", "remaining_time": "7:05:11"}
|
| 549 |
+
{"current_steps": 549, "total_steps": 1195, "loss": 0.3714, "lr": 2.6235900991984327e-05, "epoch": 2.291079812206573, "percentage": 45.94, "elapsed_time": "6:00:47", "remaining_time": "7:04:31"}
|
| 550 |
+
{"current_steps": 550, "total_steps": 1195, "loss": 0.3684, "lr": 2.618033988749895e-05, "epoch": 2.2952529994783517, "percentage": 46.03, "elapsed_time": "6:01:30", "remaining_time": "7:03:57"}
|
| 551 |
+
{"current_steps": 551, "total_steps": 1195, "loss": 0.3681, "lr": 2.6124725999916684e-05, "epoch": 2.2994261867501304, "percentage": 46.11, "elapsed_time": "6:02:08", "remaining_time": "7:03:15"}
|
| 552 |
+
{"current_steps": 552, "total_steps": 1195, "loss": 0.3607, "lr": 2.6069059804207072e-05, "epoch": 2.303599374021909, "percentage": 46.19, "elapsed_time": "6:02:47", "remaining_time": "7:02:35"}
|
| 553 |
+
{"current_steps": 553, "total_steps": 1195, "loss": 0.3961, "lr": 2.6013341775786396e-05, "epoch": 2.307772561293688, "percentage": 46.28, "elapsed_time": "6:03:26", "remaining_time": "7:01:56"}
|
| 554 |
+
{"current_steps": 554, "total_steps": 1195, "loss": 0.3553, "lr": 2.5957572390513617e-05, "epoch": 2.311945748565467, "percentage": 46.36, "elapsed_time": "6:04:01", "remaining_time": "7:01:12"}
|
| 555 |
+
{"current_steps": 555, "total_steps": 1195, "loss": 0.3487, "lr": 2.5901752124686294e-05, "epoch": 2.316118935837246, "percentage": 46.44, "elapsed_time": "6:04:40", "remaining_time": "7:00:31"}
|
| 556 |
+
{"current_steps": 556, "total_steps": 1195, "loss": 0.3648, "lr": 2.5845881455036552e-05, "epoch": 2.3202921231090246, "percentage": 46.53, "elapsed_time": "6:05:18", "remaining_time": "6:59:50"}
|
| 557 |
+
{"current_steps": 557, "total_steps": 1195, "loss": 0.3675, "lr": 2.5789960858726968e-05, "epoch": 2.3244653103808033, "percentage": 46.61, "elapsed_time": "6:05:56", "remaining_time": "6:59:09"}
|
| 558 |
+
{"current_steps": 558, "total_steps": 1195, "loss": 0.376, "lr": 2.5733990813346536e-05, "epoch": 2.328638497652582, "percentage": 46.69, "elapsed_time": "6:06:36", "remaining_time": "6:58:30"}
|
| 559 |
+
{"current_steps": 559, "total_steps": 1195, "loss": 0.3871, "lr": 2.5677971796906555e-05, "epoch": 2.332811684924361, "percentage": 46.78, "elapsed_time": "6:07:18", "remaining_time": "6:57:53"}
|
| 560 |
+
{"current_steps": 560, "total_steps": 1195, "loss": 0.3663, "lr": 2.5621904287836568e-05, "epoch": 2.33698487219614, "percentage": 46.86, "elapsed_time": "6:08:01", "remaining_time": "6:57:18"}
|
| 561 |
+
{"current_steps": 561, "total_steps": 1195, "loss": 0.3615, "lr": 2.5565788764980265e-05, "epoch": 2.3411580594679187, "percentage": 46.95, "elapsed_time": "6:08:41", "remaining_time": "6:56:39"}
|
| 562 |
+
{"current_steps": 562, "total_steps": 1195, "loss": 0.3658, "lr": 2.5509625707591394e-05, "epoch": 2.3453312467396974, "percentage": 47.03, "elapsed_time": "6:09:15", "remaining_time": "6:55:54"}
|
| 563 |
+
{"current_steps": 563, "total_steps": 1195, "loss": 0.3728, "lr": 2.5453415595329684e-05, "epoch": 2.349504434011476, "percentage": 47.11, "elapsed_time": "6:09:52", "remaining_time": "6:55:12"}
|
| 564 |
+
{"current_steps": 564, "total_steps": 1195, "loss": 0.3612, "lr": 2.539715890825672e-05, "epoch": 2.3536776212832553, "percentage": 47.2, "elapsed_time": "6:10:32", "remaining_time": "6:54:33"}
|
| 565 |
+
{"current_steps": 565, "total_steps": 1195, "loss": 0.3643, "lr": 2.5340856126831864e-05, "epoch": 2.357850808555034, "percentage": 47.28, "elapsed_time": "6:11:13", "remaining_time": "6:53:55"}
|
| 566 |
+
{"current_steps": 566, "total_steps": 1195, "loss": 0.3567, "lr": 2.528450773190814e-05, "epoch": 2.3620239958268128, "percentage": 47.36, "elapsed_time": "6:11:54", "remaining_time": "6:53:18"}
|
| 567 |
+
{"current_steps": 567, "total_steps": 1195, "loss": 0.3621, "lr": 2.5228114204728163e-05, "epoch": 2.3661971830985915, "percentage": 47.45, "elapsed_time": "6:12:33", "remaining_time": "6:52:38"}
|
| 568 |
+
{"current_steps": 568, "total_steps": 1195, "loss": 0.3713, "lr": 2.5171676026919953e-05, "epoch": 2.3703703703703702, "percentage": 47.53, "elapsed_time": "6:13:10", "remaining_time": "6:51:56"}
|
| 569 |
+
{"current_steps": 569, "total_steps": 1195, "loss": 0.3673, "lr": 2.5115193680492908e-05, "epoch": 2.3745435576421494, "percentage": 47.62, "elapsed_time": "6:13:49", "remaining_time": "6:51:16"}
|
| 570 |
+
{"current_steps": 570, "total_steps": 1195, "loss": 0.3452, "lr": 2.5058667647833615e-05, "epoch": 2.378716744913928, "percentage": 47.7, "elapsed_time": "6:14:30", "remaining_time": "6:50:38"}
|
| 571 |
+
{"current_steps": 571, "total_steps": 1195, "loss": 0.372, "lr": 2.5002098411701797e-05, "epoch": 2.382889932185707, "percentage": 47.78, "elapsed_time": "6:15:13", "remaining_time": "6:50:03"}
|
| 572 |
+
{"current_steps": 572, "total_steps": 1195, "loss": 0.363, "lr": 2.494548645522612e-05, "epoch": 2.3870631194574856, "percentage": 47.87, "elapsed_time": "6:16:06", "remaining_time": "6:49:38"}
|
| 573 |
+
{"current_steps": 573, "total_steps": 1195, "loss": 0.3545, "lr": 2.4888832261900136e-05, "epoch": 2.3912363067292643, "percentage": 47.95, "elapsed_time": "6:16:44", "remaining_time": "6:48:57"}
|
| 574 |
+
{"current_steps": 574, "total_steps": 1195, "loss": 0.3398, "lr": 2.4832136315578094e-05, "epoch": 2.3954094940010435, "percentage": 48.03, "elapsed_time": "6:17:19", "remaining_time": "6:48:13"}
|
| 575 |
+
{"current_steps": 575, "total_steps": 1195, "loss": 0.3722, "lr": 2.4775399100470837e-05, "epoch": 2.3995826812728223, "percentage": 48.12, "elapsed_time": "6:17:57", "remaining_time": "6:47:32"}
|
| 576 |
+
{"current_steps": 576, "total_steps": 1195, "loss": 0.3617, "lr": 2.471862110114169e-05, "epoch": 2.403755868544601, "percentage": 48.2, "elapsed_time": "6:18:34", "remaining_time": "6:46:50"}
|
| 577 |
+
{"current_steps": 577, "total_steps": 1195, "loss": 0.3577, "lr": 2.466180280250226e-05, "epoch": 2.4079290558163797, "percentage": 48.28, "elapsed_time": "6:19:13", "remaining_time": "6:46:10"}
|
| 578 |
+
{"current_steps": 578, "total_steps": 1195, "loss": 0.3712, "lr": 2.4604944689808344e-05, "epoch": 2.4121022430881585, "percentage": 48.37, "elapsed_time": "6:19:45", "remaining_time": "6:45:23"}
|
| 579 |
+
{"current_steps": 579, "total_steps": 1195, "loss": 0.3585, "lr": 2.4548047248655773e-05, "epoch": 2.4162754303599376, "percentage": 48.45, "elapsed_time": "6:20:21", "remaining_time": "6:44:40"}
|
| 580 |
+
{"current_steps": 580, "total_steps": 1195, "loss": 0.3696, "lr": 2.449111096497627e-05, "epoch": 2.4204486176317164, "percentage": 48.54, "elapsed_time": "6:21:03", "remaining_time": "6:44:03"}
|
| 581 |
+
{"current_steps": 581, "total_steps": 1195, "loss": 0.3674, "lr": 2.443413632503327e-05, "epoch": 2.424621804903495, "percentage": 48.62, "elapsed_time": "6:21:43", "remaining_time": "6:43:24"}
|
| 582 |
+
{"current_steps": 582, "total_steps": 1195, "loss": 0.3861, "lr": 2.4377123815417805e-05, "epoch": 2.428794992175274, "percentage": 48.7, "elapsed_time": "6:22:25", "remaining_time": "6:42:47"}
|
| 583 |
+
{"current_steps": 583, "total_steps": 1195, "loss": 0.3831, "lr": 2.4320073923044326e-05, "epoch": 2.4329681794470526, "percentage": 48.79, "elapsed_time": "6:23:05", "remaining_time": "6:42:08"}
|
| 584 |
+
{"current_steps": 584, "total_steps": 1195, "loss": 0.3711, "lr": 2.4262987135146555e-05, "epoch": 2.4371413667188317, "percentage": 48.87, "elapsed_time": "6:23:41", "remaining_time": "6:41:26"}
|
| 585 |
+
{"current_steps": 585, "total_steps": 1195, "loss": 0.3674, "lr": 2.4205863939273328e-05, "epoch": 2.4413145539906105, "percentage": 48.95, "elapsed_time": "6:24:18", "remaining_time": "6:40:43"}
|
| 586 |
+
{"current_steps": 586, "total_steps": 1195, "loss": 0.3594, "lr": 2.4148704823284395e-05, "epoch": 2.445487741262389, "percentage": 49.04, "elapsed_time": "6:24:58", "remaining_time": "6:40:05"}
|
| 587 |
+
{"current_steps": 587, "total_steps": 1195, "loss": 0.3766, "lr": 2.4091510275346317e-05, "epoch": 2.449660928534168, "percentage": 49.12, "elapsed_time": "6:25:39", "remaining_time": "6:39:27"}
|
| 588 |
+
{"current_steps": 588, "total_steps": 1195, "loss": 0.3567, "lr": 2.4034280783928227e-05, "epoch": 2.4538341158059467, "percentage": 49.21, "elapsed_time": "6:26:22", "remaining_time": "6:38:51"}
|
| 589 |
+
{"current_steps": 589, "total_steps": 1195, "loss": 0.3589, "lr": 2.3977016837797718e-05, "epoch": 2.458007303077726, "percentage": 49.29, "elapsed_time": "6:27:01", "remaining_time": "6:38:11"}
|
| 590 |
+
{"current_steps": 590, "total_steps": 1195, "loss": 0.3679, "lr": 2.391971892601663e-05, "epoch": 2.4621804903495046, "percentage": 49.37, "elapsed_time": "6:27:42", "remaining_time": "6:37:34"}
|
| 591 |
+
{"current_steps": 591, "total_steps": 1195, "loss": 0.3605, "lr": 2.3862387537936894e-05, "epoch": 2.4663536776212833, "percentage": 49.46, "elapsed_time": "6:28:20", "remaining_time": "6:36:52"}
|
| 592 |
+
{"current_steps": 592, "total_steps": 1195, "loss": 0.3657, "lr": 2.3805023163196326e-05, "epoch": 2.470526864893062, "percentage": 49.54, "elapsed_time": "6:28:56", "remaining_time": "6:36:10"}
|
| 593 |
+
{"current_steps": 593, "total_steps": 1195, "loss": 0.377, "lr": 2.37476262917145e-05, "epoch": 2.474700052164841, "percentage": 49.62, "elapsed_time": "6:29:37", "remaining_time": "6:35:32"}
|
| 594 |
+
{"current_steps": 594, "total_steps": 1195, "loss": 0.3769, "lr": 2.3690197413688483e-05, "epoch": 2.4788732394366195, "percentage": 49.71, "elapsed_time": "6:30:12", "remaining_time": "6:34:48"}
|
| 595 |
+
{"current_steps": 595, "total_steps": 1195, "loss": 0.3656, "lr": 2.363273701958873e-05, "epoch": 2.4830464267083987, "percentage": 49.79, "elapsed_time": "6:30:51", "remaining_time": "6:34:08"}
|
| 596 |
+
{"current_steps": 596, "total_steps": 1195, "loss": 0.3846, "lr": 2.3575245600154845e-05, "epoch": 2.4872196139801774, "percentage": 49.87, "elapsed_time": "6:31:29", "remaining_time": "6:33:28"}
|
| 597 |
+
{"current_steps": 597, "total_steps": 1195, "loss": 0.3856, "lr": 2.35177236463914e-05, "epoch": 2.491392801251956, "percentage": 49.96, "elapsed_time": "6:32:13", "remaining_time": "6:32:52"}
|
| 598 |
+
{"current_steps": 598, "total_steps": 1195, "loss": 0.3525, "lr": 2.3460171649563753e-05, "epoch": 2.495565988523735, "percentage": 50.04, "elapsed_time": "6:32:49", "remaining_time": "6:32:10"}
|
| 599 |
+
{"current_steps": 599, "total_steps": 1195, "loss": 0.3507, "lr": 2.3402590101193828e-05, "epoch": 2.4997391757955136, "percentage": 50.13, "elapsed_time": "6:33:28", "remaining_time": "6:31:29"}
|
| 600 |
+
{"current_steps": 600, "total_steps": 1195, "loss": 0.3781, "lr": 2.3344979493055958e-05, "epoch": 2.5039123630672924, "percentage": 50.21, "elapsed_time": "6:34:06", "remaining_time": "6:30:49"}
|
| 601 |
+
{"current_steps": 601, "total_steps": 1195, "loss": 0.363, "lr": 2.3287340317172638e-05, "epoch": 2.5080855503390715, "percentage": 50.29, "elapsed_time": "6:34:40", "remaining_time": "6:30:04"}
|
| 602 |
+
{"current_steps": 602, "total_steps": 1195, "loss": 0.3691, "lr": 2.3229673065810365e-05, "epoch": 2.5122587376108503, "percentage": 50.38, "elapsed_time": "6:35:16", "remaining_time": "6:29:21"}
|
| 603 |
+
{"current_steps": 603, "total_steps": 1195, "loss": 0.3542, "lr": 2.3171978231475403e-05, "epoch": 2.516431924882629, "percentage": 50.46, "elapsed_time": "6:35:55", "remaining_time": "6:28:42"}
|
| 604 |
+
{"current_steps": 604, "total_steps": 1195, "loss": 0.3614, "lr": 2.311425630690958e-05, "epoch": 2.520605112154408, "percentage": 50.54, "elapsed_time": "6:36:36", "remaining_time": "6:28:04"}
|
| 605 |
+
{"current_steps": 605, "total_steps": 1195, "loss": 0.3586, "lr": 2.3056507785086105e-05, "epoch": 2.5247782994261865, "percentage": 50.63, "elapsed_time": "6:37:10", "remaining_time": "6:27:19"}
|
| 606 |
+
{"current_steps": 606, "total_steps": 1195, "loss": 0.3637, "lr": 2.2998733159205325e-05, "epoch": 2.5289514866979657, "percentage": 50.71, "elapsed_time": "6:37:50", "remaining_time": "6:26:40"}
|
| 607 |
+
{"current_steps": 607, "total_steps": 1195, "loss": 0.3615, "lr": 2.2940932922690543e-05, "epoch": 2.5331246739697444, "percentage": 50.79, "elapsed_time": "6:38:31", "remaining_time": "6:26:03"}
|
| 608 |
+
{"current_steps": 608, "total_steps": 1195, "loss": 0.3735, "lr": 2.2883107569183776e-05, "epoch": 2.537297861241523, "percentage": 50.88, "elapsed_time": "6:39:09", "remaining_time": "6:25:22"}
|
| 609 |
+
{"current_steps": 609, "total_steps": 1195, "loss": 0.3903, "lr": 2.282525759254156e-05, "epoch": 2.5414710485133023, "percentage": 50.96, "elapsed_time": "6:39:46", "remaining_time": "6:24:40"}
|
| 610 |
+
{"current_steps": 610, "total_steps": 1195, "loss": 0.3665, "lr": 2.2767383486830728e-05, "epoch": 2.5456442357850806, "percentage": 51.05, "elapsed_time": "6:40:25", "remaining_time": "6:24:00"}
|
| 611 |
+
{"current_steps": 611, "total_steps": 1195, "loss": 0.3587, "lr": 2.2709485746324175e-05, "epoch": 2.5498174230568598, "percentage": 51.13, "elapsed_time": "6:41:04", "remaining_time": "6:23:20"}
|
| 612 |
+
{"current_steps": 612, "total_steps": 1195, "loss": 0.3786, "lr": 2.265156486549666e-05, "epoch": 2.5539906103286385, "percentage": 51.21, "elapsed_time": "6:41:45", "remaining_time": "6:22:43"}
|
| 613 |
+
{"current_steps": 613, "total_steps": 1195, "loss": 0.3837, "lr": 2.259362133902056e-05, "epoch": 2.5581637976004172, "percentage": 51.3, "elapsed_time": "6:42:25", "remaining_time": "6:22:04"}
|
| 614 |
+
{"current_steps": 614, "total_steps": 1195, "loss": 0.3735, "lr": 2.2535655661761677e-05, "epoch": 2.5623369848721964, "percentage": 51.38, "elapsed_time": "6:43:08", "remaining_time": "6:21:28"}
|
| 615 |
+
{"current_steps": 615, "total_steps": 1195, "loss": 0.3667, "lr": 2.247766832877496e-05, "epoch": 2.5665101721439747, "percentage": 51.46, "elapsed_time": "6:43:45", "remaining_time": "6:20:47"}
|
| 616 |
+
{"current_steps": 616, "total_steps": 1195, "loss": 0.3567, "lr": 2.241965983530034e-05, "epoch": 2.570683359415754, "percentage": 51.55, "elapsed_time": "6:44:21", "remaining_time": "6:20:04"}
|
| 617 |
+
{"current_steps": 617, "total_steps": 1195, "loss": 0.3624, "lr": 2.236163067675845e-05, "epoch": 2.5748565466875326, "percentage": 51.63, "elapsed_time": "6:45:00", "remaining_time": "6:19:24"}
|
| 618 |
+
{"current_steps": 618, "total_steps": 1195, "loss": 0.3683, "lr": 2.230358134874642e-05, "epoch": 2.5790297339593113, "percentage": 51.72, "elapsed_time": "6:45:40", "remaining_time": "6:18:45"}
|
| 619 |
+
{"current_steps": 619, "total_steps": 1195, "loss": 0.3703, "lr": 2.2245512347033625e-05, "epoch": 2.5832029212310905, "percentage": 51.8, "elapsed_time": "6:46:22", "remaining_time": "6:18:08"}
|
| 620 |
+
{"current_steps": 620, "total_steps": 1195, "loss": 0.3799, "lr": 2.2187424167557496e-05, "epoch": 2.587376108502869, "percentage": 51.88, "elapsed_time": "6:47:00", "remaining_time": "6:17:28"}
|
| 621 |
+
{"current_steps": 621, "total_steps": 1195, "loss": 0.3555, "lr": 2.2129317306419198e-05, "epoch": 2.591549295774648, "percentage": 51.97, "elapsed_time": "6:47:41", "remaining_time": "6:16:49"}
|
| 622 |
+
{"current_steps": 622, "total_steps": 1195, "loss": 0.3683, "lr": 2.2071192259879498e-05, "epoch": 2.5957224830464267, "percentage": 52.05, "elapsed_time": "6:48:12", "remaining_time": "6:16:03"}
|
| 623 |
+
{"current_steps": 623, "total_steps": 1195, "loss": 0.3528, "lr": 2.2013049524354453e-05, "epoch": 2.5998956703182055, "percentage": 52.13, "elapsed_time": "6:48:44", "remaining_time": "6:15:17"}
|
| 624 |
+
{"current_steps": 624, "total_steps": 1195, "loss": 0.353, "lr": 2.1954889596411184e-05, "epoch": 2.604068857589984, "percentage": 52.22, "elapsed_time": "6:49:22", "remaining_time": "6:14:36"}
|
| 625 |
+
{"current_steps": 625, "total_steps": 1195, "loss": 0.3759, "lr": 2.1896712972763658e-05, "epoch": 2.608242044861763, "percentage": 52.3, "elapsed_time": "6:50:04", "remaining_time": "6:13:59"}
|
| 626 |
+
{"current_steps": 626, "total_steps": 1195, "loss": 0.3767, "lr": 2.183852015026842e-05, "epoch": 2.612415232133542, "percentage": 52.38, "elapsed_time": "6:50:45", "remaining_time": "6:13:21"}
|
| 627 |
+
{"current_steps": 627, "total_steps": 1195, "loss": 0.3745, "lr": 2.178031162592038e-05, "epoch": 2.616588419405321, "percentage": 52.47, "elapsed_time": "6:51:21", "remaining_time": "6:12:39"}
|
| 628 |
+
{"current_steps": 628, "total_steps": 1195, "loss": 0.3686, "lr": 2.1722087896848528e-05, "epoch": 2.6207616066770996, "percentage": 52.55, "elapsed_time": "6:51:58", "remaining_time": "6:11:57"}
|
| 629 |
+
{"current_steps": 629, "total_steps": 1195, "loss": 0.3708, "lr": 2.1663849460311722e-05, "epoch": 2.6249347939488783, "percentage": 52.64, "elapsed_time": "6:52:38", "remaining_time": "6:11:18"}
|
| 630 |
+
{"current_steps": 630, "total_steps": 1195, "loss": 0.3804, "lr": 2.1605596813694426e-05, "epoch": 2.629107981220657, "percentage": 52.72, "elapsed_time": "6:53:20", "remaining_time": "6:10:41"}
|
| 631 |
+
{"current_steps": 631, "total_steps": 1195, "loss": 0.365, "lr": 2.154733045450246e-05, "epoch": 2.633281168492436, "percentage": 52.8, "elapsed_time": "6:53:57", "remaining_time": "6:10:00"}
|
| 632 |
+
{"current_steps": 632, "total_steps": 1195, "loss": 0.3648, "lr": 2.1489050880358758e-05, "epoch": 2.637454355764215, "percentage": 52.89, "elapsed_time": "6:54:37", "remaining_time": "6:09:21"}
|
| 633 |
+
{"current_steps": 633, "total_steps": 1195, "loss": 0.3677, "lr": 2.143075858899913e-05, "epoch": 2.6416275430359937, "percentage": 52.97, "elapsed_time": "6:55:14", "remaining_time": "6:08:39"}
|
| 634 |
+
{"current_steps": 634, "total_steps": 1195, "loss": 0.3706, "lr": 2.1372454078267975e-05, "epoch": 2.6458007303077724, "percentage": 53.05, "elapsed_time": "6:55:55", "remaining_time": "6:08:02"}
|
| 635 |
+
{"current_steps": 635, "total_steps": 1195, "loss": 0.3731, "lr": 2.131413784611406e-05, "epoch": 2.649973917579551, "percentage": 53.14, "elapsed_time": "6:56:35", "remaining_time": "6:07:23"}
|
| 636 |
+
{"current_steps": 636, "total_steps": 1195, "loss": 0.3605, "lr": 2.125581039058627e-05, "epoch": 2.6541471048513303, "percentage": 53.22, "elapsed_time": "6:57:13", "remaining_time": "6:06:42"}
|
| 637 |
+
{"current_steps": 637, "total_steps": 1195, "loss": 0.3825, "lr": 2.1197472209829328e-05, "epoch": 2.658320292123109, "percentage": 53.31, "elapsed_time": "6:57:49", "remaining_time": "6:06:00"}
|
| 638 |
+
{"current_steps": 638, "total_steps": 1195, "loss": 0.3502, "lr": 2.113912380207957e-05, "epoch": 2.662493479394888, "percentage": 53.39, "elapsed_time": "6:58:28", "remaining_time": "6:05:20"}
|
| 639 |
+
{"current_steps": 639, "total_steps": 1195, "loss": 0.3689, "lr": 2.1080765665660653e-05, "epoch": 2.6666666666666665, "percentage": 53.47, "elapsed_time": "6:59:05", "remaining_time": "6:04:39"}
|
| 640 |
+
{"current_steps": 640, "total_steps": 1195, "loss": 0.3642, "lr": 2.1022398298979345e-05, "epoch": 2.6708398539384453, "percentage": 53.56, "elapsed_time": "6:59:46", "remaining_time": "6:04:01"}
|
| 641 |
+
{"current_steps": 641, "total_steps": 1195, "loss": 0.376, "lr": 2.096402220052123e-05, "epoch": 2.6750130412102244, "percentage": 53.64, "elapsed_time": "7:00:30", "remaining_time": "6:03:26"}
|
| 642 |
+
{"current_steps": 642, "total_steps": 1195, "loss": 0.3478, "lr": 2.0905637868846478e-05, "epoch": 2.679186228482003, "percentage": 53.72, "elapsed_time": "7:01:06", "remaining_time": "6:02:43"}
|
| 643 |
+
{"current_steps": 643, "total_steps": 1195, "loss": 0.3612, "lr": 2.0847245802585567e-05, "epoch": 2.683359415753782, "percentage": 53.81, "elapsed_time": "7:01:46", "remaining_time": "6:02:04"}
|
| 644 |
+
{"current_steps": 644, "total_steps": 1195, "loss": 0.3716, "lr": 2.078884650043502e-05, "epoch": 2.6875326030255606, "percentage": 53.89, "elapsed_time": "7:02:24", "remaining_time": "6:01:24"}
|
| 645 |
+
{"current_steps": 645, "total_steps": 1195, "loss": 0.3714, "lr": 2.0730440461153183e-05, "epoch": 2.6917057902973394, "percentage": 53.97, "elapsed_time": "7:02:59", "remaining_time": "6:00:41"}
|
| 646 |
+
{"current_steps": 646, "total_steps": 1195, "loss": 0.3787, "lr": 2.067202818355592e-05, "epoch": 2.6958789775691185, "percentage": 54.06, "elapsed_time": "7:03:32", "remaining_time": "5:59:57"}
|
| 647 |
+
{"current_steps": 647, "total_steps": 1195, "loss": 0.3675, "lr": 2.061361016651239e-05, "epoch": 2.7000521648408973, "percentage": 54.14, "elapsed_time": "7:04:13", "remaining_time": "5:59:18"}
|
| 648 |
+
{"current_steps": 648, "total_steps": 1195, "loss": 0.3504, "lr": 2.0555186908940753e-05, "epoch": 2.704225352112676, "percentage": 54.23, "elapsed_time": "7:04:56", "remaining_time": "5:58:42"}
|
| 649 |
+
{"current_steps": 649, "total_steps": 1195, "loss": 0.3602, "lr": 2.049675890980394e-05, "epoch": 2.7083985393844547, "percentage": 54.31, "elapsed_time": "7:05:34", "remaining_time": "5:58:01"}
|
| 650 |
+
{"current_steps": 650, "total_steps": 1195, "loss": 0.3644, "lr": 2.0438326668105364e-05, "epoch": 2.7125717266562335, "percentage": 54.39, "elapsed_time": "7:06:09", "remaining_time": "5:57:18"}
|
| 651 |
+
{"current_steps": 651, "total_steps": 1195, "loss": 0.3846, "lr": 2.0379890682884685e-05, "epoch": 2.7167449139280127, "percentage": 54.48, "elapsed_time": "7:06:48", "remaining_time": "5:56:39"}
|
| 652 |
+
{"current_steps": 652, "total_steps": 1195, "loss": 0.3659, "lr": 2.0321451453213518e-05, "epoch": 2.7209181011997914, "percentage": 54.56, "elapsed_time": "7:07:34", "remaining_time": "5:56:05"}
|
| 653 |
+
{"current_steps": 653, "total_steps": 1195, "loss": 0.368, "lr": 2.026300947819121e-05, "epoch": 2.72509128847157, "percentage": 54.64, "elapsed_time": "7:08:14", "remaining_time": "5:55:27"}
|
| 654 |
+
{"current_steps": 654, "total_steps": 1195, "loss": 0.3633, "lr": 2.020456525694054e-05, "epoch": 2.729264475743349, "percentage": 54.73, "elapsed_time": "7:08:59", "remaining_time": "5:54:52"}
|
| 655 |
+
{"current_steps": 655, "total_steps": 1195, "loss": 0.3644, "lr": 2.014611928860346e-05, "epoch": 2.7334376630151276, "percentage": 54.81, "elapsed_time": "7:09:30", "remaining_time": "5:54:06"}
|
| 656 |
+
{"current_steps": 656, "total_steps": 1195, "loss": 0.3714, "lr": 2.008767207233687e-05, "epoch": 2.7376108502869068, "percentage": 54.9, "elapsed_time": "7:10:12", "remaining_time": "5:53:28"}
|
| 657 |
+
{"current_steps": 657, "total_steps": 1195, "loss": 0.3675, "lr": 2.0029224107308304e-05, "epoch": 2.7417840375586855, "percentage": 54.98, "elapsed_time": "7:10:49", "remaining_time": "5:52:47"}
|
| 658 |
+
{"current_steps": 658, "total_steps": 1195, "loss": 0.3531, "lr": 1.99707758926917e-05, "epoch": 2.7459572248304642, "percentage": 55.06, "elapsed_time": "7:11:29", "remaining_time": "5:52:08"}
|
| 659 |
+
{"current_steps": 659, "total_steps": 1195, "loss": 0.361, "lr": 1.9912327927663135e-05, "epoch": 2.750130412102243, "percentage": 55.15, "elapsed_time": "7:12:09", "remaining_time": "5:51:30"}
|
| 660 |
+
{"current_steps": 660, "total_steps": 1195, "loss": 0.3716, "lr": 1.985388071139654e-05, "epoch": 2.7543035993740217, "percentage": 55.23, "elapsed_time": "7:12:47", "remaining_time": "5:50:49"}
|
| 661 |
+
{"current_steps": 661, "total_steps": 1195, "loss": 0.3685, "lr": 1.9795434743059467e-05, "epoch": 2.758476786645801, "percentage": 55.31, "elapsed_time": "7:13:24", "remaining_time": "5:50:07"}
|
| 662 |
+
{"current_steps": 662, "total_steps": 1195, "loss": 0.3776, "lr": 1.9736990521808793e-05, "epoch": 2.7626499739175796, "percentage": 55.4, "elapsed_time": "7:14:04", "remaining_time": "5:49:29"}
|
| 663 |
+
{"current_steps": 663, "total_steps": 1195, "loss": 0.3726, "lr": 1.9678548546786486e-05, "epoch": 2.7668231611893583, "percentage": 55.48, "elapsed_time": "7:14:45", "remaining_time": "5:48:51"}
|
| 664 |
+
{"current_steps": 664, "total_steps": 1195, "loss": 0.3765, "lr": 1.9620109317115325e-05, "epoch": 2.770996348461137, "percentage": 55.56, "elapsed_time": "7:15:23", "remaining_time": "5:48:11"}
|
| 665 |
+
{"current_steps": 665, "total_steps": 1195, "loss": 0.3514, "lr": 1.956167333189464e-05, "epoch": 2.775169535732916, "percentage": 55.65, "elapsed_time": "7:16:07", "remaining_time": "5:47:35"}
|
| 666 |
+
{"current_steps": 666, "total_steps": 1195, "loss": 0.3549, "lr": 1.9503241090196068e-05, "epoch": 2.779342723004695, "percentage": 55.73, "elapsed_time": "7:16:48", "remaining_time": "5:46:57"}
|
| 667 |
+
{"current_steps": 667, "total_steps": 1195, "loss": 0.3677, "lr": 1.9444813091059253e-05, "epoch": 2.7835159102764737, "percentage": 55.82, "elapsed_time": "7:17:28", "remaining_time": "5:46:18"}
|
| 668 |
+
{"current_steps": 668, "total_steps": 1195, "loss": 0.3659, "lr": 1.938638983348762e-05, "epoch": 2.7876890975482524, "percentage": 55.9, "elapsed_time": "7:18:07", "remaining_time": "5:45:38"}
|
| 669 |
+
{"current_steps": 669, "total_steps": 1195, "loss": 0.3549, "lr": 1.9327971816444086e-05, "epoch": 2.791862284820031, "percentage": 55.98, "elapsed_time": "7:18:43", "remaining_time": "5:44:56"}
|
| 670 |
+
{"current_steps": 670, "total_steps": 1195, "loss": 0.3911, "lr": 1.9269559538846823e-05, "epoch": 2.79603547209181, "percentage": 56.07, "elapsed_time": "7:19:26", "remaining_time": "5:44:20"}
|
| 671 |
+
{"current_steps": 671, "total_steps": 1195, "loss": 0.3703, "lr": 1.9211153499564984e-05, "epoch": 2.800208659363589, "percentage": 56.15, "elapsed_time": "7:20:02", "remaining_time": "5:43:38"}
|
| 672 |
+
{"current_steps": 672, "total_steps": 1195, "loss": 0.3608, "lr": 1.9152754197414443e-05, "epoch": 2.804381846635368, "percentage": 56.23, "elapsed_time": "7:20:44", "remaining_time": "5:43:00"}
|
| 673 |
+
{"current_steps": 673, "total_steps": 1195, "loss": 0.3588, "lr": 1.909436213115353e-05, "epoch": 2.8085550339071466, "percentage": 56.32, "elapsed_time": "7:21:22", "remaining_time": "5:42:20"}
|
| 674 |
+
{"current_steps": 674, "total_steps": 1195, "loss": 0.3501, "lr": 1.9035977799478772e-05, "epoch": 2.8127282211789253, "percentage": 56.4, "elapsed_time": "7:21:58", "remaining_time": "5:41:39"}
|
| 675 |
+
{"current_steps": 675, "total_steps": 1195, "loss": 0.3597, "lr": 1.897760170102066e-05, "epoch": 2.816901408450704, "percentage": 56.49, "elapsed_time": "7:22:42", "remaining_time": "5:41:02"}
|
| 676 |
+
{"current_steps": 676, "total_steps": 1195, "loss": 0.3765, "lr": 1.8919234334339354e-05, "epoch": 2.821074595722483, "percentage": 56.57, "elapsed_time": "7:23:25", "remaining_time": "5:40:26"}
|
| 677 |
+
{"current_steps": 677, "total_steps": 1195, "loss": 0.3657, "lr": 1.886087619792044e-05, "epoch": 2.825247782994262, "percentage": 56.65, "elapsed_time": "7:24:03", "remaining_time": "5:39:46"}
|
| 678 |
+
{"current_steps": 678, "total_steps": 1195, "loss": 0.3554, "lr": 1.880252779017067e-05, "epoch": 2.8294209702660407, "percentage": 56.74, "elapsed_time": "7:24:45", "remaining_time": "5:39:08"}
|
| 679 |
+
{"current_steps": 679, "total_steps": 1195, "loss": 0.3747, "lr": 1.8744189609413733e-05, "epoch": 2.8335941575378194, "percentage": 56.82, "elapsed_time": "7:25:22", "remaining_time": "5:38:27"}
|
| 680 |
+
{"current_steps": 680, "total_steps": 1195, "loss": 0.362, "lr": 1.8685862153885947e-05, "epoch": 2.837767344809598, "percentage": 56.9, "elapsed_time": "7:26:05", "remaining_time": "5:37:50"}
|
| 681 |
+
{"current_steps": 681, "total_steps": 1195, "loss": 0.3533, "lr": 1.8627545921732038e-05, "epoch": 2.8419405320813773, "percentage": 56.99, "elapsed_time": "7:26:46", "remaining_time": "5:37:12"}
|
| 682 |
+
{"current_steps": 682, "total_steps": 1195, "loss": 0.3753, "lr": 1.856924141100088e-05, "epoch": 2.846113719353156, "percentage": 57.07, "elapsed_time": "7:27:24", "remaining_time": "5:36:32"}
|
| 683 |
+
{"current_steps": 683, "total_steps": 1195, "loss": 0.3808, "lr": 1.8510949119641246e-05, "epoch": 2.850286906624935, "percentage": 57.15, "elapsed_time": "7:28:04", "remaining_time": "5:35:53"}
|
| 684 |
+
{"current_steps": 684, "total_steps": 1195, "loss": 0.3543, "lr": 1.8452669545497545e-05, "epoch": 2.8544600938967135, "percentage": 57.24, "elapsed_time": "7:28:46", "remaining_time": "5:35:16"}
|
| 685 |
+
{"current_steps": 685, "total_steps": 1195, "loss": 0.3643, "lr": 1.839440318630558e-05, "epoch": 2.8586332811684922, "percentage": 57.32, "elapsed_time": "7:29:25", "remaining_time": "5:34:36"}
|
| 686 |
+
{"current_steps": 686, "total_steps": 1195, "loss": 0.3532, "lr": 1.833615053968828e-05, "epoch": 2.8628064684402714, "percentage": 57.41, "elapsed_time": "7:30:03", "remaining_time": "5:33:55"}
|
| 687 |
+
{"current_steps": 687, "total_steps": 1195, "loss": 0.3432, "lr": 1.8277912103151475e-05, "epoch": 2.86697965571205, "percentage": 57.49, "elapsed_time": "7:30:41", "remaining_time": "5:33:16"}
|
| 688 |
+
{"current_steps": 688, "total_steps": 1195, "loss": 0.3678, "lr": 1.8219688374079624e-05, "epoch": 2.871152842983829, "percentage": 57.57, "elapsed_time": "7:31:19", "remaining_time": "5:32:35"}
|
| 689 |
+
{"current_steps": 689, "total_steps": 1195, "loss": 0.3822, "lr": 1.8161479849731582e-05, "epoch": 2.8753260302556076, "percentage": 57.66, "elapsed_time": "7:32:02", "remaining_time": "5:31:59"}
|
| 690 |
+
{"current_steps": 690, "total_steps": 1195, "loss": 0.3508, "lr": 1.8103287027236352e-05, "epoch": 2.8794992175273864, "percentage": 57.74, "elapsed_time": "7:32:43", "remaining_time": "5:31:20"}
|
| 691 |
+
{"current_steps": 691, "total_steps": 1195, "loss": 0.3697, "lr": 1.804511040358882e-05, "epoch": 2.8836724047991655, "percentage": 57.82, "elapsed_time": "7:33:21", "remaining_time": "5:30:39"}
|
| 692 |
+
{"current_steps": 692, "total_steps": 1195, "loss": 0.3695, "lr": 1.7986950475645553e-05, "epoch": 2.8878455920709443, "percentage": 57.91, "elapsed_time": "7:33:59", "remaining_time": "5:29:59"}
|
| 693 |
+
{"current_steps": 693, "total_steps": 1195, "loss": 0.3755, "lr": 1.7928807740120506e-05, "epoch": 2.892018779342723, "percentage": 57.99, "elapsed_time": "7:34:42", "remaining_time": "5:29:22"}
|
| 694 |
+
{"current_steps": 694, "total_steps": 1195, "loss": 0.3754, "lr": 1.787068269358081e-05, "epoch": 2.8961919666145017, "percentage": 58.08, "elapsed_time": "7:35:20", "remaining_time": "5:28:42"}
|
| 695 |
+
{"current_steps": 695, "total_steps": 1195, "loss": 0.3685, "lr": 1.7812575832442518e-05, "epoch": 2.9003651538862805, "percentage": 58.16, "elapsed_time": "7:36:02", "remaining_time": "5:28:05"}
|
| 696 |
+
{"current_steps": 696, "total_steps": 1195, "loss": 0.3689, "lr": 1.775448765296637e-05, "epoch": 2.9045383411580596, "percentage": 58.24, "elapsed_time": "7:36:47", "remaining_time": "5:27:29"}
|
| 697 |
+
{"current_steps": 697, "total_steps": 1195, "loss": 0.3607, "lr": 1.7696418651253585e-05, "epoch": 2.9087115284298384, "percentage": 58.33, "elapsed_time": "7:37:21", "remaining_time": "5:26:46"}
|
| 698 |
+
{"current_steps": 698, "total_steps": 1195, "loss": 0.3642, "lr": 1.7638369323241554e-05, "epoch": 2.912884715701617, "percentage": 58.41, "elapsed_time": "7:37:59", "remaining_time": "5:26:06"}
|
| 699 |
+
{"current_steps": 699, "total_steps": 1195, "loss": 0.376, "lr": 1.7580340164699666e-05, "epoch": 2.917057902973396, "percentage": 58.49, "elapsed_time": "7:38:38", "remaining_time": "5:25:27"}
|
| 700 |
+
{"current_steps": 700, "total_steps": 1195, "loss": 0.3567, "lr": 1.752233167122504e-05, "epoch": 2.9212310902451746, "percentage": 58.58, "elapsed_time": "7:39:20", "remaining_time": "5:24:49"}
|
| 701 |
+
{"current_steps": 701, "total_steps": 1195, "loss": 0.3507, "lr": 1.7464344338238327e-05, "epoch": 2.9254042775169538, "percentage": 58.66, "elapsed_time": "7:39:59", "remaining_time": "5:24:09"}
|
| 702 |
+
{"current_steps": 702, "total_steps": 1195, "loss": 0.3552, "lr": 1.7406378660979443e-05, "epoch": 2.9295774647887325, "percentage": 58.74, "elapsed_time": "7:40:37", "remaining_time": "5:23:29"}
|
| 703 |
+
{"current_steps": 703, "total_steps": 1195, "loss": 0.363, "lr": 1.7348435134503347e-05, "epoch": 2.933750652060511, "percentage": 58.83, "elapsed_time": "7:41:19", "remaining_time": "5:22:51"}
|
| 704 |
+
{"current_steps": 704, "total_steps": 1195, "loss": 0.3727, "lr": 1.7290514253675832e-05, "epoch": 2.93792383933229, "percentage": 58.91, "elapsed_time": "7:42:00", "remaining_time": "5:22:13"}
|
| 705 |
+
{"current_steps": 705, "total_steps": 1195, "loss": 0.3595, "lr": 1.7232616513169272e-05, "epoch": 2.9420970266040687, "percentage": 59.0, "elapsed_time": "7:42:37", "remaining_time": "5:21:32"}
|
| 706 |
+
{"current_steps": 706, "total_steps": 1195, "loss": 0.3703, "lr": 1.717474240745844e-05, "epoch": 2.946270213875848, "percentage": 59.08, "elapsed_time": "7:43:23", "remaining_time": "5:20:57"}
|
| 707 |
+
{"current_steps": 707, "total_steps": 1195, "loss": 0.3595, "lr": 1.711689243081623e-05, "epoch": 2.9504434011476266, "percentage": 59.16, "elapsed_time": "7:44:01", "remaining_time": "5:20:17"}
|
| 708 |
+
{"current_steps": 708, "total_steps": 1195, "loss": 0.3702, "lr": 1.7059067077309467e-05, "epoch": 2.9546165884194053, "percentage": 59.25, "elapsed_time": "7:44:34", "remaining_time": "5:19:33"}
|
| 709 |
+
{"current_steps": 709, "total_steps": 1195, "loss": 0.3605, "lr": 1.7001266840794678e-05, "epoch": 2.958789775691184, "percentage": 59.33, "elapsed_time": "7:45:12", "remaining_time": "5:18:53"}
|
| 710 |
+
{"current_steps": 710, "total_steps": 1195, "loss": 0.3624, "lr": 1.69434922149139e-05, "epoch": 2.962962962962963, "percentage": 59.41, "elapsed_time": "7:45:50", "remaining_time": "5:18:12"}
|
| 711 |
+
{"current_steps": 711, "total_steps": 1195, "loss": 0.351, "lr": 1.6885743693090422e-05, "epoch": 2.967136150234742, "percentage": 59.5, "elapsed_time": "7:46:26", "remaining_time": "5:17:31"}
|
| 712 |
+
{"current_steps": 712, "total_steps": 1195, "loss": 0.3717, "lr": 1.6828021768524604e-05, "epoch": 2.9713093375065207, "percentage": 59.58, "elapsed_time": "7:47:00", "remaining_time": "5:16:48"}
|
| 713 |
+
{"current_steps": 713, "total_steps": 1195, "loss": 0.3679, "lr": 1.6770326934189638e-05, "epoch": 2.9754825247782994, "percentage": 59.67, "elapsed_time": "7:47:39", "remaining_time": "5:16:08"}
|
| 714 |
+
{"current_steps": 714, "total_steps": 1195, "loss": 0.3863, "lr": 1.671265968282736e-05, "epoch": 2.979655712050078, "percentage": 59.75, "elapsed_time": "7:48:21", "remaining_time": "5:15:31"}
|
| 715 |
+
{"current_steps": 715, "total_steps": 1195, "loss": 0.3602, "lr": 1.6655020506944046e-05, "epoch": 2.983828899321857, "percentage": 59.83, "elapsed_time": "7:49:02", "remaining_time": "5:14:52"}
|
| 716 |
+
{"current_steps": 716, "total_steps": 1195, "loss": 0.3538, "lr": 1.659740989880618e-05, "epoch": 2.988002086593636, "percentage": 59.92, "elapsed_time": "7:49:41", "remaining_time": "5:14:13"}
|
| 717 |
+
{"current_steps": 717, "total_steps": 1195, "loss": 0.3561, "lr": 1.653982835043626e-05, "epoch": 2.992175273865415, "percentage": 60.0, "elapsed_time": "7:50:24", "remaining_time": "5:13:36"}
|
| 718 |
+
{"current_steps": 718, "total_steps": 1195, "loss": 0.383, "lr": 1.6482276353608602e-05, "epoch": 2.9963484611371936, "percentage": 60.08, "elapsed_time": "7:51:00", "remaining_time": "5:12:54"}
|
| 719 |
+
{"current_steps": 719, "total_steps": 1195, "loss": 0.335, "lr": 1.642475439984516e-05, "epoch": 3.0005216484089723, "percentage": 60.17, "elapsed_time": "7:52:25", "remaining_time": "5:12:45"}
|
| 720 |
+
{"current_steps": 720, "total_steps": 1195, "loss": 0.2541, "lr": 1.6367262980411273e-05, "epoch": 3.004694835680751, "percentage": 60.25, "elapsed_time": "7:53:07", "remaining_time": "5:12:07"}
|
| 721 |
+
{"current_steps": 721, "total_steps": 1195, "loss": 0.2596, "lr": 1.6309802586311523e-05, "epoch": 3.00886802295253, "percentage": 60.33, "elapsed_time": "7:53:48", "remaining_time": "5:11:29"}
|
| 722 |
+
{"current_steps": 722, "total_steps": 1195, "loss": 0.2529, "lr": 1.6252373708285505e-05, "epoch": 3.013041210224309, "percentage": 60.42, "elapsed_time": "7:54:28", "remaining_time": "5:10:50"}
|