Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7740818ede47e97dd8a223218e54e0b6d5c310fde7829c94f53457af3486753
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:443abd09b3279781d2d57b06aaf3ce071224782e45a7bcb09fcdd0fa585518dc
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a674629e0f6cdb428d28e82566bc30a783308227a38785d63afde68a5f59f0df
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8850041214617904fa29c66fac0654e5ac580ee4b1a8dfdef56a8f5fdcc1e808
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -443,3 +443,225 @@
|
|
| 443 |
{"current_steps": 443, "total_steps": 666, "loss": 0.4393, "lr": 8.619017900700374e-06, "epoch": 1.9912970241437393, "percentage": 66.52, "elapsed_time": "20:13:42", "remaining_time": "10:10:58"}
|
| 444 |
{"current_steps": 444, "total_steps": 666, "loss": 0.4239, "lr": 8.550812888872337e-06, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "20:16:30", "remaining_time": "10:08:15"}
|
| 445 |
{"current_steps": 445, "total_steps": 666, "loss": 0.6928, "lr": 8.48276167820656e-06, "epoch": 2.0016844469399215, "percentage": 66.82, "elapsed_time": "20:19:57", "remaining_time": "10:05:51"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 443 |
{"current_steps": 443, "total_steps": 666, "loss": 0.4393, "lr": 8.619017900700374e-06, "epoch": 1.9912970241437393, "percentage": 66.52, "elapsed_time": "20:13:42", "remaining_time": "10:10:58"}
|
| 444 |
{"current_steps": 444, "total_steps": 666, "loss": 0.4239, "lr": 8.550812888872337e-06, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "20:16:30", "remaining_time": "10:08:15"}
|
| 445 |
{"current_steps": 445, "total_steps": 666, "loss": 0.6928, "lr": 8.48276167820656e-06, "epoch": 2.0016844469399215, "percentage": 66.82, "elapsed_time": "20:19:57", "remaining_time": "10:05:51"}
|
| 446 |
+
{"current_steps": 446, "total_steps": 666, "loss": 0.4081, "lr": 8.414866140595784e-06, "epoch": 2.0061763054463784, "percentage": 66.97, "elapsed_time": "20:22:41", "remaining_time": "10:03:07"}
|
| 447 |
+
{"current_steps": 447, "total_steps": 666, "loss": 0.4048, "lr": 8.347128143650638e-06, "epoch": 2.0106681639528357, "percentage": 67.12, "elapsed_time": "20:25:21", "remaining_time": "10:00:20"}
|
| 448 |
+
{"current_steps": 448, "total_steps": 666, "loss": 0.3931, "lr": 8.279549550648262e-06, "epoch": 2.0151600224592925, "percentage": 67.27, "elapsed_time": "20:28:06", "remaining_time": "9:57:36"}
|
| 449 |
+
{"current_steps": 449, "total_steps": 666, "loss": 0.4008, "lr": 8.212132220481046e-06, "epoch": 2.0196518809657498, "percentage": 67.42, "elapsed_time": "20:30:55", "remaining_time": "9:54:53"}
|
| 450 |
+
{"current_steps": 450, "total_steps": 666, "loss": 0.4154, "lr": 8.144878007605514e-06, "epoch": 2.0241437394722066, "percentage": 67.57, "elapsed_time": "20:33:50", "remaining_time": "9:52:14"}
|
| 451 |
+
{"current_steps": 451, "total_steps": 666, "loss": 0.4162, "lr": 8.077788761991291e-06, "epoch": 2.028635597978664, "percentage": 67.72, "elapsed_time": "20:36:36", "remaining_time": "9:49:30"}
|
| 452 |
+
{"current_steps": 452, "total_steps": 666, "loss": 0.4003, "lr": 8.01086632907024e-06, "epoch": 2.0331274564851207, "percentage": 67.87, "elapsed_time": "20:39:20", "remaining_time": "9:46:45"}
|
| 453 |
+
{"current_steps": 453, "total_steps": 666, "loss": 0.3955, "lr": 7.944112549685684e-06, "epoch": 2.0376193149915776, "percentage": 68.02, "elapsed_time": "20:42:11", "remaining_time": "9:44:04"}
|
| 454 |
+
{"current_steps": 454, "total_steps": 666, "loss": 0.4102, "lr": 7.877529260041764e-06, "epoch": 2.042111173498035, "percentage": 68.17, "elapsed_time": "20:45:02", "remaining_time": "9:41:22"}
|
| 455 |
+
{"current_steps": 455, "total_steps": 666, "loss": 0.4138, "lr": 7.811118291652952e-06, "epoch": 2.0466030320044917, "percentage": 68.32, "elapsed_time": "20:47:44", "remaining_time": "9:38:37"}
|
| 456 |
+
{"current_steps": 456, "total_steps": 666, "loss": 0.3935, "lr": 7.744881471293649e-06, "epoch": 2.051094890510949, "percentage": 68.47, "elapsed_time": "20:50:35", "remaining_time": "9:35:55"}
|
| 457 |
+
{"current_steps": 457, "total_steps": 666, "loss": 0.4042, "lr": 7.678820620947954e-06, "epoch": 2.055586749017406, "percentage": 68.62, "elapsed_time": "20:53:21", "remaining_time": "9:33:11"}
|
| 458 |
+
{"current_steps": 458, "total_steps": 666, "loss": 0.4161, "lr": 7.612937557759534e-06, "epoch": 2.060078607523863, "percentage": 68.77, "elapsed_time": "20:56:00", "remaining_time": "9:30:24"}
|
| 459 |
+
{"current_steps": 459, "total_steps": 666, "loss": 0.421, "lr": 7.54723409398164e-06, "epoch": 2.06457046603032, "percentage": 68.92, "elapsed_time": "20:58:42", "remaining_time": "9:27:39"}
|
| 460 |
+
{"current_steps": 460, "total_steps": 666, "loss": 0.3861, "lr": 7.481712036927267e-06, "epoch": 2.069062324536777, "percentage": 69.07, "elapsed_time": "21:01:29", "remaining_time": "9:24:55"}
|
| 461 |
+
{"current_steps": 461, "total_steps": 666, "loss": 0.3922, "lr": 7.416373188919427e-06, "epoch": 2.073554183043234, "percentage": 69.22, "elapsed_time": "21:04:20", "remaining_time": "9:22:14"}
|
| 462 |
+
{"current_steps": 462, "total_steps": 666, "loss": 0.4049, "lr": 7.351219347241587e-06, "epoch": 2.0780460415496913, "percentage": 69.37, "elapsed_time": "21:07:13", "remaining_time": "9:19:33"}
|
| 463 |
+
{"current_steps": 463, "total_steps": 666, "loss": 0.4038, "lr": 7.286252304088215e-06, "epoch": 2.082537900056148, "percentage": 69.52, "elapsed_time": "21:10:01", "remaining_time": "9:16:50"}
|
| 464 |
+
{"current_steps": 464, "total_steps": 666, "loss": 0.402, "lr": 7.221473846515494e-06, "epoch": 2.0870297585626054, "percentage": 69.67, "elapsed_time": "21:12:43", "remaining_time": "9:14:04"}
|
| 465 |
+
{"current_steps": 465, "total_steps": 666, "loss": 0.3956, "lr": 7.156885756392161e-06, "epoch": 2.0915216170690623, "percentage": 69.82, "elapsed_time": "21:15:26", "remaining_time": "9:11:19"}
|
| 466 |
+
{"current_steps": 466, "total_steps": 666, "loss": 0.3912, "lr": 7.092489810350491e-06, "epoch": 2.0960134755755195, "percentage": 69.97, "elapsed_time": "21:18:19", "remaining_time": "9:08:38"}
|
| 467 |
+
{"current_steps": 467, "total_steps": 666, "loss": 0.4066, "lr": 7.028287779737433e-06, "epoch": 2.1005053340819764, "percentage": 70.12, "elapsed_time": "21:20:49", "remaining_time": "9:05:47"}
|
| 468 |
+
{"current_steps": 468, "total_steps": 666, "loss": 0.4048, "lr": 6.964281430565874e-06, "epoch": 2.1049971925884337, "percentage": 70.27, "elapsed_time": "21:23:31", "remaining_time": "9:03:01"}
|
| 469 |
+
{"current_steps": 469, "total_steps": 666, "loss": 0.3929, "lr": 6.9004725234660754e-06, "epoch": 2.1094890510948905, "percentage": 70.42, "elapsed_time": "21:26:17", "remaining_time": "9:00:17"}
|
| 470 |
+
{"current_steps": 470, "total_steps": 666, "loss": 0.4214, "lr": 6.836862813637232e-06, "epoch": 2.1139809096013478, "percentage": 70.57, "elapsed_time": "21:29:05", "remaining_time": "8:57:34"}
|
| 471 |
+
{"current_steps": 471, "total_steps": 666, "loss": 0.3956, "lr": 6.773454050799198e-06, "epoch": 2.1184727681078046, "percentage": 70.72, "elapsed_time": "21:31:45", "remaining_time": "8:54:48"}
|
| 472 |
+
{"current_steps": 472, "total_steps": 666, "loss": 0.4067, "lr": 6.710247979144353e-06, "epoch": 2.1229646266142614, "percentage": 70.87, "elapsed_time": "21:34:36", "remaining_time": "8:52:06"}
|
| 473 |
+
{"current_steps": 473, "total_steps": 666, "loss": 0.4087, "lr": 6.6472463372896255e-06, "epoch": 2.1274564851207187, "percentage": 71.02, "elapsed_time": "21:37:32", "remaining_time": "8:49:26"}
|
| 474 |
+
{"current_steps": 474, "total_steps": 666, "loss": 0.4155, "lr": 6.584450858228674e-06, "epoch": 2.1319483436271756, "percentage": 71.17, "elapsed_time": "21:40:13", "remaining_time": "8:46:40"}
|
| 475 |
+
{"current_steps": 475, "total_steps": 666, "loss": 0.3982, "lr": 6.5218632692842e-06, "epoch": 2.136440202133633, "percentage": 71.32, "elapsed_time": "21:42:53", "remaining_time": "8:43:54"}
|
| 476 |
+
{"current_steps": 476, "total_steps": 666, "loss": 0.4012, "lr": 6.459485292060468e-06, "epoch": 2.1409320606400897, "percentage": 71.47, "elapsed_time": "21:45:40", "remaining_time": "8:41:10"}
|
| 477 |
+
{"current_steps": 477, "total_steps": 666, "loss": 0.4009, "lr": 6.397318642395911e-06, "epoch": 2.145423919146547, "percentage": 71.62, "elapsed_time": "21:48:30", "remaining_time": "8:38:28"}
|
| 478 |
+
{"current_steps": 478, "total_steps": 666, "loss": 0.3972, "lr": 6.335365030315953e-06, "epoch": 2.149915777653004, "percentage": 71.77, "elapsed_time": "21:51:06", "remaining_time": "8:35:40"}
|
| 479 |
+
{"current_steps": 479, "total_steps": 666, "loss": 0.4017, "lr": 6.273626159985971e-06, "epoch": 2.154407636159461, "percentage": 71.92, "elapsed_time": "21:53:49", "remaining_time": "8:32:54"}
|
| 480 |
+
{"current_steps": 480, "total_steps": 666, "loss": 0.4028, "lr": 6.2121037296644114e-06, "epoch": 2.158899494665918, "percentage": 72.07, "elapsed_time": "21:56:26", "remaining_time": "8:30:07"}
|
| 481 |
+
{"current_steps": 481, "total_steps": 666, "loss": 0.4188, "lr": 6.1507994316560836e-06, "epoch": 2.163391353172375, "percentage": 72.22, "elapsed_time": "21:59:21", "remaining_time": "8:27:26"}
|
| 482 |
+
{"current_steps": 482, "total_steps": 666, "loss": 0.37, "lr": 6.089714952265603e-06, "epoch": 2.167883211678832, "percentage": 72.37, "elapsed_time": "22:01:58", "remaining_time": "8:24:39"}
|
| 483 |
+
{"current_steps": 483, "total_steps": 666, "loss": 0.4305, "lr": 6.028851971751007e-06, "epoch": 2.1723750701852893, "percentage": 72.52, "elapsed_time": "22:04:51", "remaining_time": "8:21:57"}
|
| 484 |
+
{"current_steps": 484, "total_steps": 666, "loss": 0.3958, "lr": 5.968212164277541e-06, "epoch": 2.176866928691746, "percentage": 72.67, "elapsed_time": "22:07:29", "remaining_time": "8:19:10"}
|
| 485 |
+
{"current_steps": 485, "total_steps": 666, "loss": 0.4198, "lr": 5.9077971978716e-06, "epoch": 2.1813587871982034, "percentage": 72.82, "elapsed_time": "22:10:08", "remaining_time": "8:16:24"}
|
| 486 |
+
{"current_steps": 486, "total_steps": 666, "loss": 0.4195, "lr": 5.8476087343748505e-06, "epoch": 2.1858506457046603, "percentage": 72.97, "elapsed_time": "22:12:52", "remaining_time": "8:13:39"}
|
| 487 |
+
{"current_steps": 487, "total_steps": 666, "loss": 0.3914, "lr": 5.787648429398515e-06, "epoch": 2.1903425042111175, "percentage": 73.12, "elapsed_time": "22:15:21", "remaining_time": "8:10:49"}
|
| 488 |
+
{"current_steps": 488, "total_steps": 666, "loss": 0.414, "lr": 5.727917932277831e-06, "epoch": 2.1948343627175744, "percentage": 73.27, "elapsed_time": "22:18:00", "remaining_time": "8:08:02"}
|
| 489 |
+
{"current_steps": 489, "total_steps": 666, "loss": 0.3993, "lr": 5.668418886026689e-06, "epoch": 2.199326221224031, "percentage": 73.42, "elapsed_time": "22:20:45", "remaining_time": "8:05:18"}
|
| 490 |
+
{"current_steps": 490, "total_steps": 666, "loss": 0.3934, "lr": 5.609152927292432e-06, "epoch": 2.2038180797304885, "percentage": 73.57, "elapsed_time": "22:23:22", "remaining_time": "8:02:31"}
|
| 491 |
+
{"current_steps": 491, "total_steps": 666, "loss": 0.3982, "lr": 5.55012168631083e-06, "epoch": 2.2083099382369458, "percentage": 73.72, "elapsed_time": "22:26:15", "remaining_time": "7:59:49"}
|
| 492 |
+
{"current_steps": 492, "total_steps": 666, "loss": 0.3956, "lr": 5.491326786861248e-06, "epoch": 2.2128017967434026, "percentage": 73.87, "elapsed_time": "22:28:45", "remaining_time": "7:57:00"}
|
| 493 |
+
{"current_steps": 493, "total_steps": 666, "loss": 0.4166, "lr": 5.432769846221986e-06, "epoch": 2.2172936552498594, "percentage": 74.02, "elapsed_time": "22:31:27", "remaining_time": "7:54:14"}
|
| 494 |
+
{"current_steps": 494, "total_steps": 666, "loss": 0.3881, "lr": 5.374452475125769e-06, "epoch": 2.2217855137563167, "percentage": 74.17, "elapsed_time": "22:34:11", "remaining_time": "7:51:29"}
|
| 495 |
+
{"current_steps": 495, "total_steps": 666, "loss": 0.3912, "lr": 5.316376277715458e-06, "epoch": 2.2262773722627736, "percentage": 74.32, "elapsed_time": "22:36:48", "remaining_time": "7:48:43"}
|
| 496 |
+
{"current_steps": 496, "total_steps": 666, "loss": 0.3956, "lr": 5.258542851499929e-06, "epoch": 2.230769230769231, "percentage": 74.47, "elapsed_time": "22:39:27", "remaining_time": "7:45:56"}
|
| 497 |
+
{"current_steps": 497, "total_steps": 666, "loss": 0.4026, "lr": 5.200953787310104e-06, "epoch": 2.2352610892756877, "percentage": 74.62, "elapsed_time": "22:42:12", "remaining_time": "7:43:12"}
|
| 498 |
+
{"current_steps": 498, "total_steps": 666, "loss": 0.3952, "lr": 5.143610669255224e-06, "epoch": 2.239752947782145, "percentage": 74.77, "elapsed_time": "22:44:53", "remaining_time": "7:40:26"}
|
| 499 |
+
{"current_steps": 499, "total_steps": 666, "loss": 0.3885, "lr": 5.08651507467926e-06, "epoch": 2.244244806288602, "percentage": 74.92, "elapsed_time": "22:47:34", "remaining_time": "7:37:41"}
|
| 500 |
+
{"current_steps": 500, "total_steps": 666, "loss": 0.4158, "lr": 5.02966857411752e-06, "epoch": 2.248736664795059, "percentage": 75.08, "elapsed_time": "22:50:17", "remaining_time": "7:34:56"}
|
| 501 |
+
{"current_steps": 501, "total_steps": 666, "loss": 0.3998, "lr": 4.9730727312534544e-06, "epoch": 2.253228523301516, "percentage": 75.23, "elapsed_time": "22:53:08", "remaining_time": "7:32:13"}
|
| 502 |
+
{"current_steps": 502, "total_steps": 666, "loss": 0.418, "lr": 4.916729102875645e-06, "epoch": 2.257720381807973, "percentage": 75.38, "elapsed_time": "22:55:55", "remaining_time": "7:29:30"}
|
| 503 |
+
{"current_steps": 503, "total_steps": 666, "loss": 0.3897, "lr": 4.860639238834977e-06, "epoch": 2.26221224031443, "percentage": 75.53, "elapsed_time": "22:58:46", "remaining_time": "7:26:48"}
|
| 504 |
+
{"current_steps": 504, "total_steps": 666, "loss": 0.4283, "lr": 4.8048046820020125e-06, "epoch": 2.2667040988208873, "percentage": 75.68, "elapsed_time": "23:01:39", "remaining_time": "7:24:06"}
|
| 505 |
+
{"current_steps": 505, "total_steps": 666, "loss": 0.3976, "lr": 4.7492269682245465e-06, "epoch": 2.271195957327344, "percentage": 75.83, "elapsed_time": "23:04:20", "remaining_time": "7:21:20"}
|
| 506 |
+
{"current_steps": 506, "total_steps": 666, "loss": 0.3925, "lr": 4.693907626285361e-06, "epoch": 2.2756878158338014, "percentage": 75.98, "elapsed_time": "23:06:56", "remaining_time": "7:18:33"}
|
| 507 |
+
{"current_steps": 507, "total_steps": 666, "loss": 0.4004, "lr": 4.638848177860173e-06, "epoch": 2.2801796743402583, "percentage": 76.13, "elapsed_time": "23:09:43", "remaining_time": "7:15:49"}
|
| 508 |
+
{"current_steps": 508, "total_steps": 666, "loss": 0.4313, "lr": 4.584050137475774e-06, "epoch": 2.2846715328467155, "percentage": 76.28, "elapsed_time": "23:12:31", "remaining_time": "7:13:06"}
|
| 509 |
+
{"current_steps": 509, "total_steps": 666, "loss": 0.3981, "lr": 4.529515012468387e-06, "epoch": 2.2891633913531724, "percentage": 76.43, "elapsed_time": "23:15:24", "remaining_time": "7:10:24"}
|
| 510 |
+
{"current_steps": 510, "total_steps": 666, "loss": 0.409, "lr": 4.475244302942176e-06, "epoch": 2.293655249859629, "percentage": 76.58, "elapsed_time": "23:18:10", "remaining_time": "7:07:40"}
|
| 511 |
+
{"current_steps": 511, "total_steps": 666, "loss": 0.4111, "lr": 4.421239501728004e-06, "epoch": 2.2981471083660865, "percentage": 76.73, "elapsed_time": "23:20:50", "remaining_time": "7:04:54"}
|
| 512 |
+
{"current_steps": 512, "total_steps": 666, "loss": 0.4148, "lr": 4.367502094342358e-06, "epoch": 2.3026389668725433, "percentage": 76.88, "elapsed_time": "23:23:28", "remaining_time": "7:02:08"}
|
| 513 |
+
{"current_steps": 513, "total_steps": 666, "loss": 0.4175, "lr": 4.3140335589464955e-06, "epoch": 2.3071308253790006, "percentage": 77.03, "elapsed_time": "23:26:17", "remaining_time": "6:59:25"}
|
| 514 |
+
{"current_steps": 514, "total_steps": 666, "loss": 0.3954, "lr": 4.260835366305778e-06, "epoch": 2.3116226838854574, "percentage": 77.18, "elapsed_time": "23:29:01", "remaining_time": "6:56:40"}
|
| 515 |
+
{"current_steps": 515, "total_steps": 666, "loss": 0.4029, "lr": 4.2079089797492155e-06, "epoch": 2.3161145423919147, "percentage": 77.33, "elapsed_time": "23:31:41", "remaining_time": "6:53:54"}
|
| 516 |
+
{"current_steps": 516, "total_steps": 666, "loss": 0.3914, "lr": 4.1552558551292194e-06, "epoch": 2.3206064008983716, "percentage": 77.48, "elapsed_time": "23:34:35", "remaining_time": "6:51:13"}
|
| 517 |
+
{"current_steps": 517, "total_steps": 666, "loss": 0.4087, "lr": 4.1028774407815484e-06, "epoch": 2.325098259404829, "percentage": 77.63, "elapsed_time": "23:37:18", "remaining_time": "6:48:28"}
|
| 518 |
+
{"current_steps": 518, "total_steps": 666, "loss": 0.4116, "lr": 4.050775177485476e-06, "epoch": 2.3295901179112857, "percentage": 77.78, "elapsed_time": "23:40:08", "remaining_time": "6:45:45"}
|
| 519 |
+
{"current_steps": 519, "total_steps": 666, "loss": 0.4011, "lr": 3.998950498424157e-06, "epoch": 2.334081976417743, "percentage": 77.93, "elapsed_time": "23:42:42", "remaining_time": "6:42:57"}
|
| 520 |
+
{"current_steps": 520, "total_steps": 666, "loss": 0.3923, "lr": 3.947404829145199e-06, "epoch": 2.3385738349242, "percentage": 78.08, "elapsed_time": "23:45:25", "remaining_time": "6:40:12"}
|
| 521 |
+
{"current_steps": 521, "total_steps": 666, "loss": 0.4405, "lr": 3.896139587521457e-06, "epoch": 2.343065693430657, "percentage": 78.23, "elapsed_time": "23:48:06", "remaining_time": "6:37:27"}
|
| 522 |
+
{"current_steps": 522, "total_steps": 666, "loss": 0.385, "lr": 3.84515618371203e-06, "epoch": 2.347557551937114, "percentage": 78.38, "elapsed_time": "23:50:41", "remaining_time": "6:34:40"}
|
| 523 |
+
{"current_steps": 523, "total_steps": 666, "loss": 0.4128, "lr": 3.794456020123469e-06, "epoch": 2.352049410443571, "percentage": 78.53, "elapsed_time": "23:53:25", "remaining_time": "6:31:55"}
|
| 524 |
+
{"current_steps": 524, "total_steps": 666, "loss": 0.3956, "lr": 3.744040491371204e-06, "epoch": 2.356541268950028, "percentage": 78.68, "elapsed_time": "23:56:01", "remaining_time": "6:29:09"}
|
| 525 |
+
{"current_steps": 525, "total_steps": 666, "loss": 0.4134, "lr": 3.693910984241176e-06, "epoch": 2.3610331274564853, "percentage": 78.83, "elapsed_time": "23:58:52", "remaining_time": "6:26:26"}
|
| 526 |
+
{"current_steps": 526, "total_steps": 666, "loss": 0.3955, "lr": 3.6440688776517076e-06, "epoch": 2.365524985962942, "percentage": 78.98, "elapsed_time": "1 day, 0:01:38", "remaining_time": "6:23:42"}
|
| 527 |
+
{"current_steps": 527, "total_steps": 666, "loss": 0.3952, "lr": 3.5945155426155476e-06, "epoch": 2.370016844469399, "percentage": 79.13, "elapsed_time": "1 day, 0:04:16", "remaining_time": "6:20:56"}
|
| 528 |
+
{"current_steps": 528, "total_steps": 666, "loss": 0.4198, "lr": 3.5452523422021744e-06, "epoch": 2.3745087029758563, "percentage": 79.28, "elapsed_time": "1 day, 0:07:00", "remaining_time": "6:18:11"}
|
| 529 |
+
{"current_steps": 529, "total_steps": 666, "loss": 0.4071, "lr": 3.496280631500304e-06, "epoch": 2.3790005614823135, "percentage": 79.43, "elapsed_time": "1 day, 0:09:42", "remaining_time": "6:15:26"}
|
| 530 |
+
{"current_steps": 530, "total_steps": 666, "loss": 0.4254, "lr": 3.447601757580604e-06, "epoch": 2.3834924199887704, "percentage": 79.58, "elapsed_time": "1 day, 0:12:34", "remaining_time": "6:12:44"}
|
| 531 |
+
{"current_steps": 531, "total_steps": 666, "loss": 0.3874, "lr": 3.399217059458649e-06, "epoch": 2.387984278495227, "percentage": 79.73, "elapsed_time": "1 day, 0:15:17", "remaining_time": "6:09:59"}
|
| 532 |
+
{"current_steps": 532, "total_steps": 666, "loss": 0.4191, "lr": 3.3511278680580843e-06, "epoch": 2.3924761370016845, "percentage": 79.88, "elapsed_time": "1 day, 0:18:05", "remaining_time": "6:07:15"}
|
| 533 |
+
{"current_steps": 533, "total_steps": 666, "loss": 0.3967, "lr": 3.303335506174018e-06, "epoch": 2.3969679955081413, "percentage": 80.03, "elapsed_time": "1 day, 0:20:48", "remaining_time": "6:04:31"}
|
| 534 |
+
{"current_steps": 534, "total_steps": 666, "loss": 0.404, "lr": 3.2558412884366303e-06, "epoch": 2.4014598540145986, "percentage": 80.18, "elapsed_time": "1 day, 0:23:36", "remaining_time": "6:01:47"}
|
| 535 |
+
{"current_steps": 535, "total_steps": 666, "loss": 0.419, "lr": 3.2086465212750174e-06, "epoch": 2.4059517125210554, "percentage": 80.33, "elapsed_time": "1 day, 0:26:29", "remaining_time": "5:59:05"}
|
| 536 |
+
{"current_steps": 536, "total_steps": 666, "loss": 0.4005, "lr": 3.1617525028812533e-06, "epoch": 2.4104435710275127, "percentage": 80.48, "elapsed_time": "1 day, 0:29:16", "remaining_time": "5:56:21"}
|
| 537 |
+
{"current_steps": 537, "total_steps": 666, "loss": 0.4078, "lr": 3.115160523174681e-06, "epoch": 2.4149354295339696, "percentage": 80.63, "elapsed_time": "1 day, 0:32:03", "remaining_time": "5:53:37"}
|
| 538 |
+
{"current_steps": 538, "total_steps": 666, "loss": 0.4163, "lr": 3.0688718637664205e-06, "epoch": 2.419427288040427, "percentage": 80.78, "elapsed_time": "1 day, 0:34:43", "remaining_time": "5:50:51"}
|
| 539 |
+
{"current_steps": 539, "total_steps": 666, "loss": 0.3743, "lr": 3.0228877979241345e-06, "epoch": 2.4239191465468837, "percentage": 80.93, "elapsed_time": "1 day, 0:37:18", "remaining_time": "5:48:05"}
|
| 540 |
+
{"current_steps": 540, "total_steps": 666, "loss": 0.4152, "lr": 2.9772095905369913e-06, "epoch": 2.428411005053341, "percentage": 81.08, "elapsed_time": "1 day, 0:40:07", "remaining_time": "5:45:21"}
|
| 541 |
+
{"current_steps": 541, "total_steps": 666, "loss": 0.4059, "lr": 2.9318384980808727e-06, "epoch": 2.432902863559798, "percentage": 81.23, "elapsed_time": "1 day, 0:43:06", "remaining_time": "5:42:40"}
|
| 542 |
+
{"current_steps": 542, "total_steps": 666, "loss": 0.3939, "lr": 2.8867757685838118e-06, "epoch": 2.437394722066255, "percentage": 81.38, "elapsed_time": "1 day, 0:45:50", "remaining_time": "5:39:55"}
|
| 543 |
+
{"current_steps": 543, "total_steps": 666, "loss": 0.3997, "lr": 2.8420226415916757e-06, "epoch": 2.441886580572712, "percentage": 81.53, "elapsed_time": "1 day, 0:48:37", "remaining_time": "5:37:12"}
|
| 544 |
+
{"current_steps": 544, "total_steps": 666, "loss": 0.4023, "lr": 2.7975803481340463e-06, "epoch": 2.446378439079169, "percentage": 81.68, "elapsed_time": "1 day, 0:51:29", "remaining_time": "5:34:29"}
|
| 545 |
+
{"current_steps": 545, "total_steps": 666, "loss": 0.4052, "lr": 2.753450110690375e-06, "epoch": 2.450870297585626, "percentage": 81.83, "elapsed_time": "1 day, 0:54:05", "remaining_time": "5:31:42"}
|
| 546 |
+
{"current_steps": 546, "total_steps": 666, "loss": 0.3799, "lr": 2.709633143156353e-06, "epoch": 2.4553621560920833, "percentage": 81.98, "elapsed_time": "1 day, 0:56:45", "remaining_time": "5:28:57"}
|
| 547 |
+
{"current_steps": 547, "total_steps": 666, "loss": 0.4042, "lr": 2.666130650810515e-06, "epoch": 2.45985401459854, "percentage": 82.13, "elapsed_time": "1 day, 0:59:28", "remaining_time": "5:26:12"}
|
| 548 |
+
{"current_steps": 548, "total_steps": 666, "loss": 0.4253, "lr": 2.6229438302810933e-06, "epoch": 2.464345873104997, "percentage": 82.28, "elapsed_time": "1 day, 1:02:12", "remaining_time": "5:23:28"}
|
| 549 |
+
{"current_steps": 549, "total_steps": 666, "loss": 0.3916, "lr": 2.580073869513094e-06, "epoch": 2.4688377316114543, "percentage": 82.43, "elapsed_time": "1 day, 1:04:59", "remaining_time": "5:20:44"}
|
| 550 |
+
{"current_steps": 550, "total_steps": 666, "loss": 0.4193, "lr": 2.5375219477356294e-06, "epoch": 2.473329590117911, "percentage": 82.58, "elapsed_time": "1 day, 1:07:32", "remaining_time": "5:17:57"}
|
| 551 |
+
{"current_steps": 551, "total_steps": 666, "loss": 0.4168, "lr": 2.4952892354294682e-06, "epoch": 2.4778214486243684, "percentage": 82.73, "elapsed_time": "1 day, 1:10:28", "remaining_time": "5:15:15"}
|
| 552 |
+
{"current_steps": 552, "total_steps": 666, "loss": 0.3986, "lr": 2.4533768942948534e-06, "epoch": 2.482313307130825, "percentage": 82.88, "elapsed_time": "1 day, 1:13:14", "remaining_time": "5:12:31"}
|
| 553 |
+
{"current_steps": 553, "total_steps": 666, "loss": 0.4066, "lr": 2.4117860772195375e-06, "epoch": 2.4868051656372825, "percentage": 83.03, "elapsed_time": "1 day, 1:16:04", "remaining_time": "5:09:47"}
|
| 554 |
+
{"current_steps": 554, "total_steps": 666, "loss": 0.3951, "lr": 2.3705179282470687e-06, "epoch": 2.4912970241437393, "percentage": 83.18, "elapsed_time": "1 day, 1:18:44", "remaining_time": "5:07:02"}
|
| 555 |
+
{"current_steps": 555, "total_steps": 666, "loss": 0.4096, "lr": 2.329573582545332e-06, "epoch": 2.4957888826501966, "percentage": 83.33, "elapsed_time": "1 day, 1:21:24", "remaining_time": "5:04:16"}
|
| 556 |
+
{"current_steps": 556, "total_steps": 666, "loss": 0.3814, "lr": 2.288954166375312e-06, "epoch": 2.5002807411566534, "percentage": 83.48, "elapsed_time": "1 day, 1:23:54", "remaining_time": "5:01:29"}
|
| 557 |
+
{"current_steps": 557, "total_steps": 666, "loss": 0.4286, "lr": 2.2486607970601196e-06, "epoch": 2.5047725996631107, "percentage": 83.63, "elapsed_time": "1 day, 1:26:34", "remaining_time": "4:58:44"}
|
| 558 |
+
{"current_steps": 558, "total_steps": 666, "loss": 0.375, "lr": 2.2086945829542548e-06, "epoch": 2.5092644581695676, "percentage": 83.78, "elapsed_time": "1 day, 1:29:11", "remaining_time": "4:55:58"}
|
| 559 |
+
{"current_steps": 559, "total_steps": 666, "loss": 0.3948, "lr": 2.1690566234131268e-06, "epoch": 2.513756316676025, "percentage": 83.93, "elapsed_time": "1 day, 1:31:52", "remaining_time": "4:53:13"}
|
| 560 |
+
{"current_steps": 560, "total_steps": 666, "loss": 0.4195, "lr": 2.1297480087628017e-06, "epoch": 2.5182481751824817, "percentage": 84.08, "elapsed_time": "1 day, 1:34:37", "remaining_time": "4:50:28"}
|
| 561 |
+
{"current_steps": 561, "total_steps": 666, "loss": 0.394, "lr": 2.090769820270016e-06, "epoch": 2.522740033688939, "percentage": 84.23, "elapsed_time": "1 day, 1:37:14", "remaining_time": "4:47:43"}
|
| 562 |
+
{"current_steps": 562, "total_steps": 666, "loss": 0.4015, "lr": 2.0521231301124356e-06, "epoch": 2.527231892195396, "percentage": 84.38, "elapsed_time": "1 day, 1:40:01", "remaining_time": "4:44:59"}
|
| 563 |
+
{"current_steps": 563, "total_steps": 666, "loss": 0.39, "lr": 2.013809001349163e-06, "epoch": 2.531723750701853, "percentage": 84.53, "elapsed_time": "1 day, 1:42:46", "remaining_time": "4:42:14"}
|
| 564 |
+
{"current_steps": 564, "total_steps": 666, "loss": 0.4132, "lr": 1.9758284878914944e-06, "epoch": 2.53621560920831, "percentage": 84.68, "elapsed_time": "1 day, 1:45:32", "remaining_time": "4:39:30"}
|
| 565 |
+
{"current_steps": 565, "total_steps": 666, "loss": 0.4211, "lr": 1.9381826344739317e-06, "epoch": 2.5407074677147667, "percentage": 84.83, "elapsed_time": "1 day, 1:48:12", "remaining_time": "4:36:45"}
|
| 566 |
+
{"current_steps": 566, "total_steps": 666, "loss": 0.4131, "lr": 1.9008724766254398e-06, "epoch": 2.545199326221224, "percentage": 84.98, "elapsed_time": "1 day, 1:50:56", "remaining_time": "4:34:01"}
|
| 567 |
+
{"current_steps": 567, "total_steps": 666, "loss": 0.3899, "lr": 1.8638990406409697e-06, "epoch": 2.5496911847276813, "percentage": 85.14, "elapsed_time": "1 day, 1:53:36", "remaining_time": "4:31:15"}
|
| 568 |
+
{"current_steps": 568, "total_steps": 666, "loss": 0.3861, "lr": 1.8272633435532205e-06, "epoch": 2.554183043234138, "percentage": 85.29, "elapsed_time": "1 day, 1:56:16", "remaining_time": "4:28:30"}
|
| 569 |
+
{"current_steps": 569, "total_steps": 666, "loss": 0.4472, "lr": 1.7909663931046709e-06, "epoch": 2.558674901740595, "percentage": 85.44, "elapsed_time": "1 day, 1:58:54", "remaining_time": "4:25:45"}
|
| 570 |
+
{"current_steps": 570, "total_steps": 666, "loss": 0.3958, "lr": 1.7550091877198515e-06, "epoch": 2.5631667602470523, "percentage": 85.59, "elapsed_time": "1 day, 2:01:37", "remaining_time": "4:23:00"}
|
| 571 |
+
{"current_steps": 571, "total_steps": 666, "loss": 0.3979, "lr": 1.719392716477887e-06, "epoch": 2.5676586187535095, "percentage": 85.74, "elapsed_time": "1 day, 2:04:22", "remaining_time": "4:20:16"}
|
| 572 |
+
{"current_steps": 572, "total_steps": 666, "loss": 0.4047, "lr": 1.6841179590852887e-06, "epoch": 2.5721504772599664, "percentage": 85.89, "elapsed_time": "1 day, 2:07:03", "remaining_time": "4:17:31"}
|
| 573 |
+
{"current_steps": 573, "total_steps": 666, "loss": 0.3919, "lr": 1.6491858858490027e-06, "epoch": 2.576642335766423, "percentage": 86.04, "elapsed_time": "1 day, 2:09:37", "remaining_time": "4:14:45"}
|
| 574 |
+
{"current_steps": 574, "total_steps": 666, "loss": 0.4361, "lr": 1.614597457649723e-06, "epoch": 2.5811341942728805, "percentage": 86.19, "elapsed_time": "1 day, 2:12:24", "remaining_time": "4:12:01"}
|
| 575 |
+
{"current_steps": 575, "total_steps": 666, "loss": 0.3871, "lr": 1.5803536259154552e-06, "epoch": 2.5856260527793373, "percentage": 86.34, "elapsed_time": "1 day, 2:15:06", "remaining_time": "4:09:16"}
|
| 576 |
+
{"current_steps": 576, "total_steps": 666, "loss": 0.4031, "lr": 1.546455332595352e-06, "epoch": 2.5901179112857946, "percentage": 86.49, "elapsed_time": "1 day, 2:17:55", "remaining_time": "4:06:32"}
|
| 577 |
+
{"current_steps": 577, "total_steps": 666, "loss": 0.41, "lr": 1.5129035101338013e-06, "epoch": 2.5946097697922514, "percentage": 86.64, "elapsed_time": "1 day, 2:20:39", "remaining_time": "4:03:48"}
|
| 578 |
+
{"current_steps": 578, "total_steps": 666, "loss": 0.3911, "lr": 1.479699081444771e-06, "epoch": 2.5991016282987087, "percentage": 86.79, "elapsed_time": "1 day, 2:23:19", "remaining_time": "4:01:03"}
|
| 579 |
+
{"current_steps": 579, "total_steps": 666, "loss": 0.4091, "lr": 1.44684295988643e-06, "epoch": 2.6035934868051656, "percentage": 86.94, "elapsed_time": "1 day, 2:26:10", "remaining_time": "3:58:20"}
|
| 580 |
+
{"current_steps": 580, "total_steps": 666, "loss": 0.4048, "lr": 1.4143360492360238e-06, "epoch": 2.608085345311623, "percentage": 87.09, "elapsed_time": "1 day, 2:28:59", "remaining_time": "3:55:36"}
|
| 581 |
+
{"current_steps": 581, "total_steps": 666, "loss": 0.4065, "lr": 1.3821792436650067e-06, "epoch": 2.6125772038180797, "percentage": 87.24, "elapsed_time": "1 day, 2:31:34", "remaining_time": "3:52:50"}
|
| 582 |
+
{"current_steps": 582, "total_steps": 666, "loss": 0.4163, "lr": 1.350373427714457e-06, "epoch": 2.6170690623245365, "percentage": 87.39, "elapsed_time": "1 day, 2:34:20", "remaining_time": "3:50:06"}
|
| 583 |
+
{"current_steps": 583, "total_steps": 666, "loss": 0.3724, "lr": 1.3189194762707326e-06, "epoch": 2.621560920830994, "percentage": 87.54, "elapsed_time": "1 day, 2:37:11", "remaining_time": "3:47:23"}
|
| 584 |
+
{"current_steps": 584, "total_steps": 666, "loss": 0.4149, "lr": 1.2878182545414191e-06, "epoch": 2.626052779337451, "percentage": 87.69, "elapsed_time": "1 day, 2:40:02", "remaining_time": "3:44:39"}
|
| 585 |
+
{"current_steps": 585, "total_steps": 666, "loss": 0.3933, "lr": 1.2570706180315225e-06, "epoch": 2.630544637843908, "percentage": 87.84, "elapsed_time": "1 day, 2:42:43", "remaining_time": "3:41:55"}
|
| 586 |
+
{"current_steps": 586, "total_steps": 666, "loss": 0.4214, "lr": 1.2266774125199337e-06, "epoch": 2.6350364963503647, "percentage": 87.99, "elapsed_time": "1 day, 2:45:35", "remaining_time": "3:39:11"}
|
| 587 |
+
{"current_steps": 587, "total_steps": 666, "loss": 0.4042, "lr": 1.1966394740361719e-06, "epoch": 2.639528354856822, "percentage": 88.14, "elapsed_time": "1 day, 2:48:11", "remaining_time": "3:36:26"}
|
| 588 |
+
{"current_steps": 588, "total_steps": 666, "loss": 0.4081, "lr": 1.1669576288373846e-06, "epoch": 2.6440202133632793, "percentage": 88.29, "elapsed_time": "1 day, 2:51:00", "remaining_time": "3:33:42"}
|
| 589 |
+
{"current_steps": 589, "total_steps": 666, "loss": 0.3906, "lr": 1.1376326933856181e-06, "epoch": 2.648512071869736, "percentage": 88.44, "elapsed_time": "1 day, 2:53:42", "remaining_time": "3:30:57"}
|
| 590 |
+
{"current_steps": 590, "total_steps": 666, "loss": 0.4137, "lr": 1.1086654743253583e-06, "epoch": 2.653003930376193, "percentage": 88.59, "elapsed_time": "1 day, 2:56:30", "remaining_time": "3:28:13"}
|
| 591 |
+
{"current_steps": 591, "total_steps": 666, "loss": 0.4087, "lr": 1.0800567684613445e-06, "epoch": 2.6574957888826503, "percentage": 88.74, "elapsed_time": "1 day, 2:59:20", "remaining_time": "3:25:29"}
|
| 592 |
+
{"current_steps": 592, "total_steps": 666, "loss": 0.4019, "lr": 1.0518073627366485e-06, "epoch": 2.661987647389107, "percentage": 88.89, "elapsed_time": "1 day, 3:02:03", "remaining_time": "3:22:45"}
|
| 593 |
+
{"current_steps": 593, "total_steps": 666, "loss": 0.3952, "lr": 1.0239180342110379e-06, "epoch": 2.6664795058955644, "percentage": 89.04, "elapsed_time": "1 day, 3:04:48", "remaining_time": "3:20:01"}
|
| 594 |
+
{"current_steps": 594, "total_steps": 666, "loss": 0.4065, "lr": 9.963895500395894e-07, "epoch": 2.670971364402021, "percentage": 89.19, "elapsed_time": "1 day, 3:07:35", "remaining_time": "3:17:17"}
|
| 595 |
+
{"current_steps": 595, "total_steps": 666, "loss": 0.4102, "lr": 9.692226674515869e-07, "epoch": 2.6754632229084785, "percentage": 89.34, "elapsed_time": "1 day, 3:10:23", "remaining_time": "3:14:33"}
|
| 596 |
+
{"current_steps": 596, "total_steps": 666, "loss": 0.402, "lr": 9.424181337297035e-07, "epoch": 2.6799550814149353, "percentage": 89.49, "elapsed_time": "1 day, 3:13:10", "remaining_time": "3:11:49"}
|
| 597 |
+
{"current_steps": 597, "total_steps": 666, "loss": 0.4067, "lr": 9.159766861894357e-07, "epoch": 2.6844469399213926, "percentage": 89.64, "elapsed_time": "1 day, 3:16:00", "remaining_time": "3:09:05"}
|
| 598 |
+
{"current_steps": 598, "total_steps": 666, "loss": 0.395, "lr": 8.89899052158824e-07, "epoch": 2.6889387984278494, "percentage": 89.79, "elapsed_time": "1 day, 3:18:43", "remaining_time": "3:06:20"}
|
| 599 |
+
{"current_steps": 599, "total_steps": 666, "loss": 0.4073, "lr": 8.641859489584498e-07, "epoch": 2.6934306569343067, "percentage": 89.94, "elapsed_time": "1 day, 3:21:30", "remaining_time": "3:03:36"}
|
| 600 |
+
{"current_steps": 600, "total_steps": 666, "loss": 0.387, "lr": 8.388380838817022e-07, "epoch": 2.6979225154407636, "percentage": 90.09, "elapsed_time": "1 day, 3:24:12", "remaining_time": "3:00:51"}
|
| 601 |
+
{"current_steps": 601, "total_steps": 666, "loss": 0.411, "lr": 8.138561541753177e-07, "epoch": 2.702414373947221, "percentage": 90.24, "elapsed_time": "1 day, 3:26:54", "remaining_time": "2:58:07"}
|
| 602 |
+
{"current_steps": 602, "total_steps": 666, "loss": 0.3968, "lr": 7.892408470202099e-07, "epoch": 2.7069062324536777, "percentage": 90.39, "elapsed_time": "1 day, 3:29:42", "remaining_time": "2:55:23"}
|
| 603 |
+
{"current_steps": 603, "total_steps": 666, "loss": 0.4057, "lr": 7.649928395125592e-07, "epoch": 2.7113980909601345, "percentage": 90.54, "elapsed_time": "1 day, 3:32:36", "remaining_time": "2:52:39"}
|
| 604 |
+
{"current_steps": 604, "total_steps": 666, "loss": 0.4037, "lr": 7.411127986451912e-07, "epoch": 2.715889949466592, "percentage": 90.69, "elapsed_time": "1 day, 3:35:23", "remaining_time": "2:49:55"}
|
| 605 |
+
{"current_steps": 605, "total_steps": 666, "loss": 0.4194, "lr": 7.176013812892307e-07, "epoch": 2.720381807973049, "percentage": 90.84, "elapsed_time": "1 day, 3:38:08", "remaining_time": "2:47:11"}
|
| 606 |
+
{"current_steps": 606, "total_steps": 666, "loss": 0.3818, "lr": 6.944592341760311e-07, "epoch": 2.724873666479506, "percentage": 90.99, "elapsed_time": "1 day, 3:40:50", "remaining_time": "2:44:26"}
|
| 607 |
+
{"current_steps": 607, "total_steps": 666, "loss": 0.3984, "lr": 6.716869938793857e-07, "epoch": 2.7293655249859627, "percentage": 91.14, "elapsed_time": "1 day, 3:43:29", "remaining_time": "2:41:41"}
|
| 608 |
+
{"current_steps": 608, "total_steps": 666, "loss": 0.398, "lr": 6.492852867980155e-07, "epoch": 2.73385738349242, "percentage": 91.29, "elapsed_time": "1 day, 3:46:09", "remaining_time": "2:38:56"}
|
| 609 |
+
{"current_steps": 609, "total_steps": 666, "loss": 0.4086, "lr": 6.272547291383403e-07, "epoch": 2.7383492419988773, "percentage": 91.44, "elapsed_time": "1 day, 3:48:40", "remaining_time": "2:36:10"}
|
| 610 |
+
{"current_steps": 610, "total_steps": 666, "loss": 0.4031, "lr": 6.055959268975332e-07, "epoch": 2.742841100505334, "percentage": 91.59, "elapsed_time": "1 day, 3:51:13", "remaining_time": "2:33:25"}
|
| 611 |
+
{"current_steps": 611, "total_steps": 666, "loss": 0.3861, "lr": 5.843094758468389e-07, "epoch": 2.747332959011791, "percentage": 91.74, "elapsed_time": "1 day, 3:54:03", "remaining_time": "2:30:41"}
|
| 612 |
+
{"current_steps": 612, "total_steps": 666, "loss": 0.4037, "lr": 5.633959615152007e-07, "epoch": 2.7518248175182483, "percentage": 91.89, "elapsed_time": "1 day, 3:56:46", "remaining_time": "2:27:57"}
|
| 613 |
+
{"current_steps": 613, "total_steps": 666, "loss": 0.3994, "lr": 5.428559591731436e-07, "epoch": 2.756316676024705, "percentage": 92.04, "elapsed_time": "1 day, 3:59:28", "remaining_time": "2:25:12"}
|
| 614 |
+
{"current_steps": 614, "total_steps": 666, "loss": 0.3973, "lr": 5.226900338169552e-07, "epoch": 2.7608085345311624, "percentage": 92.19, "elapsed_time": "1 day, 4:02:09", "remaining_time": "2:22:27"}
|
| 615 |
+
{"current_steps": 615, "total_steps": 666, "loss": 0.4056, "lr": 5.028987401531437e-07, "epoch": 2.765300393037619, "percentage": 92.34, "elapsed_time": "1 day, 4:04:44", "remaining_time": "2:19:42"}
|
| 616 |
+
{"current_steps": 616, "total_steps": 666, "loss": 0.3863, "lr": 4.834826225831736e-07, "epoch": 2.7697922515440765, "percentage": 92.49, "elapsed_time": "1 day, 4:07:29", "remaining_time": "2:16:58"}
|
| 617 |
+
{"current_steps": 617, "total_steps": 666, "loss": 0.4194, "lr": 4.644422151885038e-07, "epoch": 2.7742841100505333, "percentage": 92.64, "elapsed_time": "1 day, 4:10:17", "remaining_time": "2:14:14"}
|
| 618 |
+
{"current_steps": 618, "total_steps": 666, "loss": 0.4066, "lr": 4.457780417158842e-07, "epoch": 2.7787759685569906, "percentage": 92.79, "elapsed_time": "1 day, 4:13:07", "remaining_time": "2:11:30"}
|
| 619 |
+
{"current_steps": 619, "total_steps": 666, "loss": 0.4004, "lr": 4.274906155629513e-07, "epoch": 2.7832678270634474, "percentage": 92.94, "elapsed_time": "1 day, 4:15:48", "remaining_time": "2:08:45"}
|
| 620 |
+
{"current_steps": 620, "total_steps": 666, "loss": 0.3835, "lr": 4.095804397641149e-07, "epoch": 2.7877596855699043, "percentage": 93.09, "elapsed_time": "1 day, 4:18:17", "remaining_time": "2:06:00"}
|
| 621 |
+
{"current_steps": 621, "total_steps": 666, "loss": 0.4147, "lr": 3.9204800697670965e-07, "epoch": 2.7922515440763616, "percentage": 93.24, "elapsed_time": "1 day, 4:20:53", "remaining_time": "2:03:15"}
|
| 622 |
+
{"current_steps": 622, "total_steps": 666, "loss": 0.4056, "lr": 3.7489379946744694e-07, "epoch": 2.796743402582819, "percentage": 93.39, "elapsed_time": "1 day, 4:23:43", "remaining_time": "2:00:31"}
|
| 623 |
+
{"current_steps": 623, "total_steps": 666, "loss": 0.4149, "lr": 3.5811828909915534e-07, "epoch": 2.8012352610892757, "percentage": 93.54, "elapsed_time": "1 day, 4:26:22", "remaining_time": "1:57:46"}
|
| 624 |
+
{"current_steps": 624, "total_steps": 666, "loss": 0.3966, "lr": 3.417219373177928e-07, "epoch": 2.8057271195957325, "percentage": 93.69, "elapsed_time": "1 day, 4:29:03", "remaining_time": "1:55:01"}
|
| 625 |
+
{"current_steps": 625, "total_steps": 666, "loss": 0.3997, "lr": 3.257051951397572e-07, "epoch": 2.81021897810219, "percentage": 93.84, "elapsed_time": "1 day, 4:31:58", "remaining_time": "1:52:18"}
|
| 626 |
+
{"current_steps": 626, "total_steps": 666, "loss": 0.4033, "lr": 3.1006850313948107e-07, "epoch": 2.814710836608647, "percentage": 93.99, "elapsed_time": "1 day, 4:34:47", "remaining_time": "1:49:34"}
|
| 627 |
+
{"current_steps": 627, "total_steps": 666, "loss": 0.3886, "lr": 2.9481229143731197e-07, "epoch": 2.819202695115104, "percentage": 94.14, "elapsed_time": "1 day, 4:37:36", "remaining_time": "1:46:50"}
|
| 628 |
+
{"current_steps": 628, "total_steps": 666, "loss": 0.4158, "lr": 2.7993697968767725e-07, "epoch": 2.8236945536215607, "percentage": 94.29, "elapsed_time": "1 day, 4:40:28", "remaining_time": "1:44:06"}
|
| 629 |
+
{"current_steps": 629, "total_steps": 666, "loss": 0.4068, "lr": 2.6544297706754683e-07, "epoch": 2.828186412128018, "percentage": 94.44, "elapsed_time": "1 day, 4:43:06", "remaining_time": "1:41:21"}
|
| 630 |
+
{"current_steps": 630, "total_steps": 666, "loss": 0.398, "lr": 2.5133068226517584e-07, "epoch": 2.832678270634475, "percentage": 94.59, "elapsed_time": "1 day, 4:45:55", "remaining_time": "1:38:37"}
|
| 631 |
+
{"current_steps": 631, "total_steps": 666, "loss": 0.4131, "lr": 2.3760048346913432e-07, "epoch": 2.837170129140932, "percentage": 94.74, "elapsed_time": "1 day, 4:48:42", "remaining_time": "1:35:53"}
|
| 632 |
+
{"current_steps": 632, "total_steps": 666, "loss": 0.3974, "lr": 2.2425275835763363e-07, "epoch": 2.841661987647389, "percentage": 94.89, "elapsed_time": "1 day, 4:51:35", "remaining_time": "1:33:09"}
|
| 633 |
+
{"current_steps": 633, "total_steps": 666, "loss": 0.4061, "lr": 2.1128787408813722e-07, "epoch": 2.8461538461538463, "percentage": 95.05, "elapsed_time": "1 day, 4:54:21", "remaining_time": "1:30:25"}
|
| 634 |
+
{"current_steps": 634, "total_steps": 666, "loss": 0.4119, "lr": 1.9870618728725558e-07, "epoch": 2.850645704660303, "percentage": 95.2, "elapsed_time": "1 day, 4:57:05", "remaining_time": "1:27:40"}
|
| 635 |
+
{"current_steps": 635, "total_steps": 666, "loss": 0.4165, "lr": 1.8650804404094718e-07, "epoch": 2.8551375631667604, "percentage": 95.35, "elapsed_time": "1 day, 4:59:55", "remaining_time": "1:24:56"}
|
| 636 |
+
{"current_steps": 636, "total_steps": 666, "loss": 0.3936, "lr": 1.7469377988498657e-07, "epoch": 2.859629421673217, "percentage": 95.5, "elapsed_time": "1 day, 5:02:42", "remaining_time": "1:22:12"}
|
| 637 |
+
{"current_steps": 637, "total_steps": 666, "loss": 0.3946, "lr": 1.632637197957446e-07, "epoch": 2.8641212801796745, "percentage": 95.65, "elapsed_time": "1 day, 5:05:25", "remaining_time": "1:19:27"}
|
| 638 |
+
{"current_steps": 638, "total_steps": 666, "loss": 0.4082, "lr": 1.522181781812407e-07, "epoch": 2.8686131386861313, "percentage": 95.8, "elapsed_time": "1 day, 5:08:07", "remaining_time": "1:16:43"}
|
| 639 |
+
{"current_steps": 639, "total_steps": 666, "loss": 0.4165, "lr": 1.415574588725056e-07, "epoch": 2.8731049971925886, "percentage": 95.95, "elapsed_time": "1 day, 5:10:59", "remaining_time": "1:13:59"}
|
| 640 |
+
{"current_steps": 640, "total_steps": 666, "loss": 0.3951, "lr": 1.3128185511520974e-07, "epoch": 2.8775968556990454, "percentage": 96.1, "elapsed_time": "1 day, 5:13:49", "remaining_time": "1:11:14"}
|
| 641 |
+
{"current_steps": 641, "total_steps": 666, "loss": 0.3838, "lr": 1.2139164956160858e-07, "epoch": 2.8820887142055023, "percentage": 96.25, "elapsed_time": "1 day, 5:16:42", "remaining_time": "1:08:30"}
|
| 642 |
+
{"current_steps": 642, "total_steps": 666, "loss": 0.4242, "lr": 1.1188711426276294e-07, "epoch": 2.8865805727119596, "percentage": 96.4, "elapsed_time": "1 day, 5:19:35", "remaining_time": "1:05:46"}
|
| 643 |
+
{"current_steps": 643, "total_steps": 666, "loss": 0.3999, "lr": 1.0276851066105732e-07, "epoch": 2.891072431218417, "percentage": 96.55, "elapsed_time": "1 day, 5:22:18", "remaining_time": "1:03:02"}
|
| 644 |
+
{"current_steps": 644, "total_steps": 666, "loss": 0.3986, "lr": 9.403608958300276e-08, "epoch": 2.8955642897248737, "percentage": 96.7, "elapsed_time": "1 day, 5:24:55", "remaining_time": "1:00:17"}
|
| 645 |
+
{"current_steps": 645, "total_steps": 666, "loss": 0.4052, "lr": 8.569009123234562e-08, "epoch": 2.9000561482313305, "percentage": 96.85, "elapsed_time": "1 day, 5:27:36", "remaining_time": "0:57:32"}
|
| 646 |
+
{"current_steps": 646, "total_steps": 666, "loss": 0.4053, "lr": 7.773074518345438e-08, "epoch": 2.904548006737788, "percentage": 97.0, "elapsed_time": "1 day, 5:30:21", "remaining_time": "0:54:48"}
|
| 647 |
+
{"current_steps": 647, "total_steps": 666, "loss": 0.393, "lr": 7.015827037500785e-08, "epoch": 2.909039865244245, "percentage": 97.15, "elapsed_time": "1 day, 5:32:59", "remaining_time": "0:52:03"}
|
| 648 |
+
{"current_steps": 648, "total_steps": 666, "loss": 0.4043, "lr": 6.297287510397075e-08, "epoch": 2.913531723750702, "percentage": 97.3, "elapsed_time": "1 day, 5:35:49", "remaining_time": "0:49:19"}
|
| 649 |
+
{"current_steps": 649, "total_steps": 666, "loss": 0.4062, "lr": 5.6174757019866e-08, "epoch": 2.9180235822571587, "percentage": 97.45, "elapsed_time": "1 day, 5:38:26", "remaining_time": "0:46:35"}
|
| 650 |
+
{"current_steps": 650, "total_steps": 666, "loss": 0.4024, "lr": 4.976410311933432e-08, "epoch": 2.922515440763616, "percentage": 97.6, "elapsed_time": "1 day, 5:41:11", "remaining_time": "0:43:50"}
|
| 651 |
+
{"current_steps": 651, "total_steps": 666, "loss": 0.4023, "lr": 4.3741089740998524e-08, "epoch": 2.927007299270073, "percentage": 97.75, "elapsed_time": "1 day, 5:44:03", "remaining_time": "0:41:06"}
|
| 652 |
+
{"current_steps": 652, "total_steps": 666, "loss": 0.3967, "lr": 3.810588256060089e-08, "epoch": 2.93149915777653, "percentage": 97.9, "elapsed_time": "1 day, 5:46:45", "remaining_time": "0:38:21"}
|
| 653 |
+
{"current_steps": 653, "total_steps": 666, "loss": 0.4006, "lr": 3.2858636586456185e-08, "epoch": 2.935991016282987, "percentage": 98.05, "elapsed_time": "1 day, 5:49:35", "remaining_time": "0:35:37"}
|
| 654 |
+
{"current_steps": 654, "total_steps": 666, "loss": 0.39, "lr": 2.7999496155184166e-08, "epoch": 2.9404828747894443, "percentage": 98.2, "elapsed_time": "1 day, 5:52:22", "remaining_time": "0:32:53"}
|
| 655 |
+
{"current_steps": 655, "total_steps": 666, "loss": 0.3861, "lr": 2.3528594927737242e-08, "epoch": 2.944974733295901, "percentage": 98.35, "elapsed_time": "1 day, 5:55:11", "remaining_time": "0:30:08"}
|
| 656 |
+
{"current_steps": 656, "total_steps": 666, "loss": 0.4219, "lr": 1.9446055885728008e-08, "epoch": 2.9494665918023584, "percentage": 98.5, "elapsed_time": "1 day, 5:57:52", "remaining_time": "0:27:24"}
|
| 657 |
+
{"current_steps": 657, "total_steps": 666, "loss": 0.3958, "lr": 1.5751991328044162e-08, "epoch": 2.953958450308815, "percentage": 98.65, "elapsed_time": "1 day, 6:00:39", "remaining_time": "0:24:39"}
|
| 658 |
+
{"current_steps": 658, "total_steps": 666, "loss": 0.4025, "lr": 1.2446502867756959e-08, "epoch": 2.958450308815272, "percentage": 98.8, "elapsed_time": "1 day, 6:03:26", "remaining_time": "0:21:55"}
|
| 659 |
+
{"current_steps": 659, "total_steps": 666, "loss": 0.4144, "lr": 9.529681429332745e-09, "epoch": 2.9629421673217293, "percentage": 98.95, "elapsed_time": "1 day, 6:06:04", "remaining_time": "0:19:11"}
|
| 660 |
+
{"current_steps": 660, "total_steps": 666, "loss": 0.3971, "lr": 7.0016072461239484e-09, "epoch": 2.9674340258281866, "percentage": 99.1, "elapsed_time": "1 day, 6:08:43", "remaining_time": "0:16:26"}
|
| 661 |
+
{"current_steps": 661, "total_steps": 666, "loss": 0.4035, "lr": 4.862349858167804e-09, "epoch": 2.9719258843346434, "percentage": 99.25, "elapsed_time": "1 day, 6:11:34", "remaining_time": "0:13:42"}
|
| 662 |
+
{"current_steps": 662, "total_steps": 666, "loss": 0.4031, "lr": 3.111968110273985e-09, "epoch": 2.9764177428411003, "percentage": 99.4, "elapsed_time": "1 day, 6:14:33", "remaining_time": "0:10:57"}
|
| 663 |
+
{"current_steps": 663, "total_steps": 666, "loss": 0.4044, "lr": 1.7505101503979872e-09, "epoch": 2.9809096013475576, "percentage": 99.55, "elapsed_time": "1 day, 6:17:21", "remaining_time": "0:08:13"}
|
| 664 |
+
{"current_steps": 664, "total_steps": 666, "loss": 0.3951, "lr": 7.780134283285303e-10, "epoch": 2.985401459854015, "percentage": 99.7, "elapsed_time": "1 day, 6:20:03", "remaining_time": "0:05:28"}
|
| 665 |
+
{"current_steps": 665, "total_steps": 666, "loss": 0.3995, "lr": 1.945046946481569e-10, "epoch": 2.9898933183604717, "percentage": 99.85, "elapsed_time": "1 day, 6:22:48", "remaining_time": "0:02:44"}
|
| 666 |
+
{"current_steps": 666, "total_steps": 666, "loss": 0.4058, "lr": 0.0, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 6:25:39", "remaining_time": "0:00:00"}
|
| 667 |
+
{"current_steps": 666, "total_steps": 666, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 6:27:11", "remaining_time": "0:00:00"}
|