Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff55cf75993fedcbb082851fd57e1de34e2db70b50a5f40440ecdee32963097e
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb73fdfd88f7be3e17d27796ab542fd51314a0f5b1fbcec5b512a8658934c568
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:879342511f1193ad25de7b1b792cd191f42b9f64161c8f491016992562ccd454
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:557c07aa37a376288098ee59c8a7f8669c5582fefaf0f32f86f5f29d77e9ba4e
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -443,3 +443,225 @@
|
|
| 443 |
{"current_steps": 443, "total_steps": 666, "loss": 0.4103, "lr": 2.4378265094203597e-05, "epoch": 1.9912970241437393, "percentage": 66.52, "elapsed_time": "20:13:31", "remaining_time": "10:10:52"}
|
| 444 |
{"current_steps": 444, "total_steps": 666, "loss": 0.3956, "lr": 2.418535218019723e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "20:16:19", "remaining_time": "10:08:09"}
|
| 445 |
{"current_steps": 445, "total_steps": 666, "loss": 0.6375, "lr": 2.3992874281589192e-05, "epoch": 2.0016844469399215, "percentage": 66.82, "elapsed_time": "20:19:46", "remaining_time": "10:05:46"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 443 |
{"current_steps": 443, "total_steps": 666, "loss": 0.4103, "lr": 2.4378265094203597e-05, "epoch": 1.9912970241437393, "percentage": 66.52, "elapsed_time": "20:13:31", "remaining_time": "10:10:52"}
|
| 444 |
{"current_steps": 444, "total_steps": 666, "loss": 0.3956, "lr": 2.418535218019723e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "20:16:19", "remaining_time": "10:08:09"}
|
| 445 |
{"current_steps": 445, "total_steps": 666, "loss": 0.6375, "lr": 2.3992874281589192e-05, "epoch": 2.0016844469399215, "percentage": 66.82, "elapsed_time": "20:19:46", "remaining_time": "10:05:46"}
|
| 446 |
+
{"current_steps": 446, "total_steps": 666, "loss": 0.356, "lr": 2.380083669289194e-05, "epoch": 2.0061763054463784, "percentage": 66.97, "elapsed_time": "20:22:30", "remaining_time": "10:03:02"}
|
| 447 |
+
{"current_steps": 447, "total_steps": 666, "loss": 0.3511, "lr": 2.360924469650626e-05, "epoch": 2.0106681639528357, "percentage": 67.12, "elapsed_time": "20:25:10", "remaining_time": "10:00:15"}
|
| 448 |
+
{"current_steps": 448, "total_steps": 666, "loss": 0.3416, "lr": 2.3418103562575984e-05, "epoch": 2.0151600224592925, "percentage": 67.27, "elapsed_time": "20:27:55", "remaining_time": "9:57:30"}
|
| 449 |
+
{"current_steps": 449, "total_steps": 666, "loss": 0.3472, "lr": 2.3227418548843008e-05, "epoch": 2.0196518809657498, "percentage": 67.42, "elapsed_time": "20:30:44", "remaining_time": "9:54:48"}
|
| 450 |
+
{"current_steps": 450, "total_steps": 666, "loss": 0.3604, "lr": 2.3037194900502685e-05, "epoch": 2.0241437394722066, "percentage": 67.57, "elapsed_time": "20:33:40", "remaining_time": "9:52:09"}
|
| 451 |
+
{"current_steps": 451, "total_steps": 666, "loss": 0.3618, "lr": 2.2847437850059534e-05, "epoch": 2.028635597978664, "percentage": 67.72, "elapsed_time": "20:36:25", "remaining_time": "9:49:25"}
|
| 452 |
+
{"current_steps": 452, "total_steps": 666, "loss": 0.3474, "lr": 2.2658152617183308e-05, "epoch": 2.0331274564851207, "percentage": 67.87, "elapsed_time": "20:39:09", "remaining_time": "9:46:40"}
|
| 453 |
+
{"current_steps": 453, "total_steps": 666, "loss": 0.3434, "lr": 2.2469344408565423e-05, "epoch": 2.0376193149915776, "percentage": 68.02, "elapsed_time": "20:42:01", "remaining_time": "9:43:59"}
|
| 454 |
+
{"current_steps": 454, "total_steps": 666, "loss": 0.3555, "lr": 2.2281018417775716e-05, "epoch": 2.042111173498035, "percentage": 68.17, "elapsed_time": "20:44:51", "remaining_time": "9:41:17"}
|
| 455 |
+
{"current_steps": 455, "total_steps": 666, "loss": 0.3588, "lr": 2.2093179825119622e-05, "epoch": 2.0466030320044917, "percentage": 68.32, "elapsed_time": "20:47:33", "remaining_time": "9:38:32"}
|
| 456 |
+
{"current_steps": 456, "total_steps": 666, "loss": 0.3401, "lr": 2.1905833797495638e-05, "epoch": 2.051094890510949, "percentage": 68.47, "elapsed_time": "20:50:23", "remaining_time": "9:35:50"}
|
| 457 |
+
{"current_steps": 457, "total_steps": 666, "loss": 0.3491, "lr": 2.1718985488253236e-05, "epoch": 2.055586749017406, "percentage": 68.62, "elapsed_time": "20:53:10", "remaining_time": "9:33:06"}
|
| 458 |
+
{"current_steps": 458, "total_steps": 666, "loss": 0.3607, "lr": 2.1532640037051082e-05, "epoch": 2.060078607523863, "percentage": 68.77, "elapsed_time": "20:55:48", "remaining_time": "9:30:19"}
|
| 459 |
+
{"current_steps": 459, "total_steps": 666, "loss": 0.3644, "lr": 2.134680256971565e-05, "epoch": 2.06457046603032, "percentage": 68.92, "elapsed_time": "20:58:31", "remaining_time": "9:27:34"}
|
| 460 |
+
{"current_steps": 460, "total_steps": 666, "loss": 0.3342, "lr": 2.1161478198100265e-05, "epoch": 2.069062324536777, "percentage": 69.07, "elapsed_time": "21:01:17", "remaining_time": "9:24:50"}
|
| 461 |
+
{"current_steps": 461, "total_steps": 666, "loss": 0.3395, "lr": 2.097667201994445e-05, "epoch": 2.073554183043234, "percentage": 69.22, "elapsed_time": "21:04:08", "remaining_time": "9:22:08"}
|
| 462 |
+
{"current_steps": 462, "total_steps": 666, "loss": 0.3497, "lr": 2.0792389118733735e-05, "epoch": 2.0780460415496913, "percentage": 69.37, "elapsed_time": "21:07:01", "remaining_time": "9:19:27"}
|
| 463 |
+
{"current_steps": 463, "total_steps": 666, "loss": 0.3485, "lr": 2.060863456355979e-05, "epoch": 2.082537900056148, "percentage": 69.52, "elapsed_time": "21:09:49", "remaining_time": "9:16:44"}
|
| 464 |
+
{"current_steps": 464, "total_steps": 666, "loss": 0.3465, "lr": 2.0425413408981017e-05, "epoch": 2.0870297585626054, "percentage": 69.67, "elapsed_time": "21:12:31", "remaining_time": "9:13:59"}
|
| 465 |
+
{"current_steps": 465, "total_steps": 666, "loss": 0.3411, "lr": 2.0242730694883513e-05, "epoch": 2.0915216170690623, "percentage": 69.82, "elapsed_time": "21:15:13", "remaining_time": "9:11:13"}
|
| 466 |
+
{"current_steps": 466, "total_steps": 666, "loss": 0.3378, "lr": 2.0060591446342413e-05, "epoch": 2.0960134755755195, "percentage": 69.97, "elapsed_time": "21:18:06", "remaining_time": "9:08:32"}
|
| 467 |
+
{"current_steps": 467, "total_steps": 666, "loss": 0.351, "lr": 1.9879000673483696e-05, "epoch": 2.1005053340819764, "percentage": 70.12, "elapsed_time": "21:20:35", "remaining_time": "9:05:41"}
|
| 468 |
+
{"current_steps": 468, "total_steps": 666, "loss": 0.348, "lr": 1.9697963371346334e-05, "epoch": 2.1049971925884337, "percentage": 70.27, "elapsed_time": "21:23:18", "remaining_time": "9:02:56"}
|
| 469 |
+
{"current_steps": 469, "total_steps": 666, "loss": 0.3392, "lr": 1.9517484519744933e-05, "epoch": 2.1094890510948905, "percentage": 70.42, "elapsed_time": "21:26:04", "remaining_time": "9:00:12"}
|
| 470 |
+
{"current_steps": 470, "total_steps": 666, "loss": 0.3638, "lr": 1.933756908313273e-05, "epoch": 2.1139809096013478, "percentage": 70.57, "elapsed_time": "21:28:52", "remaining_time": "8:57:29"}
|
| 471 |
+
{"current_steps": 471, "total_steps": 666, "loss": 0.3406, "lr": 1.9158222010465034e-05, "epoch": 2.1184727681078046, "percentage": 70.72, "elapsed_time": "21:31:32", "remaining_time": "8:54:42"}
|
| 472 |
+
{"current_steps": 472, "total_steps": 666, "loss": 0.35, "lr": 1.8979448235063103e-05, "epoch": 2.1229646266142614, "percentage": 70.87, "elapsed_time": "21:34:23", "remaining_time": "8:52:00"}
|
| 473 |
+
{"current_steps": 473, "total_steps": 666, "loss": 0.3529, "lr": 1.8801252674478432e-05, "epoch": 2.1274564851207187, "percentage": 71.02, "elapsed_time": "21:37:18", "remaining_time": "8:49:20"}
|
| 474 |
+
{"current_steps": 474, "total_steps": 666, "loss": 0.3597, "lr": 1.8623640230357507e-05, "epoch": 2.1319483436271756, "percentage": 71.17, "elapsed_time": "21:40:00", "remaining_time": "8:46:34"}
|
| 475 |
+
{"current_steps": 475, "total_steps": 666, "loss": 0.3443, "lr": 1.8446615788306928e-05, "epoch": 2.136440202133633, "percentage": 71.32, "elapsed_time": "21:42:40", "remaining_time": "8:43:48"}
|
| 476 |
+
{"current_steps": 476, "total_steps": 666, "loss": 0.3453, "lr": 1.827018421775911e-05, "epoch": 2.1409320606400897, "percentage": 71.47, "elapsed_time": "21:45:26", "remaining_time": "8:41:04"}
|
| 477 |
+
{"current_steps": 477, "total_steps": 666, "loss": 0.3459, "lr": 1.809435037183823e-05, "epoch": 2.145423919146547, "percentage": 71.62, "elapsed_time": "21:48:16", "remaining_time": "8:38:22"}
|
| 478 |
+
{"current_steps": 478, "total_steps": 666, "loss": 0.3415, "lr": 1.7919119087226797e-05, "epoch": 2.149915777653004, "percentage": 71.77, "elapsed_time": "21:50:52", "remaining_time": "8:35:34"}
|
| 479 |
+
{"current_steps": 479, "total_steps": 666, "loss": 0.3468, "lr": 1.7744495184032598e-05, "epoch": 2.154407636159461, "percentage": 71.92, "elapsed_time": "21:53:35", "remaining_time": "8:32:49"}
|
| 480 |
+
{"current_steps": 480, "total_steps": 666, "loss": 0.3475, "lr": 1.7570483465656103e-05, "epoch": 2.158899494665918, "percentage": 72.07, "elapsed_time": "21:56:11", "remaining_time": "8:30:01"}
|
| 481 |
+
{"current_steps": 481, "total_steps": 666, "loss": 0.3624, "lr": 1.7397088718658345e-05, "epoch": 2.163391353172375, "percentage": 72.22, "elapsed_time": "21:59:06", "remaining_time": "8:27:21"}
|
| 482 |
+
{"current_steps": 482, "total_steps": 666, "loss": 0.3178, "lr": 1.7224315712629254e-05, "epoch": 2.167883211678832, "percentage": 72.37, "elapsed_time": "22:01:44", "remaining_time": "8:24:34"}
|
| 483 |
+
{"current_steps": 483, "total_steps": 666, "loss": 0.373, "lr": 1.7052169200056447e-05, "epoch": 2.1723750701852893, "percentage": 72.52, "elapsed_time": "22:04:37", "remaining_time": "8:21:52"}
|
| 484 |
+
{"current_steps": 484, "total_steps": 666, "loss": 0.3404, "lr": 1.6880653916194526e-05, "epoch": 2.176866928691746, "percentage": 72.67, "elapsed_time": "22:07:15", "remaining_time": "8:19:05"}
|
| 485 |
+
{"current_steps": 485, "total_steps": 666, "loss": 0.3626, "lr": 1.6709774578934794e-05, "epoch": 2.1813587871982034, "percentage": 72.82, "elapsed_time": "22:09:54", "remaining_time": "8:16:18"}
|
| 486 |
+
{"current_steps": 486, "total_steps": 666, "loss": 0.3617, "lr": 1.6539535888675508e-05, "epoch": 2.1858506457046603, "percentage": 72.97, "elapsed_time": "22:12:37", "remaining_time": "8:13:33"}
|
| 487 |
+
{"current_steps": 487, "total_steps": 666, "loss": 0.3362, "lr": 1.6369942528192567e-05, "epoch": 2.1903425042111175, "percentage": 73.12, "elapsed_time": "22:15:06", "remaining_time": "8:10:43"}
|
| 488 |
+
{"current_steps": 488, "total_steps": 666, "loss": 0.3564, "lr": 1.62009991625107e-05, "epoch": 2.1948343627175744, "percentage": 73.27, "elapsed_time": "22:17:45", "remaining_time": "8:07:57"}
|
| 489 |
+
{"current_steps": 489, "total_steps": 666, "loss": 0.3447, "lr": 1.6032710438775163e-05, "epoch": 2.199326221224031, "percentage": 73.42, "elapsed_time": "22:20:30", "remaining_time": "8:05:12"}
|
| 490 |
+
{"current_steps": 490, "total_steps": 666, "loss": 0.3388, "lr": 1.58650809861239e-05, "epoch": 2.2038180797304885, "percentage": 73.57, "elapsed_time": "22:23:08", "remaining_time": "8:02:26"}
|
| 491 |
+
{"current_steps": 491, "total_steps": 666, "loss": 0.342, "lr": 1.5698115415560184e-05, "epoch": 2.2083099382369458, "percentage": 73.72, "elapsed_time": "22:26:01", "remaining_time": "7:59:44"}
|
| 492 |
+
{"current_steps": 492, "total_steps": 666, "loss": 0.34, "lr": 1.553181831982582e-05, "epoch": 2.2128017967434026, "percentage": 73.87, "elapsed_time": "22:28:31", "remaining_time": "7:56:54"}
|
| 493 |
+
{"current_steps": 493, "total_steps": 666, "loss": 0.3593, "lr": 1.5366194273274823e-05, "epoch": 2.2172936552498594, "percentage": 74.02, "elapsed_time": "22:31:13", "remaining_time": "7:54:09"}
|
| 494 |
+
{"current_steps": 494, "total_steps": 666, "loss": 0.3345, "lr": 1.5201247831747522e-05, "epoch": 2.2217855137563167, "percentage": 74.17, "elapsed_time": "22:33:56", "remaining_time": "7:51:24"}
|
| 495 |
+
{"current_steps": 495, "total_steps": 666, "loss": 0.3361, "lr": 1.5036983532445302e-05, "epoch": 2.2262773722627736, "percentage": 74.32, "elapsed_time": "22:36:33", "remaining_time": "7:48:37"}
|
| 496 |
+
{"current_steps": 496, "total_steps": 666, "loss": 0.3416, "lr": 1.4873405893805792e-05, "epoch": 2.230769230769231, "percentage": 74.47, "elapsed_time": "22:39:13", "remaining_time": "7:45:51"}
|
| 497 |
+
{"current_steps": 497, "total_steps": 666, "loss": 0.3479, "lr": 1.4710519415378523e-05, "epoch": 2.2352610892756877, "percentage": 74.62, "elapsed_time": "22:41:58", "remaining_time": "7:43:07"}
|
| 498 |
+
{"current_steps": 498, "total_steps": 666, "loss": 0.3403, "lr": 1.4548328577701245e-05, "epoch": 2.239752947782145, "percentage": 74.77, "elapsed_time": "22:44:39", "remaining_time": "7:40:21"}
|
| 499 |
+
{"current_steps": 499, "total_steps": 666, "loss": 0.3338, "lr": 1.4386837842176618e-05, "epoch": 2.244244806288602, "percentage": 74.92, "elapsed_time": "22:47:19", "remaining_time": "7:37:35"}
|
| 500 |
+
{"current_steps": 500, "total_steps": 666, "loss": 0.3583, "lr": 1.4226051650949506e-05, "epoch": 2.248736664795059, "percentage": 75.08, "elapsed_time": "22:50:02", "remaining_time": "7:34:51"}
|
| 501 |
+
{"current_steps": 501, "total_steps": 666, "loss": 0.3452, "lr": 1.4065974426784794e-05, "epoch": 2.253228523301516, "percentage": 75.23, "elapsed_time": "22:52:53", "remaining_time": "7:32:09"}
|
| 502 |
+
{"current_steps": 502, "total_steps": 666, "loss": 0.3622, "lr": 1.3906610572945724e-05, "epoch": 2.257720381807973, "percentage": 75.38, "elapsed_time": "22:55:40", "remaining_time": "7:29:25"}
|
| 503 |
+
{"current_steps": 503, "total_steps": 666, "loss": 0.3366, "lr": 1.374796447307278e-05, "epoch": 2.26221224031443, "percentage": 75.53, "elapsed_time": "22:58:32", "remaining_time": "7:26:43"}
|
| 504 |
+
{"current_steps": 504, "total_steps": 666, "loss": 0.3698, "lr": 1.359004049106309e-05, "epoch": 2.2667040988208873, "percentage": 75.68, "elapsed_time": "23:01:24", "remaining_time": "7:24:01"}
|
| 505 |
+
{"current_steps": 505, "total_steps": 666, "loss": 0.3428, "lr": 1.3432842970950418e-05, "epoch": 2.271195957327344, "percentage": 75.83, "elapsed_time": "23:04:05", "remaining_time": "7:21:15"}
|
| 506 |
+
{"current_steps": 506, "total_steps": 666, "loss": 0.3378, "lr": 1.3276376236785638e-05, "epoch": 2.2756878158338014, "percentage": 75.98, "elapsed_time": "23:06:41", "remaining_time": "7:18:28"}
|
| 507 |
+
{"current_steps": 507, "total_steps": 666, "loss": 0.3446, "lr": 1.3120644592517815e-05, "epoch": 2.2801796743402583, "percentage": 76.13, "elapsed_time": "23:09:28", "remaining_time": "7:15:45"}
|
| 508 |
+
{"current_steps": 508, "total_steps": 666, "loss": 0.3727, "lr": 1.2965652321875797e-05, "epoch": 2.2846715328467155, "percentage": 76.28, "elapsed_time": "23:12:16", "remaining_time": "7:13:01"}
|
| 509 |
+
{"current_steps": 509, "total_steps": 666, "loss": 0.3422, "lr": 1.2811403688250428e-05, "epoch": 2.2891633913531724, "percentage": 76.43, "elapsed_time": "23:15:09", "remaining_time": "7:10:20"}
|
| 510 |
+
{"current_steps": 510, "total_steps": 666, "loss": 0.3536, "lr": 1.2657902934577209e-05, "epoch": 2.293655249859629, "percentage": 76.58, "elapsed_time": "23:17:55", "remaining_time": "7:07:36"}
|
| 511 |
+
{"current_steps": 511, "total_steps": 666, "loss": 0.3551, "lr": 1.2505154283219624e-05, "epoch": 2.2981471083660865, "percentage": 76.73, "elapsed_time": "23:20:34", "remaining_time": "7:04:50"}
|
| 512 |
+
{"current_steps": 512, "total_steps": 666, "loss": 0.3578, "lr": 1.235316193585299e-05, "epoch": 2.3026389668725433, "percentage": 76.88, "elapsed_time": "23:23:13", "remaining_time": "7:02:03"}
|
| 513 |
+
{"current_steps": 513, "total_steps": 666, "loss": 0.3611, "lr": 1.2201930073348884e-05, "epoch": 2.3071308253790006, "percentage": 77.03, "elapsed_time": "23:26:01", "remaining_time": "6:59:20"}
|
| 514 |
+
{"current_steps": 514, "total_steps": 666, "loss": 0.3413, "lr": 1.2051462855660133e-05, "epoch": 2.3116226838854574, "percentage": 77.18, "elapsed_time": "23:28:46", "remaining_time": "6:56:36"}
|
| 515 |
+
{"current_steps": 515, "total_steps": 666, "loss": 0.3473, "lr": 1.1901764421706386e-05, "epoch": 2.3161145423919147, "percentage": 77.33, "elapsed_time": "23:31:26", "remaining_time": "6:53:50"}
|
| 516 |
+
{"current_steps": 516, "total_steps": 666, "loss": 0.3379, "lr": 1.175283888926027e-05, "epoch": 2.3206064008983716, "percentage": 77.48, "elapsed_time": "23:34:20", "remaining_time": "6:51:08"}
|
| 517 |
+
{"current_steps": 517, "total_steps": 666, "loss": 0.3522, "lr": 1.1604690354834114e-05, "epoch": 2.325098259404829, "percentage": 77.63, "elapsed_time": "23:37:03", "remaining_time": "6:48:23"}
|
| 518 |
+
{"current_steps": 518, "total_steps": 666, "loss": 0.3547, "lr": 1.1457322893567277e-05, "epoch": 2.3295901179112857, "percentage": 77.78, "elapsed_time": "23:39:53", "remaining_time": "6:45:40"}
|
| 519 |
+
{"current_steps": 519, "total_steps": 666, "loss": 0.3438, "lr": 1.1310740559114044e-05, "epoch": 2.334081976417743, "percentage": 77.93, "elapsed_time": "23:42:26", "remaining_time": "6:42:53"}
|
| 520 |
+
{"current_steps": 520, "total_steps": 666, "loss": 0.3365, "lr": 1.1164947383532118e-05, "epoch": 2.3385738349242, "percentage": 78.08, "elapsed_time": "23:45:09", "remaining_time": "6:40:08"}
|
| 521 |
+
{"current_steps": 521, "total_steps": 666, "loss": 0.3795, "lr": 1.1019947377171714e-05, "epoch": 2.343065693430657, "percentage": 78.23, "elapsed_time": "23:47:50", "remaining_time": "6:37:23"}
|
| 522 |
+
{"current_steps": 522, "total_steps": 666, "loss": 0.3313, "lr": 1.0875744528565258e-05, "epoch": 2.347557551937114, "percentage": 78.38, "elapsed_time": "23:50:24", "remaining_time": "6:34:35"}
|
| 523 |
+
{"current_steps": 523, "total_steps": 666, "loss": 0.3547, "lr": 1.0732342804317649e-05, "epoch": 2.352049410443571, "percentage": 78.53, "elapsed_time": "23:53:08", "remaining_time": "6:31:51"}
|
| 524 |
+
{"current_steps": 524, "total_steps": 666, "loss": 0.341, "lr": 1.0589746148997175e-05, "epoch": 2.356541268950028, "percentage": 78.68, "elapsed_time": "23:55:44", "remaining_time": "6:29:04"}
|
| 525 |
+
{"current_steps": 525, "total_steps": 666, "loss": 0.3562, "lr": 1.044795848502698e-05, "epoch": 2.3610331274564853, "percentage": 78.83, "elapsed_time": "23:58:35", "remaining_time": "6:26:21"}
|
| 526 |
+
{"current_steps": 526, "total_steps": 666, "loss": 0.3407, "lr": 1.0306983712577226e-05, "epoch": 2.365524985962942, "percentage": 78.98, "elapsed_time": "1 day, 0:01:20", "remaining_time": "6:23:37"}
|
| 527 |
+
{"current_steps": 527, "total_steps": 666, "loss": 0.3398, "lr": 1.0166825709457725e-05, "epoch": 2.370016844469399, "percentage": 79.13, "elapsed_time": "1 day, 0:03:58", "remaining_time": "6:20:51"}
|
| 528 |
+
{"current_steps": 528, "total_steps": 666, "loss": 0.3629, "lr": 1.0027488331011335e-05, "epoch": 2.3745087029758563, "percentage": 79.28, "elapsed_time": "1 day, 0:06:42", "remaining_time": "6:18:07"}
|
| 529 |
+
{"current_steps": 529, "total_steps": 666, "loss": 0.3489, "lr": 9.888975410007905e-06, "epoch": 2.3790005614823135, "percentage": 79.43, "elapsed_time": "1 day, 0:09:24", "remaining_time": "6:15:22"}
|
| 530 |
+
{"current_steps": 530, "total_steps": 666, "loss": 0.368, "lr": 9.751290756538822e-06, "epoch": 2.3834924199887704, "percentage": 79.58, "elapsed_time": "1 day, 0:12:16", "remaining_time": "6:12:39"}
|
| 531 |
+
{"current_steps": 531, "total_steps": 666, "loss": 0.3333, "lr": 9.614438157912223e-06, "epoch": 2.387984278495227, "percentage": 79.73, "elapsed_time": "1 day, 0:14:59", "remaining_time": "6:09:54"}
|
| 532 |
+
{"current_steps": 532, "total_steps": 666, "loss": 0.3618, "lr": 9.47842137854881e-06, "epoch": 2.3924761370016845, "percentage": 79.88, "elapsed_time": "1 day, 0:17:45", "remaining_time": "6:07:10"}
|
| 533 |
+
{"current_steps": 533, "total_steps": 666, "loss": 0.3405, "lr": 9.343244159878315e-06, "epoch": 2.3969679955081413, "percentage": 80.03, "elapsed_time": "1 day, 0:20:29", "remaining_time": "6:04:26"}
|
| 534 |
+
{"current_steps": 534, "total_steps": 666, "loss": 0.3468, "lr": 9.208910220236564e-06, "epoch": 2.4014598540145986, "percentage": 80.18, "elapsed_time": "1 day, 0:23:16", "remaining_time": "6:01:42"}
|
| 535 |
+
{"current_steps": 535, "total_steps": 666, "loss": 0.3612, "lr": 9.07542325476321e-06, "epoch": 2.4059517125210554, "percentage": 80.33, "elapsed_time": "1 day, 0:26:09", "remaining_time": "5:59:00"}
|
| 536 |
+
{"current_steps": 536, "total_steps": 666, "loss": 0.3449, "lr": 8.94278693530009e-06, "epoch": 2.4104435710275127, "percentage": 80.48, "elapsed_time": "1 day, 0:28:56", "remaining_time": "5:56:16"}
|
| 537 |
+
{"current_steps": 537, "total_steps": 666, "loss": 0.3521, "lr": 8.811004910290223e-06, "epoch": 2.4149354295339696, "percentage": 80.63, "elapsed_time": "1 day, 0:31:42", "remaining_time": "5:53:32"}
|
| 538 |
+
{"current_steps": 538, "total_steps": 666, "loss": 0.359, "lr": 8.68008080467743e-06, "epoch": 2.419427288040427, "percentage": 80.78, "elapsed_time": "1 day, 0:34:22", "remaining_time": "5:50:46"}
|
| 539 |
+
{"current_steps": 539, "total_steps": 666, "loss": 0.321, "lr": 8.550018219806654e-06, "epoch": 2.4239191465468837, "percentage": 80.93, "elapsed_time": "1 day, 0:36:57", "remaining_time": "5:48:00"}
|
| 540 |
+
{"current_steps": 540, "total_steps": 666, "loss": 0.3585, "lr": 8.420820733324895e-06, "epoch": 2.428411005053341, "percentage": 81.08, "elapsed_time": "1 day, 0:39:46", "remaining_time": "5:45:16"}
|
| 541 |
+
{"current_steps": 541, "total_steps": 666, "loss": 0.3512, "lr": 8.29249189908277e-06, "epoch": 2.432902863559798, "percentage": 81.23, "elapsed_time": "1 day, 0:42:46", "remaining_time": "5:42:35"}
|
| 542 |
+
{"current_steps": 542, "total_steps": 666, "loss": 0.3377, "lr": 8.16503524703678e-06, "epoch": 2.437394722066255, "percentage": 81.38, "elapsed_time": "1 day, 0:45:29", "remaining_time": "5:39:51"}
|
| 543 |
+
{"current_steps": 543, "total_steps": 666, "loss": 0.345, "lr": 8.038454283152228e-06, "epoch": 2.441886580572712, "percentage": 81.53, "elapsed_time": "1 day, 0:48:17", "remaining_time": "5:37:07"}
|
| 544 |
+
{"current_steps": 544, "total_steps": 666, "loss": 0.346, "lr": 7.912752489306732e-06, "epoch": 2.446378439079169, "percentage": 81.68, "elapsed_time": "1 day, 0:51:09", "remaining_time": "5:34:24"}
|
| 545 |
+
{"current_steps": 545, "total_steps": 666, "loss": 0.3499, "lr": 7.787933323194483e-06, "epoch": 2.450870297585626, "percentage": 81.83, "elapsed_time": "1 day, 0:53:44", "remaining_time": "5:31:38"}
|
| 546 |
+
{"current_steps": 546, "total_steps": 666, "loss": 0.3262, "lr": 7.664000218231132e-06, "epoch": 2.4553621560920833, "percentage": 81.98, "elapsed_time": "1 day, 0:56:24", "remaining_time": "5:28:52"}
|
| 547 |
+
{"current_steps": 547, "total_steps": 666, "loss": 0.3483, "lr": 7.540956583459329e-06, "epoch": 2.45985401459854, "percentage": 82.13, "elapsed_time": "1 day, 0:59:07", "remaining_time": "5:26:07"}
|
| 548 |
+
{"current_steps": 548, "total_steps": 666, "loss": 0.3671, "lr": 7.418805803454976e-06, "epoch": 2.464345873104997, "percentage": 82.28, "elapsed_time": "1 day, 1:01:50", "remaining_time": "5:23:23"}
|
| 549 |
+
{"current_steps": 549, "total_steps": 666, "loss": 0.3359, "lr": 7.297551238234098e-06, "epoch": 2.4688377316114543, "percentage": 82.43, "elapsed_time": "1 day, 1:04:37", "remaining_time": "5:20:39"}
|
| 550 |
+
{"current_steps": 550, "total_steps": 666, "loss": 0.3612, "lr": 7.1771962231604476e-06, "epoch": 2.473329590117911, "percentage": 82.58, "elapsed_time": "1 day, 1:07:10", "remaining_time": "5:17:52"}
|
| 551 |
+
{"current_steps": 551, "total_steps": 666, "loss": 0.3565, "lr": 7.057744068853729e-06, "epoch": 2.4778214486243684, "percentage": 82.73, "elapsed_time": "1 day, 1:10:06", "remaining_time": "5:15:10"}
|
| 552 |
+
{"current_steps": 552, "total_steps": 666, "loss": 0.3422, "lr": 6.939198061098564e-06, "epoch": 2.482313307130825, "percentage": 82.88, "elapsed_time": "1 day, 1:12:53", "remaining_time": "5:12:26"}
|
| 553 |
+
{"current_steps": 553, "total_steps": 666, "loss": 0.3484, "lr": 6.821561460754087e-06, "epoch": 2.4868051656372825, "percentage": 83.03, "elapsed_time": "1 day, 1:15:42", "remaining_time": "5:09:43"}
|
| 554 |
+
{"current_steps": 554, "total_steps": 666, "loss": 0.3396, "lr": 6.704837503664246e-06, "epoch": 2.4912970241437393, "percentage": 83.18, "elapsed_time": "1 day, 1:18:23", "remaining_time": "5:06:58"}
|
| 555 |
+
{"current_steps": 555, "total_steps": 666, "loss": 0.3499, "lr": 6.589029400568816e-06, "epoch": 2.4957888826501966, "percentage": 83.33, "elapsed_time": "1 day, 1:21:03", "remaining_time": "5:04:12"}
|
| 556 |
+
{"current_steps": 556, "total_steps": 666, "loss": 0.3283, "lr": 6.47414033701506e-06, "epoch": 2.5002807411566534, "percentage": 83.48, "elapsed_time": "1 day, 1:23:33", "remaining_time": "5:01:25"}
|
| 557 |
+
{"current_steps": 557, "total_steps": 666, "loss": 0.3686, "lr": 6.360173473270111e-06, "epoch": 2.5047725996631107, "percentage": 83.63, "elapsed_time": "1 day, 1:26:13", "remaining_time": "4:58:40"}
|
| 558 |
+
{"current_steps": 558, "total_steps": 666, "loss": 0.3229, "lr": 6.247131944234035e-06, "epoch": 2.5092644581695676, "percentage": 83.78, "elapsed_time": "1 day, 1:28:50", "remaining_time": "4:55:54"}
|
| 559 |
+
{"current_steps": 559, "total_steps": 666, "loss": 0.3404, "lr": 6.135018859353632e-06, "epoch": 2.513756316676025, "percentage": 83.93, "elapsed_time": "1 day, 1:31:31", "remaining_time": "4:53:09"}
|
| 560 |
+
{"current_steps": 560, "total_steps": 666, "loss": 0.3621, "lr": 6.023837302536857e-06, "epoch": 2.5182481751824817, "percentage": 84.08, "elapsed_time": "1 day, 1:34:17", "remaining_time": "4:50:25"}
|
| 561 |
+
{"current_steps": 561, "total_steps": 666, "loss": 0.3395, "lr": 5.913590332068011e-06, "epoch": 2.522740033688939, "percentage": 84.23, "elapsed_time": "1 day, 1:36:53", "remaining_time": "4:47:39"}
|
| 562 |
+
{"current_steps": 562, "total_steps": 666, "loss": 0.3459, "lr": 5.804280980523622e-06, "epoch": 2.527231892195396, "percentage": 84.38, "elapsed_time": "1 day, 1:39:41", "remaining_time": "4:44:55"}
|
| 563 |
+
{"current_steps": 563, "total_steps": 666, "loss": 0.3344, "lr": 5.695912254689022e-06, "epoch": 2.531723750701853, "percentage": 84.53, "elapsed_time": "1 day, 1:42:25", "remaining_time": "4:42:10"}
|
| 564 |
+
{"current_steps": 564, "total_steps": 666, "loss": 0.3542, "lr": 5.58848713547564e-06, "epoch": 2.53621560920831, "percentage": 84.68, "elapsed_time": "1 day, 1:45:11", "remaining_time": "4:39:26"}
|
| 565 |
+
{"current_steps": 565, "total_steps": 666, "loss": 0.3624, "lr": 5.4820085778390084e-06, "epoch": 2.5407074677147667, "percentage": 84.83, "elapsed_time": "1 day, 1:47:51", "remaining_time": "4:36:41"}
|
| 566 |
+
{"current_steps": 566, "total_steps": 666, "loss": 0.355, "lr": 5.376479510697472e-06, "epoch": 2.545199326221224, "percentage": 84.98, "elapsed_time": "1 day, 1:50:35", "remaining_time": "4:33:57"}
|
| 567 |
+
{"current_steps": 567, "total_steps": 666, "loss": 0.3348, "lr": 5.271902836851635e-06, "epoch": 2.5496911847276813, "percentage": 85.14, "elapsed_time": "1 day, 1:53:14", "remaining_time": "4:31:12"}
|
| 568 |
+
{"current_steps": 568, "total_steps": 666, "loss": 0.332, "lr": 5.168281432904496e-06, "epoch": 2.554183043234138, "percentage": 85.29, "elapsed_time": "1 day, 1:55:54", "remaining_time": "4:28:26"}
|
| 569 |
+
{"current_steps": 569, "total_steps": 666, "loss": 0.385, "lr": 5.065618149182343e-06, "epoch": 2.558674901740595, "percentage": 85.44, "elapsed_time": "1 day, 1:58:33", "remaining_time": "4:25:41"}
|
| 570 |
+
{"current_steps": 570, "total_steps": 666, "loss": 0.3401, "lr": 4.963915809656325e-06, "epoch": 2.5631667602470523, "percentage": 85.59, "elapsed_time": "1 day, 2:01:16", "remaining_time": "4:22:57"}
|
| 571 |
+
{"current_steps": 571, "total_steps": 666, "loss": 0.3426, "lr": 4.863177211864791e-06, "epoch": 2.5676586187535095, "percentage": 85.74, "elapsed_time": "1 day, 2:04:01", "remaining_time": "4:20:12"}
|
| 572 |
+
{"current_steps": 572, "total_steps": 666, "loss": 0.3479, "lr": 4.763405126836333e-06, "epoch": 2.5721504772599664, "percentage": 85.89, "elapsed_time": "1 day, 2:06:42", "remaining_time": "4:17:27"}
|
| 573 |
+
{"current_steps": 573, "total_steps": 666, "loss": 0.3383, "lr": 4.664602299013559e-06, "epoch": 2.576642335766423, "percentage": 86.04, "elapsed_time": "1 day, 2:09:16", "remaining_time": "4:14:41"}
|
| 574 |
+
{"current_steps": 574, "total_steps": 666, "loss": 0.3758, "lr": 4.566771446177605e-06, "epoch": 2.5811341942728805, "percentage": 86.19, "elapsed_time": "1 day, 2:12:03", "remaining_time": "4:11:58"}
|
| 575 |
+
{"current_steps": 575, "total_steps": 666, "loss": 0.3326, "lr": 4.469915259373369e-06, "epoch": 2.5856260527793373, "percentage": 86.34, "elapsed_time": "1 day, 2:14:45", "remaining_time": "4:09:13"}
|
| 576 |
+
{"current_steps": 576, "total_steps": 666, "loss": 0.3462, "lr": 4.3740364028355045e-06, "epoch": 2.5901179112857946, "percentage": 86.49, "elapsed_time": "1 day, 2:17:34", "remaining_time": "4:06:29"}
|
| 577 |
+
{"current_steps": 577, "total_steps": 666, "loss": 0.3525, "lr": 4.279137513915124e-06, "epoch": 2.5946097697922514, "percentage": 86.64, "elapsed_time": "1 day, 2:20:18", "remaining_time": "4:03:45"}
|
| 578 |
+
{"current_steps": 578, "total_steps": 666, "loss": 0.3355, "lr": 4.185221203007244e-06, "epoch": 2.5991016282987087, "percentage": 86.79, "elapsed_time": "1 day, 2:22:58", "remaining_time": "4:01:00"}
|
| 579 |
+
{"current_steps": 579, "total_steps": 666, "loss": 0.3515, "lr": 4.092290053478998e-06, "epoch": 2.6035934868051656, "percentage": 86.94, "elapsed_time": "1 day, 2:25:48", "remaining_time": "3:58:16"}
|
| 580 |
+
{"current_steps": 580, "total_steps": 666, "loss": 0.3492, "lr": 4.0003466215985745e-06, "epoch": 2.608085345311623, "percentage": 87.09, "elapsed_time": "1 day, 2:28:38", "remaining_time": "3:55:33"}
|
| 581 |
+
{"current_steps": 581, "total_steps": 666, "loss": 0.3495, "lr": 3.909393436464881e-06, "epoch": 2.6125772038180797, "percentage": 87.24, "elapsed_time": "1 day, 2:31:13", "remaining_time": "3:52:47"}
|
| 582 |
+
{"current_steps": 582, "total_steps": 666, "loss": 0.3587, "lr": 3.819432999938006e-06, "epoch": 2.6170690623245365, "percentage": 87.39, "elapsed_time": "1 day, 2:34:00", "remaining_time": "3:50:03"}
|
| 583 |
+
{"current_steps": 583, "total_steps": 666, "loss": 0.3195, "lr": 3.7304677865703665e-06, "epoch": 2.621560920830994, "percentage": 87.54, "elapsed_time": "1 day, 2:36:50", "remaining_time": "3:47:20"}
|
| 584 |
+
{"current_steps": 584, "total_steps": 666, "loss": 0.3563, "lr": 3.6425002435386714e-06, "epoch": 2.626052779337451, "percentage": 87.69, "elapsed_time": "1 day, 2:39:42", "remaining_time": "3:44:37"}
|
| 585 |
+
{"current_steps": 585, "total_steps": 666, "loss": 0.3375, "lr": 3.5555327905765925e-06, "epoch": 2.630544637843908, "percentage": 87.84, "elapsed_time": "1 day, 2:42:24", "remaining_time": "3:41:52"}
|
| 586 |
+
{"current_steps": 586, "total_steps": 666, "loss": 0.3616, "lr": 3.469567819908193e-06, "epoch": 2.6350364963503647, "percentage": 87.99, "elapsed_time": "1 day, 2:45:16", "remaining_time": "3:39:08"}
|
| 587 |
+
{"current_steps": 587, "total_steps": 666, "loss": 0.3473, "lr": 3.384607696182145e-06, "epoch": 2.639528354856822, "percentage": 88.14, "elapsed_time": "1 day, 2:47:51", "remaining_time": "3:36:23"}
|
| 588 |
+
{"current_steps": 588, "total_steps": 666, "loss": 0.3512, "lr": 3.3006547564066806e-06, "epoch": 2.6440202133632793, "percentage": 88.29, "elapsed_time": "1 day, 2:50:40", "remaining_time": "3:33:39"}
|
| 589 |
+
{"current_steps": 589, "total_steps": 666, "loss": 0.335, "lr": 3.2177113098852985e-06, "epoch": 2.648512071869736, "percentage": 88.44, "elapsed_time": "1 day, 2:53:23", "remaining_time": "3:30:55"}
|
| 590 |
+
{"current_steps": 590, "total_steps": 666, "loss": 0.3548, "lr": 3.1357796381532445e-06, "epoch": 2.653003930376193, "percentage": 88.59, "elapsed_time": "1 day, 2:56:11", "remaining_time": "3:28:11"}
|
| 591 |
+
{"current_steps": 591, "total_steps": 666, "loss": 0.3516, "lr": 3.054861994914755e-06, "epoch": 2.6574957888826503, "percentage": 88.74, "elapsed_time": "1 day, 2:59:00", "remaining_time": "3:25:27"}
|
| 592 |
+
{"current_steps": 592, "total_steps": 666, "loss": 0.3456, "lr": 2.9749606059810586e-06, "epoch": 2.661987647389107, "percentage": 88.89, "elapsed_time": "1 day, 3:01:44", "remaining_time": "3:22:43"}
|
| 593 |
+
{"current_steps": 593, "total_steps": 666, "loss": 0.3398, "lr": 2.8960776692091764e-06, "epoch": 2.6664795058955644, "percentage": 89.04, "elapsed_time": "1 day, 3:04:28", "remaining_time": "3:19:58"}
|
| 594 |
+
{"current_steps": 594, "total_steps": 666, "loss": 0.3497, "lr": 2.8182153544414316e-06, "epoch": 2.670971364402021, "percentage": 89.19, "elapsed_time": "1 day, 3:07:15", "remaining_time": "3:17:14"}
|
| 595 |
+
{"current_steps": 595, "total_steps": 666, "loss": 0.3525, "lr": 2.7413758034457648e-06, "epoch": 2.6754632229084785, "percentage": 89.34, "elapsed_time": "1 day, 3:10:03", "remaining_time": "3:14:30"}
|
| 596 |
+
{"current_steps": 596, "total_steps": 666, "loss": 0.3454, "lr": 2.665561129856853e-06, "epoch": 2.6799550814149353, "percentage": 89.49, "elapsed_time": "1 day, 3:12:51", "remaining_time": "3:11:46"}
|
| 597 |
+
{"current_steps": 597, "total_steps": 666, "loss": 0.3479, "lr": 2.590773419117936e-06, "epoch": 2.6844469399213926, "percentage": 89.64, "elapsed_time": "1 day, 3:15:40", "remaining_time": "3:09:02"}
|
| 598 |
+
{"current_steps": 598, "total_steps": 666, "loss": 0.3389, "lr": 2.517014728423464e-06, "epoch": 2.6889387984278494, "percentage": 89.79, "elapsed_time": "1 day, 3:18:24", "remaining_time": "3:06:18"}
|
| 599 |
+
{"current_steps": 599, "total_steps": 666, "loss": 0.3511, "lr": 2.4442870866625157e-06, "epoch": 2.6934306569343067, "percentage": 89.94, "elapsed_time": "1 day, 3:21:10", "remaining_time": "3:03:34"}
|
| 600 |
+
{"current_steps": 600, "total_steps": 666, "loss": 0.3318, "lr": 2.3725924943629863e-06, "epoch": 2.6979225154407636, "percentage": 90.09, "elapsed_time": "1 day, 3:23:53", "remaining_time": "3:00:49"}
|
| 601 |
+
{"current_steps": 601, "total_steps": 666, "loss": 0.353, "lr": 2.301932923636545e-06, "epoch": 2.702414373947221, "percentage": 90.24, "elapsed_time": "1 day, 3:26:34", "remaining_time": "2:58:04"}
|
| 602 |
+
{"current_steps": 602, "total_steps": 666, "loss": 0.3413, "lr": 2.232310318124413e-06, "epoch": 2.7069062324536777, "percentage": 90.39, "elapsed_time": "1 day, 3:29:21", "remaining_time": "2:55:20"}
|
| 603 |
+
{"current_steps": 603, "total_steps": 666, "loss": 0.3496, "lr": 2.1637265929438777e-06, "epoch": 2.7113980909601345, "percentage": 90.54, "elapsed_time": "1 day, 3:32:15", "remaining_time": "2:52:37"}
|
| 604 |
+
{"current_steps": 604, "total_steps": 666, "loss": 0.348, "lr": 2.0961836346356225e-06, "epoch": 2.715889949466592, "percentage": 90.69, "elapsed_time": "1 day, 3:35:02", "remaining_time": "2:49:53"}
|
| 605 |
+
{"current_steps": 605, "total_steps": 666, "loss": 0.3606, "lr": 2.0296833011118356e-06, "epoch": 2.720381807973049, "percentage": 90.84, "elapsed_time": "1 day, 3:37:47", "remaining_time": "2:47:08"}
|
| 606 |
+
{"current_steps": 606, "total_steps": 666, "loss": 0.3276, "lr": 1.9642274216051005e-06, "epoch": 2.724873666479506, "percentage": 90.99, "elapsed_time": "1 day, 3:40:29", "remaining_time": "2:44:24"}
|
| 607 |
+
{"current_steps": 607, "total_steps": 666, "loss": 0.341, "lr": 1.8998177966180797e-06, "epoch": 2.7293655249859627, "percentage": 91.14, "elapsed_time": "1 day, 3:43:08", "remaining_time": "2:41:39"}
|
| 608 |
+
{"current_steps": 608, "total_steps": 666, "loss": 0.3427, "lr": 1.836456197873986e-06, "epoch": 2.73385738349242, "percentage": 91.29, "elapsed_time": "1 day, 3:45:48", "remaining_time": "2:38:54"}
|
| 609 |
+
{"current_steps": 609, "total_steps": 666, "loss": 0.3508, "lr": 1.7741443682678472e-06, "epoch": 2.7383492419988773, "percentage": 91.44, "elapsed_time": "1 day, 3:48:19", "remaining_time": "2:36:08"}
|
| 610 |
+
{"current_steps": 610, "total_steps": 666, "loss": 0.3467, "lr": 1.7128840218185816e-06, "epoch": 2.742841100505334, "percentage": 91.59, "elapsed_time": "1 day, 3:50:52", "remaining_time": "2:33:23"}
|
| 611 |
+
{"current_steps": 611, "total_steps": 666, "loss": 0.3314, "lr": 1.6526768436218122e-06, "epoch": 2.747332959011791, "percentage": 91.74, "elapsed_time": "1 day, 3:53:41", "remaining_time": "2:30:39"}
|
| 612 |
+
{"current_steps": 612, "total_steps": 666, "loss": 0.3477, "lr": 1.5935244898035574e-06, "epoch": 2.7518248175182483, "percentage": 91.89, "elapsed_time": "1 day, 3:56:25", "remaining_time": "2:27:55"}
|
| 613 |
+
{"current_steps": 613, "total_steps": 666, "loss": 0.3441, "lr": 1.5354285874746455e-06, "epoch": 2.756316676024705, "percentage": 92.04, "elapsed_time": "1 day, 3:59:06", "remaining_time": "2:25:10"}
|
| 614 |
+
{"current_steps": 614, "total_steps": 666, "loss": 0.339, "lr": 1.4783907346859728e-06, "epoch": 2.7608085345311624, "percentage": 92.19, "elapsed_time": "1 day, 4:01:47", "remaining_time": "2:22:25"}
|
| 615 |
+
{"current_steps": 615, "total_steps": 666, "loss": 0.3468, "lr": 1.4224125003845423e-06, "epoch": 2.765300393037619, "percentage": 92.34, "elapsed_time": "1 day, 4:04:21", "remaining_time": "2:19:40"}
|
| 616 |
+
{"current_steps": 616, "total_steps": 666, "loss": 0.3313, "lr": 1.367495424370291e-06, "epoch": 2.7697922515440765, "percentage": 92.49, "elapsed_time": "1 day, 4:07:07", "remaining_time": "2:16:56"}
|
| 617 |
+
{"current_steps": 617, "total_steps": 666, "loss": 0.3602, "lr": 1.3136410172537705e-06, "epoch": 2.7742841100505333, "percentage": 92.64, "elapsed_time": "1 day, 4:09:54", "remaining_time": "2:14:12"}
|
| 618 |
+
{"current_steps": 618, "total_steps": 666, "loss": 0.35, "lr": 1.2608507604145603e-06, "epoch": 2.7787759685569906, "percentage": 92.79, "elapsed_time": "1 day, 4:12:43", "remaining_time": "2:11:28"}
|
| 619 |
+
{"current_steps": 619, "total_steps": 666, "loss": 0.3431, "lr": 1.2091261059605253e-06, "epoch": 2.7832678270634474, "percentage": 92.94, "elapsed_time": "1 day, 4:15:24", "remaining_time": "2:08:43"}
|
| 620 |
+
{"current_steps": 620, "total_steps": 666, "loss": 0.3297, "lr": 1.1584684766878973e-06, "epoch": 2.7877596855699043, "percentage": 93.09, "elapsed_time": "1 day, 4:17:53", "remaining_time": "2:05:58"}
|
| 621 |
+
{"current_steps": 621, "total_steps": 666, "loss": 0.3568, "lr": 1.1088792660421067e-06, "epoch": 2.7922515440763616, "percentage": 93.24, "elapsed_time": "1 day, 4:20:29", "remaining_time": "2:03:13"}
|
| 622 |
+
{"current_steps": 622, "total_steps": 666, "loss": 0.3491, "lr": 1.060359838079461e-06, "epoch": 2.796743402582819, "percentage": 93.39, "elapsed_time": "1 day, 4:23:19", "remaining_time": "2:00:29"}
|
| 623 |
+
{"current_steps": 623, "total_steps": 666, "loss": 0.3559, "lr": 1.0129115274296431e-06, "epoch": 2.8012352610892757, "percentage": 93.54, "elapsed_time": "1 day, 4:25:58", "remaining_time": "1:57:44"}
|
| 624 |
+
{"current_steps": 624, "total_steps": 666, "loss": 0.3424, "lr": 9.665356392589742e-07, "epoch": 2.8057271195957325, "percentage": 93.69, "elapsed_time": "1 day, 4:28:39", "remaining_time": "1:55:00"}
|
| 625 |
+
{"current_steps": 625, "total_steps": 666, "loss": 0.3436, "lr": 9.212334492345243e-07, "epoch": 2.81021897810219, "percentage": 93.84, "elapsed_time": "1 day, 4:31:34", "remaining_time": "1:52:16"}
|
| 626 |
+
{"current_steps": 626, "total_steps": 666, "loss": 0.3454, "lr": 8.770062034890237e-07, "epoch": 2.814710836608647, "percentage": 93.99, "elapsed_time": "1 day, 4:34:22", "remaining_time": "1:49:32"}
|
| 627 |
+
{"current_steps": 627, "total_steps": 666, "loss": 0.3326, "lr": 8.33855118586584e-07, "epoch": 2.819202695115104, "percentage": 94.14, "elapsed_time": "1 day, 4:37:11", "remaining_time": "1:46:48"}
|
| 628 |
+
{"current_steps": 628, "total_steps": 666, "loss": 0.3562, "lr": 7.917813814892228e-07, "epoch": 2.8236945536215607, "percentage": 94.29, "elapsed_time": "1 day, 4:40:03", "remaining_time": "1:44:04"}
|
| 629 |
+
{"current_steps": 629, "total_steps": 666, "loss": 0.3491, "lr": 7.507861495242319e-07, "epoch": 2.828186412128018, "percentage": 94.44, "elapsed_time": "1 day, 4:42:41", "remaining_time": "1:41:20"}
|
| 630 |
+
{"current_steps": 630, "total_steps": 666, "loss": 0.3427, "lr": 7.108705503523361e-07, "epoch": 2.832678270634475, "percentage": 94.59, "elapsed_time": "1 day, 4:45:30", "remaining_time": "1:38:36"}
|
| 631 |
+
{"current_steps": 631, "total_steps": 666, "loss": 0.3548, "lr": 6.720356819366647e-07, "epoch": 2.837170129140932, "percentage": 94.74, "elapsed_time": "1 day, 4:48:17", "remaining_time": "1:35:51"}
|
| 632 |
+
{"current_steps": 632, "total_steps": 666, "loss": 0.3407, "lr": 6.342826125125623e-07, "epoch": 2.841661987647389, "percentage": 94.89, "elapsed_time": "1 day, 4:51:09", "remaining_time": "1:33:07"}
|
| 633 |
+
{"current_steps": 633, "total_steps": 666, "loss": 0.35, "lr": 5.976123805582035e-07, "epoch": 2.8461538461538463, "percentage": 95.05, "elapsed_time": "1 day, 4:53:55", "remaining_time": "1:30:23"}
|
| 634 |
+
{"current_steps": 634, "total_steps": 666, "loss": 0.3536, "lr": 5.620259947660112e-07, "epoch": 2.850645704660303, "percentage": 95.2, "elapsed_time": "1 day, 4:56:39", "remaining_time": "1:27:39"}
|
| 635 |
+
{"current_steps": 635, "total_steps": 666, "loss": 0.3569, "lr": 5.275244340149411e-07, "epoch": 2.8551375631667604, "percentage": 95.35, "elapsed_time": "1 day, 4:59:28", "remaining_time": "1:24:55"}
|
| 636 |
+
{"current_steps": 636, "total_steps": 666, "loss": 0.3379, "lr": 4.941086473435209e-07, "epoch": 2.859629421673217, "percentage": 95.5, "elapsed_time": "1 day, 5:02:15", "remaining_time": "1:22:10"}
|
| 637 |
+
{"current_steps": 637, "total_steps": 666, "loss": 0.3387, "lr": 4.617795539237735e-07, "epoch": 2.8641212801796745, "percentage": 95.65, "elapsed_time": "1 day, 5:04:58", "remaining_time": "1:19:26"}
|
| 638 |
+
{"current_steps": 638, "total_steps": 666, "loss": 0.3516, "lr": 4.305380430359085e-07, "epoch": 2.8686131386861313, "percentage": 95.8, "elapsed_time": "1 day, 5:07:39", "remaining_time": "1:16:42"}
|
| 639 |
+
{"current_steps": 639, "total_steps": 666, "loss": 0.3579, "lr": 4.0038497404389254e-07, "epoch": 2.8731049971925886, "percentage": 95.95, "elapsed_time": "1 day, 5:10:31", "remaining_time": "1:13:57"}
|
| 640 |
+
{"current_steps": 640, "total_steps": 666, "loss": 0.3392, "lr": 3.7132117637177054e-07, "epoch": 2.8775968556990454, "percentage": 96.1, "elapsed_time": "1 day, 5:13:21", "remaining_time": "1:11:13"}
|
| 641 |
+
{"current_steps": 641, "total_steps": 666, "loss": 0.3295, "lr": 3.433474494808842e-07, "epoch": 2.8820887142055023, "percentage": 96.25, "elapsed_time": "1 day, 5:16:13", "remaining_time": "1:08:29"}
|
| 642 |
+
{"current_steps": 642, "total_steps": 666, "loss": 0.3641, "lr": 3.1646456284786685e-07, "epoch": 2.8865805727119596, "percentage": 96.4, "elapsed_time": "1 day, 5:19:06", "remaining_time": "1:05:45"}
|
| 643 |
+
{"current_steps": 643, "total_steps": 666, "loss": 0.3429, "lr": 2.9067325594348326e-07, "epoch": 2.891072431218417, "percentage": 96.55, "elapsed_time": "1 day, 5:21:49", "remaining_time": "1:03:01"}
|
| 644 |
+
{"current_steps": 644, "total_steps": 666, "loss": 0.343, "lr": 2.659742382122721e-07, "epoch": 2.8955642897248737, "percentage": 96.7, "elapsed_time": "1 day, 5:24:26", "remaining_time": "1:00:16"}
|
| 645 |
+
{"current_steps": 645, "total_steps": 666, "loss": 0.3491, "lr": 2.4236818905305493e-07, "epoch": 2.9000561482313305, "percentage": 96.85, "elapsed_time": "1 day, 5:27:06", "remaining_time": "0:57:32"}
|
| 646 |
+
{"current_steps": 646, "total_steps": 666, "loss": 0.3471, "lr": 2.1985575780023138e-07, "epoch": 2.904548006737788, "percentage": 97.0, "elapsed_time": "1 day, 5:29:51", "remaining_time": "0:54:47"}
|
| 647 |
+
{"current_steps": 647, "total_steps": 666, "loss": 0.3378, "lr": 1.984375637059266e-07, "epoch": 2.909039865244245, "percentage": 97.15, "elapsed_time": "1 day, 5:32:29", "remaining_time": "0:52:03"}
|
| 648 |
+
{"current_steps": 648, "total_steps": 666, "loss": 0.348, "lr": 1.7811419592295153e-07, "epoch": 2.913531723750702, "percentage": 97.3, "elapsed_time": "1 day, 5:35:20", "remaining_time": "0:49:18"}
|
| 649 |
+
{"current_steps": 649, "total_steps": 666, "loss": 0.3494, "lr": 1.5888621348860266e-07, "epoch": 2.9180235822571587, "percentage": 97.45, "elapsed_time": "1 day, 5:37:57", "remaining_time": "0:46:34"}
|
| 650 |
+
{"current_steps": 650, "total_steps": 666, "loss": 0.3451, "lr": 1.4075414530927422e-07, "epoch": 2.922515440763616, "percentage": 97.6, "elapsed_time": "1 day, 5:40:43", "remaining_time": "0:43:49"}
|
| 651 |
+
{"current_steps": 651, "total_steps": 666, "loss": 0.3451, "lr": 1.2371849014593208e-07, "epoch": 2.927007299270073, "percentage": 97.75, "elapsed_time": "1 day, 5:43:35", "remaining_time": "0:41:05"}
|
| 652 |
+
{"current_steps": 652, "total_steps": 666, "loss": 0.3389, "lr": 1.0777971660036024e-07, "epoch": 2.93149915777653, "percentage": 97.9, "elapsed_time": "1 day, 5:46:16", "remaining_time": "0:38:21"}
|
| 653 |
+
{"current_steps": 653, "total_steps": 666, "loss": 0.3439, "lr": 9.293826310230014e-08, "epoch": 2.935991016282987, "percentage": 98.05, "elapsed_time": "1 day, 5:49:06", "remaining_time": "0:35:37"}
|
| 654 |
+
{"current_steps": 654, "total_steps": 666, "loss": 0.3337, "lr": 7.919453789738019e-08, "epoch": 2.9404828747894443, "percentage": 98.2, "elapsed_time": "1 day, 5:51:52", "remaining_time": "0:32:52"}
|
| 655 |
+
{"current_steps": 655, "total_steps": 666, "loss": 0.3312, "lr": 6.654891903588035e-08, "epoch": 2.944974733295901, "percentage": 98.35, "elapsed_time": "1 day, 5:54:41", "remaining_time": "0:30:08"}
|
| 656 |
+
{"current_steps": 656, "total_steps": 666, "loss": 0.3615, "lr": 5.500175436234489e-08, "epoch": 2.9494665918023584, "percentage": 98.5, "elapsed_time": "1 day, 5:57:22", "remaining_time": "0:27:23"}
|
| 657 |
+
{"current_steps": 657, "total_steps": 666, "loss": 0.3399, "lr": 4.455336150600786e-08, "epoch": 2.953958450308815, "percentage": 98.65, "elapsed_time": "1 day, 6:00:09", "remaining_time": "0:24:39"}
|
| 658 |
+
{"current_steps": 658, "total_steps": 666, "loss": 0.345, "lr": 3.520402787204891e-08, "epoch": 2.958450308815272, "percentage": 98.8, "elapsed_time": "1 day, 6:02:55", "remaining_time": "0:21:55"}
|
| 659 |
+
{"current_steps": 659, "total_steps": 666, "loss": 0.3552, "lr": 2.6954010633706284e-08, "epoch": 2.9629421673217293, "percentage": 98.95, "elapsed_time": "1 day, 6:05:32", "remaining_time": "0:19:10"}
|
| 660 |
+
{"current_steps": 660, "total_steps": 666, "loss": 0.3411, "lr": 1.9803536725180317e-08, "epoch": 2.9674340258281866, "percentage": 99.1, "elapsed_time": "1 day, 6:08:12", "remaining_time": "0:16:26"}
|
| 661 |
+
{"current_steps": 661, "total_steps": 666, "loss": 0.3486, "lr": 1.3752802835407254e-08, "epoch": 2.9719258843346434, "percentage": 99.25, "elapsed_time": "1 day, 6:11:02", "remaining_time": "0:13:41"}
|
| 662 |
+
{"current_steps": 662, "total_steps": 666, "loss": 0.3483, "lr": 8.801975402650264e-09, "epoch": 2.9764177428411003, "percentage": 99.4, "elapsed_time": "1 day, 6:14:01", "remaining_time": "0:10:57"}
|
| 663 |
+
{"current_steps": 663, "total_steps": 666, "loss": 0.3475, "lr": 4.951190609898682e-09, "epoch": 2.9809096013475576, "percentage": 99.55, "elapsed_time": "1 day, 6:16:49", "remaining_time": "0:08:13"}
|
| 664 |
+
{"current_steps": 664, "total_steps": 666, "loss": 0.338, "lr": 2.2005543811554066e-09, "epoch": 2.985401459854015, "percentage": 99.7, "elapsed_time": "1 day, 6:19:31", "remaining_time": "0:05:28"}
|
| 665 |
+
{"current_steps": 665, "total_steps": 666, "loss": 0.3412, "lr": 5.501423784970428e-10, "epoch": 2.9898933183604717, "percentage": 99.85, "elapsed_time": "1 day, 6:22:16", "remaining_time": "0:02:44"}
|
| 666 |
+
{"current_steps": 666, "total_steps": 666, "loss": 0.3482, "lr": 0.0, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 6:25:07", "remaining_time": "0:00:00"}
|
| 667 |
+
{"current_steps": 666, "total_steps": 666, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 6:26:39", "remaining_time": "0:00:00"}
|