Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e795508ebec89f295035341ade3ba77125295b62ca970443295b63f098a16a82
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20ab3649a53fddb436c86aebed066f0406dff082a21051c2c6631a589ba9bd32
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3a5f44af34400ce1270043ef5ad64a3686a0d60f6fc8aa8d313ed8ee7342f46
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37650b56615a5cb6fb4122d63727649255a9b8aea66eeae83c2932f92bfd7e77
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -494,3 +494,249 @@
|
|
| 494 |
{"current_steps": 494, "total_steps": 1230, "loss": 0.3212, "lr": 2.9901530542287044e-05, "epoch": 2.0060790273556233, "percentage": 40.16, "elapsed_time": "5:39:51", "remaining_time": "8:26:20"}
|
| 495 |
{"current_steps": 495, "total_steps": 1230, "loss": 0.3317, "lr": 2.9852175996655676e-05, "epoch": 2.010131712259372, "percentage": 40.24, "elapsed_time": "5:40:30", "remaining_time": "8:25:36"}
|
| 496 |
{"current_steps": 496, "total_steps": 1230, "loss": 0.3276, "lr": 2.980274210295326e-05, "epoch": 2.0141843971631204, "percentage": 40.33, "elapsed_time": "5:41:11", "remaining_time": "8:24:54"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 494 |
{"current_steps": 494, "total_steps": 1230, "loss": 0.3212, "lr": 2.9901530542287044e-05, "epoch": 2.0060790273556233, "percentage": 40.16, "elapsed_time": "5:39:51", "remaining_time": "8:26:20"}
|
| 495 |
{"current_steps": 495, "total_steps": 1230, "loss": 0.3317, "lr": 2.9852175996655676e-05, "epoch": 2.010131712259372, "percentage": 40.24, "elapsed_time": "5:40:30", "remaining_time": "8:25:36"}
|
| 496 |
{"current_steps": 496, "total_steps": 1230, "loss": 0.3276, "lr": 2.980274210295326e-05, "epoch": 2.0141843971631204, "percentage": 40.33, "elapsed_time": "5:41:11", "remaining_time": "8:24:54"}
|
| 497 |
+
{"current_steps": 497, "total_steps": 1230, "loss": 0.3202, "lr": 2.9753229259313578e-05, "epoch": 2.0182370820668694, "percentage": 40.41, "elapsed_time": "5:41:51", "remaining_time": "8:24:10"}
|
| 498 |
+
{"current_steps": 498, "total_steps": 1230, "loss": 0.3083, "lr": 2.9703637864506274e-05, "epoch": 2.022289766970618, "percentage": 40.49, "elapsed_time": "5:42:32", "remaining_time": "8:23:29"}
|
| 499 |
+
{"current_steps": 499, "total_steps": 1230, "loss": 0.3147, "lr": 2.965396831793362e-05, "epoch": 2.026342451874367, "percentage": 40.57, "elapsed_time": "5:43:14", "remaining_time": "8:22:49"}
|
| 500 |
+
{"current_steps": 500, "total_steps": 1230, "loss": 0.3203, "lr": 2.9604221019627316e-05, "epoch": 2.0303951367781155, "percentage": 40.65, "elapsed_time": "5:43:56", "remaining_time": "8:22:08"}
|
| 501 |
+
{"current_steps": 501, "total_steps": 1230, "loss": 0.3232, "lr": 2.955439637024526e-05, "epoch": 2.0344478216818644, "percentage": 40.73, "elapsed_time": "5:44:38", "remaining_time": "8:21:29"}
|
| 502 |
+
{"current_steps": 502, "total_steps": 1230, "loss": 0.3248, "lr": 2.9504494771068334e-05, "epoch": 2.038500506585613, "percentage": 40.81, "elapsed_time": "5:45:23", "remaining_time": "8:20:52"}
|
| 503 |
+
{"current_steps": 503, "total_steps": 1230, "loss": 0.3022, "lr": 2.9454516623997156e-05, "epoch": 2.0425531914893615, "percentage": 40.89, "elapsed_time": "5:46:03", "remaining_time": "8:20:10"}
|
| 504 |
+
{"current_steps": 504, "total_steps": 1230, "loss": 0.3181, "lr": 2.9404462331548847e-05, "epoch": 2.0466058763931105, "percentage": 40.98, "elapsed_time": "5:46:42", "remaining_time": "8:19:25"}
|
| 505 |
+
{"current_steps": 505, "total_steps": 1230, "loss": 0.3149, "lr": 2.93543322968538e-05, "epoch": 2.050658561296859, "percentage": 41.06, "elapsed_time": "5:47:23", "remaining_time": "8:18:44"}
|
| 506 |
+
{"current_steps": 506, "total_steps": 1230, "loss": 0.2998, "lr": 2.9304126923652428e-05, "epoch": 2.054711246200608, "percentage": 41.14, "elapsed_time": "5:48:05", "remaining_time": "8:18:03"}
|
| 507 |
+
{"current_steps": 507, "total_steps": 1230, "loss": 0.32, "lr": 2.9253846616291896e-05, "epoch": 2.0587639311043566, "percentage": 41.22, "elapsed_time": "5:48:42", "remaining_time": "8:17:16"}
|
| 508 |
+
{"current_steps": 508, "total_steps": 1230, "loss": 0.3319, "lr": 2.9203491779722896e-05, "epoch": 2.062816616008105, "percentage": 41.3, "elapsed_time": "5:49:27", "remaining_time": "8:16:39"}
|
| 509 |
+
{"current_steps": 509, "total_steps": 1230, "loss": 0.3138, "lr": 2.9153062819496357e-05, "epoch": 2.066869300911854, "percentage": 41.38, "elapsed_time": "5:50:08", "remaining_time": "8:15:59"}
|
| 510 |
+
{"current_steps": 510, "total_steps": 1230, "loss": 0.3231, "lr": 2.9102560141760178e-05, "epoch": 2.0709219858156027, "percentage": 41.46, "elapsed_time": "5:50:48", "remaining_time": "8:15:15"}
|
| 511 |
+
{"current_steps": 511, "total_steps": 1230, "loss": 0.3158, "lr": 2.9051984153256004e-05, "epoch": 2.0749746707193517, "percentage": 41.54, "elapsed_time": "5:51:33", "remaining_time": "8:14:39"}
|
| 512 |
+
{"current_steps": 512, "total_steps": 1230, "loss": 0.3163, "lr": 2.900133526131588e-05, "epoch": 2.0790273556231003, "percentage": 41.63, "elapsed_time": "5:52:14", "remaining_time": "8:13:57"}
|
| 513 |
+
{"current_steps": 513, "total_steps": 1230, "loss": 0.3174, "lr": 2.8950613873859025e-05, "epoch": 2.0830800405268493, "percentage": 41.71, "elapsed_time": "5:52:54", "remaining_time": "8:13:14"}
|
| 514 |
+
{"current_steps": 514, "total_steps": 1230, "loss": 0.3027, "lr": 2.8899820399388515e-05, "epoch": 2.087132725430598, "percentage": 41.79, "elapsed_time": "5:53:32", "remaining_time": "8:12:28"}
|
| 515 |
+
{"current_steps": 515, "total_steps": 1230, "loss": 0.3183, "lr": 2.8848955246988012e-05, "epoch": 2.0911854103343464, "percentage": 41.87, "elapsed_time": "5:54:15", "remaining_time": "8:11:49"}
|
| 516 |
+
{"current_steps": 516, "total_steps": 1230, "loss": 0.3282, "lr": 2.879801882631847e-05, "epoch": 2.0952380952380953, "percentage": 41.95, "elapsed_time": "5:55:01", "remaining_time": "8:11:14"}
|
| 517 |
+
{"current_steps": 517, "total_steps": 1230, "loss": 0.2908, "lr": 2.8747011547614808e-05, "epoch": 2.099290780141844, "percentage": 42.03, "elapsed_time": "5:55:42", "remaining_time": "8:10:33"}
|
| 518 |
+
{"current_steps": 518, "total_steps": 1230, "loss": 0.3024, "lr": 2.8695933821682635e-05, "epoch": 2.103343465045593, "percentage": 42.11, "elapsed_time": "5:56:22", "remaining_time": "8:09:50"}
|
| 519 |
+
{"current_steps": 519, "total_steps": 1230, "loss": 0.3203, "lr": 2.864478605989494e-05, "epoch": 2.1073961499493414, "percentage": 42.2, "elapsed_time": "5:57:01", "remaining_time": "8:09:05"}
|
| 520 |
+
{"current_steps": 520, "total_steps": 1230, "loss": 0.3267, "lr": 2.8593568674188765e-05, "epoch": 2.11144883485309, "percentage": 42.28, "elapsed_time": "5:57:42", "remaining_time": "8:08:24"}
|
| 521 |
+
{"current_steps": 521, "total_steps": 1230, "loss": 0.3148, "lr": 2.8542282077061892e-05, "epoch": 2.115501519756839, "percentage": 42.36, "elapsed_time": "5:58:22", "remaining_time": "8:07:41"}
|
| 522 |
+
{"current_steps": 522, "total_steps": 1230, "loss": 0.3084, "lr": 2.8490926681569523e-05, "epoch": 2.1195542046605875, "percentage": 42.44, "elapsed_time": "5:58:59", "remaining_time": "8:06:53"}
|
| 523 |
+
{"current_steps": 523, "total_steps": 1230, "loss": 0.3009, "lr": 2.8439502901320956e-05, "epoch": 2.1236068895643365, "percentage": 42.52, "elapsed_time": "5:59:38", "remaining_time": "8:06:10"}
|
| 524 |
+
{"current_steps": 524, "total_steps": 1230, "loss": 0.3235, "lr": 2.8388011150476237e-05, "epoch": 2.127659574468085, "percentage": 42.6, "elapsed_time": "6:00:19", "remaining_time": "8:05:28"}
|
| 525 |
+
{"current_steps": 525, "total_steps": 1230, "loss": 0.3117, "lr": 2.8336451843742866e-05, "epoch": 2.1317122593718336, "percentage": 42.68, "elapsed_time": "6:01:03", "remaining_time": "8:04:51"}
|
| 526 |
+
{"current_steps": 526, "total_steps": 1230, "loss": 0.3158, "lr": 2.8284825396372387e-05, "epoch": 2.1357649442755826, "percentage": 42.76, "elapsed_time": "6:01:44", "remaining_time": "8:04:09"}
|
| 527 |
+
{"current_steps": 527, "total_steps": 1230, "loss": 0.3137, "lr": 2.8233132224157132e-05, "epoch": 2.139817629179331, "percentage": 42.85, "elapsed_time": "6:02:23", "remaining_time": "8:03:24"}
|
| 528 |
+
{"current_steps": 528, "total_steps": 1230, "loss": 0.3246, "lr": 2.8181372743426805e-05, "epoch": 2.14387031408308, "percentage": 42.93, "elapsed_time": "6:03:04", "remaining_time": "8:02:43"}
|
| 529 |
+
{"current_steps": 529, "total_steps": 1230, "loss": 0.3172, "lr": 2.8129547371045128e-05, "epoch": 2.1479229989868287, "percentage": 43.01, "elapsed_time": "6:03:41", "remaining_time": "8:01:56"}
|
| 530 |
+
{"current_steps": 530, "total_steps": 1230, "loss": 0.3095, "lr": 2.8077656524406534e-05, "epoch": 2.1519756838905777, "percentage": 43.09, "elapsed_time": "6:04:18", "remaining_time": "8:01:09"}
|
| 531 |
+
{"current_steps": 531, "total_steps": 1230, "loss": 0.3218, "lr": 2.802570062143278e-05, "epoch": 2.1560283687943262, "percentage": 43.17, "elapsed_time": "6:04:56", "remaining_time": "8:00:24"}
|
| 532 |
+
{"current_steps": 532, "total_steps": 1230, "loss": 0.3037, "lr": 2.7973680080569555e-05, "epoch": 2.160081053698075, "percentage": 43.25, "elapsed_time": "6:05:36", "remaining_time": "7:59:41"}
|
| 533 |
+
{"current_steps": 533, "total_steps": 1230, "loss": 0.3298, "lr": 2.792159532078314e-05, "epoch": 2.164133738601824, "percentage": 43.33, "elapsed_time": "6:06:19", "remaining_time": "7:59:02"}
|
| 534 |
+
{"current_steps": 534, "total_steps": 1230, "loss": 0.2986, "lr": 2.7869446761557033e-05, "epoch": 2.1681864235055723, "percentage": 43.41, "elapsed_time": "6:06:57", "remaining_time": "7:58:17"}
|
| 535 |
+
{"current_steps": 535, "total_steps": 1230, "loss": 0.3106, "lr": 2.781723482288857e-05, "epoch": 2.1722391084093213, "percentage": 43.5, "elapsed_time": "6:07:39", "remaining_time": "7:57:37"}
|
| 536 |
+
{"current_steps": 536, "total_steps": 1230, "loss": 0.3109, "lr": 2.7764959925285517e-05, "epoch": 2.17629179331307, "percentage": 43.58, "elapsed_time": "6:08:24", "remaining_time": "7:57:00"}
|
| 537 |
+
{"current_steps": 537, "total_steps": 1230, "loss": 0.3214, "lr": 2.771262248976272e-05, "epoch": 2.180344478216819, "percentage": 43.66, "elapsed_time": "6:09:04", "remaining_time": "7:56:17"}
|
| 538 |
+
{"current_steps": 538, "total_steps": 1230, "loss": 0.3361, "lr": 2.7660222937838677e-05, "epoch": 2.1843971631205674, "percentage": 43.74, "elapsed_time": "6:09:46", "remaining_time": "7:55:37"}
|
| 539 |
+
{"current_steps": 539, "total_steps": 1230, "loss": 0.314, "lr": 2.7607761691532186e-05, "epoch": 2.188449848024316, "percentage": 43.82, "elapsed_time": "6:10:26", "remaining_time": "7:54:54"}
|
| 540 |
+
{"current_steps": 540, "total_steps": 1230, "loss": 0.3078, "lr": 2.7555239173358916e-05, "epoch": 2.192502532928065, "percentage": 43.9, "elapsed_time": "6:11:07", "remaining_time": "7:54:12"}
|
| 541 |
+
{"current_steps": 541, "total_steps": 1230, "loss": 0.3173, "lr": 2.7502655806328e-05, "epoch": 2.1965552178318135, "percentage": 43.98, "elapsed_time": "6:11:42", "remaining_time": "7:53:23"}
|
| 542 |
+
{"current_steps": 542, "total_steps": 1230, "loss": 0.319, "lr": 2.7450012013938648e-05, "epoch": 2.2006079027355625, "percentage": 44.07, "elapsed_time": "6:12:23", "remaining_time": "7:52:42"}
|
| 543 |
+
{"current_steps": 543, "total_steps": 1230, "loss": 0.3158, "lr": 2.739730822017673e-05, "epoch": 2.204660587639311, "percentage": 44.15, "elapsed_time": "6:13:04", "remaining_time": "7:52:00"}
|
| 544 |
+
{"current_steps": 544, "total_steps": 1230, "loss": 0.3238, "lr": 2.7344544849511355e-05, "epoch": 2.2087132725430596, "percentage": 44.23, "elapsed_time": "6:13:46", "remaining_time": "7:51:20"}
|
| 545 |
+
{"current_steps": 545, "total_steps": 1230, "loss": 0.3062, "lr": 2.7291722326891456e-05, "epoch": 2.2127659574468086, "percentage": 44.31, "elapsed_time": "6:14:26", "remaining_time": "7:50:37"}
|
| 546 |
+
{"current_steps": 546, "total_steps": 1230, "loss": 0.3032, "lr": 2.723884107774236e-05, "epoch": 2.216818642350557, "percentage": 44.39, "elapsed_time": "6:15:09", "remaining_time": "7:49:58"}
|
| 547 |
+
{"current_steps": 547, "total_steps": 1230, "loss": 0.3097, "lr": 2.718590152796239e-05, "epoch": 2.220871327254306, "percentage": 44.47, "elapsed_time": "6:15:47", "remaining_time": "7:49:13"}
|
| 548 |
+
{"current_steps": 548, "total_steps": 1230, "loss": 0.3182, "lr": 2.71329041039194e-05, "epoch": 2.2249240121580547, "percentage": 44.55, "elapsed_time": "6:16:27", "remaining_time": "7:48:30"}
|
| 549 |
+
{"current_steps": 549, "total_steps": 1230, "loss": 0.3137, "lr": 2.7079849232447357e-05, "epoch": 2.2289766970618032, "percentage": 44.63, "elapsed_time": "6:17:02", "remaining_time": "7:47:42"}
|
| 550 |
+
{"current_steps": 550, "total_steps": 1230, "loss": 0.3083, "lr": 2.7026737340842895e-05, "epoch": 2.2330293819655522, "percentage": 44.72, "elapsed_time": "6:17:43", "remaining_time": "7:46:59"}
|
| 551 |
+
{"current_steps": 551, "total_steps": 1230, "loss": 0.3085, "lr": 2.697356885686189e-05, "epoch": 2.237082066869301, "percentage": 44.8, "elapsed_time": "6:18:25", "remaining_time": "7:46:19"}
|
| 552 |
+
{"current_steps": 552, "total_steps": 1230, "loss": 0.323, "lr": 2.6920344208716014e-05, "epoch": 2.2411347517730498, "percentage": 44.88, "elapsed_time": "6:19:03", "remaining_time": "7:45:35"}
|
| 553 |
+
{"current_steps": 553, "total_steps": 1230, "loss": 0.3196, "lr": 2.6867063825069252e-05, "epoch": 2.2451874366767983, "percentage": 44.96, "elapsed_time": "6:19:40", "remaining_time": "7:44:48"}
|
| 554 |
+
{"current_steps": 554, "total_steps": 1230, "loss": 0.3136, "lr": 2.6813728135034494e-05, "epoch": 2.2492401215805473, "percentage": 45.04, "elapsed_time": "6:20:20", "remaining_time": "7:44:05"}
|
| 555 |
+
{"current_steps": 555, "total_steps": 1230, "loss": 0.3049, "lr": 2.6760337568170056e-05, "epoch": 2.253292806484296, "percentage": 45.12, "elapsed_time": "6:21:00", "remaining_time": "7:43:23"}
|
| 556 |
+
{"current_steps": 556, "total_steps": 1230, "loss": 0.3266, "lr": 2.6706892554476226e-05, "epoch": 2.2573454913880444, "percentage": 45.2, "elapsed_time": "6:21:43", "remaining_time": "7:42:44"}
|
| 557 |
+
{"current_steps": 557, "total_steps": 1230, "loss": 0.3137, "lr": 2.6653393524391795e-05, "epoch": 2.2613981762917934, "percentage": 45.28, "elapsed_time": "6:22:27", "remaining_time": "7:42:06"}
|
| 558 |
+
{"current_steps": 558, "total_steps": 1230, "loss": 0.3162, "lr": 2.6599840908790592e-05, "epoch": 2.265450861195542, "percentage": 45.37, "elapsed_time": "6:23:13", "remaining_time": "7:41:31"}
|
| 559 |
+
{"current_steps": 559, "total_steps": 1230, "loss": 0.3275, "lr": 2.6546235138978028e-05, "epoch": 2.269503546099291, "percentage": 45.45, "elapsed_time": "6:23:53", "remaining_time": "7:40:47"}
|
| 560 |
+
{"current_steps": 560, "total_steps": 1230, "loss": 0.3257, "lr": 2.6492576646687597e-05, "epoch": 2.2735562310030395, "percentage": 45.53, "elapsed_time": "6:24:35", "remaining_time": "7:40:07"}
|
| 561 |
+
{"current_steps": 561, "total_steps": 1230, "loss": 0.3344, "lr": 2.6438865864077425e-05, "epoch": 2.2776089159067885, "percentage": 45.61, "elapsed_time": "6:25:17", "remaining_time": "7:39:28"}
|
| 562 |
+
{"current_steps": 562, "total_steps": 1230, "loss": 0.3136, "lr": 2.6385103223726766e-05, "epoch": 2.281661600810537, "percentage": 45.69, "elapsed_time": "6:25:57", "remaining_time": "7:38:45"}
|
| 563 |
+
{"current_steps": 563, "total_steps": 1230, "loss": 0.3371, "lr": 2.6331289158632537e-05, "epoch": 2.2857142857142856, "percentage": 45.77, "elapsed_time": "6:26:38", "remaining_time": "7:38:04"}
|
| 564 |
+
{"current_steps": 564, "total_steps": 1230, "loss": 0.3192, "lr": 2.6277424102205817e-05, "epoch": 2.2897669706180346, "percentage": 45.85, "elapsed_time": "6:27:23", "remaining_time": "7:37:27"}
|
| 565 |
+
{"current_steps": 565, "total_steps": 1230, "loss": 0.3027, "lr": 2.6223508488268374e-05, "epoch": 2.293819655521783, "percentage": 45.93, "elapsed_time": "6:28:02", "remaining_time": "7:36:42"}
|
| 566 |
+
{"current_steps": 566, "total_steps": 1230, "loss": 0.3159, "lr": 2.6169542751049148e-05, "epoch": 2.297872340425532, "percentage": 46.02, "elapsed_time": "6:28:43", "remaining_time": "7:36:01"}
|
| 567 |
+
{"current_steps": 567, "total_steps": 1230, "loss": 0.3118, "lr": 2.6115527325180754e-05, "epoch": 2.3019250253292807, "percentage": 46.1, "elapsed_time": "6:29:22", "remaining_time": "7:35:18"}
|
| 568 |
+
{"current_steps": 568, "total_steps": 1230, "loss": 0.3235, "lr": 2.606146264569603e-05, "epoch": 2.305977710233029, "percentage": 46.18, "elapsed_time": "6:30:00", "remaining_time": "7:34:33"}
|
| 569 |
+
{"current_steps": 569, "total_steps": 1230, "loss": 0.3102, "lr": 2.6007349148024447e-05, "epoch": 2.310030395136778, "percentage": 46.26, "elapsed_time": "6:30:43", "remaining_time": "7:33:53"}
|
| 570 |
+
{"current_steps": 570, "total_steps": 1230, "loss": 0.3117, "lr": 2.5953187267988694e-05, "epoch": 2.3140830800405268, "percentage": 46.34, "elapsed_time": "6:31:26", "remaining_time": "7:33:14"}
|
| 571 |
+
{"current_steps": 571, "total_steps": 1230, "loss": 0.321, "lr": 2.5898977441801097e-05, "epoch": 2.3181357649442758, "percentage": 46.42, "elapsed_time": "6:32:07", "remaining_time": "7:32:33"}
|
| 572 |
+
{"current_steps": 572, "total_steps": 1230, "loss": 0.3225, "lr": 2.584472010606015e-05, "epoch": 2.3221884498480243, "percentage": 46.5, "elapsed_time": "6:32:48", "remaining_time": "7:31:52"}
|
| 573 |
+
{"current_steps": 573, "total_steps": 1230, "loss": 0.3198, "lr": 2.5790415697746976e-05, "epoch": 2.326241134751773, "percentage": 46.59, "elapsed_time": "6:33:25", "remaining_time": "7:31:05"}
|
| 574 |
+
{"current_steps": 574, "total_steps": 1230, "loss": 0.2939, "lr": 2.5736064654221808e-05, "epoch": 2.330293819655522, "percentage": 46.67, "elapsed_time": "6:34:07", "remaining_time": "7:30:25"}
|
| 575 |
+
{"current_steps": 575, "total_steps": 1230, "loss": 0.3002, "lr": 2.568166741322048e-05, "epoch": 2.3343465045592704, "percentage": 46.75, "elapsed_time": "6:34:46", "remaining_time": "7:29:41"}
|
| 576 |
+
{"current_steps": 576, "total_steps": 1230, "loss": 0.3285, "lr": 2.56272244128509e-05, "epoch": 2.3383991894630194, "percentage": 46.83, "elapsed_time": "6:35:26", "remaining_time": "7:28:59"}
|
| 577 |
+
{"current_steps": 577, "total_steps": 1230, "loss": 0.3162, "lr": 2.55727360915895e-05, "epoch": 2.342451874366768, "percentage": 46.91, "elapsed_time": "6:36:09", "remaining_time": "7:28:20"}
|
| 578 |
+
{"current_steps": 578, "total_steps": 1230, "loss": 0.3176, "lr": 2.5518202888277734e-05, "epoch": 2.3465045592705165, "percentage": 46.99, "elapsed_time": "6:36:51", "remaining_time": "7:27:39"}
|
| 579 |
+
{"current_steps": 579, "total_steps": 1230, "loss": 0.3301, "lr": 2.5463625242118523e-05, "epoch": 2.3505572441742655, "percentage": 47.07, "elapsed_time": "6:37:31", "remaining_time": "7:26:57"}
|
| 580 |
+
{"current_steps": 580, "total_steps": 1230, "loss": 0.3072, "lr": 2.5409003592672723e-05, "epoch": 2.354609929078014, "percentage": 47.15, "elapsed_time": "6:38:13", "remaining_time": "7:26:17"}
|
| 581 |
+
{"current_steps": 581, "total_steps": 1230, "loss": 0.3116, "lr": 2.535433837985559e-05, "epoch": 2.358662613981763, "percentage": 47.24, "elapsed_time": "6:38:54", "remaining_time": "7:25:35"}
|
| 582 |
+
{"current_steps": 582, "total_steps": 1230, "loss": 0.307, "lr": 2.529963004393324e-05, "epoch": 2.3627152988855116, "percentage": 47.32, "elapsed_time": "6:39:34", "remaining_time": "7:24:53"}
|
| 583 |
+
{"current_steps": 583, "total_steps": 1230, "loss": 0.3279, "lr": 2.524487902551908e-05, "epoch": 2.3667679837892606, "percentage": 47.4, "elapsed_time": "6:40:17", "remaining_time": "7:24:14"}
|
| 584 |
+
{"current_steps": 584, "total_steps": 1230, "loss": 0.3135, "lr": 2.519008576557029e-05, "epoch": 2.370820668693009, "percentage": 47.48, "elapsed_time": "6:40:57", "remaining_time": "7:23:31"}
|
| 585 |
+
{"current_steps": 585, "total_steps": 1230, "loss": 0.3221, "lr": 2.5135250705384254e-05, "epoch": 2.3748733535967577, "percentage": 47.56, "elapsed_time": "6:41:42", "remaining_time": "7:22:54"}
|
| 586 |
+
{"current_steps": 586, "total_steps": 1230, "loss": 0.326, "lr": 2.5080374286595007e-05, "epoch": 2.3789260385005067, "percentage": 47.64, "elapsed_time": "6:42:25", "remaining_time": "7:22:15"}
|
| 587 |
+
{"current_steps": 587, "total_steps": 1230, "loss": 0.3264, "lr": 2.5025456951169677e-05, "epoch": 2.382978723404255, "percentage": 47.72, "elapsed_time": "6:43:03", "remaining_time": "7:21:30"}
|
| 588 |
+
{"current_steps": 588, "total_steps": 1230, "loss": 0.3277, "lr": 2.4970499141404942e-05, "epoch": 2.387031408308004, "percentage": 47.8, "elapsed_time": "6:43:42", "remaining_time": "7:20:47"}
|
| 589 |
+
{"current_steps": 589, "total_steps": 1230, "loss": 0.315, "lr": 2.491550129992345e-05, "epoch": 2.3910840932117527, "percentage": 47.89, "elapsed_time": "6:44:23", "remaining_time": "7:20:06"}
|
| 590 |
+
{"current_steps": 590, "total_steps": 1230, "loss": 0.3232, "lr": 2.486046386967024e-05, "epoch": 2.3951367781155017, "percentage": 47.97, "elapsed_time": "6:45:05", "remaining_time": "7:19:25"}
|
| 591 |
+
{"current_steps": 591, "total_steps": 1230, "loss": 0.319, "lr": 2.4805387293909214e-05, "epoch": 2.3991894630192503, "percentage": 48.05, "elapsed_time": "6:45:51", "remaining_time": "7:18:48"}
|
| 592 |
+
{"current_steps": 592, "total_steps": 1230, "loss": 0.3124, "lr": 2.4750272016219552e-05, "epoch": 2.403242147922999, "percentage": 48.13, "elapsed_time": "6:46:31", "remaining_time": "7:18:06"}
|
| 593 |
+
{"current_steps": 593, "total_steps": 1230, "loss": 0.3158, "lr": 2.4695118480492114e-05, "epoch": 2.407294832826748, "percentage": 48.21, "elapsed_time": "6:47:10", "remaining_time": "7:17:22"}
|
| 594 |
+
{"current_steps": 594, "total_steps": 1230, "loss": 0.3219, "lr": 2.4639927130925898e-05, "epoch": 2.4113475177304964, "percentage": 48.29, "elapsed_time": "6:47:49", "remaining_time": "7:16:39"}
|
| 595 |
+
{"current_steps": 595, "total_steps": 1230, "loss": 0.3277, "lr": 2.458469841202444e-05, "epoch": 2.4154002026342454, "percentage": 48.37, "elapsed_time": "6:48:33", "remaining_time": "7:16:01"}
|
| 596 |
+
{"current_steps": 596, "total_steps": 1230, "loss": 0.305, "lr": 2.452943276859226e-05, "epoch": 2.419452887537994, "percentage": 48.46, "elapsed_time": "6:49:17", "remaining_time": "7:15:22"}
|
| 597 |
+
{"current_steps": 597, "total_steps": 1230, "loss": 0.3192, "lr": 2.447413064573125e-05, "epoch": 2.4235055724417425, "percentage": 48.54, "elapsed_time": "6:49:57", "remaining_time": "7:14:40"}
|
| 598 |
+
{"current_steps": 598, "total_steps": 1230, "loss": 0.3209, "lr": 2.4418792488837095e-05, "epoch": 2.4275582573454915, "percentage": 48.62, "elapsed_time": "6:50:38", "remaining_time": "7:13:59"}
|
| 599 |
+
{"current_steps": 599, "total_steps": 1230, "loss": 0.3233, "lr": 2.4363418743595713e-05, "epoch": 2.43161094224924, "percentage": 48.7, "elapsed_time": "6:51:19", "remaining_time": "7:13:18"}
|
| 600 |
+
{"current_steps": 600, "total_steps": 1230, "loss": 0.3071, "lr": 2.430800985597963e-05, "epoch": 2.435663627152989, "percentage": 48.78, "elapsed_time": "6:52:03", "remaining_time": "7:12:39"}
|
| 601 |
+
{"current_steps": 601, "total_steps": 1230, "loss": 0.3182, "lr": 2.4252566272244415e-05, "epoch": 2.4397163120567376, "percentage": 48.86, "elapsed_time": "6:52:45", "remaining_time": "7:11:59"}
|
| 602 |
+
{"current_steps": 602, "total_steps": 1230, "loss": 0.3243, "lr": 2.4197088438925063e-05, "epoch": 2.443768996960486, "percentage": 48.94, "elapsed_time": "6:53:22", "remaining_time": "7:11:13"}
|
| 603 |
+
{"current_steps": 603, "total_steps": 1230, "loss": 0.3035, "lr": 2.4141576802832417e-05, "epoch": 2.447821681864235, "percentage": 49.02, "elapsed_time": "6:54:04", "remaining_time": "7:10:32"}
|
| 604 |
+
{"current_steps": 604, "total_steps": 1230, "loss": 0.3158, "lr": 2.408603181104957e-05, "epoch": 2.4518743667679836, "percentage": 49.11, "elapsed_time": "6:54:45", "remaining_time": "7:09:51"}
|
| 605 |
+
{"current_steps": 605, "total_steps": 1230, "loss": 0.3079, "lr": 2.4030453910928245e-05, "epoch": 2.4559270516717326, "percentage": 49.19, "elapsed_time": "6:55:20", "remaining_time": "7:09:04"}
|
| 606 |
+
{"current_steps": 606, "total_steps": 1230, "loss": 0.321, "lr": 2.397484355008521e-05, "epoch": 2.459979736575481, "percentage": 49.27, "elapsed_time": "6:56:00", "remaining_time": "7:08:21"}
|
| 607 |
+
{"current_steps": 607, "total_steps": 1230, "loss": 0.3251, "lr": 2.3919201176398662e-05, "epoch": 2.46403242147923, "percentage": 49.35, "elapsed_time": "6:56:41", "remaining_time": "7:07:41"}
|
| 608 |
+
{"current_steps": 608, "total_steps": 1230, "loss": 0.3242, "lr": 2.3863527238004633e-05, "epoch": 2.4680851063829787, "percentage": 49.43, "elapsed_time": "6:57:23", "remaining_time": "7:06:59"}
|
| 609 |
+
{"current_steps": 609, "total_steps": 1230, "loss": 0.3062, "lr": 2.380782218329337e-05, "epoch": 2.4721377912867273, "percentage": 49.51, "elapsed_time": "6:58:00", "remaining_time": "7:06:14"}
|
| 610 |
+
{"current_steps": 610, "total_steps": 1230, "loss": 0.3141, "lr": 2.3752086460905725e-05, "epoch": 2.4761904761904763, "percentage": 49.59, "elapsed_time": "6:58:38", "remaining_time": "7:05:29"}
|
| 611 |
+
{"current_steps": 611, "total_steps": 1230, "loss": 0.3385, "lr": 2.3696320519729544e-05, "epoch": 2.480243161094225, "percentage": 49.67, "elapsed_time": "6:59:19", "remaining_time": "7:04:48"}
|
| 612 |
+
{"current_steps": 612, "total_steps": 1230, "loss": 0.3178, "lr": 2.3640524808896045e-05, "epoch": 2.484295845997974, "percentage": 49.76, "elapsed_time": "7:00:02", "remaining_time": "7:04:09"}
|
| 613 |
+
{"current_steps": 613, "total_steps": 1230, "loss": 0.3154, "lr": 2.3584699777776222e-05, "epoch": 2.4883485309017224, "percentage": 49.84, "elapsed_time": "7:00:45", "remaining_time": "7:03:30"}
|
| 614 |
+
{"current_steps": 614, "total_steps": 1230, "loss": 0.3323, "lr": 2.3528845875977195e-05, "epoch": 2.4924012158054714, "percentage": 49.92, "elapsed_time": "7:01:24", "remaining_time": "7:02:47"}
|
| 615 |
+
{"current_steps": 615, "total_steps": 1230, "loss": 0.3132, "lr": 2.3472963553338614e-05, "epoch": 2.49645390070922, "percentage": 50.0, "elapsed_time": "7:02:06", "remaining_time": "7:02:06"}
|
| 616 |
+
{"current_steps": 616, "total_steps": 1230, "loss": 0.3273, "lr": 2.341705325992901e-05, "epoch": 2.5005065856129685, "percentage": 50.08, "elapsed_time": "7:02:47", "remaining_time": "7:01:25"}
|
| 617 |
+
{"current_steps": 617, "total_steps": 1230, "loss": 0.3104, "lr": 2.336111544604222e-05, "epoch": 2.5045592705167175, "percentage": 50.16, "elapsed_time": "7:03:28", "remaining_time": "7:00:44"}
|
| 618 |
+
{"current_steps": 618, "total_steps": 1230, "loss": 0.3191, "lr": 2.33051505621937e-05, "epoch": 2.508611955420466, "percentage": 50.24, "elapsed_time": "7:04:08", "remaining_time": "7:00:01"}
|
| 619 |
+
{"current_steps": 619, "total_steps": 1230, "loss": 0.3101, "lr": 2.324915905911693e-05, "epoch": 2.512664640324215, "percentage": 50.33, "elapsed_time": "7:04:50", "remaining_time": "6:59:21"}
|
| 620 |
+
{"current_steps": 620, "total_steps": 1230, "loss": 0.3185, "lr": 2.319314138775977e-05, "epoch": 2.5167173252279635, "percentage": 50.41, "elapsed_time": "7:05:29", "remaining_time": "6:58:37"}
|
| 621 |
+
{"current_steps": 621, "total_steps": 1230, "loss": 0.3284, "lr": 2.3137097999280856e-05, "epoch": 2.520770010131712, "percentage": 50.49, "elapsed_time": "7:06:08", "remaining_time": "6:57:54"}
|
| 622 |
+
{"current_steps": 622, "total_steps": 1230, "loss": 0.3176, "lr": 2.308102934504593e-05, "epoch": 2.524822695035461, "percentage": 50.57, "elapsed_time": "7:06:49", "remaining_time": "6:57:13"}
|
| 623 |
+
{"current_steps": 623, "total_steps": 1230, "loss": 0.2925, "lr": 2.3024935876624222e-05, "epoch": 2.5288753799392096, "percentage": 50.65, "elapsed_time": "7:07:25", "remaining_time": "6:56:27"}
|
| 624 |
+
{"current_steps": 624, "total_steps": 1230, "loss": 0.3101, "lr": 2.2968818045784813e-05, "epoch": 2.5329280648429586, "percentage": 50.73, "elapsed_time": "7:08:06", "remaining_time": "6:55:45"}
|
| 625 |
+
{"current_steps": 625, "total_steps": 1230, "loss": 0.3188, "lr": 2.2912676304493006e-05, "epoch": 2.536980749746707, "percentage": 50.81, "elapsed_time": "7:08:44", "remaining_time": "6:55:01"}
|
| 626 |
+
{"current_steps": 626, "total_steps": 1230, "loss": 0.3236, "lr": 2.2856511104906668e-05, "epoch": 2.5410334346504557, "percentage": 50.89, "elapsed_time": "7:09:26", "remaining_time": "6:54:20"}
|
| 627 |
+
{"current_steps": 627, "total_steps": 1230, "loss": 0.335, "lr": 2.2800322899372586e-05, "epoch": 2.5450861195542047, "percentage": 50.98, "elapsed_time": "7:10:03", "remaining_time": "6:53:35"}
|
| 628 |
+
{"current_steps": 628, "total_steps": 1230, "loss": 0.3195, "lr": 2.2744112140422844e-05, "epoch": 2.5491388044579533, "percentage": 51.06, "elapsed_time": "7:10:44", "remaining_time": "6:52:54"}
|
| 629 |
+
{"current_steps": 629, "total_steps": 1230, "loss": 0.3228, "lr": 2.2687879280771177e-05, "epoch": 2.5531914893617023, "percentage": 51.14, "elapsed_time": "7:11:26", "remaining_time": "6:52:13"}
|
| 630 |
+
{"current_steps": 630, "total_steps": 1230, "loss": 0.3166, "lr": 2.26316247733093e-05, "epoch": 2.557244174265451, "percentage": 51.22, "elapsed_time": "7:12:06", "remaining_time": "6:51:31"}
|
| 631 |
+
{"current_steps": 631, "total_steps": 1230, "loss": 0.3208, "lr": 2.257534907110328e-05, "epoch": 2.5612968591691994, "percentage": 51.3, "elapsed_time": "7:12:49", "remaining_time": "6:50:52"}
|
| 632 |
+
{"current_steps": 632, "total_steps": 1230, "loss": 0.3213, "lr": 2.2519052627389882e-05, "epoch": 2.5653495440729484, "percentage": 51.38, "elapsed_time": "7:13:27", "remaining_time": "6:50:08"}
|
| 633 |
+
{"current_steps": 633, "total_steps": 1230, "loss": 0.3233, "lr": 2.246273589557294e-05, "epoch": 2.569402228976697, "percentage": 51.46, "elapsed_time": "7:14:08", "remaining_time": "6:49:26"}
|
| 634 |
+
{"current_steps": 634, "total_steps": 1230, "loss": 0.3179, "lr": 2.240639932921966e-05, "epoch": 2.573454913880446, "percentage": 51.54, "elapsed_time": "7:14:48", "remaining_time": "6:48:44"}
|
| 635 |
+
{"current_steps": 635, "total_steps": 1230, "loss": 0.3306, "lr": 2.2350043382056995e-05, "epoch": 2.5775075987841944, "percentage": 51.63, "elapsed_time": "7:15:30", "remaining_time": "6:48:04"}
|
| 636 |
+
{"current_steps": 636, "total_steps": 1230, "loss": 0.3099, "lr": 2.2293668507968015e-05, "epoch": 2.581560283687943, "percentage": 51.71, "elapsed_time": "7:16:11", "remaining_time": "6:47:22"}
|
| 637 |
+
{"current_steps": 637, "total_steps": 1230, "loss": 0.3208, "lr": 2.2237275160988186e-05, "epoch": 2.585612968591692, "percentage": 51.79, "elapsed_time": "7:16:49", "remaining_time": "6:46:38"}
|
| 638 |
+
{"current_steps": 638, "total_steps": 1230, "loss": 0.3209, "lr": 2.2180863795301787e-05, "epoch": 2.589665653495441, "percentage": 51.87, "elapsed_time": "7:17:29", "remaining_time": "6:45:56"}
|
| 639 |
+
{"current_steps": 639, "total_steps": 1230, "loss": 0.3248, "lr": 2.212443486523819e-05, "epoch": 2.5937183383991895, "percentage": 51.95, "elapsed_time": "7:18:12", "remaining_time": "6:45:17"}
|
| 640 |
+
{"current_steps": 640, "total_steps": 1230, "loss": 0.3258, "lr": 2.2067988825268243e-05, "epoch": 2.597771023302938, "percentage": 52.03, "elapsed_time": "7:18:54", "remaining_time": "6:44:37"}
|
| 641 |
+
{"current_steps": 641, "total_steps": 1230, "loss": 0.3181, "lr": 2.2011526130000596e-05, "epoch": 2.601823708206687, "percentage": 52.11, "elapsed_time": "7:19:34", "remaining_time": "6:43:54"}
|
| 642 |
+
{"current_steps": 642, "total_steps": 1230, "loss": 0.3129, "lr": 2.1955047234178038e-05, "epoch": 2.6058763931104356, "percentage": 52.2, "elapsed_time": "7:20:13", "remaining_time": "6:43:11"}
|
| 643 |
+
{"current_steps": 643, "total_steps": 1230, "loss": 0.3139, "lr": 2.1898552592673825e-05, "epoch": 2.6099290780141846, "percentage": 52.28, "elapsed_time": "7:20:53", "remaining_time": "6:42:29"}
|
| 644 |
+
{"current_steps": 644, "total_steps": 1230, "loss": 0.3214, "lr": 2.184204266048803e-05, "epoch": 2.613981762917933, "percentage": 52.36, "elapsed_time": "7:21:37", "remaining_time": "6:41:51"}
|
| 645 |
+
{"current_steps": 645, "total_steps": 1230, "loss": 0.314, "lr": 2.1785517892743887e-05, "epoch": 2.6180344478216817, "percentage": 52.44, "elapsed_time": "7:22:18", "remaining_time": "6:41:09"}
|
| 646 |
+
{"current_steps": 646, "total_steps": 1230, "loss": 0.3182, "lr": 2.17289787446841e-05, "epoch": 2.6220871327254307, "percentage": 52.52, "elapsed_time": "7:23:00", "remaining_time": "6:40:29"}
|
| 647 |
+
{"current_steps": 647, "total_steps": 1230, "loss": 0.3054, "lr": 2.1672425671667198e-05, "epoch": 2.6261398176291793, "percentage": 52.6, "elapsed_time": "7:23:39", "remaining_time": "6:39:46"}
|
| 648 |
+
{"current_steps": 648, "total_steps": 1230, "loss": 0.3244, "lr": 2.161585912916385e-05, "epoch": 2.6301925025329282, "percentage": 52.68, "elapsed_time": "7:24:19", "remaining_time": "6:39:04"}
|
| 649 |
+
{"current_steps": 649, "total_steps": 1230, "loss": 0.308, "lr": 2.1559279572753214e-05, "epoch": 2.634245187436677, "percentage": 52.76, "elapsed_time": "7:24:59", "remaining_time": "6:38:21"}
|
| 650 |
+
{"current_steps": 650, "total_steps": 1230, "loss": 0.3176, "lr": 2.1502687458119268e-05, "epoch": 2.6382978723404253, "percentage": 52.85, "elapsed_time": "7:25:43", "remaining_time": "6:37:43"}
|
| 651 |
+
{"current_steps": 651, "total_steps": 1230, "loss": 0.3135, "lr": 2.1446083241047116e-05, "epoch": 2.6423505572441743, "percentage": 52.93, "elapsed_time": "7:26:19", "remaining_time": "6:36:57"}
|
| 652 |
+
{"current_steps": 652, "total_steps": 1230, "loss": 0.3174, "lr": 2.1389467377419333e-05, "epoch": 2.646403242147923, "percentage": 53.01, "elapsed_time": "7:26:58", "remaining_time": "6:36:14"}
|
| 653 |
+
{"current_steps": 653, "total_steps": 1230, "loss": 0.3085, "lr": 2.133284032321232e-05, "epoch": 2.650455927051672, "percentage": 53.09, "elapsed_time": "7:27:33", "remaining_time": "6:35:28"}
|
| 654 |
+
{"current_steps": 654, "total_steps": 1230, "loss": 0.3163, "lr": 2.1276202534492566e-05, "epoch": 2.6545086119554204, "percentage": 53.17, "elapsed_time": "7:28:10", "remaining_time": "6:34:42"}
|
| 655 |
+
{"current_steps": 655, "total_steps": 1230, "loss": 0.3255, "lr": 2.121955446741306e-05, "epoch": 2.658561296859169, "percentage": 53.25, "elapsed_time": "7:28:52", "remaining_time": "6:34:03"}
|
| 656 |
+
{"current_steps": 656, "total_steps": 1230, "loss": 0.3227, "lr": 2.1162896578209517e-05, "epoch": 2.662613981762918, "percentage": 53.33, "elapsed_time": "7:29:33", "remaining_time": "6:33:22"}
|
| 657 |
+
{"current_steps": 657, "total_steps": 1230, "loss": 0.336, "lr": 2.1106229323196813e-05, "epoch": 2.6666666666666665, "percentage": 53.41, "elapsed_time": "7:30:13", "remaining_time": "6:32:39"}
|
| 658 |
+
{"current_steps": 658, "total_steps": 1230, "loss": 0.3254, "lr": 2.1049553158765214e-05, "epoch": 2.6707193515704155, "percentage": 53.5, "elapsed_time": "7:30:56", "remaining_time": "6:32:00"}
|
| 659 |
+
{"current_steps": 659, "total_steps": 1230, "loss": 0.3056, "lr": 2.0992868541376764e-05, "epoch": 2.674772036474164, "percentage": 53.58, "elapsed_time": "7:31:33", "remaining_time": "6:31:15"}
|
| 660 |
+
{"current_steps": 660, "total_steps": 1230, "loss": 0.3053, "lr": 2.093617592756158e-05, "epoch": 2.6788247213779126, "percentage": 53.66, "elapsed_time": "7:32:09", "remaining_time": "6:30:29"}
|
| 661 |
+
{"current_steps": 661, "total_steps": 1230, "loss": 0.3074, "lr": 2.0879475773914167e-05, "epoch": 2.6828774062816616, "percentage": 53.74, "elapsed_time": "7:32:50", "remaining_time": "6:29:48"}
|
| 662 |
+
{"current_steps": 662, "total_steps": 1230, "loss": 0.3084, "lr": 2.082276853708978e-05, "epoch": 2.6869300911854106, "percentage": 53.82, "elapsed_time": "7:33:32", "remaining_time": "6:29:08"}
|
| 663 |
+
{"current_steps": 663, "total_steps": 1230, "loss": 0.3232, "lr": 2.076605467380071e-05, "epoch": 2.690982776089159, "percentage": 53.9, "elapsed_time": "7:34:16", "remaining_time": "6:28:30"}
|
| 664 |
+
{"current_steps": 664, "total_steps": 1230, "loss": 0.3176, "lr": 2.0709334640812613e-05, "epoch": 2.6950354609929077, "percentage": 53.98, "elapsed_time": "7:35:00", "remaining_time": "6:27:51"}
|
| 665 |
+
{"current_steps": 665, "total_steps": 1230, "loss": 0.2986, "lr": 2.0652608894940824e-05, "epoch": 2.6990881458966567, "percentage": 54.07, "elapsed_time": "7:35:40", "remaining_time": "6:27:09"}
|
| 666 |
+
{"current_steps": 666, "total_steps": 1230, "loss": 0.3174, "lr": 2.0595877893046722e-05, "epoch": 2.7031408308004052, "percentage": 54.15, "elapsed_time": "7:36:24", "remaining_time": "6:26:30"}
|
| 667 |
+
{"current_steps": 667, "total_steps": 1230, "loss": 0.3109, "lr": 2.0539142092033985e-05, "epoch": 2.7071935157041542, "percentage": 54.23, "elapsed_time": "7:37:07", "remaining_time": "6:25:51"}
|
| 668 |
+
{"current_steps": 668, "total_steps": 1230, "loss": 0.321, "lr": 2.048240194884496e-05, "epoch": 2.711246200607903, "percentage": 54.31, "elapsed_time": "7:37:48", "remaining_time": "6:25:09"}
|
| 669 |
+
{"current_steps": 669, "total_steps": 1230, "loss": 0.3125, "lr": 2.042565792045695e-05, "epoch": 2.7152988855116513, "percentage": 54.39, "elapsed_time": "7:38:31", "remaining_time": "6:24:30"}
|
| 670 |
+
{"current_steps": 670, "total_steps": 1230, "loss": 0.3027, "lr": 2.036891046387857e-05, "epoch": 2.7193515704154003, "percentage": 54.47, "elapsed_time": "7:39:11", "remaining_time": "6:23:47"}
|
| 671 |
+
{"current_steps": 671, "total_steps": 1230, "loss": 0.3382, "lr": 2.0312160036146036e-05, "epoch": 2.723404255319149, "percentage": 54.55, "elapsed_time": "7:39:52", "remaining_time": "6:23:07"}
|
| 672 |
+
{"current_steps": 672, "total_steps": 1230, "loss": 0.3013, "lr": 2.025540709431948e-05, "epoch": 2.727456940222898, "percentage": 54.63, "elapsed_time": "7:40:33", "remaining_time": "6:22:25"}
|
| 673 |
+
{"current_steps": 673, "total_steps": 1230, "loss": 0.3269, "lr": 2.0198652095479298e-05, "epoch": 2.7315096251266464, "percentage": 54.72, "elapsed_time": "7:41:12", "remaining_time": "6:21:43"}
|
| 674 |
+
{"current_steps": 674, "total_steps": 1230, "loss": 0.3046, "lr": 2.014189549672245e-05, "epoch": 2.735562310030395, "percentage": 54.8, "elapsed_time": "7:41:51", "remaining_time": "6:20:59"}
|
| 675 |
+
{"current_steps": 675, "total_steps": 1230, "loss": 0.319, "lr": 2.0085137755158776e-05, "epoch": 2.739614994934144, "percentage": 54.88, "elapsed_time": "7:42:28", "remaining_time": "6:20:15"}
|
| 676 |
+
{"current_steps": 676, "total_steps": 1230, "loss": 0.303, "lr": 2.0028379327907327e-05, "epoch": 2.7436676798378925, "percentage": 54.96, "elapsed_time": "7:43:07", "remaining_time": "6:19:32"}
|
| 677 |
+
{"current_steps": 677, "total_steps": 1230, "loss": 0.3261, "lr": 1.9971620672092676e-05, "epoch": 2.7477203647416415, "percentage": 55.04, "elapsed_time": "7:43:45", "remaining_time": "6:18:49"}
|
| 678 |
+
{"current_steps": 678, "total_steps": 1230, "loss": 0.317, "lr": 1.991486224484123e-05, "epoch": 2.75177304964539, "percentage": 55.12, "elapsed_time": "7:44:24", "remaining_time": "6:18:06"}
|
| 679 |
+
{"current_steps": 679, "total_steps": 1230, "loss": 0.3245, "lr": 1.985810450327756e-05, "epoch": 2.7558257345491386, "percentage": 55.2, "elapsed_time": "7:45:07", "remaining_time": "6:17:26"}
|
| 680 |
+
{"current_steps": 680, "total_steps": 1230, "loss": 0.32, "lr": 1.9801347904520706e-05, "epoch": 2.7598784194528876, "percentage": 55.28, "elapsed_time": "7:45:50", "remaining_time": "6:16:46"}
|
| 681 |
+
{"current_steps": 681, "total_steps": 1230, "loss": 0.323, "lr": 1.974459290568053e-05, "epoch": 2.763931104356636, "percentage": 55.37, "elapsed_time": "7:46:26", "remaining_time": "6:16:01"}
|
| 682 |
+
{"current_steps": 682, "total_steps": 1230, "loss": 0.3151, "lr": 1.968783996385397e-05, "epoch": 2.767983789260385, "percentage": 55.45, "elapsed_time": "7:47:06", "remaining_time": "6:15:19"}
|
| 683 |
+
{"current_steps": 683, "total_steps": 1230, "loss": 0.3287, "lr": 1.963108953612143e-05, "epoch": 2.7720364741641337, "percentage": 55.53, "elapsed_time": "7:47:45", "remaining_time": "6:14:36"}
|
| 684 |
+
{"current_steps": 684, "total_steps": 1230, "loss": 0.3106, "lr": 1.9574342079543056e-05, "epoch": 2.7760891590678822, "percentage": 55.61, "elapsed_time": "7:48:21", "remaining_time": "6:13:51"}
|
| 685 |
+
{"current_steps": 685, "total_steps": 1230, "loss": 0.3217, "lr": 1.9517598051155046e-05, "epoch": 2.780141843971631, "percentage": 55.69, "elapsed_time": "7:48:59", "remaining_time": "6:13:08"}
|
| 686 |
+
{"current_steps": 686, "total_steps": 1230, "loss": 0.3107, "lr": 1.9460857907966025e-05, "epoch": 2.78419452887538, "percentage": 55.77, "elapsed_time": "7:49:40", "remaining_time": "6:12:27"}
|
| 687 |
+
{"current_steps": 687, "total_steps": 1230, "loss": 0.3279, "lr": 1.9404122106953285e-05, "epoch": 2.7882472137791288, "percentage": 55.85, "elapsed_time": "7:50:23", "remaining_time": "6:11:47"}
|
| 688 |
+
{"current_steps": 688, "total_steps": 1230, "loss": 0.3185, "lr": 1.9347391105059176e-05, "epoch": 2.7922998986828773, "percentage": 55.93, "elapsed_time": "7:51:06", "remaining_time": "6:11:07"}
|
| 689 |
+
{"current_steps": 689, "total_steps": 1230, "loss": 0.3391, "lr": 1.92906653591874e-05, "epoch": 2.7963525835866263, "percentage": 56.02, "elapsed_time": "7:51:46", "remaining_time": "6:10:25"}
|
| 690 |
+
{"current_steps": 690, "total_steps": 1230, "loss": 0.3023, "lr": 1.9233945326199295e-05, "epoch": 2.800405268490375, "percentage": 56.1, "elapsed_time": "7:52:24", "remaining_time": "6:09:42"}
|
| 691 |
+
{"current_steps": 691, "total_steps": 1230, "loss": 0.3187, "lr": 1.917723146291022e-05, "epoch": 2.804457953394124, "percentage": 56.18, "elapsed_time": "7:53:02", "remaining_time": "6:08:59"}
|
| 692 |
+
{"current_steps": 692, "total_steps": 1230, "loss": 0.3203, "lr": 1.912052422608584e-05, "epoch": 2.8085106382978724, "percentage": 56.26, "elapsed_time": "7:53:46", "remaining_time": "6:08:20"}
|
| 693 |
+
{"current_steps": 693, "total_steps": 1230, "loss": 0.3111, "lr": 1.9063824072438428e-05, "epoch": 2.812563323201621, "percentage": 56.34, "elapsed_time": "7:54:26", "remaining_time": "6:07:38"}
|
| 694 |
+
{"current_steps": 694, "total_steps": 1230, "loss": 0.3183, "lr": 1.9007131458623246e-05, "epoch": 2.81661600810537, "percentage": 56.42, "elapsed_time": "7:55:07", "remaining_time": "6:06:57"}
|
| 695 |
+
{"current_steps": 695, "total_steps": 1230, "loss": 0.3177, "lr": 1.895044684123479e-05, "epoch": 2.8206686930091185, "percentage": 56.5, "elapsed_time": "7:55:48", "remaining_time": "6:06:15"}
|
| 696 |
+
{"current_steps": 696, "total_steps": 1230, "loss": 0.3199, "lr": 1.8893770676803194e-05, "epoch": 2.8247213779128675, "percentage": 56.59, "elapsed_time": "7:56:28", "remaining_time": "6:05:33"}
|
| 697 |
+
{"current_steps": 697, "total_steps": 1230, "loss": 0.3189, "lr": 1.8837103421790486e-05, "epoch": 2.828774062816616, "percentage": 56.67, "elapsed_time": "7:57:08", "remaining_time": "6:04:52"}
|
| 698 |
+
{"current_steps": 698, "total_steps": 1230, "loss": 0.3044, "lr": 1.8780445532586952e-05, "epoch": 2.8328267477203646, "percentage": 56.75, "elapsed_time": "7:57:47", "remaining_time": "6:04:09"}
|
| 699 |
+
{"current_steps": 699, "total_steps": 1230, "loss": 0.3285, "lr": 1.872379746550743e-05, "epoch": 2.8368794326241136, "percentage": 56.83, "elapsed_time": "7:58:25", "remaining_time": "6:03:26"}
|
| 700 |
+
{"current_steps": 700, "total_steps": 1230, "loss": 0.3179, "lr": 1.866715967678769e-05, "epoch": 2.840932117527862, "percentage": 56.91, "elapsed_time": "7:59:04", "remaining_time": "6:02:43"}
|
| 701 |
+
{"current_steps": 701, "total_steps": 1230, "loss": 0.331, "lr": 1.861053262258067e-05, "epoch": 2.844984802431611, "percentage": 56.99, "elapsed_time": "7:59:45", "remaining_time": "6:02:02"}
|
| 702 |
+
{"current_steps": 702, "total_steps": 1230, "loss": 0.3402, "lr": 1.8553916758952897e-05, "epoch": 2.8490374873353597, "percentage": 57.07, "elapsed_time": "8:00:26", "remaining_time": "6:01:21"}
|
| 703 |
+
{"current_steps": 703, "total_steps": 1230, "loss": 0.3157, "lr": 1.8497312541880735e-05, "epoch": 2.853090172239108, "percentage": 57.15, "elapsed_time": "8:01:09", "remaining_time": "6:00:41"}
|
| 704 |
+
{"current_steps": 704, "total_steps": 1230, "loss": 0.309, "lr": 1.8440720427246786e-05, "epoch": 2.857142857142857, "percentage": 57.24, "elapsed_time": "8:01:45", "remaining_time": "5:59:57"}
|
| 705 |
+
{"current_steps": 705, "total_steps": 1230, "loss": 0.3171, "lr": 1.8384140870836157e-05, "epoch": 2.8611955420466058, "percentage": 57.32, "elapsed_time": "8:02:27", "remaining_time": "5:59:16"}
|
| 706 |
+
{"current_steps": 706, "total_steps": 1230, "loss": 0.3229, "lr": 1.8327574328332806e-05, "epoch": 2.8652482269503547, "percentage": 57.4, "elapsed_time": "8:03:11", "remaining_time": "5:58:37"}
|
| 707 |
+
{"current_steps": 707, "total_steps": 1230, "loss": 0.3251, "lr": 1.8271021255315906e-05, "epoch": 2.8693009118541033, "percentage": 57.48, "elapsed_time": "8:03:47", "remaining_time": "5:57:52"}
|
| 708 |
+
{"current_steps": 708, "total_steps": 1230, "loss": 0.3163, "lr": 1.8214482107256117e-05, "epoch": 2.873353596757852, "percentage": 57.56, "elapsed_time": "8:04:26", "remaining_time": "5:57:10"}
|
| 709 |
+
{"current_steps": 709, "total_steps": 1230, "loss": 0.3103, "lr": 1.8157957339511968e-05, "epoch": 2.877406281661601, "percentage": 57.64, "elapsed_time": "8:05:08", "remaining_time": "5:56:30"}
|
| 710 |
+
{"current_steps": 710, "total_steps": 1230, "loss": 0.3171, "lr": 1.8101447407326182e-05, "epoch": 2.8814589665653494, "percentage": 57.72, "elapsed_time": "8:05:50", "remaining_time": "5:55:49"}
|
| 711 |
+
{"current_steps": 711, "total_steps": 1230, "loss": 0.3017, "lr": 1.8044952765821966e-05, "epoch": 2.8855116514690984, "percentage": 57.8, "elapsed_time": "8:06:26", "remaining_time": "5:55:04"}
|
| 712 |
+
{"current_steps": 712, "total_steps": 1230, "loss": 0.311, "lr": 1.7988473869999407e-05, "epoch": 2.889564336372847, "percentage": 57.89, "elapsed_time": "8:07:08", "remaining_time": "5:54:24"}
|
| 713 |
+
{"current_steps": 713, "total_steps": 1230, "loss": 0.3087, "lr": 1.7932011174731764e-05, "epoch": 2.8936170212765955, "percentage": 57.97, "elapsed_time": "8:07:46", "remaining_time": "5:53:41"}
|
| 714 |
+
{"current_steps": 714, "total_steps": 1230, "loss": 0.3228, "lr": 1.7875565134761817e-05, "epoch": 2.8976697061803445, "percentage": 58.05, "elapsed_time": "8:08:27", "remaining_time": "5:53:00"}
|
| 715 |
+
{"current_steps": 715, "total_steps": 1230, "loss": 0.3148, "lr": 1.7819136204698226e-05, "epoch": 2.9017223910840935, "percentage": 58.13, "elapsed_time": "8:09:08", "remaining_time": "5:52:19"}
|
| 716 |
+
{"current_steps": 716, "total_steps": 1230, "loss": 0.3202, "lr": 1.776272483901182e-05, "epoch": 2.905775075987842, "percentage": 58.21, "elapsed_time": "8:09:46", "remaining_time": "5:51:35"}
|
| 717 |
+
{"current_steps": 717, "total_steps": 1230, "loss": 0.2989, "lr": 1.7706331492031995e-05, "epoch": 2.9098277608915906, "percentage": 58.29, "elapsed_time": "8:10:29", "remaining_time": "5:50:56"}
|
| 718 |
+
{"current_steps": 718, "total_steps": 1230, "loss": 0.3235, "lr": 1.764995661794301e-05, "epoch": 2.9138804457953396, "percentage": 58.37, "elapsed_time": "8:11:10", "remaining_time": "5:50:15"}
|
| 719 |
+
{"current_steps": 719, "total_steps": 1230, "loss": 0.3087, "lr": 1.759360067078035e-05, "epoch": 2.917933130699088, "percentage": 58.46, "elapsed_time": "8:11:49", "remaining_time": "5:49:32"}
|
| 720 |
+
{"current_steps": 720, "total_steps": 1230, "loss": 0.3192, "lr": 1.7537264104427064e-05, "epoch": 2.921985815602837, "percentage": 58.54, "elapsed_time": "8:12:31", "remaining_time": "5:48:52"}
|
| 721 |
+
{"current_steps": 721, "total_steps": 1230, "loss": 0.3179, "lr": 1.748094737261012e-05, "epoch": 2.9260385005065856, "percentage": 58.62, "elapsed_time": "8:13:12", "remaining_time": "5:48:11"}
|
| 722 |
+
{"current_steps": 722, "total_steps": 1230, "loss": 0.3161, "lr": 1.7424650928896726e-05, "epoch": 2.930091185410334, "percentage": 58.7, "elapsed_time": "8:13:51", "remaining_time": "5:47:28"}
|
| 723 |
+
{"current_steps": 723, "total_steps": 1230, "loss": 0.3035, "lr": 1.7368375226690712e-05, "epoch": 2.934143870314083, "percentage": 58.78, "elapsed_time": "8:14:35", "remaining_time": "5:46:49"}
|
| 724 |
+
{"current_steps": 724, "total_steps": 1230, "loss": 0.3196, "lr": 1.731212071922883e-05, "epoch": 2.9381965552178317, "percentage": 58.86, "elapsed_time": "8:15:14", "remaining_time": "5:46:07"}
|
| 725 |
+
{"current_steps": 725, "total_steps": 1230, "loss": 0.3113, "lr": 1.7255887859577156e-05, "epoch": 2.9422492401215807, "percentage": 58.94, "elapsed_time": "8:15:54", "remaining_time": "5:45:25"}
|
| 726 |
+
{"current_steps": 726, "total_steps": 1230, "loss": 0.3163, "lr": 1.7199677100627427e-05, "epoch": 2.9463019250253293, "percentage": 59.02, "elapsed_time": "8:16:33", "remaining_time": "5:44:43"}
|
| 727 |
+
{"current_steps": 727, "total_steps": 1230, "loss": 0.3115, "lr": 1.7143488895093343e-05, "epoch": 2.950354609929078, "percentage": 59.11, "elapsed_time": "8:17:11", "remaining_time": "5:44:00"}
|
| 728 |
+
{"current_steps": 728, "total_steps": 1230, "loss": 0.3139, "lr": 1.7087323695506994e-05, "epoch": 2.954407294832827, "percentage": 59.19, "elapsed_time": "8:17:51", "remaining_time": "5:43:17"}
|
| 729 |
+
{"current_steps": 729, "total_steps": 1230, "loss": 0.3103, "lr": 1.7031181954215194e-05, "epoch": 2.9584599797365754, "percentage": 59.27, "elapsed_time": "8:18:32", "remaining_time": "5:42:37"}
|
| 730 |
+
{"current_steps": 730, "total_steps": 1230, "loss": 0.3249, "lr": 1.6975064123375788e-05, "epoch": 2.9625126646403244, "percentage": 59.35, "elapsed_time": "8:19:15", "remaining_time": "5:41:57"}
|
| 731 |
+
{"current_steps": 731, "total_steps": 1230, "loss": 0.3224, "lr": 1.6918970654954084e-05, "epoch": 2.966565349544073, "percentage": 59.43, "elapsed_time": "8:19:57", "remaining_time": "5:41:16"}
|
| 732 |
+
{"current_steps": 732, "total_steps": 1230, "loss": 0.3213, "lr": 1.686290200071915e-05, "epoch": 2.9706180344478215, "percentage": 59.51, "elapsed_time": "8:20:37", "remaining_time": "5:40:35"}
|
| 733 |
+
{"current_steps": 733, "total_steps": 1230, "loss": 0.3196, "lr": 1.6806858612240234e-05, "epoch": 2.9746707193515705, "percentage": 59.59, "elapsed_time": "8:21:12", "remaining_time": "5:39:49"}
|
| 734 |
+
{"current_steps": 734, "total_steps": 1230, "loss": 0.3141, "lr": 1.6750840940883078e-05, "epoch": 2.978723404255319, "percentage": 59.67, "elapsed_time": "8:21:52", "remaining_time": "5:39:08"}
|
| 735 |
+
{"current_steps": 735, "total_steps": 1230, "loss": 0.3108, "lr": 1.6694849437806305e-05, "epoch": 2.982776089159068, "percentage": 59.76, "elapsed_time": "8:22:36", "remaining_time": "5:38:29"}
|
| 736 |
+
{"current_steps": 736, "total_steps": 1230, "loss": 0.3176, "lr": 1.663888455395778e-05, "epoch": 2.9868287740628165, "percentage": 59.84, "elapsed_time": "8:23:18", "remaining_time": "5:37:49"}
|
| 737 |
+
{"current_steps": 737, "total_steps": 1230, "loss": 0.3167, "lr": 1.6582946740070995e-05, "epoch": 2.990881458966565, "percentage": 59.92, "elapsed_time": "8:23:59", "remaining_time": "5:37:08"}
|
| 738 |
+
{"current_steps": 738, "total_steps": 1230, "loss": 0.3059, "lr": 1.6527036446661396e-05, "epoch": 2.994934143870314, "percentage": 60.0, "elapsed_time": "8:24:41", "remaining_time": "5:36:27"}
|
| 739 |
+
{"current_steps": 739, "total_steps": 1230, "loss": 0.3014, "lr": 1.6471154124022818e-05, "epoch": 3.0010131712259374, "percentage": 60.08, "elapsed_time": "8:27:49", "remaining_time": "5:37:23"}
|
| 740 |
+
{"current_steps": 740, "total_steps": 1230, "loss": 0.2657, "lr": 1.6415300222223788e-05, "epoch": 3.005065856129686, "percentage": 60.16, "elapsed_time": "8:28:27", "remaining_time": "5:36:41"}
|
| 741 |
+
{"current_steps": 741, "total_steps": 1230, "loss": 0.2475, "lr": 1.6359475191103958e-05, "epoch": 3.0091185410334345, "percentage": 60.24, "elapsed_time": "8:29:06", "remaining_time": "5:35:58"}
|
| 742 |
+
{"current_steps": 742, "total_steps": 1230, "loss": 0.2577, "lr": 1.6303679480270466e-05, "epoch": 3.0131712259371835, "percentage": 60.33, "elapsed_time": "8:29:48", "remaining_time": "5:35:17"}
|