Training in progress, step 4039
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:201e8137f626cdd3b97fc3ebc29992415eeb5111e78c6717e7f515272038f5bc
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c42f15401207fa818cb6829acb23927a861570a15eeb89d7c47ebe998a645b6
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2be48392d59b30ff24e79ec80e0a3d40c38a21ff0172730bcba0ccd20e9f6d28
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78f5c0b01c714bf66ac03e55708b6faf7712ce5f8075bba6fb2888c9a096c521
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -612,3 +612,197 @@
|
|
| 612 |
{"current_steps": 3060, "total_steps": 4039, "loss": 0.2397, "lr": 6.754972600084109e-06, "epoch": 5.303555941023417, "percentage": 75.76, "elapsed_time": "12:21:58", "remaining_time": "3:57:23"}
|
| 613 |
{"current_steps": 3065, "total_steps": 4039, "loss": 0.2349, "lr": 6.6903388892327105e-06, "epoch": 5.3122289679098005, "percentage": 75.89, "elapsed_time": "12:23:12", "remaining_time": "3:56:10"}
|
| 614 |
{"current_steps": 3070, "total_steps": 4039, "loss": 0.235, "lr": 6.625953718925837e-06, "epoch": 5.320901994796184, "percentage": 76.01, "elapsed_time": "12:24:30", "remaining_time": "3:54:59"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 612 |
{"current_steps": 3060, "total_steps": 4039, "loss": 0.2397, "lr": 6.754972600084109e-06, "epoch": 5.303555941023417, "percentage": 75.76, "elapsed_time": "12:21:58", "remaining_time": "3:57:23"}
|
| 613 |
{"current_steps": 3065, "total_steps": 4039, "loss": 0.2349, "lr": 6.6903388892327105e-06, "epoch": 5.3122289679098005, "percentage": 75.89, "elapsed_time": "12:23:12", "remaining_time": "3:56:10"}
|
| 614 |
{"current_steps": 3070, "total_steps": 4039, "loss": 0.235, "lr": 6.625953718925837e-06, "epoch": 5.320901994796184, "percentage": 76.01, "elapsed_time": "12:24:30", "remaining_time": "3:54:59"}
|
| 615 |
+
{"current_steps": 3075, "total_steps": 4039, "loss": 0.2091, "lr": 6.561818291472493e-06, "epoch": 5.329575021682567, "percentage": 76.13, "elapsed_time": "12:25:41", "remaining_time": "3:53:46"}
|
| 616 |
+
{"current_steps": 3080, "total_steps": 4039, "loss": 0.2877, "lr": 6.497933804518048e-06, "epoch": 5.338248048568951, "percentage": 76.26, "elapsed_time": "12:26:59", "remaining_time": "3:52:35"}
|
| 617 |
+
{"current_steps": 3085, "total_steps": 4039, "loss": 0.2655, "lr": 6.434301451021891e-06, "epoch": 5.346921075455334, "percentage": 76.38, "elapsed_time": "12:28:00", "remaining_time": "3:51:18"}
|
| 618 |
+
{"current_steps": 3090, "total_steps": 4039, "loss": 0.2269, "lr": 6.370922419235142e-06, "epoch": 5.355594102341717, "percentage": 76.5, "elapsed_time": "12:29:17", "remaining_time": "3:50:07"}
|
| 619 |
+
{"current_steps": 3095, "total_steps": 4039, "loss": 0.2185, "lr": 6.307797892678482e-06, "epoch": 5.364267129228101, "percentage": 76.63, "elapsed_time": "12:30:19", "remaining_time": "3:48:51"}
|
| 620 |
+
{"current_steps": 3100, "total_steps": 4039, "loss": 0.2591, "lr": 6.244929050120026e-06, "epoch": 5.372940156114484, "percentage": 76.75, "elapsed_time": "12:31:34", "remaining_time": "3:47:39"}
|
| 621 |
+
{"current_steps": 3105, "total_steps": 4039, "loss": 0.2628, "lr": 6.1823170655533315e-06, "epoch": 5.3816131830008676, "percentage": 76.88, "elapsed_time": "12:32:48", "remaining_time": "3:46:26"}
|
| 622 |
+
{"current_steps": 3110, "total_steps": 4039, "loss": 0.2357, "lr": 6.119963108175464e-06, "epoch": 5.39028620988725, "percentage": 77.0, "elapsed_time": "12:33:57", "remaining_time": "3:45:13"}
|
| 623 |
+
{"current_steps": 3115, "total_steps": 4039, "loss": 0.2565, "lr": 6.057868342365163e-06, "epoch": 5.398959236773634, "percentage": 77.12, "elapsed_time": "12:35:05", "remaining_time": "3:43:58"}
|
| 624 |
+
{"current_steps": 3120, "total_steps": 4039, "loss": 0.2492, "lr": 5.996033927661124e-06, "epoch": 5.407632263660018, "percentage": 77.25, "elapsed_time": "12:36:12", "remaining_time": "3:42:44"}
|
| 625 |
+
{"current_steps": 3125, "total_steps": 4039, "loss": 0.2447, "lr": 5.9344610187403e-06, "epoch": 5.416305290546401, "percentage": 77.37, "elapsed_time": "12:37:30", "remaining_time": "3:41:33"}
|
| 626 |
+
{"current_steps": 3130, "total_steps": 4039, "loss": 0.2597, "lr": 5.873150765396389e-06, "epoch": 5.424978317432784, "percentage": 77.49, "elapsed_time": "12:38:44", "remaining_time": "3:40:21"}
|
| 627 |
+
{"current_steps": 3135, "total_steps": 4039, "loss": 0.2557, "lr": 5.812104312518325e-06, "epoch": 5.433651344319167, "percentage": 77.62, "elapsed_time": "12:39:58", "remaining_time": "3:39:08"}
|
| 628 |
+
{"current_steps": 3140, "total_steps": 4039, "loss": 0.2545, "lr": 5.751322800068904e-06, "epoch": 5.442324371205551, "percentage": 77.74, "elapsed_time": "12:41:13", "remaining_time": "3:37:56"}
|
| 629 |
+
{"current_steps": 3145, "total_steps": 4039, "loss": 0.2657, "lr": 5.690807363063529e-06, "epoch": 5.450997398091934, "percentage": 77.87, "elapsed_time": "12:42:22", "remaining_time": "3:36:42"}
|
| 630 |
+
{"current_steps": 3150, "total_steps": 4039, "loss": 0.2424, "lr": 5.6305591315489765e-06, "epoch": 5.4596704249783174, "percentage": 77.99, "elapsed_time": "12:43:31", "remaining_time": "3:35:29"}
|
| 631 |
+
{"current_steps": 3155, "total_steps": 4039, "loss": 0.2339, "lr": 5.5705792305823e-06, "epoch": 5.468343451864701, "percentage": 78.11, "elapsed_time": "12:44:46", "remaining_time": "3:34:16"}
|
| 632 |
+
{"current_steps": 3160, "total_steps": 4039, "loss": 0.2293, "lr": 5.510868780209859e-06, "epoch": 5.477016478751084, "percentage": 78.24, "elapsed_time": "12:45:45", "remaining_time": "3:33:00"}
|
| 633 |
+
{"current_steps": 3165, "total_steps": 4039, "loss": 0.2602, "lr": 5.451428895446351e-06, "epoch": 5.485689505637468, "percentage": 78.36, "elapsed_time": "12:46:47", "remaining_time": "3:31:44"}
|
| 634 |
+
{"current_steps": 3170, "total_steps": 4039, "loss": 0.2686, "lr": 5.392260686254014e-06, "epoch": 5.4943625325238505, "percentage": 78.48, "elapsed_time": "12:48:04", "remaining_time": "3:30:33"}
|
| 635 |
+
{"current_steps": 3175, "total_steps": 4039, "loss": 0.2234, "lr": 5.333365257521916e-06, "epoch": 5.503035559410234, "percentage": 78.61, "elapsed_time": "12:49:24", "remaining_time": "3:29:22"}
|
| 636 |
+
{"current_steps": 3180, "total_steps": 4039, "loss": 0.2847, "lr": 5.274743709045289e-06, "epoch": 5.511708586296617, "percentage": 78.73, "elapsed_time": "12:50:37", "remaining_time": "3:28:09"}
|
| 637 |
+
{"current_steps": 3185, "total_steps": 4039, "loss": 0.2925, "lr": 5.216397135505025e-06, "epoch": 5.520381613183001, "percentage": 78.86, "elapsed_time": "12:51:55", "remaining_time": "3:26:58"}
|
| 638 |
+
{"current_steps": 3190, "total_steps": 4039, "loss": 0.2065, "lr": 5.1583266264472055e-06, "epoch": 5.5290546400693845, "percentage": 78.98, "elapsed_time": "12:53:06", "remaining_time": "3:25:45"}
|
| 639 |
+
{"current_steps": 3195, "total_steps": 4039, "loss": 0.2575, "lr": 5.100533266262764e-06, "epoch": 5.537727666955767, "percentage": 79.1, "elapsed_time": "12:54:24", "remaining_time": "3:24:34"}
|
| 640 |
+
{"current_steps": 3200, "total_steps": 4039, "loss": 0.2242, "lr": 5.043018134167262e-06, "epoch": 5.546400693842151, "percentage": 79.23, "elapsed_time": "12:55:42", "remaining_time": "3:23:22"}
|
| 641 |
+
{"current_steps": 3205, "total_steps": 4039, "loss": 0.2672, "lr": 4.985782304180693e-06, "epoch": 5.555073720728534, "percentage": 79.35, "elapsed_time": "12:56:51", "remaining_time": "3:22:09"}
|
| 642 |
+
{"current_steps": 3210, "total_steps": 4039, "loss": 0.2188, "lr": 4.928826845107453e-06, "epoch": 5.563746747614918, "percentage": 79.48, "elapsed_time": "12:58:05", "remaining_time": "3:20:56"}
|
| 643 |
+
{"current_steps": 3215, "total_steps": 4039, "loss": 0.2513, "lr": 4.8721528205163895e-06, "epoch": 5.572419774501301, "percentage": 79.6, "elapsed_time": "12:59:12", "remaining_time": "3:19:42"}
|
| 644 |
+
{"current_steps": 3220, "total_steps": 4039, "loss": 0.263, "lr": 4.815761288720919e-06, "epoch": 5.581092801387684, "percentage": 79.72, "elapsed_time": "13:00:23", "remaining_time": "3:18:29"}
|
| 645 |
+
{"current_steps": 3225, "total_steps": 4039, "loss": 0.2611, "lr": 4.759653302759264e-06, "epoch": 5.589765828274068, "percentage": 79.85, "elapsed_time": "13:01:37", "remaining_time": "3:17:17"}
|
| 646 |
+
{"current_steps": 3230, "total_steps": 4039, "loss": 0.2083, "lr": 4.703829910374824e-06, "epoch": 5.598438855160451, "percentage": 79.97, "elapsed_time": "13:02:45", "remaining_time": "3:16:03"}
|
| 647 |
+
{"current_steps": 3235, "total_steps": 4039, "loss": 0.2351, "lr": 4.648292153996563e-06, "epoch": 5.607111882046834, "percentage": 80.09, "elapsed_time": "13:03:58", "remaining_time": "3:14:50"}
|
| 648 |
+
{"current_steps": 3240, "total_steps": 4039, "loss": 0.2315, "lr": 4.593041070719573e-06, "epoch": 5.615784908933218, "percentage": 80.22, "elapsed_time": "13:05:07", "remaining_time": "3:13:36"}
|
| 649 |
+
{"current_steps": 3245, "total_steps": 4039, "loss": 0.2252, "lr": 4.538077692285694e-06, "epoch": 5.624457935819601, "percentage": 80.34, "elapsed_time": "13:06:23", "remaining_time": "3:12:25"}
|
| 650 |
+
{"current_steps": 3250, "total_steps": 4039, "loss": 0.2705, "lr": 4.483403045064272e-06, "epoch": 5.633130962705985, "percentage": 80.47, "elapsed_time": "13:07:37", "remaining_time": "3:11:12"}
|
| 651 |
+
{"current_steps": 3255, "total_steps": 4039, "loss": 0.229, "lr": 4.429018150032956e-06, "epoch": 5.6418039895923675, "percentage": 80.59, "elapsed_time": "13:08:46", "remaining_time": "3:09:59"}
|
| 652 |
+
{"current_steps": 3260, "total_steps": 4039, "loss": 0.2352, "lr": 4.374924022758657e-06, "epoch": 5.650477016478751, "percentage": 80.71, "elapsed_time": "13:10:05", "remaining_time": "3:08:47"}
|
| 653 |
+
{"current_steps": 3265, "total_steps": 4039, "loss": 0.245, "lr": 4.321121673378572e-06, "epoch": 5.659150043365134, "percentage": 80.84, "elapsed_time": "13:11:14", "remaining_time": "3:07:34"}
|
| 654 |
+
{"current_steps": 3270, "total_steps": 4039, "loss": 0.2254, "lr": 4.267612106581347e-06, "epoch": 5.667823070251518, "percentage": 80.96, "elapsed_time": "13:12:26", "remaining_time": "3:06:21"}
|
| 655 |
+
{"current_steps": 3275, "total_steps": 4039, "loss": 0.2411, "lr": 4.214396321588272e-06, "epoch": 5.6764960971379015, "percentage": 81.08, "elapsed_time": "13:13:29", "remaining_time": "3:05:06"}
|
| 656 |
+
{"current_steps": 3280, "total_steps": 4039, "loss": 0.2233, "lr": 4.16147531213465e-06, "epoch": 5.685169124024284, "percentage": 81.21, "elapsed_time": "13:14:49", "remaining_time": "3:03:55"}
|
| 657 |
+
{"current_steps": 3285, "total_steps": 4039, "loss": 0.261, "lr": 4.108850066451256e-06, "epoch": 5.693842150910668, "percentage": 81.33, "elapsed_time": "13:16:07", "remaining_time": "3:02:43"}
|
| 658 |
+
{"current_steps": 3290, "total_steps": 4039, "loss": 0.2274, "lr": 4.056521567245828e-06, "epoch": 5.702515177797051, "percentage": 81.46, "elapsed_time": "13:17:19", "remaining_time": "3:01:31"}
|
| 659 |
+
{"current_steps": 3295, "total_steps": 4039, "loss": 0.2454, "lr": 4.004490791684788e-06, "epoch": 5.711188204683435, "percentage": 81.58, "elapsed_time": "13:18:34", "remaining_time": "3:00:18"}
|
| 660 |
+
{"current_steps": 3300, "total_steps": 4039, "loss": 0.2695, "lr": 3.952758711374931e-06, "epoch": 5.719861231569817, "percentage": 81.7, "elapsed_time": "13:19:37", "remaining_time": "2:59:03"}
|
| 661 |
+
{"current_steps": 3305, "total_steps": 4039, "loss": 0.2753, "lr": 3.901326292345314e-06, "epoch": 5.728534258456201, "percentage": 81.83, "elapsed_time": "13:20:51", "remaining_time": "2:57:51"}
|
| 662 |
+
{"current_steps": 3310, "total_steps": 4039, "loss": 0.2419, "lr": 3.8501944950292184e-06, "epoch": 5.737207285342585, "percentage": 81.95, "elapsed_time": "13:22:07", "remaining_time": "2:56:39"}
|
| 663 |
+
{"current_steps": 3315, "total_steps": 4039, "loss": 0.2532, "lr": 3.7993642742462043e-06, "epoch": 5.745880312228968, "percentage": 82.07, "elapsed_time": "13:23:05", "remaining_time": "2:55:23"}
|
| 664 |
+
{"current_steps": 3320, "total_steps": 4039, "loss": 0.2431, "lr": 3.748836579184274e-06, "epoch": 5.754553339115351, "percentage": 82.2, "elapsed_time": "13:24:17", "remaining_time": "2:54:10"}
|
| 665 |
+
{"current_steps": 3325, "total_steps": 4039, "loss": 0.231, "lr": 3.698612353382176e-06, "epoch": 5.763226366001735, "percentage": 82.32, "elapsed_time": "13:25:28", "remaining_time": "2:52:57"}
|
| 666 |
+
{"current_steps": 3330, "total_steps": 4039, "loss": 0.2122, "lr": 3.648692534711751e-06, "epoch": 5.771899392888118, "percentage": 82.45, "elapsed_time": "13:26:33", "remaining_time": "2:51:43"}
|
| 667 |
+
{"current_steps": 3335, "total_steps": 4039, "loss": 0.2549, "lr": 3.599078055360432e-06, "epoch": 5.780572419774502, "percentage": 82.57, "elapsed_time": "13:27:38", "remaining_time": "2:50:29"}
|
| 668 |
+
{"current_steps": 3340, "total_steps": 4039, "loss": 0.257, "lr": 3.5497698418138573e-06, "epoch": 5.7892454466608845, "percentage": 82.69, "elapsed_time": "13:28:48", "remaining_time": "2:49:16"}
|
| 669 |
+
{"current_steps": 3345, "total_steps": 4039, "loss": 0.2122, "lr": 3.500768814838531e-06, "epoch": 5.797918473547268, "percentage": 82.82, "elapsed_time": "13:30:05", "remaining_time": "2:48:04"}
|
| 670 |
+
{"current_steps": 3350, "total_steps": 4039, "loss": 0.2207, "lr": 3.4520758894646654e-06, "epoch": 5.806591500433651, "percentage": 82.94, "elapsed_time": "13:31:20", "remaining_time": "2:46:52"}
|
| 671 |
+
{"current_steps": 3355, "total_steps": 4039, "loss": 0.288, "lr": 3.4036919749690654e-06, "epoch": 5.815264527320035, "percentage": 83.07, "elapsed_time": "13:32:37", "remaining_time": "2:45:40"}
|
| 672 |
+
{"current_steps": 3360, "total_steps": 4039, "loss": 0.2623, "lr": 3.3556179748581586e-06, "epoch": 5.8239375542064185, "percentage": 83.19, "elapsed_time": "13:33:52", "remaining_time": "2:44:28"}
|
| 673 |
+
{"current_steps": 3365, "total_steps": 4039, "loss": 0.2123, "lr": 3.3078547868511455e-06, "epoch": 5.832610581092801, "percentage": 83.31, "elapsed_time": "13:35:05", "remaining_time": "2:43:15"}
|
| 674 |
+
{"current_steps": 3370, "total_steps": 4039, "loss": 0.2414, "lr": 3.2604033028632e-06, "epoch": 5.841283607979185, "percentage": 83.44, "elapsed_time": "13:36:14", "remaining_time": "2:42:02"}
|
| 675 |
+
{"current_steps": 3375, "total_steps": 4039, "loss": 0.2447, "lr": 3.2132644089888253e-06, "epoch": 5.849956634865568, "percentage": 83.56, "elapsed_time": "13:37:33", "remaining_time": "2:40:50"}
|
| 676 |
+
{"current_steps": 3380, "total_steps": 4039, "loss": 0.2163, "lr": 3.166438985485334e-06, "epoch": 5.8586296617519515, "percentage": 83.68, "elapsed_time": "13:38:48", "remaining_time": "2:39:38"}
|
| 677 |
+
{"current_steps": 3385, "total_steps": 4039, "loss": 0.2509, "lr": 3.1199279067563706e-06, "epoch": 5.867302688638334, "percentage": 83.81, "elapsed_time": "13:39:56", "remaining_time": "2:38:25"}
|
| 678 |
+
{"current_steps": 3390, "total_steps": 4039, "loss": 0.2474, "lr": 3.0737320413356063e-06, "epoch": 5.875975715524718, "percentage": 83.93, "elapsed_time": "13:41:10", "remaining_time": "2:37:12"}
|
| 679 |
+
{"current_steps": 3395, "total_steps": 4039, "loss": 0.2393, "lr": 3.0278522518705177e-06, "epoch": 5.884648742411102, "percentage": 84.06, "elapsed_time": "13:42:24", "remaining_time": "2:36:00"}
|
| 680 |
+
{"current_steps": 3400, "total_steps": 4039, "loss": 0.2438, "lr": 2.9822893951062658e-06, "epoch": 5.893321769297485, "percentage": 84.18, "elapsed_time": "13:43:41", "remaining_time": "2:34:48"}
|
| 681 |
+
{"current_steps": 3405, "total_steps": 4039, "loss": 0.2397, "lr": 2.9370443218697264e-06, "epoch": 5.901994796183868, "percentage": 84.3, "elapsed_time": "13:44:58", "remaining_time": "2:33:36"}
|
| 682 |
+
{"current_steps": 3410, "total_steps": 4039, "loss": 0.234, "lr": 2.8921178770535687e-06, "epoch": 5.910667823070251, "percentage": 84.43, "elapsed_time": "13:46:12", "remaining_time": "2:32:23"}
|
| 683 |
+
{"current_steps": 3415, "total_steps": 4039, "loss": 0.2583, "lr": 2.847510899600485e-06, "epoch": 5.919340849956635, "percentage": 84.55, "elapsed_time": "13:47:24", "remaining_time": "2:31:11"}
|
| 684 |
+
{"current_steps": 3420, "total_steps": 4039, "loss": 0.2667, "lr": 2.8032242224875573e-06, "epoch": 5.928013876843018, "percentage": 84.67, "elapsed_time": "13:48:40", "remaining_time": "2:29:59"}
|
| 685 |
+
{"current_steps": 3425, "total_steps": 4039, "loss": 0.259, "lr": 2.7592586727106517e-06, "epoch": 5.936686903729401, "percentage": 84.8, "elapsed_time": "13:49:51", "remaining_time": "2:28:46"}
|
| 686 |
+
{"current_steps": 3430, "total_steps": 4039, "loss": 0.2646, "lr": 2.715615071269009e-06, "epoch": 5.945359930615785, "percentage": 84.92, "elapsed_time": "13:50:57", "remaining_time": "2:27:32"}
|
| 687 |
+
{"current_steps": 3435, "total_steps": 4039, "loss": 0.2488, "lr": 2.6722942331499125e-06, "epoch": 5.954032957502168, "percentage": 85.05, "elapsed_time": "13:52:03", "remaining_time": "2:26:18"}
|
| 688 |
+
{"current_steps": 3440, "total_steps": 4039, "loss": 0.2242, "lr": 2.6292969673134527e-06, "epoch": 5.962705984388552, "percentage": 85.17, "elapsed_time": "13:53:22", "remaining_time": "2:25:06"}
|
| 689 |
+
{"current_steps": 3445, "total_steps": 4039, "loss": 0.2544, "lr": 2.5866240766774265e-06, "epoch": 5.971379011274935, "percentage": 85.29, "elapsed_time": "13:54:30", "remaining_time": "2:23:53"}
|
| 690 |
+
{"current_steps": 3450, "total_steps": 4039, "loss": 0.2173, "lr": 2.5442763581023664e-06, "epoch": 5.980052038161318, "percentage": 85.42, "elapsed_time": "13:55:36", "remaining_time": "2:22:39"}
|
| 691 |
+
{"current_steps": 3455, "total_steps": 4039, "loss": 0.1968, "lr": 2.5022546023766192e-06, "epoch": 5.988725065047702, "percentage": 85.54, "elapsed_time": "13:56:38", "remaining_time": "2:21:25"}
|
| 692 |
+
{"current_steps": 3460, "total_steps": 4039, "loss": 0.2547, "lr": 2.460559594201617e-06, "epoch": 5.997398091934085, "percentage": 85.66, "elapsed_time": "13:57:48", "remaining_time": "2:20:11"}
|
| 693 |
+
{"current_steps": 3465, "total_steps": 4039, "loss": 0.2973, "lr": 2.4191921121772e-06, "epoch": 6.00520381613183, "percentage": 85.79, "elapsed_time": "13:58:45", "remaining_time": "2:18:56"}
|
| 694 |
+
{"current_steps": 3470, "total_steps": 4039, "loss": 0.2283, "lr": 2.3781529287870786e-06, "epoch": 6.013876843018213, "percentage": 85.91, "elapsed_time": "14:00:00", "remaining_time": "2:17:44"}
|
| 695 |
+
{"current_steps": 3475, "total_steps": 4039, "loss": 0.2239, "lr": 2.337442810384436e-06, "epoch": 6.022549869904597, "percentage": 86.04, "elapsed_time": "14:01:17", "remaining_time": "2:16:32"}
|
| 696 |
+
{"current_steps": 3480, "total_steps": 4039, "loss": 0.2414, "lr": 2.2970625171775774e-06, "epoch": 6.03122289679098, "percentage": 86.16, "elapsed_time": "14:02:19", "remaining_time": "2:15:18"}
|
| 697 |
+
{"current_steps": 3485, "total_steps": 4039, "loss": 0.2267, "lr": 2.2570128032157568e-06, "epoch": 6.0398959236773635, "percentage": 86.28, "elapsed_time": "14:03:29", "remaining_time": "2:14:05"}
|
| 698 |
+
{"current_steps": 3490, "total_steps": 4039, "loss": 0.207, "lr": 2.2172944163750975e-06, "epoch": 6.048568950563746, "percentage": 86.41, "elapsed_time": "14:04:41", "remaining_time": "2:12:52"}
|
| 699 |
+
{"current_steps": 3495, "total_steps": 4039, "loss": 0.2408, "lr": 2.177908098344621e-06, "epoch": 6.05724197745013, "percentage": 86.53, "elapsed_time": "14:06:00", "remaining_time": "2:11:40"}
|
| 700 |
+
{"current_steps": 3500, "total_steps": 4039, "loss": 0.2629, "lr": 2.1388545846123866e-06, "epoch": 6.065915004336514, "percentage": 86.66, "elapsed_time": "14:07:15", "remaining_time": "2:10:28"}
|
| 701 |
+
{"current_steps": 3505, "total_steps": 4039, "loss": 0.2005, "lr": 2.1001346044517847e-06, "epoch": 6.074588031222897, "percentage": 86.78, "elapsed_time": "14:08:30", "remaining_time": "2:09:16"}
|
| 702 |
+
{"current_steps": 3510, "total_steps": 4039, "loss": 0.2344, "lr": 2.061748880907888e-06, "epoch": 6.08326105810928, "percentage": 86.9, "elapsed_time": "14:09:43", "remaining_time": "2:08:03"}
|
| 703 |
+
{"current_steps": 3515, "total_steps": 4039, "loss": 0.2176, "lr": 2.023698130783971e-06, "epoch": 6.091934084995663, "percentage": 87.03, "elapsed_time": "14:10:48", "remaining_time": "2:06:50"}
|
| 704 |
+
{"current_steps": 3520, "total_steps": 4039, "loss": 0.2255, "lr": 1.985983064628114e-06, "epoch": 6.100607111882047, "percentage": 87.15, "elapsed_time": "14:11:58", "remaining_time": "2:05:37"}
|
| 705 |
+
{"current_steps": 3525, "total_steps": 4039, "loss": 0.2201, "lr": 1.948604386719939e-06, "epoch": 6.109280138768431, "percentage": 87.27, "elapsed_time": "14:13:06", "remaining_time": "2:04:23"}
|
| 706 |
+
{"current_steps": 3530, "total_steps": 4039, "loss": 0.2266, "lr": 1.9115627950574533e-06, "epoch": 6.117953165654813, "percentage": 87.4, "elapsed_time": "14:14:24", "remaining_time": "2:03:12"}
|
| 707 |
+
{"current_steps": 3535, "total_steps": 4039, "loss": 0.2236, "lr": 1.8748589813440165e-06, "epoch": 6.126626192541197, "percentage": 87.52, "elapsed_time": "14:15:33", "remaining_time": "2:01:58"}
|
| 708 |
+
{"current_steps": 3540, "total_steps": 4039, "loss": 0.2368, "lr": 1.8384936309754375e-06, "epoch": 6.13529921942758, "percentage": 87.65, "elapsed_time": "14:16:42", "remaining_time": "2:00:45"}
|
| 709 |
+
{"current_steps": 3545, "total_steps": 4039, "loss": 0.213, "lr": 1.8024674230271544e-06, "epoch": 6.143972246313964, "percentage": 87.77, "elapsed_time": "14:17:47", "remaining_time": "1:59:32"}
|
| 710 |
+
{"current_steps": 3550, "total_steps": 4039, "loss": 0.2317, "lr": 1.7667810302415666e-06, "epoch": 6.152645273200347, "percentage": 87.89, "elapsed_time": "14:18:59", "remaining_time": "1:58:19"}
|
| 711 |
+
{"current_steps": 3555, "total_steps": 4039, "loss": 0.2296, "lr": 1.7314351190154633e-06, "epoch": 6.16131830008673, "percentage": 88.02, "elapsed_time": "14:20:11", "remaining_time": "1:57:06"}
|
| 712 |
+
{"current_steps": 3560, "total_steps": 4039, "loss": 0.2366, "lr": 1.6964303493875966e-06, "epoch": 6.169991326973114, "percentage": 88.14, "elapsed_time": "14:21:21", "remaining_time": "1:55:53"}
|
| 713 |
+
{"current_steps": 3565, "total_steps": 4039, "loss": 0.2874, "lr": 1.661767375026333e-06, "epoch": 6.178664353859497, "percentage": 88.26, "elapsed_time": "14:22:39", "remaining_time": "1:54:41"}
|
| 714 |
+
{"current_steps": 3570, "total_steps": 4039, "loss": 0.2621, "lr": 1.6274468432174707e-06, "epoch": 6.1873373807458805, "percentage": 88.39, "elapsed_time": "14:23:46", "remaining_time": "1:53:28"}
|
| 715 |
+
{"current_steps": 3575, "total_steps": 4039, "loss": 0.2278, "lr": 1.5934693948521251e-06, "epoch": 6.196010407632263, "percentage": 88.51, "elapsed_time": "14:24:56", "remaining_time": "1:52:15"}
|
| 716 |
+
{"current_steps": 3580, "total_steps": 4039, "loss": 0.2293, "lr": 1.5598356644147883e-06, "epoch": 6.204683434518647, "percentage": 88.64, "elapsed_time": "14:26:16", "remaining_time": "1:51:04"}
|
| 717 |
+
{"current_steps": 3585, "total_steps": 4039, "loss": 0.2505, "lr": 1.5265462799714659e-06, "epoch": 6.213356461405031, "percentage": 88.76, "elapsed_time": "14:27:28", "remaining_time": "1:49:51"}
|
| 718 |
+
{"current_steps": 3590, "total_steps": 4039, "loss": 0.2173, "lr": 1.4936018631579497e-06, "epoch": 6.222029488291414, "percentage": 88.88, "elapsed_time": "14:28:40", "remaining_time": "1:48:38"}
|
| 719 |
+
{"current_steps": 3595, "total_steps": 4039, "loss": 0.2626, "lr": 1.461003029168211e-06, "epoch": 6.230702515177797, "percentage": 89.01, "elapsed_time": "14:29:52", "remaining_time": "1:47:26"}
|
| 720 |
+
{"current_steps": 3600, "total_steps": 4039, "loss": 0.2382, "lr": 1.4287503867429165e-06, "epoch": 6.23937554206418, "percentage": 89.13, "elapsed_time": "14:30:54", "remaining_time": "1:46:12"}
|
| 721 |
+
{"current_steps": 3605, "total_steps": 4039, "loss": 0.2449, "lr": 1.3968445381580554e-06, "epoch": 6.248048568950564, "percentage": 89.25, "elapsed_time": "14:32:12", "remaining_time": "1:45:00"}
|
| 722 |
+
{"current_steps": 3610, "total_steps": 4039, "loss": 0.2875, "lr": 1.3652860792136902e-06, "epoch": 6.256721595836947, "percentage": 89.38, "elapsed_time": "14:33:29", "remaining_time": "1:43:48"}
|
| 723 |
+
{"current_steps": 3615, "total_steps": 4039, "loss": 0.2494, "lr": 1.334075599222846e-06, "epoch": 6.26539462272333, "percentage": 89.5, "elapsed_time": "14:34:31", "remaining_time": "1:42:34"}
|
| 724 |
+
{"current_steps": 3620, "total_steps": 4039, "loss": 0.2366, "lr": 1.3032136810004881e-06, "epoch": 6.274067649609714, "percentage": 89.63, "elapsed_time": "14:35:40", "remaining_time": "1:41:21"}
|
| 725 |
+
{"current_steps": 3625, "total_steps": 4039, "loss": 0.2541, "lr": 1.2727009008526414e-06, "epoch": 6.282740676496097, "percentage": 89.75, "elapsed_time": "14:36:58", "remaining_time": "1:40:09"}
|
| 726 |
+
{"current_steps": 3630, "total_steps": 4039, "loss": 0.2517, "lr": 1.2425378285656464e-06, "epoch": 6.291413703382481, "percentage": 89.87, "elapsed_time": "14:38:01", "remaining_time": "1:38:55"}
|
| 727 |
+
{"current_steps": 3635, "total_steps": 4039, "loss": 0.2292, "lr": 1.2127250273954893e-06, "epoch": 6.3000867302688635, "percentage": 90.0, "elapsed_time": "14:39:12", "remaining_time": "1:37:42"}
|
| 728 |
+
{"current_steps": 3640, "total_steps": 4039, "loss": 0.2702, "lr": 1.1832630540573176e-06, "epoch": 6.308759757155247, "percentage": 90.12, "elapsed_time": "14:40:25", "remaining_time": "1:36:30"}
|
| 729 |
+
{"current_steps": 3645, "total_steps": 4039, "loss": 0.2626, "lr": 1.1541524587150165e-06, "epoch": 6.317432784041631, "percentage": 90.25, "elapsed_time": "14:41:45", "remaining_time": "1:35:18"}
|
| 730 |
+
{"current_steps": 3650, "total_steps": 4039, "loss": 0.2511, "lr": 1.1253937849709428e-06, "epoch": 6.326105810928014, "percentage": 90.37, "elapsed_time": "14:42:52", "remaining_time": "1:34:05"}
|
| 731 |
+
{"current_steps": 3655, "total_steps": 4039, "loss": 0.2574, "lr": 1.0969875698557874e-06, "epoch": 6.334778837814397, "percentage": 90.49, "elapsed_time": "14:44:03", "remaining_time": "1:32:52"}
|
| 732 |
+
{"current_steps": 3660, "total_steps": 4039, "loss": 0.2459, "lr": 1.0689343438185328e-06, "epoch": 6.34345186470078, "percentage": 90.62, "elapsed_time": "14:45:18", "remaining_time": "1:31:40"}
|
| 733 |
+
{"current_steps": 3665, "total_steps": 4039, "loss": 0.2648, "lr": 1.041234630716541e-06, "epoch": 6.352124891587164, "percentage": 90.74, "elapsed_time": "14:46:30", "remaining_time": "1:30:27"}
|
| 734 |
+
{"current_steps": 3670, "total_steps": 4039, "loss": 0.2199, "lr": 1.0138889478058013e-06, "epoch": 6.360797918473548, "percentage": 90.86, "elapsed_time": "14:47:35", "remaining_time": "1:29:14"}
|
| 735 |
+
{"current_steps": 3675, "total_steps": 4039, "loss": 0.2533, "lr": 9.868978057312328e-07, "epoch": 6.3694709453599305, "percentage": 90.99, "elapsed_time": "14:48:51", "remaining_time": "1:28:02"}
|
| 736 |
+
{"current_steps": 3680, "total_steps": 4039, "loss": 0.2321, "lr": 9.602617085171784e-07, "epoch": 6.378143972246314, "percentage": 91.11, "elapsed_time": "14:50:06", "remaining_time": "1:26:50"}
|
| 737 |
+
{"current_steps": 3685, "total_steps": 4039, "loss": 0.2345, "lr": 9.339811535579768e-07, "epoch": 6.386816999132697, "percentage": 91.24, "elapsed_time": "14:51:22", "remaining_time": "1:25:37"}
|
| 738 |
+
{"current_steps": 3690, "total_steps": 4039, "loss": 0.2425, "lr": 9.08056631608678e-07, "epoch": 6.395490026019081, "percentage": 91.36, "elapsed_time": "14:52:35", "remaining_time": "1:24:25"}
|
| 739 |
+
{"current_steps": 3695, "total_steps": 4039, "loss": 0.2711, "lr": 8.824886267758881e-07, "epoch": 6.404163052905464, "percentage": 91.48, "elapsed_time": "14:53:53", "remaining_time": "1:23:13"}
|
| 740 |
+
{"current_steps": 3700, "total_steps": 4039, "loss": 0.271, "lr": 8.572776165087137e-07, "epoch": 6.412836079791847, "percentage": 91.61, "elapsed_time": "14:55:10", "remaining_time": "1:22:01"}
|
| 741 |
+
{"current_steps": 3705, "total_steps": 4039, "loss": 0.2232, "lr": 8.324240715898568e-07, "epoch": 6.421509106678231, "percentage": 91.73, "elapsed_time": "14:56:20", "remaining_time": "1:20:48"}
|
| 742 |
+
{"current_steps": 3710, "total_steps": 4039, "loss": 0.2733, "lr": 8.079284561268208e-07, "epoch": 6.430182133564614, "percentage": 91.85, "elapsed_time": "14:57:32", "remaining_time": "1:19:35"}
|
| 743 |
+
{"current_steps": 3715, "total_steps": 4039, "loss": 0.2536, "lr": 7.837912275432469e-07, "epoch": 6.438855160450998, "percentage": 91.98, "elapsed_time": "14:58:44", "remaining_time": "1:18:22"}
|
| 744 |
+
{"current_steps": 3720, "total_steps": 4039, "loss": 0.2314, "lr": 7.600128365703608e-07, "epoch": 6.44752818733738, "percentage": 92.1, "elapsed_time": "14:59:53", "remaining_time": "1:17:10"}
|
| 745 |
+
{"current_steps": 3725, "total_steps": 4039, "loss": 0.2381, "lr": 7.365937272385726e-07, "epoch": 6.456201214223764, "percentage": 92.23, "elapsed_time": "15:01:07", "remaining_time": "1:15:57"}
|
| 746 |
+
{"current_steps": 3730, "total_steps": 4039, "loss": 0.2329, "lr": 7.13534336869175e-07, "epoch": 6.464874241110148, "percentage": 92.35, "elapsed_time": "15:02:18", "remaining_time": "1:14:44"}
|
| 747 |
+
{"current_steps": 3735, "total_steps": 4039, "loss": 0.2523, "lr": 6.908350960661713e-07, "epoch": 6.473547267996531, "percentage": 92.47, "elapsed_time": "15:03:26", "remaining_time": "1:13:31"}
|
| 748 |
+
{"current_steps": 3740, "total_steps": 4039, "loss": 0.2488, "lr": 6.684964287082562e-07, "epoch": 6.482220294882914, "percentage": 92.6, "elapsed_time": "15:04:36", "remaining_time": "1:12:19"}
|
| 749 |
+
{"current_steps": 3745, "total_steps": 4039, "loss": 0.24, "lr": 6.4651875194087e-07, "epoch": 6.490893321769297, "percentage": 92.72, "elapsed_time": "15:05:46", "remaining_time": "1:11:06"}
|
| 750 |
+
{"current_steps": 3750, "total_steps": 4039, "loss": 0.2528, "lr": 6.249024761684408e-07, "epoch": 6.499566348655681, "percentage": 92.84, "elapsed_time": "15:07:02", "remaining_time": "1:09:54"}
|
| 751 |
+
{"current_steps": 3755, "total_steps": 4039, "loss": 0.2402, "lr": 6.036480050466931e-07, "epoch": 6.508239375542065, "percentage": 92.97, "elapsed_time": "15:08:19", "remaining_time": "1:08:41"}
|
| 752 |
+
{"current_steps": 3760, "total_steps": 4039, "loss": 0.2229, "lr": 5.827557354751223e-07, "epoch": 6.5169124024284475, "percentage": 93.09, "elapsed_time": "15:09:33", "remaining_time": "1:07:29"}
|
| 753 |
+
{"current_steps": 3765, "total_steps": 4039, "loss": 0.2359, "lr": 5.622260575895944e-07, "epoch": 6.525585429314831, "percentage": 93.22, "elapsed_time": "15:10:49", "remaining_time": "1:06:17"}
|
| 754 |
+
{"current_steps": 3770, "total_steps": 4039, "loss": 0.2636, "lr": 5.420593547550334e-07, "epoch": 6.534258456201214, "percentage": 93.34, "elapsed_time": "15:11:57", "remaining_time": "1:05:04"}
|
| 755 |
+
{"current_steps": 3775, "total_steps": 4039, "loss": 0.286, "lr": 5.22256003558288e-07, "epoch": 6.542931483087598, "percentage": 93.46, "elapsed_time": "15:13:08", "remaining_time": "1:03:51"}
|
| 756 |
+
{"current_steps": 3780, "total_steps": 4039, "loss": 0.2247, "lr": 5.028163738010917e-07, "epoch": 6.551604509973981, "percentage": 93.59, "elapsed_time": "15:14:17", "remaining_time": "1:02:38"}
|
| 757 |
+
{"current_steps": 3785, "total_steps": 4039, "loss": 0.2083, "lr": 4.837408284931444e-07, "epoch": 6.560277536860364, "percentage": 93.71, "elapsed_time": "15:15:28", "remaining_time": "1:01:26"}
|
| 758 |
+
{"current_steps": 3790, "total_steps": 4039, "loss": 0.2507, "lr": 4.650297238453516e-07, "epoch": 6.568950563746748, "percentage": 93.84, "elapsed_time": "15:16:44", "remaining_time": "1:00:13"}
|
| 759 |
+
{"current_steps": 3795, "total_steps": 4039, "loss": 0.2675, "lr": 4.4668340926316446e-07, "epoch": 6.577623590633131, "percentage": 93.96, "elapsed_time": "15:17:54", "remaining_time": "0:59:01"}
|
| 760 |
+
{"current_steps": 3800, "total_steps": 4039, "loss": 0.2603, "lr": 4.287022273400565e-07, "epoch": 6.586296617519515, "percentage": 94.08, "elapsed_time": "15:19:11", "remaining_time": "0:57:48"}
|
| 761 |
+
{"current_steps": 3805, "total_steps": 4039, "loss": 0.235, "lr": 4.110865138511244e-07, "epoch": 6.594969644405897, "percentage": 94.21, "elapsed_time": "15:20:30", "remaining_time": "0:56:36"}
|
| 762 |
+
{"current_steps": 3810, "total_steps": 4039, "loss": 0.2438, "lr": 3.938365977468173e-07, "epoch": 6.603642671292281, "percentage": 94.33, "elapsed_time": "15:21:37", "remaining_time": "0:55:23"}
|
| 763 |
+
{"current_steps": 3815, "total_steps": 4039, "loss": 0.2503, "lr": 3.769528011467993e-07, "epoch": 6.612315698178664, "percentage": 94.45, "elapsed_time": "15:22:47", "remaining_time": "0:54:10"}
|
| 764 |
+
{"current_steps": 3820, "total_steps": 4039, "loss": 0.2811, "lr": 3.604354393339238e-07, "epoch": 6.620988725065048, "percentage": 94.58, "elapsed_time": "15:23:59", "remaining_time": "0:52:58"}
|
| 765 |
+
{"current_steps": 3825, "total_steps": 4039, "loss": 0.231, "lr": 3.4428482074836623e-07, "epoch": 6.629661751951431, "percentage": 94.7, "elapsed_time": "15:25:18", "remaining_time": "0:51:46"}
|
| 766 |
+
{"current_steps": 3830, "total_steps": 4039, "loss": 0.2425, "lr": 3.2850124698183827e-07, "epoch": 6.638334778837814, "percentage": 94.83, "elapsed_time": "15:26:33", "remaining_time": "0:50:33"}
|
| 767 |
+
{"current_steps": 3835, "total_steps": 4039, "loss": 0.266, "lr": 3.1308501277197203e-07, "epoch": 6.647007805724198, "percentage": 94.95, "elapsed_time": "15:27:47", "remaining_time": "0:49:21"}
|
| 768 |
+
{"current_steps": 3840, "total_steps": 4039, "loss": 0.2642, "lr": 2.9803640599681995e-07, "epoch": 6.655680832610581, "percentage": 95.07, "elapsed_time": "15:29:05", "remaining_time": "0:48:08"}
|
| 769 |
+
{"current_steps": 3845, "total_steps": 4039, "loss": 0.2689, "lr": 2.833557076694571e-07, "epoch": 6.6643538594969645, "percentage": 95.2, "elapsed_time": "15:30:24", "remaining_time": "0:46:56"}
|
| 770 |
+
{"current_steps": 3850, "total_steps": 4039, "loss": 0.2807, "lr": 2.690431919327674e-07, "epoch": 6.673026886383347, "percentage": 95.32, "elapsed_time": "15:31:37", "remaining_time": "0:45:44"}
|
| 771 |
+
{"current_steps": 3855, "total_steps": 4039, "loss": 0.2457, "lr": 2.5509912605429233e-07, "epoch": 6.681699913269731, "percentage": 95.44, "elapsed_time": "15:32:49", "remaining_time": "0:44:31"}
|
| 772 |
+
{"current_steps": 3860, "total_steps": 4039, "loss": 0.2452, "lr": 2.41523770421257e-07, "epoch": 6.690372940156115, "percentage": 95.57, "elapsed_time": "15:34:03", "remaining_time": "0:43:18"}
|
| 773 |
+
{"current_steps": 3865, "total_steps": 4039, "loss": 0.2434, "lr": 2.2831737853570513e-07, "epoch": 6.6990459670424976, "percentage": 95.69, "elapsed_time": "15:35:22", "remaining_time": "0:42:06"}
|
| 774 |
+
{"current_steps": 3870, "total_steps": 4039, "loss": 0.2298, "lr": 2.1548019700976308e-07, "epoch": 6.707718993928881, "percentage": 95.82, "elapsed_time": "15:36:28", "remaining_time": "0:40:53"}
|
| 775 |
+
{"current_steps": 3875, "total_steps": 4039, "loss": 0.2505, "lr": 2.0301246556103437e-07, "epoch": 6.716392020815265, "percentage": 95.94, "elapsed_time": "15:37:35", "remaining_time": "0:39:40"}
|
| 776 |
+
{"current_steps": 3880, "total_steps": 4039, "loss": 0.2672, "lr": 1.9091441700813008e-07, "epoch": 6.725065047701648, "percentage": 96.06, "elapsed_time": "15:38:49", "remaining_time": "0:38:28"}
|
| 777 |
+
{"current_steps": 3885, "total_steps": 4039, "loss": 0.2611, "lr": 1.7918627726630777e-07, "epoch": 6.7337380745880315, "percentage": 96.19, "elapsed_time": "15:40:06", "remaining_time": "0:37:15"}
|
| 778 |
+
{"current_steps": 3890, "total_steps": 4039, "loss": 0.2367, "lr": 1.6782826534326835e-07, "epoch": 6.742411101474414, "percentage": 96.31, "elapsed_time": "15:41:25", "remaining_time": "0:36:03"}
|
| 779 |
+
{"current_steps": 3895, "total_steps": 4039, "loss": 0.1902, "lr": 1.5684059333505254e-07, "epoch": 6.751084128360798, "percentage": 96.43, "elapsed_time": "15:42:44", "remaining_time": "0:34:51"}
|
| 780 |
+
{"current_steps": 3900, "total_steps": 4039, "loss": 0.2232, "lr": 1.4622346642209295e-07, "epoch": 6.759757155247181, "percentage": 96.56, "elapsed_time": "15:44:02", "remaining_time": "0:33:38"}
|
| 781 |
+
{"current_steps": 3905, "total_steps": 4039, "loss": 0.2387, "lr": 1.359770828653728e-07, "epoch": 6.768430182133565, "percentage": 96.68, "elapsed_time": "15:45:08", "remaining_time": "0:32:25"}
|
| 782 |
+
{"current_steps": 3910, "total_steps": 4039, "loss": 0.2365, "lr": 1.2610163400272657e-07, "epoch": 6.777103209019948, "percentage": 96.81, "elapsed_time": "15:46:16", "remaining_time": "0:31:13"}
|
| 783 |
+
{"current_steps": 3915, "total_steps": 4039, "loss": 0.2348, "lr": 1.1659730424526949e-07, "epoch": 6.785776235906331, "percentage": 96.93, "elapsed_time": "15:47:33", "remaining_time": "0:30:00"}
|
| 784 |
+
{"current_steps": 3920, "total_steps": 4039, "loss": 0.2399, "lr": 1.0746427107395151e-07, "epoch": 6.794449262792715, "percentage": 97.05, "elapsed_time": "15:48:52", "remaining_time": "0:28:48"}
|
| 785 |
+
{"current_steps": 3925, "total_steps": 4039, "loss": 0.2355, "lr": 9.87027050362399e-08, "epoch": 6.803122289679098, "percentage": 97.18, "elapsed_time": "15:50:04", "remaining_time": "0:27:35"}
|
| 786 |
+
{"current_steps": 3930, "total_steps": 4039, "loss": 0.2719, "lr": 9.031276974294622e-08, "epoch": 6.811795316565481, "percentage": 97.3, "elapsed_time": "15:51:24", "remaining_time": "0:26:23"}
|
| 787 |
+
{"current_steps": 3935, "total_steps": 4039, "loss": 0.2081, "lr": 8.229462186515769e-08, "epoch": 6.820468343451864, "percentage": 97.43, "elapsed_time": "15:52:30", "remaining_time": "0:25:10"}
|
| 788 |
+
{"current_steps": 3940, "total_steps": 4039, "loss": 0.2117, "lr": 7.464841113131504e-08, "epoch": 6.829141370338248, "percentage": 97.55, "elapsed_time": "15:53:42", "remaining_time": "0:23:57"}
|
| 789 |
+
{"current_steps": 3945, "total_steps": 4039, "loss": 0.2581, "lr": 6.737428032442372e-08, "epoch": 6.837814397224632, "percentage": 97.67, "elapsed_time": "15:54:58", "remaining_time": "0:22:45"}
|
| 790 |
+
{"current_steps": 3950, "total_steps": 4039, "loss": 0.2386, "lr": 6.047236527937594e-08, "epoch": 6.8464874241110145, "percentage": 97.8, "elapsed_time": "15:56:07", "remaining_time": "0:21:32"}
|
| 791 |
+
{"current_steps": 3955, "total_steps": 4039, "loss": 0.2404, "lr": 5.394279488042831e-08, "epoch": 6.855160450997398, "percentage": 97.92, "elapsed_time": "15:57:22", "remaining_time": "0:20:20"}
|
| 792 |
+
{"current_steps": 3960, "total_steps": 4039, "loss": 0.2151, "lr": 4.7785691058781505e-08, "epoch": 6.863833477883781, "percentage": 98.04, "elapsed_time": "15:58:38", "remaining_time": "0:19:07"}
|
| 793 |
+
{"current_steps": 3965, "total_steps": 4039, "loss": 0.2525, "lr": 4.200116879031102e-08, "epoch": 6.872506504770165, "percentage": 98.17, "elapsed_time": "15:59:57", "remaining_time": "0:17:54"}
|
| 794 |
+
{"current_steps": 3970, "total_steps": 4039, "loss": 0.2346, "lr": 3.658933609341775e-08, "epoch": 6.8811795316565485, "percentage": 98.29, "elapsed_time": "16:01:16", "remaining_time": "0:16:42"}
|
| 795 |
+
{"current_steps": 3975, "total_steps": 4039, "loss": 0.2365, "lr": 3.155029402701182e-08, "epoch": 6.889852558542931, "percentage": 98.42, "elapsed_time": "16:02:27", "remaining_time": "0:15:29"}
|
| 796 |
+
{"current_steps": 3980, "total_steps": 4039, "loss": 0.2933, "lr": 2.6884136688625218e-08, "epoch": 6.898525585429315, "percentage": 98.54, "elapsed_time": "16:03:39", "remaining_time": "0:14:17"}
|
| 797 |
+
{"current_steps": 3985, "total_steps": 4039, "loss": 0.2367, "lr": 2.259095121265542e-08, "epoch": 6.907198612315698, "percentage": 98.66, "elapsed_time": "16:04:51", "remaining_time": "0:13:04"}
|
| 798 |
+
{"current_steps": 3990, "total_steps": 4039, "loss": 0.2095, "lr": 1.8670817768733364e-08, "epoch": 6.915871639202082, "percentage": 98.79, "elapsed_time": "16:06:05", "remaining_time": "0:11:51"}
|
| 799 |
+
{"current_steps": 3995, "total_steps": 4039, "loss": 0.2266, "lr": 1.5123809560233516e-08, "epoch": 6.924544666088465, "percentage": 98.91, "elapsed_time": "16:07:09", "remaining_time": "0:10:39"}
|
| 800 |
+
{"current_steps": 4000, "total_steps": 4039, "loss": 0.2251, "lr": 1.194999282290832e-08, "epoch": 6.933217692974848, "percentage": 99.03, "elapsed_time": "16:08:21", "remaining_time": "0:09:26"}
|
| 801 |
+
{"current_steps": 4005, "total_steps": 4039, "loss": 0.2256, "lr": 9.149426823633622e-09, "epoch": 6.941890719861232, "percentage": 99.16, "elapsed_time": "16:09:30", "remaining_time": "0:08:13"}
|
| 802 |
+
{"current_steps": 4010, "total_steps": 4039, "loss": 0.2563, "lr": 6.722163859329556e-09, "epoch": 6.950563746747615, "percentage": 99.28, "elapsed_time": "16:10:38", "remaining_time": "0:07:01"}
|
| 803 |
+
{"current_steps": 4015, "total_steps": 4039, "loss": 0.2209, "lr": 4.668249255961321e-09, "epoch": 6.959236773633998, "percentage": 99.41, "elapsed_time": "16:11:47", "remaining_time": "0:05:48"}
|
| 804 |
+
{"current_steps": 4020, "total_steps": 4039, "loss": 0.2422, "lr": 2.98772136770209e-09, "epoch": 6.967909800520381, "percentage": 99.53, "elapsed_time": "16:12:57", "remaining_time": "0:04:35"}
|
| 805 |
+
{"current_steps": 4025, "total_steps": 4039, "loss": 0.2171, "lr": 1.6806115762135754e-09, "epoch": 6.976582827406765, "percentage": 99.65, "elapsed_time": "16:14:05", "remaining_time": "0:03:23"}
|
| 806 |
+
{"current_steps": 4030, "total_steps": 4039, "loss": 0.216, "lr": 7.469442900687185e-10, "epoch": 6.985255854293149, "percentage": 99.78, "elapsed_time": "16:15:12", "remaining_time": "0:02:10"}
|
| 807 |
+
{"current_steps": 4035, "total_steps": 4039, "loss": 0.2716, "lr": 1.867369442853928e-10, "epoch": 6.9939288811795315, "percentage": 99.9, "elapsed_time": "16:16:19", "remaining_time": "0:00:58"}
|
| 808 |
+
{"current_steps": 4039, "total_steps": 4039, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "16:17:49", "remaining_time": "0:00:00"}
|