Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c80e5c1b7a40f41b14ae4d24011d6737084c0815f3b9cc4e3c6a95903a79cdc7
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4338278d77f05613800efc95f1ae3aff4ef09d5209612e6ca4b9533d6c48fcec
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6fbc61af36c0b525252001002db0da393a42a346fcea8da2de153b5957b4c56c
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b5e1bf08062069001c50e4fbf434169b544a97ffe34355bb484596389d78de3b
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -740,3 +740,250 @@
|
|
| 740 |
{"current_steps": 740, "total_steps": 1230, "loss": 0.2657, "lr": 1.6415300222223788e-05, "epoch": 3.005065856129686, "percentage": 60.16, "elapsed_time": "8:28:27", "remaining_time": "5:36:41"}
|
| 741 |
{"current_steps": 741, "total_steps": 1230, "loss": 0.2475, "lr": 1.6359475191103958e-05, "epoch": 3.0091185410334345, "percentage": 60.24, "elapsed_time": "8:29:06", "remaining_time": "5:35:58"}
|
| 742 |
{"current_steps": 742, "total_steps": 1230, "loss": 0.2577, "lr": 1.6303679480270466e-05, "epoch": 3.0131712259371835, "percentage": 60.33, "elapsed_time": "8:29:48", "remaining_time": "5:35:17"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 740 |
{"current_steps": 740, "total_steps": 1230, "loss": 0.2657, "lr": 1.6415300222223788e-05, "epoch": 3.005065856129686, "percentage": 60.16, "elapsed_time": "8:28:27", "remaining_time": "5:36:41"}
|
| 741 |
{"current_steps": 741, "total_steps": 1230, "loss": 0.2475, "lr": 1.6359475191103958e-05, "epoch": 3.0091185410334345, "percentage": 60.24, "elapsed_time": "8:29:06", "remaining_time": "5:35:58"}
|
| 742 |
{"current_steps": 742, "total_steps": 1230, "loss": 0.2577, "lr": 1.6303679480270466e-05, "epoch": 3.0131712259371835, "percentage": 60.33, "elapsed_time": "8:29:48", "remaining_time": "5:35:17"}
|
| 743 |
+
{"current_steps": 743, "total_steps": 1230, "loss": 0.2319, "lr": 1.624791353909428e-05, "epoch": 3.017223910840932, "percentage": 60.41, "elapsed_time": "8:30:31", "remaining_time": "5:34:37"}
|
| 744 |
+
{"current_steps": 744, "total_steps": 1230, "loss": 0.2589, "lr": 1.619217781670663e-05, "epoch": 3.021276595744681, "percentage": 60.49, "elapsed_time": "8:31:15", "remaining_time": "5:33:57"}
|
| 745 |
+
{"current_steps": 745, "total_steps": 1230, "loss": 0.2611, "lr": 1.6136472761995373e-05, "epoch": 3.0253292806484295, "percentage": 60.57, "elapsed_time": "8:31:55", "remaining_time": "5:33:15"}
|
| 746 |
+
{"current_steps": 746, "total_steps": 1230, "loss": 0.2303, "lr": 1.608079882360134e-05, "epoch": 3.0293819655521785, "percentage": 60.65, "elapsed_time": "8:32:35", "remaining_time": "5:32:34"}
|
| 747 |
+
{"current_steps": 747, "total_steps": 1230, "loss": 0.2465, "lr": 1.60251564499148e-05, "epoch": 3.033434650455927, "percentage": 60.73, "elapsed_time": "8:33:14", "remaining_time": "5:31:51"}
|
| 748 |
+
{"current_steps": 748, "total_steps": 1230, "loss": 0.271, "lr": 1.596954608907176e-05, "epoch": 3.0374873353596756, "percentage": 60.81, "elapsed_time": "8:33:56", "remaining_time": "5:31:10"}
|
| 749 |
+
{"current_steps": 749, "total_steps": 1230, "loss": 0.2431, "lr": 1.591396818895043e-05, "epoch": 3.0415400202634246, "percentage": 60.89, "elapsed_time": "8:34:36", "remaining_time": "5:30:28"}
|
| 750 |
+
{"current_steps": 750, "total_steps": 1230, "loss": 0.251, "lr": 1.585842319716759e-05, "epoch": 3.045592705167173, "percentage": 60.98, "elapsed_time": "8:35:16", "remaining_time": "5:29:46"}
|
| 751 |
+
{"current_steps": 751, "total_steps": 1230, "loss": 0.2493, "lr": 1.5802911561074944e-05, "epoch": 3.049645390070922, "percentage": 61.06, "elapsed_time": "8:35:56", "remaining_time": "5:29:04"}
|
| 752 |
+
{"current_steps": 752, "total_steps": 1230, "loss": 0.2394, "lr": 1.5747433727755595e-05, "epoch": 3.0536980749746707, "percentage": 61.14, "elapsed_time": "8:36:37", "remaining_time": "5:28:22"}
|
| 753 |
+
{"current_steps": 753, "total_steps": 1230, "loss": 0.252, "lr": 1.5691990144020376e-05, "epoch": 3.0577507598784193, "percentage": 61.22, "elapsed_time": "8:37:19", "remaining_time": "5:27:42"}
|
| 754 |
+
{"current_steps": 754, "total_steps": 1230, "loss": 0.2517, "lr": 1.5636581256404297e-05, "epoch": 3.0618034447821683, "percentage": 61.3, "elapsed_time": "8:38:01", "remaining_time": "5:27:02"}
|
| 755 |
+
{"current_steps": 755, "total_steps": 1230, "loss": 0.2362, "lr": 1.558120751116291e-05, "epoch": 3.065856129685917, "percentage": 61.38, "elapsed_time": "8:38:42", "remaining_time": "5:26:20"}
|
| 756 |
+
{"current_steps": 756, "total_steps": 1230, "loss": 0.2494, "lr": 1.552586935426876e-05, "epoch": 3.069908814589666, "percentage": 61.46, "elapsed_time": "8:39:22", "remaining_time": "5:25:38"}
|
| 757 |
+
{"current_steps": 757, "total_steps": 1230, "loss": 0.2553, "lr": 1.547056723140774e-05, "epoch": 3.0739614994934144, "percentage": 61.54, "elapsed_time": "8:40:06", "remaining_time": "5:24:58"}
|
| 758 |
+
{"current_steps": 758, "total_steps": 1230, "loss": 0.2632, "lr": 1.5415301587975565e-05, "epoch": 3.078014184397163, "percentage": 61.63, "elapsed_time": "8:40:47", "remaining_time": "5:24:17"}
|
| 759 |
+
{"current_steps": 759, "total_steps": 1230, "loss": 0.2448, "lr": 1.536007286907411e-05, "epoch": 3.082066869300912, "percentage": 61.71, "elapsed_time": "8:41:27", "remaining_time": "5:23:35"}
|
| 760 |
+
{"current_steps": 760, "total_steps": 1230, "loss": 0.2537, "lr": 1.5304881519507896e-05, "epoch": 3.0861195542046604, "percentage": 61.79, "elapsed_time": "8:42:05", "remaining_time": "5:22:52"}
|
| 761 |
+
{"current_steps": 761, "total_steps": 1230, "loss": 0.2589, "lr": 1.5249727983780453e-05, "epoch": 3.0901722391084094, "percentage": 61.87, "elapsed_time": "8:42:45", "remaining_time": "5:22:10"}
|
| 762 |
+
{"current_steps": 762, "total_steps": 1230, "loss": 0.2544, "lr": 1.5194612706090786e-05, "epoch": 3.094224924012158, "percentage": 61.95, "elapsed_time": "8:43:25", "remaining_time": "5:21:28"}
|
| 763 |
+
{"current_steps": 763, "total_steps": 1230, "loss": 0.2393, "lr": 1.5139536130329771e-05, "epoch": 3.098277608915907, "percentage": 62.03, "elapsed_time": "8:44:06", "remaining_time": "5:20:47"}
|
| 764 |
+
{"current_steps": 764, "total_steps": 1230, "loss": 0.2578, "lr": 1.508449870007656e-05, "epoch": 3.1023302938196555, "percentage": 62.11, "elapsed_time": "8:44:46", "remaining_time": "5:20:05"}
|
| 765 |
+
{"current_steps": 765, "total_steps": 1230, "loss": 0.2622, "lr": 1.5029500858595056e-05, "epoch": 3.106382978723404, "percentage": 62.2, "elapsed_time": "8:45:27", "remaining_time": "5:19:23"}
|
| 766 |
+
{"current_steps": 766, "total_steps": 1230, "loss": 0.2435, "lr": 1.4974543048830328e-05, "epoch": 3.110435663627153, "percentage": 62.28, "elapsed_time": "8:46:04", "remaining_time": "5:18:40"}
|
| 767 |
+
{"current_steps": 767, "total_steps": 1230, "loss": 0.2452, "lr": 1.4919625713405e-05, "epoch": 3.1144883485309016, "percentage": 62.36, "elapsed_time": "8:46:44", "remaining_time": "5:17:58"}
|
| 768 |
+
{"current_steps": 768, "total_steps": 1230, "loss": 0.2487, "lr": 1.4864749294615756e-05, "epoch": 3.1185410334346506, "percentage": 62.44, "elapsed_time": "8:47:22", "remaining_time": "5:17:14"}
|
| 769 |
+
{"current_steps": 769, "total_steps": 1230, "loss": 0.2443, "lr": 1.4809914234429716e-05, "epoch": 3.122593718338399, "percentage": 62.52, "elapsed_time": "8:48:02", "remaining_time": "5:16:32"}
|
| 770 |
+
{"current_steps": 770, "total_steps": 1230, "loss": 0.257, "lr": 1.4755120974480923e-05, "epoch": 3.126646403242148, "percentage": 62.6, "elapsed_time": "8:48:43", "remaining_time": "5:15:51"}
|
| 771 |
+
{"current_steps": 771, "total_steps": 1230, "loss": 0.2371, "lr": 1.4700369956066771e-05, "epoch": 3.1306990881458967, "percentage": 62.68, "elapsed_time": "8:49:23", "remaining_time": "5:15:09"}
|
| 772 |
+
{"current_steps": 772, "total_steps": 1230, "loss": 0.2551, "lr": 1.4645661620144413e-05, "epoch": 3.1347517730496453, "percentage": 62.76, "elapsed_time": "8:50:03", "remaining_time": "5:14:27"}
|
| 773 |
+
{"current_steps": 773, "total_steps": 1230, "loss": 0.2541, "lr": 1.4590996407327284e-05, "epoch": 3.1388044579533942, "percentage": 62.85, "elapsed_time": "8:50:43", "remaining_time": "5:13:45"}
|
| 774 |
+
{"current_steps": 774, "total_steps": 1230, "loss": 0.2598, "lr": 1.4536374757881487e-05, "epoch": 3.142857142857143, "percentage": 62.93, "elapsed_time": "8:51:21", "remaining_time": "5:13:02"}
|
| 775 |
+
{"current_steps": 775, "total_steps": 1230, "loss": 0.2373, "lr": 1.4481797111722271e-05, "epoch": 3.146909827760892, "percentage": 63.01, "elapsed_time": "8:52:00", "remaining_time": "5:12:20"}
|
| 776 |
+
{"current_steps": 776, "total_steps": 1230, "loss": 0.2519, "lr": 1.4427263908410507e-05, "epoch": 3.1509625126646403, "percentage": 63.09, "elapsed_time": "8:52:41", "remaining_time": "5:11:38"}
|
| 777 |
+
{"current_steps": 777, "total_steps": 1230, "loss": 0.2549, "lr": 1.4372775587149108e-05, "epoch": 3.155015197568389, "percentage": 63.17, "elapsed_time": "8:53:21", "remaining_time": "5:10:57"}
|
| 778 |
+
{"current_steps": 778, "total_steps": 1230, "loss": 0.2537, "lr": 1.4318332586779522e-05, "epoch": 3.159067882472138, "percentage": 63.25, "elapsed_time": "8:54:01", "remaining_time": "5:10:15"}
|
| 779 |
+
{"current_steps": 779, "total_steps": 1230, "loss": 0.2477, "lr": 1.4263935345778202e-05, "epoch": 3.1631205673758864, "percentage": 63.33, "elapsed_time": "8:54:39", "remaining_time": "5:09:32"}
|
| 780 |
+
{"current_steps": 780, "total_steps": 1230, "loss": 0.257, "lr": 1.420958430225303e-05, "epoch": 3.1671732522796354, "percentage": 63.41, "elapsed_time": "8:55:19", "remaining_time": "5:08:50"}
|
| 781 |
+
{"current_steps": 781, "total_steps": 1230, "loss": 0.2473, "lr": 1.415527989393985e-05, "epoch": 3.171225937183384, "percentage": 63.5, "elapsed_time": "8:56:02", "remaining_time": "5:08:10"}
|
| 782 |
+
{"current_steps": 782, "total_steps": 1230, "loss": 0.2514, "lr": 1.410102255819891e-05, "epoch": 3.1752786220871325, "percentage": 63.58, "elapsed_time": "8:56:43", "remaining_time": "5:07:29"}
|
| 783 |
+
{"current_steps": 783, "total_steps": 1230, "loss": 0.2509, "lr": 1.404681273201131e-05, "epoch": 3.1793313069908815, "percentage": 63.66, "elapsed_time": "8:57:25", "remaining_time": "5:06:48"}
|
| 784 |
+
{"current_steps": 784, "total_steps": 1230, "loss": 0.2564, "lr": 1.399265085197556e-05, "epoch": 3.18338399189463, "percentage": 63.74, "elapsed_time": "8:58:09", "remaining_time": "5:06:08"}
|
| 785 |
+
{"current_steps": 785, "total_steps": 1230, "loss": 0.2571, "lr": 1.393853735430398e-05, "epoch": 3.187436676798379, "percentage": 63.82, "elapsed_time": "8:58:49", "remaining_time": "5:05:27"}
|
| 786 |
+
{"current_steps": 786, "total_steps": 1230, "loss": 0.2586, "lr": 1.3884472674819246e-05, "epoch": 3.1914893617021276, "percentage": 63.9, "elapsed_time": "8:59:27", "remaining_time": "5:04:44"}
|
| 787 |
+
{"current_steps": 787, "total_steps": 1230, "loss": 0.2622, "lr": 1.3830457248950864e-05, "epoch": 3.1955420466058766, "percentage": 63.98, "elapsed_time": "9:00:08", "remaining_time": "5:04:02"}
|
| 788 |
+
{"current_steps": 788, "total_steps": 1230, "loss": 0.2519, "lr": 1.377649151173163e-05, "epoch": 3.199594731509625, "percentage": 64.07, "elapsed_time": "9:00:51", "remaining_time": "5:03:22"}
|
| 789 |
+
{"current_steps": 789, "total_steps": 1230, "loss": 0.2628, "lr": 1.3722575897794181e-05, "epoch": 3.2036474164133737, "percentage": 64.15, "elapsed_time": "9:01:33", "remaining_time": "5:02:41"}
|
| 790 |
+
{"current_steps": 790, "total_steps": 1230, "loss": 0.2556, "lr": 1.3668710841367472e-05, "epoch": 3.2077001013171227, "percentage": 64.23, "elapsed_time": "9:02:11", "remaining_time": "5:01:58"}
|
| 791 |
+
{"current_steps": 791, "total_steps": 1230, "loss": 0.2447, "lr": 1.361489677627324e-05, "epoch": 3.2117527862208712, "percentage": 64.31, "elapsed_time": "9:02:50", "remaining_time": "5:01:16"}
|
| 792 |
+
{"current_steps": 792, "total_steps": 1230, "loss": 0.2688, "lr": 1.3561134135922585e-05, "epoch": 3.2158054711246202, "percentage": 64.39, "elapsed_time": "9:03:31", "remaining_time": "5:00:35"}
|
| 793 |
+
{"current_steps": 793, "total_steps": 1230, "loss": 0.2547, "lr": 1.350742335331241e-05, "epoch": 3.219858156028369, "percentage": 64.47, "elapsed_time": "9:04:14", "remaining_time": "4:59:55"}
|
| 794 |
+
{"current_steps": 794, "total_steps": 1230, "loss": 0.242, "lr": 1.345376486102198e-05, "epoch": 3.2239108409321173, "percentage": 64.55, "elapsed_time": "9:04:57", "remaining_time": "4:59:14"}
|
| 795 |
+
{"current_steps": 795, "total_steps": 1230, "loss": 0.244, "lr": 1.3400159091209414e-05, "epoch": 3.2279635258358663, "percentage": 64.63, "elapsed_time": "9:05:40", "remaining_time": "4:58:34"}
|
| 796 |
+
{"current_steps": 796, "total_steps": 1230, "loss": 0.2686, "lr": 1.3346606475608216e-05, "epoch": 3.232016210739615, "percentage": 64.72, "elapsed_time": "9:06:20", "remaining_time": "4:57:53"}
|
| 797 |
+
{"current_steps": 797, "total_steps": 1230, "loss": 0.2516, "lr": 1.3293107445523781e-05, "epoch": 3.236068895643364, "percentage": 64.8, "elapsed_time": "9:07:03", "remaining_time": "4:57:12"}
|
| 798 |
+
{"current_steps": 798, "total_steps": 1230, "loss": 0.2672, "lr": 1.3239662431829949e-05, "epoch": 3.2401215805471124, "percentage": 64.88, "elapsed_time": "9:07:46", "remaining_time": "4:56:32"}
|
| 799 |
+
{"current_steps": 799, "total_steps": 1230, "loss": 0.2505, "lr": 1.3186271864965509e-05, "epoch": 3.2441742654508614, "percentage": 64.96, "elapsed_time": "9:08:27", "remaining_time": "4:55:51"}
|
| 800 |
+
{"current_steps": 800, "total_steps": 1230, "loss": 0.2537, "lr": 1.3132936174930756e-05, "epoch": 3.24822695035461, "percentage": 65.04, "elapsed_time": "9:09:05", "remaining_time": "4:55:08"}
|
| 801 |
+
{"current_steps": 801, "total_steps": 1230, "loss": 0.2623, "lr": 1.3079655791283995e-05, "epoch": 3.2522796352583585, "percentage": 65.12, "elapsed_time": "9:09:44", "remaining_time": "4:54:25"}
|
| 802 |
+
{"current_steps": 802, "total_steps": 1230, "loss": 0.2356, "lr": 1.3026431143138108e-05, "epoch": 3.2563323201621075, "percentage": 65.2, "elapsed_time": "9:10:24", "remaining_time": "4:53:43"}
|
| 803 |
+
{"current_steps": 803, "total_steps": 1230, "loss": 0.2528, "lr": 1.2973262659157114e-05, "epoch": 3.260385005065856, "percentage": 65.28, "elapsed_time": "9:11:05", "remaining_time": "4:53:02"}
|
| 804 |
+
{"current_steps": 804, "total_steps": 1230, "loss": 0.2444, "lr": 1.2920150767552651e-05, "epoch": 3.264437689969605, "percentage": 65.37, "elapsed_time": "9:11:46", "remaining_time": "4:52:21"}
|
| 805 |
+
{"current_steps": 805, "total_steps": 1230, "loss": 0.2505, "lr": 1.2867095896080607e-05, "epoch": 3.2684903748733536, "percentage": 65.45, "elapsed_time": "9:12:26", "remaining_time": "4:51:39"}
|
| 806 |
+
{"current_steps": 806, "total_steps": 1230, "loss": 0.2671, "lr": 1.2814098472037612e-05, "epoch": 3.272543059777102, "percentage": 65.53, "elapsed_time": "9:13:10", "remaining_time": "4:51:00"}
|
| 807 |
+
{"current_steps": 807, "total_steps": 1230, "loss": 0.2626, "lr": 1.276115892225764e-05, "epoch": 3.276595744680851, "percentage": 65.61, "elapsed_time": "9:13:51", "remaining_time": "4:50:18"}
|
| 808 |
+
{"current_steps": 808, "total_steps": 1230, "loss": 0.252, "lr": 1.2708277673108555e-05, "epoch": 3.2806484295845997, "percentage": 65.69, "elapsed_time": "9:14:33", "remaining_time": "4:49:38"}
|
| 809 |
+
{"current_steps": 809, "total_steps": 1230, "loss": 0.2547, "lr": 1.2655455150488649e-05, "epoch": 3.2847011144883487, "percentage": 65.77, "elapsed_time": "9:15:16", "remaining_time": "4:48:57"}
|
| 810 |
+
{"current_steps": 810, "total_steps": 1230, "loss": 0.2603, "lr": 1.2602691779823272e-05, "epoch": 3.288753799392097, "percentage": 65.85, "elapsed_time": "9:15:56", "remaining_time": "4:48:16"}
|
| 811 |
+
{"current_steps": 811, "total_steps": 1230, "loss": 0.2387, "lr": 1.2549987986061355e-05, "epoch": 3.2928064842958458, "percentage": 65.93, "elapsed_time": "9:16:37", "remaining_time": "4:47:34"}
|
| 812 |
+
{"current_steps": 812, "total_steps": 1230, "loss": 0.268, "lr": 1.2497344193672005e-05, "epoch": 3.2968591691995948, "percentage": 66.02, "elapsed_time": "9:17:21", "remaining_time": "4:46:54"}
|
| 813 |
+
{"current_steps": 813, "total_steps": 1230, "loss": 0.2429, "lr": 1.2444760826641092e-05, "epoch": 3.3009118541033433, "percentage": 66.1, "elapsed_time": "9:17:59", "remaining_time": "4:46:12"}
|
| 814 |
+
{"current_steps": 814, "total_steps": 1230, "loss": 0.2375, "lr": 1.2392238308467817e-05, "epoch": 3.3049645390070923, "percentage": 66.18, "elapsed_time": "9:18:41", "remaining_time": "4:45:31"}
|
| 815 |
+
{"current_steps": 815, "total_steps": 1230, "loss": 0.2561, "lr": 1.2339777062161326e-05, "epoch": 3.309017223910841, "percentage": 66.26, "elapsed_time": "9:19:22", "remaining_time": "4:44:50"}
|
| 816 |
+
{"current_steps": 816, "total_steps": 1230, "loss": 0.2594, "lr": 1.2287377510237293e-05, "epoch": 3.31306990881459, "percentage": 66.34, "elapsed_time": "9:20:00", "remaining_time": "4:44:07"}
|
| 817 |
+
{"current_steps": 817, "total_steps": 1230, "loss": 0.2429, "lr": 1.2235040074714488e-05, "epoch": 3.3171225937183384, "percentage": 66.42, "elapsed_time": "9:20:42", "remaining_time": "4:43:26"}
|
| 818 |
+
{"current_steps": 818, "total_steps": 1230, "loss": 0.238, "lr": 1.2182765177111434e-05, "epoch": 3.321175278622087, "percentage": 66.5, "elapsed_time": "9:21:23", "remaining_time": "4:42:45"}
|
| 819 |
+
{"current_steps": 819, "total_steps": 1230, "loss": 0.2612, "lr": 1.213055323844297e-05, "epoch": 3.325227963525836, "percentage": 66.59, "elapsed_time": "9:22:04", "remaining_time": "4:42:03"}
|
| 820 |
+
{"current_steps": 820, "total_steps": 1230, "loss": 0.2373, "lr": 1.2078404679216864e-05, "epoch": 3.3292806484295845, "percentage": 66.67, "elapsed_time": "9:22:45", "remaining_time": "4:41:22"}
|
| 821 |
+
{"current_steps": 821, "total_steps": 1230, "loss": 0.2556, "lr": 1.2026319919430458e-05, "epoch": 3.3333333333333335, "percentage": 66.75, "elapsed_time": "9:23:28", "remaining_time": "4:40:42"}
|
| 822 |
+
{"current_steps": 822, "total_steps": 1230, "loss": 0.2481, "lr": 1.1974299378567227e-05, "epoch": 3.337386018237082, "percentage": 66.83, "elapsed_time": "9:24:08", "remaining_time": "4:40:00"}
|
| 823 |
+
{"current_steps": 823, "total_steps": 1230, "loss": 0.2523, "lr": 1.1922343475593462e-05, "epoch": 3.341438703140831, "percentage": 66.91, "elapsed_time": "9:24:52", "remaining_time": "4:39:20"}
|
| 824 |
+
{"current_steps": 824, "total_steps": 1230, "loss": 0.2531, "lr": 1.187045262895488e-05, "epoch": 3.3454913880445796, "percentage": 66.99, "elapsed_time": "9:25:29", "remaining_time": "4:38:37"}
|
| 825 |
+
{"current_steps": 825, "total_steps": 1230, "loss": 0.2443, "lr": 1.1818627256573203e-05, "epoch": 3.349544072948328, "percentage": 67.07, "elapsed_time": "9:26:09", "remaining_time": "4:37:56"}
|
| 826 |
+
{"current_steps": 826, "total_steps": 1230, "loss": 0.2371, "lr": 1.1766867775842864e-05, "epoch": 3.353596757852077, "percentage": 67.15, "elapsed_time": "9:26:43", "remaining_time": "4:37:11"}
|
| 827 |
+
{"current_steps": 827, "total_steps": 1230, "loss": 0.2519, "lr": 1.1715174603627615e-05, "epoch": 3.3576494427558257, "percentage": 67.24, "elapsed_time": "9:27:26", "remaining_time": "4:36:30"}
|
| 828 |
+
{"current_steps": 828, "total_steps": 1230, "loss": 0.2386, "lr": 1.1663548156257147e-05, "epoch": 3.3617021276595747, "percentage": 67.32, "elapsed_time": "9:28:06", "remaining_time": "4:35:49"}
|
| 829 |
+
{"current_steps": 829, "total_steps": 1230, "loss": 0.2471, "lr": 1.161198884952377e-05, "epoch": 3.365754812563323, "percentage": 67.4, "elapsed_time": "9:28:43", "remaining_time": "4:35:06"}
|
| 830 |
+
{"current_steps": 830, "total_steps": 1230, "loss": 0.2453, "lr": 1.1560497098679056e-05, "epoch": 3.3698074974670718, "percentage": 67.48, "elapsed_time": "9:29:23", "remaining_time": "4:34:24"}
|
| 831 |
+
{"current_steps": 831, "total_steps": 1230, "loss": 0.242, "lr": 1.1509073318430479e-05, "epoch": 3.3738601823708207, "percentage": 67.56, "elapsed_time": "9:30:03", "remaining_time": "4:33:42"}
|
| 832 |
+
{"current_steps": 832, "total_steps": 1230, "loss": 0.2597, "lr": 1.1457717922938116e-05, "epoch": 3.3779128672745693, "percentage": 67.64, "elapsed_time": "9:30:38", "remaining_time": "4:32:58"}
|
| 833 |
+
{"current_steps": 833, "total_steps": 1230, "loss": 0.2543, "lr": 1.1406431325811233e-05, "epoch": 3.3819655521783183, "percentage": 67.72, "elapsed_time": "9:31:20", "remaining_time": "4:32:17"}
|
| 834 |
+
{"current_steps": 834, "total_steps": 1230, "loss": 0.2485, "lr": 1.135521394010506e-05, "epoch": 3.386018237082067, "percentage": 67.8, "elapsed_time": "9:32:02", "remaining_time": "4:31:37"}
|
| 835 |
+
{"current_steps": 835, "total_steps": 1230, "loss": 0.2419, "lr": 1.1304066178317367e-05, "epoch": 3.3900709219858154, "percentage": 67.89, "elapsed_time": "9:32:43", "remaining_time": "4:30:55"}
|
| 836 |
+
{"current_steps": 836, "total_steps": 1230, "loss": 0.2514, "lr": 1.1252988452385199e-05, "epoch": 3.3941236068895644, "percentage": 67.97, "elapsed_time": "9:33:23", "remaining_time": "4:30:14"}
|
| 837 |
+
{"current_steps": 837, "total_steps": 1230, "loss": 0.2434, "lr": 1.1201981173681536e-05, "epoch": 3.398176291793313, "percentage": 68.05, "elapsed_time": "9:34:02", "remaining_time": "4:29:31"}
|
| 838 |
+
{"current_steps": 838, "total_steps": 1230, "loss": 0.2567, "lr": 1.1151044753011991e-05, "epoch": 3.402228976697062, "percentage": 68.13, "elapsed_time": "9:34:42", "remaining_time": "4:28:50"}
|
| 839 |
+
{"current_steps": 839, "total_steps": 1230, "loss": 0.2462, "lr": 1.1100179600611491e-05, "epoch": 3.4062816616008105, "percentage": 68.21, "elapsed_time": "9:35:23", "remaining_time": "4:28:08"}
|
| 840 |
+
{"current_steps": 840, "total_steps": 1230, "loss": 0.2652, "lr": 1.1049386126140985e-05, "epoch": 3.410334346504559, "percentage": 68.29, "elapsed_time": "9:36:00", "remaining_time": "4:27:26"}
|
| 841 |
+
{"current_steps": 841, "total_steps": 1230, "loss": 0.2549, "lr": 1.0998664738684128e-05, "epoch": 3.414387031408308, "percentage": 68.37, "elapsed_time": "9:36:40", "remaining_time": "4:26:44"}
|
| 842 |
+
{"current_steps": 842, "total_steps": 1230, "loss": 0.2611, "lr": 1.0948015846744e-05, "epoch": 3.4184397163120566, "percentage": 68.46, "elapsed_time": "9:37:19", "remaining_time": "4:26:02"}
|
| 843 |
+
{"current_steps": 843, "total_steps": 1230, "loss": 0.2526, "lr": 1.0897439858239832e-05, "epoch": 3.4224924012158056, "percentage": 68.54, "elapsed_time": "9:37:54", "remaining_time": "4:25:18"}
|
| 844 |
+
{"current_steps": 844, "total_steps": 1230, "loss": 0.2433, "lr": 1.0846937180503652e-05, "epoch": 3.426545086119554, "percentage": 68.62, "elapsed_time": "9:38:34", "remaining_time": "4:24:36"}
|
| 845 |
+
{"current_steps": 845, "total_steps": 1230, "loss": 0.2416, "lr": 1.0796508220277117e-05, "epoch": 3.430597771023303, "percentage": 68.7, "elapsed_time": "9:39:18", "remaining_time": "4:23:56"}
|
| 846 |
+
{"current_steps": 846, "total_steps": 1230, "loss": 0.2638, "lr": 1.0746153383708107e-05, "epoch": 3.4346504559270516, "percentage": 68.78, "elapsed_time": "9:39:56", "remaining_time": "4:23:14"}
|
| 847 |
+
{"current_steps": 847, "total_steps": 1230, "loss": 0.272, "lr": 1.0695873076347579e-05, "epoch": 3.4387031408308006, "percentage": 68.86, "elapsed_time": "9:40:36", "remaining_time": "4:22:32"}
|
| 848 |
+
{"current_steps": 848, "total_steps": 1230, "loss": 0.2636, "lr": 1.0645667703146205e-05, "epoch": 3.442755825734549, "percentage": 68.94, "elapsed_time": "9:41:20", "remaining_time": "4:21:52"}
|
| 849 |
+
{"current_steps": 849, "total_steps": 1230, "loss": 0.2343, "lr": 1.0595537668451161e-05, "epoch": 3.4468085106382977, "percentage": 69.02, "elapsed_time": "9:42:00", "remaining_time": "4:21:11"}
|
| 850 |
+
{"current_steps": 850, "total_steps": 1230, "loss": 0.2526, "lr": 1.0545483376002854e-05, "epoch": 3.4508611955420467, "percentage": 69.11, "elapsed_time": "9:42:44", "remaining_time": "4:20:31"}
|
| 851 |
+
{"current_steps": 851, "total_steps": 1230, "loss": 0.2505, "lr": 1.0495505228931676e-05, "epoch": 3.4549138804457953, "percentage": 69.19, "elapsed_time": "9:43:24", "remaining_time": "4:19:49"}
|
| 852 |
+
{"current_steps": 852, "total_steps": 1230, "loss": 0.2548, "lr": 1.044560362975474e-05, "epoch": 3.4589665653495443, "percentage": 69.27, "elapsed_time": "9:44:05", "remaining_time": "4:19:08"}
|
| 853 |
+
{"current_steps": 853, "total_steps": 1230, "loss": 0.2652, "lr": 1.0395778980372695e-05, "epoch": 3.463019250253293, "percentage": 69.35, "elapsed_time": "9:44:44", "remaining_time": "4:18:26"}
|
| 854 |
+
{"current_steps": 854, "total_steps": 1230, "loss": 0.2375, "lr": 1.0346031682066381e-05, "epoch": 3.4670719351570414, "percentage": 69.43, "elapsed_time": "9:45:26", "remaining_time": "4:17:45"}
|
| 855 |
+
{"current_steps": 855, "total_steps": 1230, "loss": 0.2371, "lr": 1.0296362135493724e-05, "epoch": 3.4711246200607904, "percentage": 69.51, "elapsed_time": "9:46:05", "remaining_time": "4:17:03"}
|
| 856 |
+
{"current_steps": 856, "total_steps": 1230, "loss": 0.2632, "lr": 1.0246770740686422e-05, "epoch": 3.475177304964539, "percentage": 69.59, "elapsed_time": "9:46:48", "remaining_time": "4:16:22"}
|
| 857 |
+
{"current_steps": 857, "total_steps": 1230, "loss": 0.2536, "lr": 1.0197257897046743e-05, "epoch": 3.479229989868288, "percentage": 69.67, "elapsed_time": "9:47:27", "remaining_time": "4:15:41"}
|
| 858 |
+
{"current_steps": 858, "total_steps": 1230, "loss": 0.2516, "lr": 1.014782400334433e-05, "epoch": 3.4832826747720365, "percentage": 69.76, "elapsed_time": "9:48:10", "remaining_time": "4:15:00"}
|
| 859 |
+
{"current_steps": 859, "total_steps": 1230, "loss": 0.2391, "lr": 1.009846945771296e-05, "epoch": 3.487335359675785, "percentage": 69.84, "elapsed_time": "9:48:53", "remaining_time": "4:14:20"}
|
| 860 |
+
{"current_steps": 860, "total_steps": 1230, "loss": 0.2529, "lr": 1.0049194657647363e-05, "epoch": 3.491388044579534, "percentage": 69.92, "elapsed_time": "9:49:33", "remaining_time": "4:13:38"}
|
| 861 |
+
{"current_steps": 861, "total_steps": 1230, "loss": 0.2543, "lr": 1.0000000000000006e-05, "epoch": 3.4954407294832825, "percentage": 70.0, "elapsed_time": "9:50:14", "remaining_time": "4:12:57"}
|
| 862 |
+
{"current_steps": 862, "total_steps": 1230, "loss": 0.2546, "lr": 9.950885880977891e-06, "epoch": 3.4994934143870315, "percentage": 70.08, "elapsed_time": "9:50:53", "remaining_time": "4:12:15"}
|
| 863 |
+
{"current_steps": 863, "total_steps": 1230, "loss": 0.248, "lr": 9.901852696139382e-06, "epoch": 3.50354609929078, "percentage": 70.16, "elapsed_time": "9:51:30", "remaining_time": "4:11:32"}
|
| 864 |
+
{"current_steps": 864, "total_steps": 1230, "loss": 0.2629, "lr": 9.852900840391027e-06, "epoch": 3.5075987841945286, "percentage": 70.24, "elapsed_time": "9:52:13", "remaining_time": "4:10:52"}
|
| 865 |
+
{"current_steps": 865, "total_steps": 1230, "loss": 0.2485, "lr": 9.804030707984313e-06, "epoch": 3.5116514690982776, "percentage": 70.33, "elapsed_time": "9:52:50", "remaining_time": "4:10:09"}
|
| 866 |
+
{"current_steps": 866, "total_steps": 1230, "loss": 0.2271, "lr": 9.755242692512599e-06, "epoch": 3.515704154002026, "percentage": 70.41, "elapsed_time": "9:53:28", "remaining_time": "4:09:27"}
|
| 867 |
+
{"current_steps": 867, "total_steps": 1230, "loss": 0.238, "lr": 9.70653718690782e-06, "epoch": 3.519756838905775, "percentage": 70.49, "elapsed_time": "9:54:09", "remaining_time": "4:08:45"}
|
| 868 |
+
{"current_steps": 868, "total_steps": 1230, "loss": 0.2632, "lr": 9.657914583437454e-06, "epoch": 3.5238095238095237, "percentage": 70.57, "elapsed_time": "9:54:48", "remaining_time": "4:08:03"}
|
| 869 |
+
{"current_steps": 869, "total_steps": 1230, "loss": 0.2608, "lr": 9.609375273701246e-06, "epoch": 3.5278622087132723, "percentage": 70.65, "elapsed_time": "9:55:28", "remaining_time": "4:07:22"}
|
| 870 |
+
{"current_steps": 870, "total_steps": 1230, "loss": 0.2482, "lr": 9.560919648628133e-06, "epoch": 3.5319148936170213, "percentage": 70.73, "elapsed_time": "9:56:11", "remaining_time": "4:06:41"}
|
| 871 |
+
{"current_steps": 871, "total_steps": 1230, "loss": 0.2288, "lr": 9.512548098473047e-06, "epoch": 3.5359675785207703, "percentage": 70.81, "elapsed_time": "9:56:53", "remaining_time": "4:06:01"}
|
| 872 |
+
{"current_steps": 872, "total_steps": 1230, "loss": 0.2453, "lr": 9.464261012813825e-06, "epoch": 3.540020263424519, "percentage": 70.89, "elapsed_time": "9:57:34", "remaining_time": "4:05:20"}
|
| 873 |
+
{"current_steps": 873, "total_steps": 1230, "loss": 0.2692, "lr": 9.416058780547987e-06, "epoch": 3.5440729483282674, "percentage": 70.98, "elapsed_time": "9:58:20", "remaining_time": "4:04:40"}
|
| 874 |
+
{"current_steps": 874, "total_steps": 1230, "loss": 0.2641, "lr": 9.367941789889714e-06, "epoch": 3.5481256332320164, "percentage": 71.06, "elapsed_time": "9:59:01", "remaining_time": "4:03:59"}
|
| 875 |
+
{"current_steps": 875, "total_steps": 1230, "loss": 0.244, "lr": 9.319910428366607e-06, "epoch": 3.552178318135765, "percentage": 71.14, "elapsed_time": "9:59:43", "remaining_time": "4:03:18"}
|
| 876 |
+
{"current_steps": 876, "total_steps": 1230, "loss": 0.232, "lr": 9.271965082816667e-06, "epoch": 3.556231003039514, "percentage": 71.22, "elapsed_time": "10:00:21", "remaining_time": "4:02:36"}
|
| 877 |
+
{"current_steps": 877, "total_steps": 1230, "loss": 0.2418, "lr": 9.224106139385111e-06, "epoch": 3.5602836879432624, "percentage": 71.3, "elapsed_time": "10:01:04", "remaining_time": "4:01:56"}
|
| 878 |
+
{"current_steps": 878, "total_steps": 1230, "loss": 0.2477, "lr": 9.176333983521291e-06, "epoch": 3.564336372847011, "percentage": 71.38, "elapsed_time": "10:01:46", "remaining_time": "4:01:15"}
|
| 879 |
+
{"current_steps": 879, "total_steps": 1230, "loss": 0.2463, "lr": 9.12864899997558e-06, "epoch": 3.56838905775076, "percentage": 71.46, "elapsed_time": "10:02:31", "remaining_time": "4:00:35"}
|
| 880 |
+
{"current_steps": 880, "total_steps": 1230, "loss": 0.247, "lr": 9.08105157279628e-06, "epoch": 3.5724417426545085, "percentage": 71.54, "elapsed_time": "10:03:13", "remaining_time": "3:59:55"}
|
| 881 |
+
{"current_steps": 881, "total_steps": 1230, "loss": 0.2578, "lr": 9.03354208532653e-06, "epoch": 3.5764944275582575, "percentage": 71.63, "elapsed_time": "10:03:55", "remaining_time": "3:59:14"}
|
| 882 |
+
{"current_steps": 882, "total_steps": 1230, "loss": 0.2374, "lr": 8.986120920201205e-06, "epoch": 3.580547112462006, "percentage": 71.71, "elapsed_time": "10:04:33", "remaining_time": "3:58:32"}
|
| 883 |
+
{"current_steps": 883, "total_steps": 1230, "loss": 0.2574, "lr": 8.938788459343852e-06, "epoch": 3.5845997973657546, "percentage": 71.79, "elapsed_time": "10:05:15", "remaining_time": "3:57:51"}
|
| 884 |
+
{"current_steps": 884, "total_steps": 1230, "loss": 0.2423, "lr": 8.8915450839636e-06, "epoch": 3.5886524822695036, "percentage": 71.87, "elapsed_time": "10:05:55", "remaining_time": "3:57:09"}
|
| 885 |
+
{"current_steps": 885, "total_steps": 1230, "loss": 0.2604, "lr": 8.844391174552116e-06, "epoch": 3.592705167173252, "percentage": 71.95, "elapsed_time": "10:06:35", "remaining_time": "3:56:27"}
|
| 886 |
+
{"current_steps": 886, "total_steps": 1230, "loss": 0.242, "lr": 8.797327110880479e-06, "epoch": 3.596757852077001, "percentage": 72.03, "elapsed_time": "10:07:14", "remaining_time": "3:55:46"}
|
| 887 |
+
{"current_steps": 887, "total_steps": 1230, "loss": 0.2648, "lr": 8.750353271996206e-06, "epoch": 3.6008105369807497, "percentage": 72.11, "elapsed_time": "10:07:53", "remaining_time": "3:55:04"}
|
| 888 |
+
{"current_steps": 888, "total_steps": 1230, "loss": 0.2499, "lr": 8.703470036220132e-06, "epoch": 3.6048632218844983, "percentage": 72.2, "elapsed_time": "10:08:31", "remaining_time": "3:54:21"}
|
| 889 |
+
{"current_steps": 889, "total_steps": 1230, "loss": 0.2478, "lr": 8.656677781143394e-06, "epoch": 3.6089159067882473, "percentage": 72.28, "elapsed_time": "10:09:13", "remaining_time": "3:53:40"}
|
| 890 |
+
{"current_steps": 890, "total_steps": 1230, "loss": 0.2555, "lr": 8.609976883624377e-06, "epoch": 3.612968591691996, "percentage": 72.36, "elapsed_time": "10:09:54", "remaining_time": "3:52:59"}
|
| 891 |
+
{"current_steps": 891, "total_steps": 1230, "loss": 0.2617, "lr": 8.563367719785698e-06, "epoch": 3.617021276595745, "percentage": 72.44, "elapsed_time": "10:10:36", "remaining_time": "3:52:18"}
|
| 892 |
+
{"current_steps": 892, "total_steps": 1230, "loss": 0.2337, "lr": 8.516850665011138e-06, "epoch": 3.6210739614994933, "percentage": 72.52, "elapsed_time": "10:11:12", "remaining_time": "3:51:36"}
|
| 893 |
+
{"current_steps": 893, "total_steps": 1230, "loss": 0.262, "lr": 8.47042609394269e-06, "epoch": 3.625126646403242, "percentage": 72.6, "elapsed_time": "10:11:52", "remaining_time": "3:50:54"}
|
| 894 |
+
{"current_steps": 894, "total_steps": 1230, "loss": 0.2435, "lr": 8.424094380477432e-06, "epoch": 3.629179331306991, "percentage": 72.68, "elapsed_time": "10:12:31", "remaining_time": "3:50:12"}
|
| 895 |
+
{"current_steps": 895, "total_steps": 1230, "loss": 0.2556, "lr": 8.37785589776465e-06, "epoch": 3.63323201621074, "percentage": 72.76, "elapsed_time": "10:13:11", "remaining_time": "3:49:31"}
|
| 896 |
+
{"current_steps": 896, "total_steps": 1230, "loss": 0.2649, "lr": 8.331711018202694e-06, "epoch": 3.6372847011144884, "percentage": 72.85, "elapsed_time": "10:13:52", "remaining_time": "3:48:50"}
|
| 897 |
+
{"current_steps": 897, "total_steps": 1230, "loss": 0.2655, "lr": 8.285660113436104e-06, "epoch": 3.641337386018237, "percentage": 72.93, "elapsed_time": "10:14:37", "remaining_time": "3:48:10"}
|
| 898 |
+
{"current_steps": 898, "total_steps": 1230, "loss": 0.2438, "lr": 8.239703554352527e-06, "epoch": 3.645390070921986, "percentage": 73.01, "elapsed_time": "10:15:19", "remaining_time": "3:47:29"}
|
| 899 |
+
{"current_steps": 899, "total_steps": 1230, "loss": 0.2368, "lr": 8.193841711079775e-06, "epoch": 3.6494427558257345, "percentage": 73.09, "elapsed_time": "10:16:00", "remaining_time": "3:46:48"}
|
| 900 |
+
{"current_steps": 900, "total_steps": 1230, "loss": 0.2474, "lr": 8.148074952982828e-06, "epoch": 3.6534954407294835, "percentage": 73.17, "elapsed_time": "10:16:44", "remaining_time": "3:46:08"}
|
| 901 |
+
{"current_steps": 901, "total_steps": 1230, "loss": 0.27, "lr": 8.102403648660859e-06, "epoch": 3.657548125633232, "percentage": 73.25, "elapsed_time": "10:17:23", "remaining_time": "3:45:26"}
|
| 902 |
+
{"current_steps": 902, "total_steps": 1230, "loss": 0.2475, "lr": 8.056828165944282e-06, "epoch": 3.6616008105369806, "percentage": 73.33, "elapsed_time": "10:18:06", "remaining_time": "3:44:46"}
|
| 903 |
+
{"current_steps": 903, "total_steps": 1230, "loss": 0.2623, "lr": 8.011348871891762e-06, "epoch": 3.6656534954407296, "percentage": 73.41, "elapsed_time": "10:18:48", "remaining_time": "3:44:05"}
|
| 904 |
+
{"current_steps": 904, "total_steps": 1230, "loss": 0.2642, "lr": 7.965966132787287e-06, "epoch": 3.669706180344478, "percentage": 73.5, "elapsed_time": "10:19:28", "remaining_time": "3:43:23"}
|
| 905 |
+
{"current_steps": 905, "total_steps": 1230, "loss": 0.2359, "lr": 7.920680314137189e-06, "epoch": 3.673758865248227, "percentage": 73.58, "elapsed_time": "10:20:11", "remaining_time": "3:42:43"}
|
| 906 |
+
{"current_steps": 906, "total_steps": 1230, "loss": 0.2507, "lr": 7.875491780667246e-06, "epoch": 3.6778115501519757, "percentage": 73.66, "elapsed_time": "10:20:50", "remaining_time": "3:42:01"}
|
| 907 |
+
{"current_steps": 907, "total_steps": 1230, "loss": 0.2388, "lr": 7.830400896319667e-06, "epoch": 3.6818642350557242, "percentage": 73.74, "elapsed_time": "10:21:29", "remaining_time": "3:41:19"}
|
| 908 |
+
{"current_steps": 908, "total_steps": 1230, "loss": 0.2628, "lr": 7.785408024250259e-06, "epoch": 3.6859169199594732, "percentage": 73.82, "elapsed_time": "10:22:09", "remaining_time": "3:40:38"}
|
| 909 |
+
{"current_steps": 909, "total_steps": 1230, "loss": 0.247, "lr": 7.74051352682542e-06, "epoch": 3.689969604863222, "percentage": 73.9, "elapsed_time": "10:22:50", "remaining_time": "3:39:56"}
|
| 910 |
+
{"current_steps": 910, "total_steps": 1230, "loss": 0.2725, "lr": 7.695717765619257e-06, "epoch": 3.694022289766971, "percentage": 73.98, "elapsed_time": "10:23:33", "remaining_time": "3:39:16"}
|
| 911 |
+
{"current_steps": 911, "total_steps": 1230, "loss": 0.2636, "lr": 7.651021101410673e-06, "epoch": 3.6980749746707193, "percentage": 74.07, "elapsed_time": "10:24:16", "remaining_time": "3:38:35"}
|
| 912 |
+
{"current_steps": 912, "total_steps": 1230, "loss": 0.2654, "lr": 7.606423894180464e-06, "epoch": 3.702127659574468, "percentage": 74.15, "elapsed_time": "10:25:00", "remaining_time": "3:37:55"}
|
| 913 |
+
{"current_steps": 913, "total_steps": 1230, "loss": 0.2435, "lr": 7.56192650310839e-06, "epoch": 3.706180344478217, "percentage": 74.23, "elapsed_time": "10:25:43", "remaining_time": "3:37:15"}
|
| 914 |
+
{"current_steps": 914, "total_steps": 1230, "loss": 0.2593, "lr": 7.517529286570349e-06, "epoch": 3.7102330293819654, "percentage": 74.31, "elapsed_time": "10:26:26", "remaining_time": "3:36:34"}
|
| 915 |
+
{"current_steps": 915, "total_steps": 1230, "loss": 0.2437, "lr": 7.473232602135387e-06, "epoch": 3.7142857142857144, "percentage": 74.39, "elapsed_time": "10:27:04", "remaining_time": "3:35:52"}
|
| 916 |
+
{"current_steps": 916, "total_steps": 1230, "loss": 0.2569, "lr": 7.429036806562935e-06, "epoch": 3.718338399189463, "percentage": 74.47, "elapsed_time": "10:27:45", "remaining_time": "3:35:11"}
|
| 917 |
+
{"current_steps": 917, "total_steps": 1230, "loss": 0.2329, "lr": 7.3849422557998455e-06, "epoch": 3.7223910840932115, "percentage": 74.55, "elapsed_time": "10:28:23", "remaining_time": "3:34:29"}
|
| 918 |
+
{"current_steps": 918, "total_steps": 1230, "loss": 0.2474, "lr": 7.340949304977567e-06, "epoch": 3.7264437689969605, "percentage": 74.63, "elapsed_time": "10:29:00", "remaining_time": "3:33:46"}
|
| 919 |
+
{"current_steps": 919, "total_steps": 1230, "loss": 0.2375, "lr": 7.297058308409282e-06, "epoch": 3.7304964539007095, "percentage": 74.72, "elapsed_time": "10:29:41", "remaining_time": "3:33:05"}
|
| 920 |
+
{"current_steps": 920, "total_steps": 1230, "loss": 0.2451, "lr": 7.25326961958704e-06, "epoch": 3.734549138804458, "percentage": 74.8, "elapsed_time": "10:30:21", "remaining_time": "3:32:24"}
|
| 921 |
+
{"current_steps": 921, "total_steps": 1230, "loss": 0.2505, "lr": 7.209583591178921e-06, "epoch": 3.7386018237082066, "percentage": 74.88, "elapsed_time": "10:31:02", "remaining_time": "3:31:43"}
|
| 922 |
+
{"current_steps": 922, "total_steps": 1230, "loss": 0.2346, "lr": 7.1660005750261925e-06, "epoch": 3.742654508611955, "percentage": 74.96, "elapsed_time": "10:31:43", "remaining_time": "3:31:02"}
|
| 923 |
+
{"current_steps": 923, "total_steps": 1230, "loss": 0.2691, "lr": 7.1225209221404765e-06, "epoch": 3.746707193515704, "percentage": 75.04, "elapsed_time": "10:32:24", "remaining_time": "3:30:20"}
|
| 924 |
+
{"current_steps": 924, "total_steps": 1230, "loss": 0.2514, "lr": 7.079144982700909e-06, "epoch": 3.750759878419453, "percentage": 75.12, "elapsed_time": "10:33:07", "remaining_time": "3:29:40"}
|
| 925 |
+
{"current_steps": 925, "total_steps": 1230, "loss": 0.2666, "lr": 7.0358731060513695e-06, "epoch": 3.7548125633232017, "percentage": 75.2, "elapsed_time": "10:33:49", "remaining_time": "3:28:59"}
|
| 926 |
+
{"current_steps": 926, "total_steps": 1230, "loss": 0.2454, "lr": 6.99270564069757e-06, "epoch": 3.7588652482269502, "percentage": 75.28, "elapsed_time": "10:34:31", "remaining_time": "3:28:18"}
|
| 927 |
+
{"current_steps": 927, "total_steps": 1230, "loss": 0.2486, "lr": 6.949642934304375e-06, "epoch": 3.762917933130699, "percentage": 75.37, "elapsed_time": "10:35:12", "remaining_time": "3:27:37"}
|
| 928 |
+
{"current_steps": 928, "total_steps": 1230, "loss": 0.2329, "lr": 6.906685333692871e-06, "epoch": 3.7669706180344478, "percentage": 75.45, "elapsed_time": "10:35:49", "remaining_time": "3:26:55"}
|
| 929 |
+
{"current_steps": 929, "total_steps": 1230, "loss": 0.2424, "lr": 6.86383318483769e-06, "epoch": 3.7710233029381968, "percentage": 75.53, "elapsed_time": "10:36:32", "remaining_time": "3:26:14"}
|
| 930 |
+
{"current_steps": 930, "total_steps": 1230, "loss": 0.2554, "lr": 6.821086832864139e-06, "epoch": 3.7750759878419453, "percentage": 75.61, "elapsed_time": "10:37:15", "remaining_time": "3:25:33"}
|
| 931 |
+
{"current_steps": 931, "total_steps": 1230, "loss": 0.2603, "lr": 6.77844662204546e-06, "epoch": 3.779128672745694, "percentage": 75.69, "elapsed_time": "10:37:57", "remaining_time": "3:24:53"}
|
| 932 |
+
{"current_steps": 932, "total_steps": 1230, "loss": 0.248, "lr": 6.7359128958000455e-06, "epoch": 3.783181357649443, "percentage": 75.77, "elapsed_time": "10:38:41", "remaining_time": "3:24:12"}
|
| 933 |
+
{"current_steps": 933, "total_steps": 1230, "loss": 0.249, "lr": 6.693485996688695e-06, "epoch": 3.7872340425531914, "percentage": 75.85, "elapsed_time": "10:39:20", "remaining_time": "3:23:31"}
|
| 934 |
+
{"current_steps": 934, "total_steps": 1230, "loss": 0.2536, "lr": 6.651166266411801e-06, "epoch": 3.7912867274569404, "percentage": 75.93, "elapsed_time": "10:40:00", "remaining_time": "3:22:49"}
|
| 935 |
+
{"current_steps": 935, "total_steps": 1230, "loss": 0.2554, "lr": 6.6089540458066725e-06, "epoch": 3.795339412360689, "percentage": 76.02, "elapsed_time": "10:40:44", "remaining_time": "3:22:09"}
|
| 936 |
+
{"current_steps": 936, "total_steps": 1230, "loss": 0.236, "lr": 6.566849674844711e-06, "epoch": 3.7993920972644375, "percentage": 76.1, "elapsed_time": "10:41:24", "remaining_time": "3:21:28"}
|
| 937 |
+
{"current_steps": 937, "total_steps": 1230, "loss": 0.2542, "lr": 6.524853492628747e-06, "epoch": 3.8034447821681865, "percentage": 76.18, "elapsed_time": "10:42:05", "remaining_time": "3:20:47"}
|
| 938 |
+
{"current_steps": 938, "total_steps": 1230, "loss": 0.2607, "lr": 6.4829658373902536e-06, "epoch": 3.807497467071935, "percentage": 76.26, "elapsed_time": "10:42:45", "remaining_time": "3:20:05"}
|
| 939 |
+
{"current_steps": 939, "total_steps": 1230, "loss": 0.25, "lr": 6.441187046486648e-06, "epoch": 3.811550151975684, "percentage": 76.34, "elapsed_time": "10:43:27", "remaining_time": "3:19:24"}
|
| 940 |
+
{"current_steps": 940, "total_steps": 1230, "loss": 0.2565, "lr": 6.399517456398567e-06, "epoch": 3.8156028368794326, "percentage": 76.42, "elapsed_time": "10:44:11", "remaining_time": "3:18:44"}
|
| 941 |
+
{"current_steps": 941, "total_steps": 1230, "loss": 0.2492, "lr": 6.357957402727164e-06, "epoch": 3.819655521783181, "percentage": 76.5, "elapsed_time": "10:44:54", "remaining_time": "3:18:03"}
|
| 942 |
+
{"current_steps": 942, "total_steps": 1230, "loss": 0.2476, "lr": 6.316507220191395e-06, "epoch": 3.82370820668693, "percentage": 76.59, "elapsed_time": "10:45:37", "remaining_time": "3:17:23"}
|
| 943 |
+
{"current_steps": 943, "total_steps": 1230, "loss": 0.2339, "lr": 6.275167242625331e-06, "epoch": 3.8277608915906787, "percentage": 76.67, "elapsed_time": "10:46:16", "remaining_time": "3:16:41"}
|
| 944 |
+
{"current_steps": 944, "total_steps": 1230, "loss": 0.2592, "lr": 6.233937802975471e-06, "epoch": 3.8318135764944277, "percentage": 76.75, "elapsed_time": "10:46:54", "remaining_time": "3:15:59"}
|
| 945 |
+
{"current_steps": 945, "total_steps": 1230, "loss": 0.2419, "lr": 6.192819233298046e-06, "epoch": 3.835866261398176, "percentage": 76.83, "elapsed_time": "10:47:33", "remaining_time": "3:15:17"}
|
| 946 |
+
{"current_steps": 946, "total_steps": 1230, "loss": 0.2607, "lr": 6.151811864756383e-06, "epoch": 3.8399189463019248, "percentage": 76.91, "elapsed_time": "10:48:11", "remaining_time": "3:14:35"}
|
| 947 |
+
{"current_steps": 947, "total_steps": 1230, "loss": 0.2683, "lr": 6.1109160276181655e-06, "epoch": 3.8439716312056738, "percentage": 76.99, "elapsed_time": "10:48:51", "remaining_time": "3:13:54"}
|
| 948 |
+
{"current_steps": 948, "total_steps": 1230, "loss": 0.2698, "lr": 6.070132051252868e-06, "epoch": 3.8480243161094227, "percentage": 77.07, "elapsed_time": "10:49:35", "remaining_time": "3:13:14"}
|
| 949 |
+
{"current_steps": 949, "total_steps": 1230, "loss": 0.2492, "lr": 6.0294602641290034e-06, "epoch": 3.8520770010131713, "percentage": 77.15, "elapsed_time": "10:50:17", "remaining_time": "3:12:33"}
|
| 950 |
+
{"current_steps": 950, "total_steps": 1230, "loss": 0.232, "lr": 5.988900993811575e-06, "epoch": 3.85612968591692, "percentage": 77.24, "elapsed_time": "10:50:52", "remaining_time": "3:11:50"}
|
| 951 |
+
{"current_steps": 951, "total_steps": 1230, "loss": 0.2368, "lr": 5.948454566959363e-06, "epoch": 3.860182370820669, "percentage": 77.32, "elapsed_time": "10:51:39", "remaining_time": "3:11:10"}
|
| 952 |
+
{"current_steps": 952, "total_steps": 1230, "loss": 0.2474, "lr": 5.908121309322328e-06, "epoch": 3.8642350557244174, "percentage": 77.4, "elapsed_time": "10:52:19", "remaining_time": "3:10:29"}
|
| 953 |
+
{"current_steps": 953, "total_steps": 1230, "loss": 0.2433, "lr": 5.867901545738976e-06, "epoch": 3.8682877406281664, "percentage": 77.48, "elapsed_time": "10:53:01", "remaining_time": "3:09:48"}
|
| 954 |
+
{"current_steps": 954, "total_steps": 1230, "loss": 0.2566, "lr": 5.827795600133774e-06, "epoch": 3.872340425531915, "percentage": 77.56, "elapsed_time": "10:53:41", "remaining_time": "3:09:07"}
|
| 955 |
+
{"current_steps": 955, "total_steps": 1230, "loss": 0.2521, "lr": 5.787803795514466e-06, "epoch": 3.8763931104356635, "percentage": 77.64, "elapsed_time": "10:54:23", "remaining_time": "3:08:26"}
|
| 956 |
+
{"current_steps": 956, "total_steps": 1230, "loss": 0.2443, "lr": 5.747926453969576e-06, "epoch": 3.8804457953394125, "percentage": 77.72, "elapsed_time": "10:55:08", "remaining_time": "3:07:46"}
|
| 957 |
+
{"current_steps": 957, "total_steps": 1230, "loss": 0.2303, "lr": 5.708163896665708e-06, "epoch": 3.884498480243161, "percentage": 77.8, "elapsed_time": "10:55:49", "remaining_time": "3:07:05"}
|
| 958 |
+
{"current_steps": 958, "total_steps": 1230, "loss": 0.2455, "lr": 5.668516443845047e-06, "epoch": 3.88855116514691, "percentage": 77.89, "elapsed_time": "10:56:29", "remaining_time": "3:06:23"}
|
| 959 |
+
{"current_steps": 959, "total_steps": 1230, "loss": 0.26, "lr": 5.6289844148227225e-06, "epoch": 3.8926038500506586, "percentage": 77.97, "elapsed_time": "10:57:12", "remaining_time": "3:05:43"}
|
| 960 |
+
{"current_steps": 960, "total_steps": 1230, "loss": 0.2605, "lr": 5.5895681279842615e-06, "epoch": 3.896656534954407, "percentage": 78.05, "elapsed_time": "10:57:49", "remaining_time": "3:05:00"}
|
| 961 |
+
{"current_steps": 961, "total_steps": 1230, "loss": 0.2572, "lr": 5.550267900783019e-06, "epoch": 3.900709219858156, "percentage": 78.13, "elapsed_time": "10:58:30", "remaining_time": "3:04:19"}
|
| 962 |
+
{"current_steps": 962, "total_steps": 1230, "loss": 0.267, "lr": 5.511084049737623e-06, "epoch": 3.9047619047619047, "percentage": 78.21, "elapsed_time": "10:59:12", "remaining_time": "3:03:38"}
|
| 963 |
+
{"current_steps": 963, "total_steps": 1230, "loss": 0.2477, "lr": 5.4720168904294215e-06, "epoch": 3.9088145896656536, "percentage": 78.29, "elapsed_time": "10:59:51", "remaining_time": "3:02:56"}
|
| 964 |
+
{"current_steps": 964, "total_steps": 1230, "loss": 0.2581, "lr": 5.433066737499948e-06, "epoch": 3.912867274569402, "percentage": 78.37, "elapsed_time": "11:00:33", "remaining_time": "3:02:16"}
|
| 965 |
+
{"current_steps": 965, "total_steps": 1230, "loss": 0.2412, "lr": 5.394233904648376e-06, "epoch": 3.9169199594731507, "percentage": 78.46, "elapsed_time": "11:01:14", "remaining_time": "3:01:35"}
|
| 966 |
+
{"current_steps": 966, "total_steps": 1230, "loss": 0.2383, "lr": 5.355518704628997e-06, "epoch": 3.9209726443768997, "percentage": 78.54, "elapsed_time": "11:01:54", "remaining_time": "3:00:53"}
|
| 967 |
+
{"current_steps": 967, "total_steps": 1230, "loss": 0.2557, "lr": 5.316921449248731e-06, "epoch": 3.9250253292806483, "percentage": 78.62, "elapsed_time": "11:02:34", "remaining_time": "3:00:12"}
|
| 968 |
+
{"current_steps": 968, "total_steps": 1230, "loss": 0.2532, "lr": 5.278442449364538e-06, "epoch": 3.9290780141843973, "percentage": 78.7, "elapsed_time": "11:03:19", "remaining_time": "2:59:32"}
|
| 969 |
+
{"current_steps": 969, "total_steps": 1230, "loss": 0.2233, "lr": 5.240082014881016e-06, "epoch": 3.933130699088146, "percentage": 78.78, "elapsed_time": "11:03:58", "remaining_time": "2:58:50"}
|
| 970 |
+
{"current_steps": 970, "total_steps": 1230, "loss": 0.2615, "lr": 5.201840454747822e-06, "epoch": 3.9371833839918944, "percentage": 78.86, "elapsed_time": "11:04:37", "remaining_time": "2:58:08"}
|
| 971 |
+
{"current_steps": 971, "total_steps": 1230, "loss": 0.2551, "lr": 5.163718076957223e-06, "epoch": 3.9412360688956434, "percentage": 78.94, "elapsed_time": "11:05:21", "remaining_time": "2:57:28"}
|
| 972 |
+
{"current_steps": 972, "total_steps": 1230, "loss": 0.2357, "lr": 5.125715188541609e-06, "epoch": 3.9452887537993924, "percentage": 79.02, "elapsed_time": "11:06:01", "remaining_time": "2:56:47"}
|
| 973 |
+
{"current_steps": 973, "total_steps": 1230, "loss": 0.2398, "lr": 5.087832095571021e-06, "epoch": 3.949341438703141, "percentage": 79.11, "elapsed_time": "11:06:43", "remaining_time": "2:56:06"}
|
| 974 |
+
{"current_steps": 974, "total_steps": 1230, "loss": 0.2656, "lr": 5.0500691031506766e-06, "epoch": 3.9533941236068895, "percentage": 79.19, "elapsed_time": "11:07:23", "remaining_time": "2:55:24"}
|
| 975 |
+
{"current_steps": 975, "total_steps": 1230, "loss": 0.2395, "lr": 5.01242651541854e-06, "epoch": 3.9574468085106385, "percentage": 79.27, "elapsed_time": "11:08:03", "remaining_time": "2:54:43"}
|
| 976 |
+
{"current_steps": 976, "total_steps": 1230, "loss": 0.2416, "lr": 4.974904635542815e-06, "epoch": 3.961499493414387, "percentage": 79.35, "elapsed_time": "11:08:46", "remaining_time": "2:54:02"}
|
| 977 |
+
{"current_steps": 977, "total_steps": 1230, "loss": 0.2541, "lr": 4.937503765719582e-06, "epoch": 3.965552178318136, "percentage": 79.43, "elapsed_time": "11:09:27", "remaining_time": "2:53:21"}
|
| 978 |
+
{"current_steps": 978, "total_steps": 1230, "loss": 0.2507, "lr": 4.900224207170299e-06, "epoch": 3.9696048632218845, "percentage": 79.51, "elapsed_time": "11:10:05", "remaining_time": "2:52:39"}
|
| 979 |
+
{"current_steps": 979, "total_steps": 1230, "loss": 0.253, "lr": 4.8630662601394065e-06, "epoch": 3.973657548125633, "percentage": 79.59, "elapsed_time": "11:10:41", "remaining_time": "2:51:57"}
|
| 980 |
+
{"current_steps": 980, "total_steps": 1230, "loss": 0.2495, "lr": 4.8260302238918995e-06, "epoch": 3.977710233029382, "percentage": 79.67, "elapsed_time": "11:11:22", "remaining_time": "2:51:16"}
|
| 981 |
+
{"current_steps": 981, "total_steps": 1230, "loss": 0.2377, "lr": 4.789116396710924e-06, "epoch": 3.9817629179331306, "percentage": 79.76, "elapsed_time": "11:11:55", "remaining_time": "2:50:32"}
|
| 982 |
+
{"current_steps": 982, "total_steps": 1230, "loss": 0.2426, "lr": 4.752325075895368e-06, "epoch": 3.9858156028368796, "percentage": 79.84, "elapsed_time": "11:12:33", "remaining_time": "2:49:51"}
|
| 983 |
+
{"current_steps": 983, "total_steps": 1230, "loss": 0.2429, "lr": 4.715656557757473e-06, "epoch": 3.989868287740628, "percentage": 79.92, "elapsed_time": "11:13:11", "remaining_time": "2:49:09"}
|
| 984 |
+
{"current_steps": 984, "total_steps": 1230, "loss": 0.2643, "lr": 4.679111137620442e-06, "epoch": 3.9939209726443767, "percentage": 80.0, "elapsed_time": "11:13:54", "remaining_time": "2:48:28"}
|
| 985 |
+
{"current_steps": 985, "total_steps": 1230, "loss": 0.2403, "lr": 4.6426891098160585e-06, "epoch": 3.9979736575481257, "percentage": 80.08, "elapsed_time": "11:14:35", "remaining_time": "2:47:47"}
|
| 986 |
+
{"current_steps": 986, "total_steps": 1230, "loss": 0.1919, "lr": 4.6063907676823474e-06, "epoch": 4.0040526849037485, "percentage": 80.16, "elapsed_time": "11:17:47", "remaining_time": "2:47:43"}
|
| 987 |
+
{"current_steps": 987, "total_steps": 1230, "loss": 0.2246, "lr": 4.570216403561141e-06, "epoch": 4.008105369807497, "percentage": 80.24, "elapsed_time": "11:18:28", "remaining_time": "2:47:02"}
|
| 988 |
+
{"current_steps": 988, "total_steps": 1230, "loss": 0.1995, "lr": 4.534166308795815e-06, "epoch": 4.0121580547112465, "percentage": 80.33, "elapsed_time": "11:19:04", "remaining_time": "2:46:20"}
|
| 989 |
+
{"current_steps": 989, "total_steps": 1230, "loss": 0.2114, "lr": 4.498240773728859e-06, "epoch": 4.016210739614995, "percentage": 80.41, "elapsed_time": "11:19:41", "remaining_time": "2:45:37"}
|