Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0795c5afa2dc6c3362e6341856d43b8c90a69270a38243970f76a92ea5a712f7
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03a516a91748d8bd60fe7dcca35f295ec4a6ac9a99b781060e71d95a37c5a3df
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19c4ca84678356e38390493fd5911e786e74c3f0a11a5584309ae1e287ff5c56
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:410b39956939f91108153ed5f812c1c9195c5830a784ed2e7eed86b682e742bb
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -104,3 +104,108 @@
|
|
| 104 |
{"current_steps": 104, "total_steps": 525, "loss": 1.1173, "lr": 7.771749434408989e-05, "epoch": 0.9904761904761905, "percentage": 19.81, "elapsed_time": "2:53:19", "remaining_time": "11:41:36"}
|
| 105 |
{"current_steps": 105, "total_steps": 525, "loss": 1.1137, "lr": 7.762801066684133e-05, "epoch": 1.0, "percentage": 20.0, "elapsed_time": "2:54:58", "remaining_time": "11:39:53"}
|
| 106 |
{"current_steps": 106, "total_steps": 525, "loss": 1.0737, "lr": 7.753686002873087e-05, "epoch": 1.0095238095238095, "percentage": 20.19, "elapsed_time": "2:58:50", "remaining_time": "11:46:56"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 104 |
{"current_steps": 104, "total_steps": 525, "loss": 1.1173, "lr": 7.771749434408989e-05, "epoch": 0.9904761904761905, "percentage": 19.81, "elapsed_time": "2:53:19", "remaining_time": "11:41:36"}
|
| 105 |
{"current_steps": 105, "total_steps": 525, "loss": 1.1137, "lr": 7.762801066684133e-05, "epoch": 1.0, "percentage": 20.0, "elapsed_time": "2:54:58", "remaining_time": "11:39:53"}
|
| 106 |
{"current_steps": 106, "total_steps": 525, "loss": 1.0737, "lr": 7.753686002873087e-05, "epoch": 1.0095238095238095, "percentage": 20.19, "elapsed_time": "2:58:50", "remaining_time": "11:46:56"}
|
| 107 |
+
{"current_steps": 107, "total_steps": 525, "loss": 1.0849, "lr": 7.744404646782866e-05, "epoch": 1.019047619047619, "percentage": 20.38, "elapsed_time": "3:00:29", "remaining_time": "11:45:07"}
|
| 108 |
+
{"current_steps": 108, "total_steps": 525, "loss": 1.0861, "lr": 7.734957409587404e-05, "epoch": 1.0285714285714285, "percentage": 20.57, "elapsed_time": "3:02:09", "remaining_time": "11:43:19"}
|
| 109 |
+
{"current_steps": 109, "total_steps": 525, "loss": 1.0785, "lr": 7.725344709809355e-05, "epoch": 1.0380952380952382, "percentage": 20.76, "elapsed_time": "3:03:48", "remaining_time": "11:41:30"}
|
| 110 |
+
{"current_steps": 110, "total_steps": 525, "loss": 1.0963, "lr": 7.715566973301529e-05, "epoch": 1.0476190476190477, "percentage": 20.95, "elapsed_time": "3:05:27", "remaining_time": "11:39:42"}
|
| 111 |
+
{"current_steps": 111, "total_steps": 525, "loss": 1.0728, "lr": 7.70562463322805e-05, "epoch": 1.0571428571428572, "percentage": 21.14, "elapsed_time": "3:07:07", "remaining_time": "11:37:54"}
|
| 112 |
+
{"current_steps": 112, "total_steps": 525, "loss": 1.0806, "lr": 7.695518130045147e-05, "epoch": 1.0666666666666667, "percentage": 21.33, "elapsed_time": "3:08:46", "remaining_time": "11:36:07"}
|
| 113 |
+
{"current_steps": 113, "total_steps": 525, "loss": 1.0981, "lr": 7.685247911481652e-05, "epoch": 1.0761904761904761, "percentage": 21.52, "elapsed_time": "3:10:26", "remaining_time": "11:34:19"}
|
| 114 |
+
{"current_steps": 114, "total_steps": 525, "loss": 1.0734, "lr": 7.674814432519163e-05, "epoch": 1.0857142857142856, "percentage": 21.71, "elapsed_time": "3:12:05", "remaining_time": "11:32:32"}
|
| 115 |
+
{"current_steps": 115, "total_steps": 525, "loss": 1.0658, "lr": 7.664218155371884e-05, "epoch": 1.0952380952380953, "percentage": 21.9, "elapsed_time": "3:13:44", "remaining_time": "11:30:45"}
|
| 116 |
+
{"current_steps": 116, "total_steps": 525, "loss": 1.086, "lr": 7.653459549466157e-05, "epoch": 1.1047619047619048, "percentage": 22.1, "elapsed_time": "3:15:24", "remaining_time": "11:28:58"}
|
| 117 |
+
{"current_steps": 117, "total_steps": 525, "loss": 1.1062, "lr": 7.642539091419654e-05, "epoch": 1.1142857142857143, "percentage": 22.29, "elapsed_time": "3:17:03", "remaining_time": "11:27:10"}
|
| 118 |
+
{"current_steps": 118, "total_steps": 525, "loss": 1.075, "lr": 7.631457265020274e-05, "epoch": 1.1238095238095238, "percentage": 22.48, "elapsed_time": "3:18:42", "remaining_time": "11:25:23"}
|
| 119 |
+
{"current_steps": 119, "total_steps": 525, "loss": 1.0683, "lr": 7.620214561204704e-05, "epoch": 1.1333333333333333, "percentage": 22.67, "elapsed_time": "3:20:22", "remaining_time": "11:23:37"}
|
| 120 |
+
{"current_steps": 120, "total_steps": 525, "loss": 1.0846, "lr": 7.608811478036671e-05, "epoch": 1.1428571428571428, "percentage": 22.86, "elapsed_time": "3:22:02", "remaining_time": "11:21:52"}
|
| 121 |
+
{"current_steps": 121, "total_steps": 525, "loss": 1.0905, "lr": 7.597248520684878e-05, "epoch": 1.1523809523809523, "percentage": 23.05, "elapsed_time": "3:23:42", "remaining_time": "11:20:08"}
|
| 122 |
+
{"current_steps": 122, "total_steps": 525, "loss": 1.0791, "lr": 7.585526201400623e-05, "epoch": 1.161904761904762, "percentage": 23.24, "elapsed_time": "3:25:22", "remaining_time": "11:18:26"}
|
| 123 |
+
{"current_steps": 123, "total_steps": 525, "loss": 1.0869, "lr": 7.57364503949511e-05, "epoch": 1.1714285714285715, "percentage": 23.43, "elapsed_time": "3:27:02", "remaining_time": "11:16:41"}
|
| 124 |
+
{"current_steps": 124, "total_steps": 525, "loss": 1.0688, "lr": 7.56160556131644e-05, "epoch": 1.180952380952381, "percentage": 23.62, "elapsed_time": "3:28:42", "remaining_time": "11:14:55"}
|
| 125 |
+
{"current_steps": 125, "total_steps": 525, "loss": 1.0798, "lr": 7.549408300226287e-05, "epoch": 1.1904761904761905, "percentage": 23.81, "elapsed_time": "3:30:21", "remaining_time": "11:13:08"}
|
| 126 |
+
{"current_steps": 126, "total_steps": 525, "loss": 1.0755, "lr": 7.537053796576282e-05, "epoch": 1.2, "percentage": 24.0, "elapsed_time": "3:32:00", "remaining_time": "11:11:22"}
|
| 127 |
+
{"current_steps": 127, "total_steps": 525, "loss": 1.0722, "lr": 7.524542597684066e-05, "epoch": 1.2095238095238094, "percentage": 24.19, "elapsed_time": "3:33:40", "remaining_time": "11:09:36"}
|
| 128 |
+
{"current_steps": 128, "total_steps": 525, "loss": 1.0718, "lr": 7.51187525780905e-05, "epoch": 1.2190476190476192, "percentage": 24.38, "elapsed_time": "3:35:19", "remaining_time": "11:07:50"}
|
| 129 |
+
{"current_steps": 129, "total_steps": 525, "loss": 1.0778, "lr": 7.499052338127845e-05, "epoch": 1.2285714285714286, "percentage": 24.57, "elapsed_time": "3:36:58", "remaining_time": "11:06:04"}
|
| 130 |
+
{"current_steps": 130, "total_steps": 525, "loss": 1.068, "lr": 7.486074406709429e-05, "epoch": 1.2380952380952381, "percentage": 24.76, "elapsed_time": "3:38:38", "remaining_time": "11:04:18"}
|
| 131 |
+
{"current_steps": 131, "total_steps": 525, "loss": 1.0832, "lr": 7.47294203848995e-05, "epoch": 1.2476190476190476, "percentage": 24.95, "elapsed_time": "3:40:17", "remaining_time": "11:02:32"}
|
| 132 |
+
{"current_steps": 132, "total_steps": 525, "loss": 1.0702, "lr": 7.459655815247278e-05, "epoch": 1.2571428571428571, "percentage": 25.14, "elapsed_time": "3:41:56", "remaining_time": "11:00:47"}
|
| 133 |
+
{"current_steps": 133, "total_steps": 525, "loss": 1.0751, "lr": 7.446216325575225e-05, "epoch": 1.2666666666666666, "percentage": 25.33, "elapsed_time": "3:43:36", "remaining_time": "10:59:02"}
|
| 134 |
+
{"current_steps": 134, "total_steps": 525, "loss": 1.0597, "lr": 7.432624164857465e-05, "epoch": 1.276190476190476, "percentage": 25.52, "elapsed_time": "3:45:15", "remaining_time": "10:57:16"}
|
| 135 |
+
{"current_steps": 135, "total_steps": 525, "loss": 1.0694, "lr": 7.418879935241162e-05, "epoch": 1.2857142857142856, "percentage": 25.71, "elapsed_time": "3:46:54", "remaining_time": "10:55:31"}
|
| 136 |
+
{"current_steps": 136, "total_steps": 525, "loss": 1.0706, "lr": 7.404984245610296e-05, "epoch": 1.2952380952380953, "percentage": 25.9, "elapsed_time": "3:48:33", "remaining_time": "10:53:45"}
|
| 137 |
+
{"current_steps": 137, "total_steps": 525, "loss": 1.0619, "lr": 7.390937711558683e-05, "epoch": 1.3047619047619048, "percentage": 26.1, "elapsed_time": "3:50:13", "remaining_time": "10:52:00"}
|
| 138 |
+
{"current_steps": 138, "total_steps": 525, "loss": 1.0535, "lr": 7.376740955362715e-05, "epoch": 1.3142857142857143, "percentage": 26.29, "elapsed_time": "3:51:52", "remaining_time": "10:50:15"}
|
| 139 |
+
{"current_steps": 139, "total_steps": 525, "loss": 1.0775, "lr": 7.362394605953773e-05, "epoch": 1.3238095238095238, "percentage": 26.48, "elapsed_time": "3:53:31", "remaining_time": "10:48:30"}
|
| 140 |
+
{"current_steps": 140, "total_steps": 525, "loss": 1.0726, "lr": 7.347899298890386e-05, "epoch": 1.3333333333333333, "percentage": 26.67, "elapsed_time": "3:55:11", "remaining_time": "10:46:45"}
|
| 141 |
+
{"current_steps": 141, "total_steps": 525, "loss": 1.0602, "lr": 7.33325567633006e-05, "epoch": 1.342857142857143, "percentage": 26.86, "elapsed_time": "3:56:50", "remaining_time": "10:45:00"}
|
| 142 |
+
{"current_steps": 142, "total_steps": 525, "loss": 1.0774, "lr": 7.31846438700084e-05, "epoch": 1.3523809523809525, "percentage": 27.05, "elapsed_time": "3:58:29", "remaining_time": "10:43:15"}
|
| 143 |
+
{"current_steps": 143, "total_steps": 525, "loss": 1.0846, "lr": 7.303526086172558e-05, "epoch": 1.361904761904762, "percentage": 27.24, "elapsed_time": "4:00:08", "remaining_time": "10:41:30"}
|
| 144 |
+
{"current_steps": 144, "total_steps": 525, "loss": 1.0627, "lr": 7.288441435627821e-05, "epoch": 1.3714285714285714, "percentage": 27.43, "elapsed_time": "4:01:48", "remaining_time": "10:39:46"}
|
| 145 |
+
{"current_steps": 145, "total_steps": 525, "loss": 1.0841, "lr": 7.273211103632676e-05, "epoch": 1.380952380952381, "percentage": 27.62, "elapsed_time": "4:03:27", "remaining_time": "10:38:01"}
|
| 146 |
+
{"current_steps": 146, "total_steps": 525, "loss": 1.0559, "lr": 7.25783576490702e-05, "epoch": 1.3904761904761904, "percentage": 27.81, "elapsed_time": "4:05:06", "remaining_time": "10:36:16"}
|
| 147 |
+
{"current_steps": 147, "total_steps": 525, "loss": 1.063, "lr": 7.242316100594696e-05, "epoch": 1.4, "percentage": 28.0, "elapsed_time": "4:06:45", "remaining_time": "10:34:32"}
|
| 148 |
+
{"current_steps": 148, "total_steps": 525, "loss": 1.0601, "lr": 7.226652798233327e-05, "epoch": 1.4095238095238094, "percentage": 28.19, "elapsed_time": "4:08:25", "remaining_time": "10:32:48"}
|
| 149 |
+
{"current_steps": 149, "total_steps": 525, "loss": 1.0655, "lr": 7.210846551723855e-05, "epoch": 1.4190476190476191, "percentage": 28.38, "elapsed_time": "4:10:04", "remaining_time": "10:31:03"}
|
| 150 |
+
{"current_steps": 150, "total_steps": 525, "loss": 1.0687, "lr": 7.194898061299798e-05, "epoch": 1.4285714285714286, "percentage": 28.57, "elapsed_time": "4:11:43", "remaining_time": "10:29:19"}
|
| 151 |
+
{"current_steps": 151, "total_steps": 525, "loss": 1.0594, "lr": 7.17880803349623e-05, "epoch": 1.438095238095238, "percentage": 28.76, "elapsed_time": "4:13:23", "remaining_time": "10:27:35"}
|
| 152 |
+
{"current_steps": 152, "total_steps": 525, "loss": 1.0747, "lr": 7.162577181118485e-05, "epoch": 1.4476190476190476, "percentage": 28.95, "elapsed_time": "4:15:02", "remaining_time": "10:25:50"}
|
| 153 |
+
{"current_steps": 153, "total_steps": 525, "loss": 1.0722, "lr": 7.146206223210571e-05, "epoch": 1.457142857142857, "percentage": 29.14, "elapsed_time": "4:16:41", "remaining_time": "10:24:07"}
|
| 154 |
+
{"current_steps": 154, "total_steps": 525, "loss": 1.0605, "lr": 7.129695885023321e-05, "epoch": 1.4666666666666668, "percentage": 29.33, "elapsed_time": "4:18:20", "remaining_time": "10:22:23"}
|
| 155 |
+
{"current_steps": 155, "total_steps": 525, "loss": 1.0678, "lr": 7.113046897982265e-05, "epoch": 1.4761904761904763, "percentage": 29.52, "elapsed_time": "4:20:00", "remaining_time": "10:20:39"}
|
| 156 |
+
{"current_steps": 156, "total_steps": 525, "loss": 1.0805, "lr": 7.09625999965522e-05, "epoch": 1.4857142857142858, "percentage": 29.71, "elapsed_time": "4:21:39", "remaining_time": "10:18:55"}
|
| 157 |
+
{"current_steps": 157, "total_steps": 525, "loss": 1.0627, "lr": 7.079335933719625e-05, "epoch": 1.4952380952380953, "percentage": 29.9, "elapsed_time": "4:23:18", "remaining_time": "10:17:11"}
|
| 158 |
+
{"current_steps": 158, "total_steps": 525, "loss": 1.0685, "lr": 7.062275449929587e-05, "epoch": 1.5047619047619047, "percentage": 30.1, "elapsed_time": "4:24:58", "remaining_time": "10:15:28"}
|
| 159 |
+
{"current_steps": 159, "total_steps": 525, "loss": 1.057, "lr": 7.045079304082667e-05, "epoch": 1.5142857142857142, "percentage": 30.29, "elapsed_time": "4:26:37", "remaining_time": "10:13:44"}
|
| 160 |
+
{"current_steps": 160, "total_steps": 525, "loss": 1.0497, "lr": 7.027748257986403e-05, "epoch": 1.5238095238095237, "percentage": 30.48, "elapsed_time": "4:28:17", "remaining_time": "10:12:01"}
|
| 161 |
+
{"current_steps": 161, "total_steps": 525, "loss": 1.0714, "lr": 7.010283079424553e-05, "epoch": 1.5333333333333332, "percentage": 30.67, "elapsed_time": "4:29:56", "remaining_time": "10:10:18"}
|
| 162 |
+
{"current_steps": 162, "total_steps": 525, "loss": 1.0651, "lr": 6.992684542123094e-05, "epoch": 1.5428571428571427, "percentage": 30.86, "elapsed_time": "4:31:35", "remaining_time": "10:08:34"}
|
| 163 |
+
{"current_steps": 163, "total_steps": 525, "loss": 1.0625, "lr": 6.974953425715926e-05, "epoch": 1.5523809523809524, "percentage": 31.05, "elapsed_time": "4:33:15", "remaining_time": "10:06:51"}
|
| 164 |
+
{"current_steps": 164, "total_steps": 525, "loss": 1.06, "lr": 6.957090515710353e-05, "epoch": 1.561904761904762, "percentage": 31.24, "elapsed_time": "4:34:54", "remaining_time": "10:05:08"}
|
| 165 |
+
{"current_steps": 165, "total_steps": 525, "loss": 1.0607, "lr": 6.939096603452269e-05, "epoch": 1.5714285714285714, "percentage": 31.43, "elapsed_time": "4:36:33", "remaining_time": "10:03:24"}
|
| 166 |
+
{"current_steps": 166, "total_steps": 525, "loss": 1.069, "lr": 6.920972486091113e-05, "epoch": 1.580952380952381, "percentage": 31.62, "elapsed_time": "4:38:13", "remaining_time": "10:01:41"}
|
| 167 |
+
{"current_steps": 167, "total_steps": 525, "loss": 1.0555, "lr": 6.902718966544545e-05, "epoch": 1.5904761904761906, "percentage": 31.81, "elapsed_time": "4:39:52", "remaining_time": "9:59:58"}
|
| 168 |
+
{"current_steps": 168, "total_steps": 525, "loss": 1.073, "lr": 6.884336853462879e-05, "epoch": 1.6, "percentage": 32.0, "elapsed_time": "4:41:31", "remaining_time": "9:58:14"}
|
| 169 |
+
{"current_steps": 169, "total_steps": 525, "loss": 1.0662, "lr": 6.865826961193261e-05, "epoch": 1.6095238095238096, "percentage": 32.19, "elapsed_time": "4:43:11", "remaining_time": "9:56:31"}
|
| 170 |
+
{"current_steps": 170, "total_steps": 525, "loss": 1.0524, "lr": 6.84719010974359e-05, "epoch": 1.619047619047619, "percentage": 32.38, "elapsed_time": "4:44:50", "remaining_time": "9:54:48"}
|
| 171 |
+
{"current_steps": 171, "total_steps": 525, "loss": 1.0692, "lr": 6.828427124746191e-05, "epoch": 1.6285714285714286, "percentage": 32.57, "elapsed_time": "4:46:29", "remaining_time": "9:53:05"}
|
| 172 |
+
{"current_steps": 172, "total_steps": 525, "loss": 1.0607, "lr": 6.80953883742124e-05, "epoch": 1.638095238095238, "percentage": 32.76, "elapsed_time": "4:48:09", "remaining_time": "9:51:22"}
|
| 173 |
+
{"current_steps": 173, "total_steps": 525, "loss": 1.0578, "lr": 6.790526084539939e-05, "epoch": 1.6476190476190475, "percentage": 32.95, "elapsed_time": "4:49:48", "remaining_time": "9:49:39"}
|
| 174 |
+
{"current_steps": 174, "total_steps": 525, "loss": 1.0666, "lr": 6.771389708387448e-05, "epoch": 1.657142857142857, "percentage": 33.14, "elapsed_time": "4:51:27", "remaining_time": "9:47:56"}
|
| 175 |
+
{"current_steps": 175, "total_steps": 525, "loss": 1.0694, "lr": 6.752130556725567e-05, "epoch": 1.6666666666666665, "percentage": 33.33, "elapsed_time": "4:53:06", "remaining_time": "9:46:13"}
|
| 176 |
+
{"current_steps": 176, "total_steps": 525, "loss": 1.0632, "lr": 6.73274948275518e-05, "epoch": 1.6761904761904762, "percentage": 33.52, "elapsed_time": "4:54:46", "remaining_time": "9:44:30"}
|
| 177 |
+
{"current_steps": 177, "total_steps": 525, "loss": 1.0543, "lr": 6.713247345078465e-05, "epoch": 1.6857142857142857, "percentage": 33.71, "elapsed_time": "4:56:25", "remaining_time": "9:42:47"}
|
| 178 |
+
{"current_steps": 178, "total_steps": 525, "loss": 1.0575, "lr": 6.693625007660845e-05, "epoch": 1.6952380952380952, "percentage": 33.9, "elapsed_time": "4:58:04", "remaining_time": "9:41:04"}
|
| 179 |
+
{"current_steps": 179, "total_steps": 525, "loss": 1.055, "lr": 6.673883339792723e-05, "epoch": 1.704761904761905, "percentage": 34.1, "elapsed_time": "4:59:43", "remaining_time": "9:39:22"}
|
| 180 |
+
{"current_steps": 180, "total_steps": 525, "loss": 1.071, "lr": 6.654023216050963e-05, "epoch": 1.7142857142857144, "percentage": 34.29, "elapsed_time": "5:01:23", "remaining_time": "9:37:39"}
|
| 181 |
+
{"current_steps": 181, "total_steps": 525, "loss": 1.051, "lr": 6.634045516260156e-05, "epoch": 1.723809523809524, "percentage": 34.48, "elapsed_time": "5:03:02", "remaining_time": "9:35:56"}
|
| 182 |
+
{"current_steps": 182, "total_steps": 525, "loss": 1.0768, "lr": 6.613951125453632e-05, "epoch": 1.7333333333333334, "percentage": 34.67, "elapsed_time": "5:04:41", "remaining_time": "9:34:14"}
|
| 183 |
+
{"current_steps": 183, "total_steps": 525, "loss": 1.0566, "lr": 6.593740933834262e-05, "epoch": 1.7428571428571429, "percentage": 34.86, "elapsed_time": "5:06:21", "remaining_time": "9:32:31"}
|
| 184 |
+
{"current_steps": 184, "total_steps": 525, "loss": 1.073, "lr": 6.573415836735011e-05, "epoch": 1.7523809523809524, "percentage": 35.05, "elapsed_time": "5:08:00", "remaining_time": "9:30:49"}
|
| 185 |
+
{"current_steps": 185, "total_steps": 525, "loss": 1.0602, "lr": 6.552976734579281e-05, "epoch": 1.7619047619047619, "percentage": 35.24, "elapsed_time": "5:09:40", "remaining_time": "9:29:07"}
|
| 186 |
+
{"current_steps": 186, "total_steps": 525, "loss": 1.0592, "lr": 6.53242453284102e-05, "epoch": 1.7714285714285714, "percentage": 35.43, "elapsed_time": "5:11:19", "remaining_time": "9:27:24"}
|
| 187 |
+
{"current_steps": 187, "total_steps": 525, "loss": 1.0607, "lr": 6.511760142004608e-05, "epoch": 1.7809523809523808, "percentage": 35.62, "elapsed_time": "5:12:58", "remaining_time": "9:25:42"}
|
| 188 |
+
{"current_steps": 188, "total_steps": 525, "loss": 1.0685, "lr": 6.49098447752452e-05, "epoch": 1.7904761904761903, "percentage": 35.81, "elapsed_time": "5:14:38", "remaining_time": "9:24:00"}
|
| 189 |
+
{"current_steps": 189, "total_steps": 525, "loss": 1.0566, "lr": 6.470098459784768e-05, "epoch": 1.8, "percentage": 36.0, "elapsed_time": "5:16:17", "remaining_time": "9:22:17"}
|
| 190 |
+
{"current_steps": 190, "total_steps": 525, "loss": 1.0588, "lr": 6.449103014058139e-05, "epoch": 1.8095238095238095, "percentage": 36.19, "elapsed_time": "5:17:57", "remaining_time": "9:20:35"}
|
| 191 |
+
{"current_steps": 191, "total_steps": 525, "loss": 1.0758, "lr": 6.427999070465191e-05, "epoch": 1.819047619047619, "percentage": 36.38, "elapsed_time": "5:19:36", "remaining_time": "9:18:53"}
|
| 192 |
+
{"current_steps": 192, "total_steps": 525, "loss": 1.0561, "lr": 6.406787563933053e-05, "epoch": 1.8285714285714287, "percentage": 36.57, "elapsed_time": "5:21:15", "remaining_time": "9:17:10"}
|
| 193 |
+
{"current_steps": 193, "total_steps": 525, "loss": 1.0806, "lr": 6.385469434154006e-05, "epoch": 1.8380952380952382, "percentage": 36.76, "elapsed_time": "5:22:54", "remaining_time": "9:15:28"}
|
| 194 |
+
{"current_steps": 194, "total_steps": 525, "loss": 1.0601, "lr": 6.364045625543856e-05, "epoch": 1.8476190476190477, "percentage": 36.95, "elapsed_time": "5:24:34", "remaining_time": "9:13:46"}
|
| 195 |
+
{"current_steps": 195, "total_steps": 525, "loss": 1.0586, "lr": 6.342517087200094e-05, "epoch": 1.8571428571428572, "percentage": 37.14, "elapsed_time": "5:26:13", "remaining_time": "9:12:04"}
|
| 196 |
+
{"current_steps": 196, "total_steps": 525, "loss": 1.0571, "lr": 6.320884772859845e-05, "epoch": 1.8666666666666667, "percentage": 37.33, "elapsed_time": "5:27:52", "remaining_time": "9:10:22"}
|
| 197 |
+
{"current_steps": 197, "total_steps": 525, "loss": 1.0571, "lr": 6.29914964085763e-05, "epoch": 1.8761904761904762, "percentage": 37.52, "elapsed_time": "5:29:32", "remaining_time": "9:08:39"}
|
| 198 |
+
{"current_steps": 198, "total_steps": 525, "loss": 1.0606, "lr": 6.277312654082886e-05, "epoch": 1.8857142857142857, "percentage": 37.71, "elapsed_time": "5:31:11", "remaining_time": "9:06:57"}
|
| 199 |
+
{"current_steps": 199, "total_steps": 525, "loss": 1.0493, "lr": 6.255374779937344e-05, "epoch": 1.8952380952380952, "percentage": 37.9, "elapsed_time": "5:32:50", "remaining_time": "9:05:15"}
|
| 200 |
+
{"current_steps": 200, "total_steps": 525, "loss": 1.0619, "lr": 6.23333699029214e-05, "epoch": 1.9047619047619047, "percentage": 38.1, "elapsed_time": "5:34:29", "remaining_time": "9:03:33"}
|
| 201 |
+
{"current_steps": 201, "total_steps": 525, "loss": 1.0541, "lr": 6.211200261444774e-05, "epoch": 1.9142857142857141, "percentage": 38.29, "elapsed_time": "5:36:09", "remaining_time": "9:01:51"}
|
| 202 |
+
{"current_steps": 202, "total_steps": 525, "loss": 1.0559, "lr": 6.188965574075863e-05, "epoch": 1.9238095238095239, "percentage": 38.48, "elapsed_time": "5:37:48", "remaining_time": "9:00:09"}
|
| 203 |
+
{"current_steps": 203, "total_steps": 525, "loss": 1.0545, "lr": 6.166633913205684e-05, "epoch": 1.9333333333333333, "percentage": 38.67, "elapsed_time": "5:39:27", "remaining_time": "8:58:27"}
|
| 204 |
+
{"current_steps": 204, "total_steps": 525, "loss": 1.0586, "lr": 6.144206268150549e-05, "epoch": 1.9428571428571428, "percentage": 38.86, "elapsed_time": "5:41:07", "remaining_time": "8:56:45"}
|
| 205 |
+
{"current_steps": 205, "total_steps": 525, "loss": 1.0457, "lr": 6.12168363247897e-05, "epoch": 1.9523809523809523, "percentage": 39.05, "elapsed_time": "5:42:46", "remaining_time": "8:55:03"}
|
| 206 |
+
{"current_steps": 206, "total_steps": 525, "loss": 1.054, "lr": 6.0990670039676416e-05, "epoch": 1.961904761904762, "percentage": 39.24, "elapsed_time": "5:44:25", "remaining_time": "8:53:21"}
|
| 207 |
+
{"current_steps": 207, "total_steps": 525, "loss": 1.0674, "lr": 6.0763573845572434e-05, "epoch": 1.9714285714285715, "percentage": 39.43, "elapsed_time": "5:46:05", "remaining_time": "8:51:39"}
|
| 208 |
+
{"current_steps": 208, "total_steps": 525, "loss": 1.0469, "lr": 6.053555780308049e-05, "epoch": 1.980952380952381, "percentage": 39.62, "elapsed_time": "5:47:44", "remaining_time": "8:49:58"}
|
| 209 |
+
{"current_steps": 209, "total_steps": 525, "loss": 1.0457, "lr": 6.03066320135536e-05, "epoch": 1.9904761904761905, "percentage": 39.81, "elapsed_time": "5:49:23", "remaining_time": "8:48:16"}
|
| 210 |
+
{"current_steps": 210, "total_steps": 525, "loss": 1.0549, "lr": 6.0076806618647545e-05, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "5:51:03", "remaining_time": "8:46:34"}
|
| 211 |
+
{"current_steps": 211, "total_steps": 525, "loss": 1.0304, "lr": 5.984609179987155e-05, "epoch": 2.0095238095238095, "percentage": 40.19, "elapsed_time": "5:54:35", "remaining_time": "8:47:41"}
|