Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c618735a76dbbc6670ab48192d0b34b6e065ff65172affd30650dff705c4baee
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bfd159e260b12d17dfc6865a5bd857ada326ec6dd8e10e713cef0a67bdb6e97
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90291f4e3ff8e85b3d676ebb3def6998d1c6786920d22e76ea55cced03de7ab7
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8fc11be423581b922239eabe3008dc283a562e328393c91ff7ee6b082e64a92
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -207,3 +207,107 @@
|
|
| 207 |
{"current_steps": 207, "total_steps": 312, "loss": 0.5542, "lr": 3.0865828381745515e-06, "epoch": 1.9872, "percentage": 66.35, "elapsed_time": "6:25:33", "remaining_time": "3:15:34"}
|
| 208 |
{"current_steps": 208, "total_steps": 312, "loss": 0.5955, "lr": 3.0348748417303826e-06, "epoch": 1.9968, "percentage": 66.67, "elapsed_time": "6:27:15", "remaining_time": "3:13:37"}
|
| 209 |
{"current_steps": 209, "total_steps": 312, "loss": 1.0655, "lr": 2.9834142279959754e-06, "epoch": 2.0064, "percentage": 66.99, "elapsed_time": "6:30:11", "remaining_time": "3:12:17"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 207 |
{"current_steps": 207, "total_steps": 312, "loss": 0.5542, "lr": 3.0865828381745515e-06, "epoch": 1.9872, "percentage": 66.35, "elapsed_time": "6:25:33", "remaining_time": "3:15:34"}
|
| 208 |
{"current_steps": 208, "total_steps": 312, "loss": 0.5955, "lr": 3.0348748417303826e-06, "epoch": 1.9968, "percentage": 66.67, "elapsed_time": "6:27:15", "remaining_time": "3:13:37"}
|
| 209 |
{"current_steps": 209, "total_steps": 312, "loss": 1.0655, "lr": 2.9834142279959754e-06, "epoch": 2.0064, "percentage": 66.99, "elapsed_time": "6:30:11", "remaining_time": "3:12:17"}
|
| 210 |
+
{"current_steps": 210, "total_steps": 312, "loss": 0.5323, "lr": 2.932207475167398e-06, "epoch": 2.016, "percentage": 67.31, "elapsed_time": "6:32:01", "remaining_time": "3:10:24"}
|
| 211 |
+
{"current_steps": 211, "total_steps": 312, "loss": 0.5364, "lr": 2.8812610294830568e-06, "epoch": 2.0256, "percentage": 67.63, "elapsed_time": "6:33:44", "remaining_time": "3:08:28"}
|
| 212 |
+
{"current_steps": 212, "total_steps": 312, "loss": 0.5504, "lr": 2.83058130441221e-06, "epoch": 2.0352, "percentage": 67.95, "elapsed_time": "6:35:33", "remaining_time": "3:06:35"}
|
| 213 |
+
{"current_steps": 213, "total_steps": 312, "loss": 0.4886, "lr": 2.7801746798475905e-06, "epoch": 2.0448, "percentage": 68.27, "elapsed_time": "6:37:25", "remaining_time": "3:04:43"}
|
| 214 |
+
{"current_steps": 214, "total_steps": 312, "loss": 0.563, "lr": 2.7300475013022666e-06, "epoch": 2.0544, "percentage": 68.59, "elapsed_time": "6:39:24", "remaining_time": "3:02:54"}
|
| 215 |
+
{"current_steps": 215, "total_steps": 312, "loss": 0.518, "lr": 2.6802060791108304e-06, "epoch": 2.064, "percentage": 68.91, "elapsed_time": "6:41:19", "remaining_time": "3:01:03"}
|
| 216 |
+
{"current_steps": 216, "total_steps": 312, "loss": 0.465, "lr": 2.6306566876350072e-06, "epoch": 2.0736, "percentage": 69.23, "elapsed_time": "6:43:11", "remaining_time": "2:59:11"}
|
| 217 |
+
{"current_steps": 217, "total_steps": 312, "loss": 0.5807, "lr": 2.5814055644738013e-06, "epoch": 2.0832, "percentage": 69.55, "elapsed_time": "6:45:16", "remaining_time": "2:57:25"}
|
| 218 |
+
{"current_steps": 218, "total_steps": 312, "loss": 0.5353, "lr": 2.532458909678266e-06, "epoch": 2.0928, "percentage": 69.87, "elapsed_time": "6:47:03", "remaining_time": "2:55:31"}
|
| 219 |
+
{"current_steps": 219, "total_steps": 312, "loss": 0.5228, "lr": 2.483822884971e-06, "epoch": 2.1024, "percentage": 70.19, "elapsed_time": "6:49:06", "remaining_time": "2:53:43"}
|
| 220 |
+
{"current_steps": 220, "total_steps": 312, "loss": 0.5144, "lr": 2.43550361297047e-06, "epoch": 2.112, "percentage": 70.51, "elapsed_time": "6:51:09", "remaining_time": "2:51:56"}
|
| 221 |
+
{"current_steps": 221, "total_steps": 312, "loss": 0.5289, "lr": 2.387507176420256e-06, "epoch": 2.1216, "percentage": 70.83, "elapsed_time": "6:53:10", "remaining_time": "2:50:07"}
|
| 222 |
+
{"current_steps": 222, "total_steps": 312, "loss": 0.5164, "lr": 2.339839617423318e-06, "epoch": 2.1312, "percentage": 71.15, "elapsed_time": "6:54:50", "remaining_time": "2:48:10"}
|
| 223 |
+
{"current_steps": 223, "total_steps": 312, "loss": 0.5183, "lr": 2.2925069366813718e-06, "epoch": 2.1408, "percentage": 71.47, "elapsed_time": "6:56:58", "remaining_time": "2:46:25"}
|
| 224 |
+
{"current_steps": 224, "total_steps": 312, "loss": 0.5208, "lr": 2.245515092739488e-06, "epoch": 2.1504, "percentage": 71.79, "elapsed_time": "6:58:56", "remaining_time": "2:44:34"}
|
| 225 |
+
{"current_steps": 225, "total_steps": 312, "loss": 0.5363, "lr": 2.1988700012359865e-06, "epoch": 2.16, "percentage": 72.12, "elapsed_time": "7:00:52", "remaining_time": "2:42:44"}
|
| 226 |
+
{"current_steps": 226, "total_steps": 312, "loss": 0.5223, "lr": 2.1525775341577404e-06, "epoch": 2.1696, "percentage": 72.44, "elapsed_time": "7:02:41", "remaining_time": "2:40:50"}
|
| 227 |
+
{"current_steps": 227, "total_steps": 312, "loss": 0.5162, "lr": 2.1066435191009717e-06, "epoch": 2.1792, "percentage": 72.76, "elapsed_time": "7:04:36", "remaining_time": "2:38:59"}
|
| 228 |
+
{"current_steps": 228, "total_steps": 312, "loss": 0.5156, "lr": 2.061073738537635e-06, "epoch": 2.1888, "percentage": 73.08, "elapsed_time": "7:06:13", "remaining_time": "2:37:01"}
|
| 229 |
+
{"current_steps": 229, "total_steps": 312, "loss": 0.5397, "lr": 2.0158739290874822e-06, "epoch": 2.1984, "percentage": 73.4, "elapsed_time": "7:08:25", "remaining_time": "2:35:16"}
|
| 230 |
+
{"current_steps": 230, "total_steps": 312, "loss": 0.5342, "lr": 1.971049780795901e-06, "epoch": 2.208, "percentage": 73.72, "elapsed_time": "7:10:27", "remaining_time": "2:33:27"}
|
| 231 |
+
{"current_steps": 231, "total_steps": 312, "loss": 0.5118, "lr": 1.9266069364176144e-06, "epoch": 2.2176, "percentage": 74.04, "elapsed_time": "7:12:07", "remaining_time": "2:31:31"}
|
| 232 |
+
{"current_steps": 232, "total_steps": 312, "loss": 0.5245, "lr": 1.8825509907063328e-06, "epoch": 2.2272, "percentage": 74.36, "elapsed_time": "7:13:50", "remaining_time": "2:29:36"}
|
| 233 |
+
{"current_steps": 233, "total_steps": 312, "loss": 0.569, "lr": 1.838887489710452e-06, "epoch": 2.2368, "percentage": 74.68, "elapsed_time": "7:15:37", "remaining_time": "2:27:42"}
|
| 234 |
+
{"current_steps": 234, "total_steps": 312, "loss": 0.494, "lr": 1.7956219300748796e-06, "epoch": 2.2464, "percentage": 75.0, "elapsed_time": "7:17:23", "remaining_time": "2:25:47"}
|
| 235 |
+
{"current_steps": 235, "total_steps": 312, "loss": 0.5668, "lr": 1.7527597583490825e-06, "epoch": 2.2560000000000002, "percentage": 75.32, "elapsed_time": "7:19:26", "remaining_time": "2:23:59"}
|
| 236 |
+
{"current_steps": 236, "total_steps": 312, "loss": 0.5039, "lr": 1.7103063703014372e-06, "epoch": 2.2656, "percentage": 75.64, "elapsed_time": "7:21:18", "remaining_time": "2:22:06"}
|
| 237 |
+
{"current_steps": 237, "total_steps": 312, "loss": 0.5206, "lr": 1.6682671102399806e-06, "epoch": 2.2752, "percentage": 75.96, "elapsed_time": "7:23:16", "remaining_time": "2:20:16"}
|
| 238 |
+
{"current_steps": 238, "total_steps": 312, "loss": 0.5307, "lr": 1.6266472703396286e-06, "epoch": 2.2848, "percentage": 76.28, "elapsed_time": "7:25:05", "remaining_time": "2:18:23"}
|
| 239 |
+
{"current_steps": 239, "total_steps": 312, "loss": 0.4928, "lr": 1.5854520899759656e-06, "epoch": 2.2944, "percentage": 76.6, "elapsed_time": "7:27:11", "remaining_time": "2:16:35"}
|
| 240 |
+
{"current_steps": 240, "total_steps": 312, "loss": 0.565, "lr": 1.544686755065677e-06, "epoch": 2.304, "percentage": 76.92, "elapsed_time": "7:29:11", "remaining_time": "2:14:45"}
|
| 241 |
+
{"current_steps": 241, "total_steps": 312, "loss": 0.5175, "lr": 1.5043563974137132e-06, "epoch": 2.3136, "percentage": 77.24, "elapsed_time": "7:31:02", "remaining_time": "2:12:52"}
|
| 242 |
+
{"current_steps": 242, "total_steps": 312, "loss": 0.5576, "lr": 1.4644660940672628e-06, "epoch": 2.3232, "percentage": 77.56, "elapsed_time": "7:33:02", "remaining_time": "2:11:02"}
|
| 243 |
+
{"current_steps": 243, "total_steps": 312, "loss": 0.4878, "lr": 1.4250208666766235e-06, "epoch": 2.3327999999999998, "percentage": 77.88, "elapsed_time": "7:34:47", "remaining_time": "2:09:08"}
|
| 244 |
+
{"current_steps": 244, "total_steps": 312, "loss": 0.474, "lr": 1.3860256808630429e-06, "epoch": 2.3424, "percentage": 78.21, "elapsed_time": "7:36:43", "remaining_time": "2:07:17"}
|
| 245 |
+
{"current_steps": 245, "total_steps": 312, "loss": 0.5516, "lr": 1.3474854455936126e-06, "epoch": 2.352, "percentage": 78.53, "elapsed_time": "7:38:28", "remaining_time": "2:05:22"}
|
| 246 |
+
{"current_steps": 246, "total_steps": 312, "loss": 0.5117, "lr": 1.3094050125632973e-06, "epoch": 2.3616, "percentage": 78.85, "elapsed_time": "7:40:10", "remaining_time": "2:03:27"}
|
| 247 |
+
{"current_steps": 247, "total_steps": 312, "loss": 0.5253, "lr": 1.2717891755841722e-06, "epoch": 2.3712, "percentage": 79.17, "elapsed_time": "7:42:14", "remaining_time": "2:01:38"}
|
| 248 |
+
{"current_steps": 248, "total_steps": 312, "loss": 0.4987, "lr": 1.234642669981946e-06, "epoch": 2.3808, "percentage": 79.49, "elapsed_time": "7:43:47", "remaining_time": "1:59:41"}
|
| 249 |
+
{"current_steps": 249, "total_steps": 312, "loss": 0.5615, "lr": 1.1979701719998454e-06, "epoch": 2.3904, "percentage": 79.81, "elapsed_time": "7:45:49", "remaining_time": "1:57:51"}
|
| 250 |
+
{"current_steps": 250, "total_steps": 312, "loss": 0.5138, "lr": 1.1617762982099446e-06, "epoch": 2.4, "percentage": 80.13, "elapsed_time": "7:47:47", "remaining_time": "1:56:00"}
|
| 251 |
+
{"current_steps": 251, "total_steps": 312, "loss": 0.529, "lr": 1.1260656049319957e-06, "epoch": 2.4096, "percentage": 80.45, "elapsed_time": "7:49:44", "remaining_time": "1:54:09"}
|
| 252 |
+
{"current_steps": 252, "total_steps": 312, "loss": 0.5435, "lr": 1.0908425876598512e-06, "epoch": 2.4192, "percentage": 80.77, "elapsed_time": "7:51:32", "remaining_time": "1:52:16"}
|
| 253 |
+
{"current_steps": 253, "total_steps": 312, "loss": 0.53, "lr": 1.0561116804955451e-06, "epoch": 2.4288, "percentage": 81.09, "elapsed_time": "7:53:10", "remaining_time": "1:50:20"}
|
| 254 |
+
{"current_steps": 254, "total_steps": 312, "loss": 0.5087, "lr": 1.0218772555910955e-06, "epoch": 2.4384, "percentage": 81.41, "elapsed_time": "7:54:56", "remaining_time": "1:48:27"}
|
| 255 |
+
{"current_steps": 255, "total_steps": 312, "loss": 0.5394, "lr": 9.881436225981107e-07, "epoch": 2.448, "percentage": 81.73, "elapsed_time": "7:56:51", "remaining_time": "1:46:35"}
|
| 256 |
+
{"current_steps": 256, "total_steps": 312, "loss": 0.4832, "lr": 9.549150281252633e-07, "epoch": 2.4576000000000002, "percentage": 82.05, "elapsed_time": "7:58:42", "remaining_time": "1:44:43"}
|
| 257 |
+
{"current_steps": 257, "total_steps": 312, "loss": 0.5408, "lr": 9.221956552036992e-07, "epoch": 2.4672, "percentage": 82.37, "elapsed_time": "8:00:25", "remaining_time": "1:42:48"}
|
| 258 |
+
{"current_steps": 258, "total_steps": 312, "loss": 0.5107, "lr": 8.899896227604509e-07, "epoch": 2.4768, "percentage": 82.69, "elapsed_time": "8:02:11", "remaining_time": "1:40:55"}
|
| 259 |
+
{"current_steps": 259, "total_steps": 312, "loss": 0.5341, "lr": 8.58300985099918e-07, "epoch": 2.4864, "percentage": 83.01, "elapsed_time": "8:04:20", "remaining_time": "1:39:06"}
|
| 260 |
+
{"current_steps": 260, "total_steps": 312, "loss": 0.5153, "lr": 8.271337313934869e-07, "epoch": 2.496, "percentage": 83.33, "elapsed_time": "8:06:16", "remaining_time": "1:37:15"}
|
| 261 |
+
{"current_steps": 261, "total_steps": 312, "loss": 0.5345, "lr": 7.964917851773496e-07, "epoch": 2.5056000000000003, "percentage": 83.65, "elapsed_time": "8:07:59", "remaining_time": "1:35:21"}
|
| 262 |
+
{"current_steps": 262, "total_steps": 312, "loss": 0.5145, "lr": 7.663790038585794e-07, "epoch": 2.5152, "percentage": 83.97, "elapsed_time": "8:09:50", "remaining_time": "1:33:28"}
|
| 263 |
+
{"current_steps": 263, "total_steps": 312, "loss": 0.5243, "lr": 7.367991782295392e-07, "epoch": 2.5248, "percentage": 84.29, "elapsed_time": "8:11:35", "remaining_time": "1:31:35"}
|
| 264 |
+
{"current_steps": 264, "total_steps": 312, "loss": 0.5349, "lr": 7.077560319906696e-07, "epoch": 2.5343999999999998, "percentage": 84.62, "elapsed_time": "8:13:22", "remaining_time": "1:29:42"}
|
| 265 |
+
{"current_steps": 265, "total_steps": 312, "loss": 0.5619, "lr": 6.792532212817271e-07, "epoch": 2.544, "percentage": 84.94, "elapsed_time": "8:15:11", "remaining_time": "1:27:49"}
|
| 266 |
+
{"current_steps": 266, "total_steps": 312, "loss": 0.4899, "lr": 6.512943342215234e-07, "epoch": 2.5536, "percentage": 85.26, "elapsed_time": "8:16:57", "remaining_time": "1:25:56"}
|
| 267 |
+
{"current_steps": 267, "total_steps": 312, "loss": 0.5072, "lr": 6.238828904562316e-07, "epoch": 2.5632, "percentage": 85.58, "elapsed_time": "8:18:44", "remaining_time": "1:24:03"}
|
| 268 |
+
{"current_steps": 268, "total_steps": 312, "loss": 0.5194, "lr": 5.9702234071631e-07, "epoch": 2.5728, "percentage": 85.9, "elapsed_time": "8:20:19", "remaining_time": "1:22:08"}
|
| 269 |
+
{"current_steps": 269, "total_steps": 312, "loss": 0.5599, "lr": 5.707160663821009e-07, "epoch": 2.5824, "percentage": 86.22, "elapsed_time": "8:22:07", "remaining_time": "1:20:15"}
|
| 270 |
+
{"current_steps": 270, "total_steps": 312, "loss": 0.5238, "lr": 5.449673790581611e-07, "epoch": 2.592, "percentage": 86.54, "elapsed_time": "8:24:02", "remaining_time": "1:18:24"}
|
| 271 |
+
{"current_steps": 271, "total_steps": 312, "loss": 0.5116, "lr": 5.197795201563744e-07, "epoch": 2.6016, "percentage": 86.86, "elapsed_time": "8:25:45", "remaining_time": "1:16:30"}
|
| 272 |
+
{"current_steps": 272, "total_steps": 312, "loss": 0.5346, "lr": 4.951556604879049e-07, "epoch": 2.6112, "percentage": 87.18, "elapsed_time": "8:27:38", "remaining_time": "1:14:39"}
|
| 273 |
+
{"current_steps": 273, "total_steps": 312, "loss": 0.539, "lr": 4.710988998640298e-07, "epoch": 2.6208, "percentage": 87.5, "elapsed_time": "8:29:38", "remaining_time": "1:12:48"}
|
| 274 |
+
{"current_steps": 274, "total_steps": 312, "loss": 0.5431, "lr": 4.4761226670592074e-07, "epoch": 2.6304, "percentage": 87.82, "elapsed_time": "8:31:41", "remaining_time": "1:10:57"}
|
| 275 |
+
{"current_steps": 275, "total_steps": 312, "loss": 0.5157, "lr": 4.2469871766340096e-07, "epoch": 2.64, "percentage": 88.14, "elapsed_time": "8:33:28", "remaining_time": "1:09:05"}
|
| 276 |
+
{"current_steps": 276, "total_steps": 312, "loss": 0.5274, "lr": 4.0236113724274716e-07, "epoch": 2.6496, "percentage": 88.46, "elapsed_time": "8:35:10", "remaining_time": "1:07:11"}
|
| 277 |
+
{"current_steps": 277, "total_steps": 312, "loss": 0.5359, "lr": 3.8060233744356634e-07, "epoch": 2.6592000000000002, "percentage": 88.78, "elapsed_time": "8:37:07", "remaining_time": "1:05:20"}
|
| 278 |
+
{"current_steps": 278, "total_steps": 312, "loss": 0.4746, "lr": 3.5942505740480583e-07, "epoch": 2.6688, "percentage": 89.1, "elapsed_time": "8:38:43", "remaining_time": "1:03:26"}
|
| 279 |
+
{"current_steps": 279, "total_steps": 312, "loss": 0.5251, "lr": 3.3883196305992906e-07, "epoch": 2.6784, "percentage": 89.42, "elapsed_time": "8:40:34", "remaining_time": "1:01:34"}
|
| 280 |
+
{"current_steps": 280, "total_steps": 312, "loss": 0.5405, "lr": 3.18825646801314e-07, "epoch": 2.6879999999999997, "percentage": 89.74, "elapsed_time": "8:42:32", "remaining_time": "0:59:43"}
|
| 281 |
+
{"current_steps": 281, "total_steps": 312, "loss": 0.5057, "lr": 2.9940862715390483e-07, "epoch": 2.6976, "percentage": 90.06, "elapsed_time": "8:44:31", "remaining_time": "0:57:51"}
|
| 282 |
+
{"current_steps": 282, "total_steps": 312, "loss": 0.5334, "lr": 2.8058334845816214e-07, "epoch": 2.7072000000000003, "percentage": 90.38, "elapsed_time": "8:46:07", "remaining_time": "0:55:58"}
|
| 283 |
+
{"current_steps": 283, "total_steps": 312, "loss": 0.5456, "lr": 2.6235218056235633e-07, "epoch": 2.7168, "percentage": 90.71, "elapsed_time": "8:47:46", "remaining_time": "0:54:05"}
|
| 284 |
+
{"current_steps": 284, "total_steps": 312, "loss": 0.5134, "lr": 2.447174185242324e-07, "epoch": 2.7264, "percentage": 91.03, "elapsed_time": "8:49:35", "remaining_time": "0:52:12"}
|
| 285 |
+
{"current_steps": 285, "total_steps": 312, "loss": 0.4706, "lr": 2.276812823220964e-07, "epoch": 2.7359999999999998, "percentage": 91.35, "elapsed_time": "8:51:20", "remaining_time": "0:50:20"}
|
| 286 |
+
{"current_steps": 286, "total_steps": 312, "loss": 0.5894, "lr": 2.1124591657534776e-07, "epoch": 2.7456, "percentage": 91.67, "elapsed_time": "8:53:15", "remaining_time": "0:48:28"}
|
| 287 |
+
{"current_steps": 287, "total_steps": 312, "loss": 0.5377, "lr": 1.9541339027450256e-07, "epoch": 2.7552, "percentage": 91.99, "elapsed_time": "8:55:08", "remaining_time": "0:46:36"}
|
| 288 |
+
{"current_steps": 288, "total_steps": 312, "loss": 0.5063, "lr": 1.801856965207338e-07, "epoch": 2.7648, "percentage": 92.31, "elapsed_time": "8:56:57", "remaining_time": "0:44:44"}
|
| 289 |
+
{"current_steps": 289, "total_steps": 312, "loss": 0.5533, "lr": 1.6556475227496816e-07, "epoch": 2.7744, "percentage": 92.63, "elapsed_time": "8:58:48", "remaining_time": "0:42:52"}
|
| 290 |
+
{"current_steps": 290, "total_steps": 312, "loss": 0.4984, "lr": 1.5155239811656562e-07, "epoch": 2.784, "percentage": 92.95, "elapsed_time": "9:00:40", "remaining_time": "0:41:01"}
|
| 291 |
+
{"current_steps": 291, "total_steps": 312, "loss": 0.5247, "lr": 1.3815039801161723e-07, "epoch": 2.7936, "percentage": 93.27, "elapsed_time": "9:02:32", "remaining_time": "0:39:09"}
|
| 292 |
+
{"current_steps": 292, "total_steps": 312, "loss": 0.567, "lr": 1.253604390908819e-07, "epoch": 2.8032, "percentage": 93.59, "elapsed_time": "9:04:29", "remaining_time": "0:37:17"}
|
| 293 |
+
{"current_steps": 293, "total_steps": 312, "loss": 0.5089, "lr": 1.1318413143740436e-07, "epoch": 2.8128, "percentage": 93.91, "elapsed_time": "9:06:26", "remaining_time": "0:35:26"}
|
| 294 |
+
{"current_steps": 294, "total_steps": 312, "loss": 0.5772, "lr": 1.0162300788382263e-07, "epoch": 2.8224, "percentage": 94.23, "elapsed_time": "9:08:26", "remaining_time": "0:33:34"}
|
| 295 |
+
{"current_steps": 295, "total_steps": 312, "loss": 0.5099, "lr": 9.0678523819408e-08, "epoch": 2.832, "percentage": 94.55, "elapsed_time": "9:10:23", "remaining_time": "0:31:43"}
|
| 296 |
+
{"current_steps": 296, "total_steps": 312, "loss": 0.5103, "lr": 8.035205700685167e-08, "epoch": 2.8416, "percentage": 94.87, "elapsed_time": "9:12:08", "remaining_time": "0:29:50"}
|
| 297 |
+
{"current_steps": 297, "total_steps": 312, "loss": 0.506, "lr": 7.064490740882057e-08, "epoch": 2.8512, "percentage": 95.19, "elapsed_time": "9:13:56", "remaining_time": "0:27:58"}
|
| 298 |
+
{"current_steps": 298, "total_steps": 312, "loss": 0.5043, "lr": 6.15582970243117e-08, "epoch": 2.8608000000000002, "percentage": 95.51, "elapsed_time": "9:15:34", "remaining_time": "0:26:06"}
|
| 299 |
+
{"current_steps": 299, "total_steps": 312, "loss": 0.5602, "lr": 5.3093369734816824e-08, "epoch": 2.8704, "percentage": 95.83, "elapsed_time": "9:17:18", "remaining_time": "0:24:13"}
|
| 300 |
+
{"current_steps": 300, "total_steps": 312, "loss": 0.5101, "lr": 4.52511911603265e-08, "epoch": 2.88, "percentage": 96.15, "elapsed_time": "9:19:14", "remaining_time": "0:22:22"}
|
| 301 |
+
{"current_steps": 301, "total_steps": 312, "loss": 0.5045, "lr": 3.8032748525179684e-08, "epoch": 2.8895999999999997, "percentage": 96.47, "elapsed_time": "9:20:50", "remaining_time": "0:20:29"}
|
| 302 |
+
{"current_steps": 302, "total_steps": 312, "loss": 0.5484, "lr": 3.143895053378698e-08, "epoch": 2.8992, "percentage": 96.79, "elapsed_time": "9:22:39", "remaining_time": "0:18:37"}
|
| 303 |
+
{"current_steps": 303, "total_steps": 312, "loss": 0.5411, "lr": 2.547062725623828e-08, "epoch": 2.9088000000000003, "percentage": 97.12, "elapsed_time": "9:24:41", "remaining_time": "0:16:46"}
|
| 304 |
+
{"current_steps": 304, "total_steps": 312, "loss": 0.5469, "lr": 2.012853002380466e-08, "epoch": 2.9184, "percentage": 97.44, "elapsed_time": "9:26:30", "remaining_time": "0:14:54"}
|
| 305 |
+
{"current_steps": 305, "total_steps": 312, "loss": 0.506, "lr": 1.541333133436018e-08, "epoch": 2.928, "percentage": 97.76, "elapsed_time": "9:28:12", "remaining_time": "0:13:02"}
|
| 306 |
+
{"current_steps": 306, "total_steps": 312, "loss": 0.5208, "lr": 1.132562476771959e-08, "epoch": 2.9375999999999998, "percentage": 98.08, "elapsed_time": "9:30:00", "remaining_time": "0:11:10"}
|
| 307 |
+
{"current_steps": 307, "total_steps": 312, "loss": 0.5208, "lr": 7.865924910916977e-09, "epoch": 2.9472, "percentage": 98.4, "elapsed_time": "9:31:51", "remaining_time": "0:09:18"}
|
| 308 |
+
{"current_steps": 308, "total_steps": 312, "loss": 0.5355, "lr": 5.034667293427053e-09, "epoch": 2.9568, "percentage": 98.72, "elapsed_time": "9:33:35", "remaining_time": "0:07:26"}
|
| 309 |
+
{"current_steps": 309, "total_steps": 312, "loss": 0.5167, "lr": 2.8322083323334417e-09, "epoch": 2.9664, "percentage": 99.04, "elapsed_time": "9:35:27", "remaining_time": "0:05:35"}
|
| 310 |
+
{"current_steps": 310, "total_steps": 312, "loss": 0.5175, "lr": 1.2588252874673469e-09, "epoch": 2.976, "percentage": 99.36, "elapsed_time": "9:37:19", "remaining_time": "0:03:43"}
|
| 311 |
+
{"current_steps": 311, "total_steps": 312, "loss": 0.5088, "lr": 3.147162264971471e-10, "epoch": 2.9856, "percentage": 99.68, "elapsed_time": "9:39:15", "remaining_time": "0:01:51"}
|
| 312 |
+
{"current_steps": 312, "total_steps": 312, "loss": 0.5469, "lr": 0.0, "epoch": 2.9952, "percentage": 100.0, "elapsed_time": "9:41:09", "remaining_time": "0:00:00"}
|
| 313 |
+
{"current_steps": 312, "total_steps": 312, "epoch": 2.9952, "percentage": 100.0, "elapsed_time": "9:43:14", "remaining_time": "0:00:00"}
|