Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bad07eb2ebee4c1a4357081b11e97d6070ccb120054ccbdb9457a4b1f43623c9
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a980e6d8fd700d58d36f03ec901bec58551b5123ba5a22b3acbe918413aac6e
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dda8f552337d891f3cf8797f16ccf3ccc7a8ffdf7e35a64c8b4563811173aeec
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f478646a66adb045b4f7dd1826d2e10ccfa3b585f62c2dd5fd5860e5f18e7513
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -250,3 +250,253 @@
|
|
| 250 |
{"current_steps": 250, "total_steps": 750, "loss": 0.87, "lr": 8.43120818934367e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "3:53:09", "remaining_time": "7:46:19"}
|
| 251 |
{"current_steps": 251, "total_steps": 750, "loss": 0.7984, "lr": 8.414244334398418e-06, "epoch": 1.004, "percentage": 33.47, "elapsed_time": "3:55:01", "remaining_time": "7:47:15"}
|
| 252 |
{"current_steps": 252, "total_steps": 750, "loss": 0.8299, "lr": 8.397206521307584e-06, "epoch": 1.008, "percentage": 33.6, "elapsed_time": "3:55:59", "remaining_time": "7:46:21"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 250 |
{"current_steps": 250, "total_steps": 750, "loss": 0.87, "lr": 8.43120818934367e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "3:53:09", "remaining_time": "7:46:19"}
|
| 251 |
{"current_steps": 251, "total_steps": 750, "loss": 0.7984, "lr": 8.414244334398418e-06, "epoch": 1.004, "percentage": 33.47, "elapsed_time": "3:55:01", "remaining_time": "7:47:15"}
|
| 252 |
{"current_steps": 252, "total_steps": 750, "loss": 0.8299, "lr": 8.397206521307584e-06, "epoch": 1.008, "percentage": 33.6, "elapsed_time": "3:55:59", "remaining_time": "7:46:21"}
|
| 253 |
+
{"current_steps": 253, "total_steps": 750, "loss": 0.8501, "lr": 8.380095119138209e-06, "epoch": 1.012, "percentage": 33.73, "elapsed_time": "3:56:55", "remaining_time": "7:45:25"}
|
| 254 |
+
{"current_steps": 254, "total_steps": 750, "loss": 0.8452, "lr": 8.362910498551402e-06, "epoch": 1.016, "percentage": 33.87, "elapsed_time": "3:57:49", "remaining_time": "7:44:24"}
|
| 255 |
+
{"current_steps": 255, "total_steps": 750, "loss": 0.8553, "lr": 8.345653031794292e-06, "epoch": 1.02, "percentage": 34.0, "elapsed_time": "3:58:43", "remaining_time": "7:43:24"}
|
| 256 |
+
{"current_steps": 256, "total_steps": 750, "loss": 0.7941, "lr": 8.328323092691985e-06, "epoch": 1.024, "percentage": 34.13, "elapsed_time": "3:59:35", "remaining_time": "7:42:20"}
|
| 257 |
+
{"current_steps": 257, "total_steps": 750, "loss": 0.8211, "lr": 8.310921056639451e-06, "epoch": 1.028, "percentage": 34.27, "elapsed_time": "4:00:31", "remaining_time": "7:41:24"}
|
| 258 |
+
{"current_steps": 258, "total_steps": 750, "loss": 0.8224, "lr": 8.293447300593402e-06, "epoch": 1.032, "percentage": 34.4, "elapsed_time": "4:01:26", "remaining_time": "7:40:25"}
|
| 259 |
+
{"current_steps": 259, "total_steps": 750, "loss": 0.8435, "lr": 8.275902203064125e-06, "epoch": 1.036, "percentage": 34.53, "elapsed_time": "4:02:24", "remaining_time": "7:39:33"}
|
| 260 |
+
{"current_steps": 260, "total_steps": 750, "loss": 0.8238, "lr": 8.258286144107277e-06, "epoch": 1.04, "percentage": 34.67, "elapsed_time": "4:03:20", "remaining_time": "7:38:37"}
|
| 261 |
+
{"current_steps": 261, "total_steps": 750, "loss": 0.8142, "lr": 8.240599505315656e-06, "epoch": 1.044, "percentage": 34.8, "elapsed_time": "4:04:11", "remaining_time": "7:37:29"}
|
| 262 |
+
{"current_steps": 262, "total_steps": 750, "loss": 0.8364, "lr": 8.222842669810936e-06, "epoch": 1.048, "percentage": 34.93, "elapsed_time": "4:05:09", "remaining_time": "7:36:38"}
|
| 263 |
+
{"current_steps": 263, "total_steps": 750, "loss": 0.8271, "lr": 8.205016022235368e-06, "epoch": 1.052, "percentage": 35.07, "elapsed_time": "4:06:00", "remaining_time": "7:35:32"}
|
| 264 |
+
{"current_steps": 264, "total_steps": 750, "loss": 0.8077, "lr": 8.18711994874345e-06, "epoch": 1.056, "percentage": 35.2, "elapsed_time": "4:06:57", "remaining_time": "7:34:37"}
|
| 265 |
+
{"current_steps": 265, "total_steps": 750, "loss": 0.7997, "lr": 8.16915483699355e-06, "epoch": 1.06, "percentage": 35.33, "elapsed_time": "4:07:47", "remaining_time": "7:33:30"}
|
| 266 |
+
{"current_steps": 266, "total_steps": 750, "loss": 0.8704, "lr": 8.151121076139534e-06, "epoch": 1.064, "percentage": 35.47, "elapsed_time": "4:08:47", "remaining_time": "7:32:40"}
|
| 267 |
+
{"current_steps": 267, "total_steps": 750, "loss": 0.8778, "lr": 8.133019056822303e-06, "epoch": 1.068, "percentage": 35.6, "elapsed_time": "4:09:57", "remaining_time": "7:32:09"}
|
| 268 |
+
{"current_steps": 268, "total_steps": 750, "loss": 0.8283, "lr": 8.11484917116136e-06, "epoch": 1.072, "percentage": 35.73, "elapsed_time": "4:11:06", "remaining_time": "7:31:37"}
|
| 269 |
+
{"current_steps": 269, "total_steps": 750, "loss": 0.8078, "lr": 8.096611812746302e-06, "epoch": 1.076, "percentage": 35.87, "elapsed_time": "4:12:08", "remaining_time": "7:30:51"}
|
| 270 |
+
{"current_steps": 270, "total_steps": 750, "loss": 0.8318, "lr": 8.078307376628292e-06, "epoch": 1.08, "percentage": 36.0, "elapsed_time": "4:12:59", "remaining_time": "7:29:46"}
|
| 271 |
+
{"current_steps": 271, "total_steps": 750, "loss": 0.7898, "lr": 8.059936259311514e-06, "epoch": 1.084, "percentage": 36.13, "elapsed_time": "4:13:50", "remaining_time": "7:28:40"}
|
| 272 |
+
{"current_steps": 272, "total_steps": 750, "loss": 0.8512, "lr": 8.041498858744572e-06, "epoch": 1.088, "percentage": 36.27, "elapsed_time": "4:14:52", "remaining_time": "7:27:54"}
|
| 273 |
+
{"current_steps": 273, "total_steps": 750, "loss": 0.8189, "lr": 8.022995574311876e-06, "epoch": 1.092, "percentage": 36.4, "elapsed_time": "4:15:51", "remaining_time": "7:27:02"}
|
| 274 |
+
{"current_steps": 274, "total_steps": 750, "loss": 0.7754, "lr": 8.004426806824985e-06, "epoch": 1.096, "percentage": 36.53, "elapsed_time": "4:16:35", "remaining_time": "7:25:44"}
|
| 275 |
+
{"current_steps": 275, "total_steps": 750, "loss": 0.7863, "lr": 7.985792958513932e-06, "epoch": 1.1, "percentage": 36.67, "elapsed_time": "4:17:15", "remaining_time": "7:24:21"}
|
| 276 |
+
{"current_steps": 276, "total_steps": 750, "loss": 0.8159, "lr": 7.967094433018508e-06, "epoch": 1.104, "percentage": 36.8, "elapsed_time": "4:18:14", "remaining_time": "7:23:30"}
|
| 277 |
+
{"current_steps": 277, "total_steps": 750, "loss": 0.8046, "lr": 7.948331635379517e-06, "epoch": 1.108, "percentage": 36.93, "elapsed_time": "4:19:13", "remaining_time": "7:22:38"}
|
| 278 |
+
{"current_steps": 278, "total_steps": 750, "loss": 0.8191, "lr": 7.929504972030003e-06, "epoch": 1.112, "percentage": 37.07, "elapsed_time": "4:19:54", "remaining_time": "7:21:17"}
|
| 279 |
+
{"current_steps": 279, "total_steps": 750, "loss": 0.8353, "lr": 7.910614850786448e-06, "epoch": 1.116, "percentage": 37.2, "elapsed_time": "4:20:52", "remaining_time": "7:20:24"}
|
| 280 |
+
{"current_steps": 280, "total_steps": 750, "loss": 0.8404, "lr": 7.891661680839932e-06, "epoch": 1.12, "percentage": 37.33, "elapsed_time": "4:21:52", "remaining_time": "7:19:34"}
|
| 281 |
+
{"current_steps": 281, "total_steps": 750, "loss": 0.8151, "lr": 7.872645872747281e-06, "epoch": 1.124, "percentage": 37.47, "elapsed_time": "4:22:46", "remaining_time": "7:18:34"}
|
| 282 |
+
{"current_steps": 282, "total_steps": 750, "loss": 0.8314, "lr": 7.85356783842216e-06, "epoch": 1.1280000000000001, "percentage": 37.6, "elapsed_time": "4:23:34", "remaining_time": "7:17:25"}
|
| 283 |
+
{"current_steps": 283, "total_steps": 750, "loss": 0.7978, "lr": 7.834427991126155e-06, "epoch": 1.1320000000000001, "percentage": 37.73, "elapsed_time": "4:24:25", "remaining_time": "7:16:20"}
|
| 284 |
+
{"current_steps": 284, "total_steps": 750, "loss": 0.8245, "lr": 7.815226745459831e-06, "epoch": 1.1360000000000001, "percentage": 37.87, "elapsed_time": "4:25:28", "remaining_time": "7:15:35"}
|
| 285 |
+
{"current_steps": 285, "total_steps": 750, "loss": 0.8185, "lr": 7.795964517353734e-06, "epoch": 1.1400000000000001, "percentage": 38.0, "elapsed_time": "4:26:22", "remaining_time": "7:14:37"}
|
| 286 |
+
{"current_steps": 286, "total_steps": 750, "loss": 0.8114, "lr": 7.776641724059398e-06, "epoch": 1.144, "percentage": 38.13, "elapsed_time": "4:27:21", "remaining_time": "7:13:44"}
|
| 287 |
+
{"current_steps": 287, "total_steps": 750, "loss": 0.8145, "lr": 7.757258784140286e-06, "epoch": 1.148, "percentage": 38.27, "elapsed_time": "4:28:06", "remaining_time": "7:12:30"}
|
| 288 |
+
{"current_steps": 288, "total_steps": 750, "loss": 0.8004, "lr": 7.737816117462752e-06, "epoch": 1.152, "percentage": 38.4, "elapsed_time": "4:29:07", "remaining_time": "7:11:43"}
|
| 289 |
+
{"current_steps": 289, "total_steps": 750, "loss": 0.8432, "lr": 7.718314145186918e-06, "epoch": 1.156, "percentage": 38.53, "elapsed_time": "4:30:02", "remaining_time": "7:10:46"}
|
| 290 |
+
{"current_steps": 290, "total_steps": 750, "loss": 0.8205, "lr": 7.698753289757565e-06, "epoch": 1.16, "percentage": 38.67, "elapsed_time": "4:31:06", "remaining_time": "7:10:01"}
|
| 291 |
+
{"current_steps": 291, "total_steps": 750, "loss": 0.82, "lr": 7.679133974894984e-06, "epoch": 1.164, "percentage": 38.8, "elapsed_time": "4:31:58", "remaining_time": "7:08:59"}
|
| 292 |
+
{"current_steps": 292, "total_steps": 750, "loss": 0.8316, "lr": 7.65945662558579e-06, "epoch": 1.168, "percentage": 38.93, "elapsed_time": "4:32:48", "remaining_time": "7:07:54"}
|
| 293 |
+
{"current_steps": 293, "total_steps": 750, "loss": 0.8174, "lr": 7.639721668073718e-06, "epoch": 1.172, "percentage": 39.07, "elapsed_time": "4:33:46", "remaining_time": "7:07:00"}
|
| 294 |
+
{"current_steps": 294, "total_steps": 750, "loss": 0.813, "lr": 7.619929529850397e-06, "epoch": 1.176, "percentage": 39.2, "elapsed_time": "4:34:33", "remaining_time": "7:05:50"}
|
| 295 |
+
{"current_steps": 295, "total_steps": 750, "loss": 0.8239, "lr": 7.600080639646077e-06, "epoch": 1.18, "percentage": 39.33, "elapsed_time": "4:35:27", "remaining_time": "7:04:51"}
|
| 296 |
+
{"current_steps": 296, "total_steps": 750, "loss": 0.8434, "lr": 7.580175427420358e-06, "epoch": 1.184, "percentage": 39.47, "elapsed_time": "4:36:27", "remaining_time": "7:04:01"}
|
| 297 |
+
{"current_steps": 297, "total_steps": 750, "loss": 0.8076, "lr": 7.560214324352858e-06, "epoch": 1.188, "percentage": 39.6, "elapsed_time": "4:37:30", "remaining_time": "7:03:15"}
|
| 298 |
+
{"current_steps": 298, "total_steps": 750, "loss": 0.8301, "lr": 7.54019776283389e-06, "epoch": 1.192, "percentage": 39.73, "elapsed_time": "4:38:21", "remaining_time": "7:02:11"}
|
| 299 |
+
{"current_steps": 299, "total_steps": 750, "loss": 0.8249, "lr": 7.520126176455084e-06, "epoch": 1.196, "percentage": 39.87, "elapsed_time": "4:39:15", "remaining_time": "7:01:13"}
|
| 300 |
+
{"current_steps": 300, "total_steps": 750, "loss": 0.7956, "lr": 7.500000000000001e-06, "epoch": 1.2, "percentage": 40.0, "elapsed_time": "4:40:06", "remaining_time": "7:00:10"}
|
| 301 |
+
{"current_steps": 301, "total_steps": 750, "loss": 0.8577, "lr": 7.479819669434712e-06, "epoch": 1.204, "percentage": 40.13, "elapsed_time": "4:40:51", "remaining_time": "6:58:57"}
|
| 302 |
+
{"current_steps": 302, "total_steps": 750, "loss": 0.8661, "lr": 7.459585621898353e-06, "epoch": 1.208, "percentage": 40.27, "elapsed_time": "4:41:53", "remaining_time": "6:58:10"}
|
| 303 |
+
{"current_steps": 303, "total_steps": 750, "loss": 0.8543, "lr": 7.4392982956936644e-06, "epoch": 1.212, "percentage": 40.4, "elapsed_time": "4:42:46", "remaining_time": "6:57:09"}
|
| 304 |
+
{"current_steps": 304, "total_steps": 750, "loss": 0.8148, "lr": 7.418958130277483e-06, "epoch": 1.216, "percentage": 40.53, "elapsed_time": "4:43:42", "remaining_time": "6:56:14"}
|
| 305 |
+
{"current_steps": 305, "total_steps": 750, "loss": 0.8162, "lr": 7.398565566251232e-06, "epoch": 1.22, "percentage": 40.67, "elapsed_time": "4:44:38", "remaining_time": "6:55:18"}
|
| 306 |
+
{"current_steps": 306, "total_steps": 750, "loss": 0.8242, "lr": 7.378121045351378e-06, "epoch": 1.224, "percentage": 40.8, "elapsed_time": "4:45:34", "remaining_time": "6:54:22"}
|
| 307 |
+
{"current_steps": 307, "total_steps": 750, "loss": 0.8429, "lr": 7.357625010439853e-06, "epoch": 1.228, "percentage": 40.93, "elapsed_time": "4:46:42", "remaining_time": "6:53:43"}
|
| 308 |
+
{"current_steps": 308, "total_steps": 750, "loss": 0.8413, "lr": 7.337077905494472e-06, "epoch": 1.232, "percentage": 41.07, "elapsed_time": "4:47:44", "remaining_time": "6:52:55"}
|
| 309 |
+
{"current_steps": 309, "total_steps": 750, "loss": 0.8431, "lr": 7.31648017559931e-06, "epoch": 1.236, "percentage": 41.2, "elapsed_time": "4:48:39", "remaining_time": "6:51:58"}
|
| 310 |
+
{"current_steps": 310, "total_steps": 750, "loss": 0.8634, "lr": 7.295832266935059e-06, "epoch": 1.24, "percentage": 41.33, "elapsed_time": "4:49:41", "remaining_time": "6:51:10"}
|
| 311 |
+
{"current_steps": 311, "total_steps": 750, "loss": 0.8387, "lr": 7.275134626769369e-06, "epoch": 1.244, "percentage": 41.47, "elapsed_time": "4:50:32", "remaining_time": "6:50:07"}
|
| 312 |
+
{"current_steps": 312, "total_steps": 750, "loss": 0.8087, "lr": 7.254387703447154e-06, "epoch": 1.248, "percentage": 41.6, "elapsed_time": "4:51:36", "remaining_time": "6:49:22"}
|
| 313 |
+
{"current_steps": 313, "total_steps": 750, "loss": 0.8138, "lr": 7.233591946380884e-06, "epoch": 1.252, "percentage": 41.73, "elapsed_time": "4:52:19", "remaining_time": "6:48:07"}
|
| 314 |
+
{"current_steps": 314, "total_steps": 750, "loss": 0.8258, "lr": 7.212747806040845e-06, "epoch": 1.256, "percentage": 41.87, "elapsed_time": "4:53:13", "remaining_time": "6:47:09"}
|
| 315 |
+
{"current_steps": 315, "total_steps": 750, "loss": 0.8444, "lr": 7.191855733945388e-06, "epoch": 1.26, "percentage": 42.0, "elapsed_time": "4:54:21", "remaining_time": "6:46:29"}
|
| 316 |
+
{"current_steps": 316, "total_steps": 750, "loss": 0.8155, "lr": 7.170916182651141e-06, "epoch": 1.264, "percentage": 42.13, "elapsed_time": "4:55:16", "remaining_time": "6:45:32"}
|
| 317 |
+
{"current_steps": 317, "total_steps": 750, "loss": 0.7777, "lr": 7.149929605743214e-06, "epoch": 1.268, "percentage": 42.27, "elapsed_time": "4:56:08", "remaining_time": "6:44:29"}
|
| 318 |
+
{"current_steps": 318, "total_steps": 750, "loss": 0.7944, "lr": 7.128896457825364e-06, "epoch": 1.272, "percentage": 42.4, "elapsed_time": "4:56:47", "remaining_time": "6:43:11"}
|
| 319 |
+
{"current_steps": 319, "total_steps": 750, "loss": 0.8503, "lr": 7.107817194510157e-06, "epoch": 1.276, "percentage": 42.53, "elapsed_time": "4:57:45", "remaining_time": "6:42:17"}
|
| 320 |
+
{"current_steps": 320, "total_steps": 750, "loss": 0.8266, "lr": 7.08669227240909e-06, "epoch": 1.28, "percentage": 42.67, "elapsed_time": "4:58:39", "remaining_time": "6:41:19"}
|
| 321 |
+
{"current_steps": 321, "total_steps": 750, "loss": 0.8107, "lr": 7.06552214912271e-06, "epoch": 1.284, "percentage": 42.8, "elapsed_time": "4:59:32", "remaining_time": "6:40:19"}
|
| 322 |
+
{"current_steps": 322, "total_steps": 750, "loss": 0.7889, "lr": 7.04430728323069e-06, "epoch": 1.288, "percentage": 42.93, "elapsed_time": "5:00:23", "remaining_time": "6:39:17"}
|
| 323 |
+
{"current_steps": 323, "total_steps": 750, "loss": 0.814, "lr": 7.023048134281907e-06, "epoch": 1.292, "percentage": 43.07, "elapsed_time": "5:01:21", "remaining_time": "6:38:23"}
|
| 324 |
+
{"current_steps": 324, "total_steps": 750, "loss": 0.8144, "lr": 7.0017451627844765e-06, "epoch": 1.296, "percentage": 43.2, "elapsed_time": "5:02:08", "remaining_time": "6:37:15"}
|
| 325 |
+
{"current_steps": 325, "total_steps": 750, "loss": 0.816, "lr": 6.980398830195785e-06, "epoch": 1.3, "percentage": 43.33, "elapsed_time": "5:03:09", "remaining_time": "6:36:26"}
|
| 326 |
+
{"current_steps": 326, "total_steps": 750, "loss": 0.8439, "lr": 6.959009598912493e-06, "epoch": 1.304, "percentage": 43.47, "elapsed_time": "5:04:04", "remaining_time": "6:35:28"}
|
| 327 |
+
{"current_steps": 327, "total_steps": 750, "loss": 0.8244, "lr": 6.9375779322605154e-06, "epoch": 1.308, "percentage": 43.6, "elapsed_time": "5:04:58", "remaining_time": "6:34:30"}
|
| 328 |
+
{"current_steps": 328, "total_steps": 750, "loss": 0.851, "lr": 6.916104294484988e-06, "epoch": 1.312, "percentage": 43.73, "elapsed_time": "5:05:59", "remaining_time": "6:33:41"}
|
| 329 |
+
{"current_steps": 329, "total_steps": 750, "loss": 0.7992, "lr": 6.8945891507402075e-06, "epoch": 1.316, "percentage": 43.87, "elapsed_time": "5:06:48", "remaining_time": "6:32:36"}
|
| 330 |
+
{"current_steps": 330, "total_steps": 750, "loss": 0.8443, "lr": 6.873032967079562e-06, "epoch": 1.32, "percentage": 44.0, "elapsed_time": "5:07:44", "remaining_time": "6:31:40"}
|
| 331 |
+
{"current_steps": 331, "total_steps": 750, "loss": 0.8277, "lr": 6.851436210445427e-06, "epoch": 1.324, "percentage": 44.13, "elapsed_time": "5:08:41", "remaining_time": "6:30:45"}
|
| 332 |
+
{"current_steps": 332, "total_steps": 750, "loss": 0.8135, "lr": 6.829799348659061e-06, "epoch": 1.328, "percentage": 44.27, "elapsed_time": "5:09:38", "remaining_time": "6:29:51"}
|
| 333 |
+
{"current_steps": 333, "total_steps": 750, "loss": 0.8288, "lr": 6.808122850410461e-06, "epoch": 1.332, "percentage": 44.4, "elapsed_time": "5:10:32", "remaining_time": "6:28:52"}
|
| 334 |
+
{"current_steps": 334, "total_steps": 750, "loss": 0.8283, "lr": 6.7864071852482205e-06, "epoch": 1.336, "percentage": 44.53, "elapsed_time": "5:11:34", "remaining_time": "6:28:03"}
|
| 335 |
+
{"current_steps": 335, "total_steps": 750, "loss": 0.8464, "lr": 6.7646528235693445e-06, "epoch": 1.34, "percentage": 44.67, "elapsed_time": "5:12:37", "remaining_time": "6:27:16"}
|
| 336 |
+
{"current_steps": 336, "total_steps": 750, "loss": 0.8347, "lr": 6.7428602366090764e-06, "epoch": 1.3439999999999999, "percentage": 44.8, "elapsed_time": "5:13:36", "remaining_time": "6:26:24"}
|
| 337 |
+
{"current_steps": 337, "total_steps": 750, "loss": 0.8384, "lr": 6.721029896430678e-06, "epoch": 1.3479999999999999, "percentage": 44.93, "elapsed_time": "5:14:35", "remaining_time": "6:25:32"}
|
| 338 |
+
{"current_steps": 338, "total_steps": 750, "loss": 0.8151, "lr": 6.699162275915208e-06, "epoch": 1.3519999999999999, "percentage": 45.07, "elapsed_time": "5:15:33", "remaining_time": "6:24:38"}
|
| 339 |
+
{"current_steps": 339, "total_steps": 750, "loss": 0.832, "lr": 6.677257848751276e-06, "epoch": 1.3559999999999999, "percentage": 45.2, "elapsed_time": "5:16:36", "remaining_time": "6:23:51"}
|
| 340 |
+
{"current_steps": 340, "total_steps": 750, "loss": 0.7989, "lr": 6.655317089424791e-06, "epoch": 1.3599999999999999, "percentage": 45.33, "elapsed_time": "5:17:29", "remaining_time": "6:22:51"}
|
| 341 |
+
{"current_steps": 341, "total_steps": 750, "loss": 0.8106, "lr": 6.633340473208673e-06, "epoch": 1.3639999999999999, "percentage": 45.47, "elapsed_time": "5:18:27", "remaining_time": "6:21:57"}
|
| 342 |
+
{"current_steps": 342, "total_steps": 750, "loss": 0.8197, "lr": 6.611328476152557e-06, "epoch": 1.3679999999999999, "percentage": 45.6, "elapsed_time": "5:19:25", "remaining_time": "6:21:03"}
|
| 343 |
+
{"current_steps": 343, "total_steps": 750, "loss": 0.836, "lr": 6.58928157507249e-06, "epoch": 1.3719999999999999, "percentage": 45.73, "elapsed_time": "5:20:17", "remaining_time": "6:20:02"}
|
| 344 |
+
{"current_steps": 344, "total_steps": 750, "loss": 0.8207, "lr": 6.567200247540599e-06, "epoch": 1.376, "percentage": 45.87, "elapsed_time": "5:21:17", "remaining_time": "6:19:12"}
|
| 345 |
+
{"current_steps": 345, "total_steps": 750, "loss": 0.8452, "lr": 6.545084971874738e-06, "epoch": 1.38, "percentage": 46.0, "elapsed_time": "5:22:20", "remaining_time": "6:18:23"}
|
| 346 |
+
{"current_steps": 346, "total_steps": 750, "loss": 0.7999, "lr": 6.522936227128139e-06, "epoch": 1.384, "percentage": 46.13, "elapsed_time": "5:23:20", "remaining_time": "6:17:32"}
|
| 347 |
+
{"current_steps": 347, "total_steps": 750, "loss": 0.8387, "lr": 6.500754493079029e-06, "epoch": 1.388, "percentage": 46.27, "elapsed_time": "5:24:23", "remaining_time": "6:16:44"}
|
| 348 |
+
{"current_steps": 348, "total_steps": 750, "loss": 0.8127, "lr": 6.4785402502202345e-06, "epoch": 1.392, "percentage": 46.4, "elapsed_time": "5:25:17", "remaining_time": "6:15:46"}
|
| 349 |
+
{"current_steps": 349, "total_steps": 750, "loss": 0.8312, "lr": 6.456293979748778e-06, "epoch": 1.396, "percentage": 46.53, "elapsed_time": "5:26:08", "remaining_time": "6:14:44"}
|
| 350 |
+
{"current_steps": 350, "total_steps": 750, "loss": 0.818, "lr": 6.434016163555452e-06, "epoch": 1.4, "percentage": 46.67, "elapsed_time": "5:27:03", "remaining_time": "6:13:46"}
|
| 351 |
+
{"current_steps": 351, "total_steps": 750, "loss": 0.8109, "lr": 6.411707284214384e-06, "epoch": 1.404, "percentage": 46.8, "elapsed_time": "5:27:59", "remaining_time": "6:12:50"}
|
| 352 |
+
{"current_steps": 352, "total_steps": 750, "loss": 0.8329, "lr": 6.389367824972575e-06, "epoch": 1.408, "percentage": 46.93, "elapsed_time": "5:28:57", "remaining_time": "6:11:56"}
|
| 353 |
+
{"current_steps": 353, "total_steps": 750, "loss": 0.8209, "lr": 6.366998269739442e-06, "epoch": 1.412, "percentage": 47.07, "elapsed_time": "5:29:53", "remaining_time": "6:11:00"}
|
| 354 |
+
{"current_steps": 354, "total_steps": 750, "loss": 0.8423, "lr": 6.344599103076329e-06, "epoch": 1.416, "percentage": 47.2, "elapsed_time": "5:30:49", "remaining_time": "6:10:04"}
|
| 355 |
+
{"current_steps": 355, "total_steps": 750, "loss": 0.8315, "lr": 6.322170810186013e-06, "epoch": 1.42, "percentage": 47.33, "elapsed_time": "5:31:54", "remaining_time": "6:09:18"}
|
| 356 |
+
{"current_steps": 356, "total_steps": 750, "loss": 0.8397, "lr": 6.299713876902188e-06, "epoch": 1.424, "percentage": 47.47, "elapsed_time": "5:32:46", "remaining_time": "6:08:17"}
|
| 357 |
+
{"current_steps": 357, "total_steps": 750, "loss": 0.8165, "lr": 6.277228789678953e-06, "epoch": 1.428, "percentage": 47.6, "elapsed_time": "5:33:46", "remaining_time": "6:07:25"}
|
| 358 |
+
{"current_steps": 358, "total_steps": 750, "loss": 0.8237, "lr": 6.254716035580264e-06, "epoch": 1.432, "percentage": 47.73, "elapsed_time": "5:34:41", "remaining_time": "6:06:28"}
|
| 359 |
+
{"current_steps": 359, "total_steps": 750, "loss": 0.8345, "lr": 6.23217610226939e-06, "epoch": 1.436, "percentage": 47.87, "elapsed_time": "5:35:28", "remaining_time": "6:05:22"}
|
| 360 |
+
{"current_steps": 360, "total_steps": 750, "loss": 0.7928, "lr": 6.209609477998339e-06, "epoch": 1.44, "percentage": 48.0, "elapsed_time": "5:36:19", "remaining_time": "6:04:21"}
|
| 361 |
+
{"current_steps": 361, "total_steps": 750, "loss": 0.8073, "lr": 6.187016651597299e-06, "epoch": 1.444, "percentage": 48.13, "elapsed_time": "5:37:09", "remaining_time": "6:03:18"}
|
| 362 |
+
{"current_steps": 362, "total_steps": 750, "loss": 0.8672, "lr": 6.16439811246403e-06, "epoch": 1.448, "percentage": 48.27, "elapsed_time": "5:38:11", "remaining_time": "6:02:28"}
|
| 363 |
+
{"current_steps": 363, "total_steps": 750, "loss": 0.8226, "lr": 6.141754350553279e-06, "epoch": 1.452, "percentage": 48.4, "elapsed_time": "5:39:02", "remaining_time": "6:01:27"}
|
| 364 |
+
{"current_steps": 364, "total_steps": 750, "loss": 0.7964, "lr": 6.119085856366158e-06, "epoch": 1.456, "percentage": 48.53, "elapsed_time": "5:39:52", "remaining_time": "6:00:24"}
|
| 365 |
+
{"current_steps": 365, "total_steps": 750, "loss": 0.7774, "lr": 6.0963931209395165e-06, "epoch": 1.46, "percentage": 48.67, "elapsed_time": "5:40:50", "remaining_time": "5:59:30"}
|
| 366 |
+
{"current_steps": 366, "total_steps": 750, "loss": 0.8087, "lr": 6.073676635835317e-06, "epoch": 1.464, "percentage": 48.8, "elapsed_time": "5:41:41", "remaining_time": "5:58:29"}
|
| 367 |
+
{"current_steps": 367, "total_steps": 750, "loss": 0.8159, "lr": 6.05093689312997e-06, "epoch": 1.468, "percentage": 48.93, "elapsed_time": "5:42:37", "remaining_time": "5:57:33"}
|
| 368 |
+
{"current_steps": 368, "total_steps": 750, "loss": 0.8259, "lr": 6.028174385403693e-06, "epoch": 1.472, "percentage": 49.07, "elapsed_time": "5:43:34", "remaining_time": "5:56:39"}
|
| 369 |
+
{"current_steps": 369, "total_steps": 750, "loss": 0.8156, "lr": 6.005389605729824e-06, "epoch": 1.476, "percentage": 49.2, "elapsed_time": "5:44:25", "remaining_time": "5:55:37"}
|
| 370 |
+
{"current_steps": 370, "total_steps": 750, "loss": 0.8131, "lr": 5.982583047664151e-06, "epoch": 1.48, "percentage": 49.33, "elapsed_time": "5:45:11", "remaining_time": "5:54:31"}
|
| 371 |
+
{"current_steps": 371, "total_steps": 750, "loss": 0.8305, "lr": 5.9597552052342174e-06, "epoch": 1.484, "percentage": 49.47, "elapsed_time": "5:46:04", "remaining_time": "5:53:32"}
|
| 372 |
+
{"current_steps": 372, "total_steps": 750, "loss": 0.8154, "lr": 5.936906572928625e-06, "epoch": 1.488, "percentage": 49.6, "elapsed_time": "5:47:01", "remaining_time": "5:52:37"}
|
| 373 |
+
{"current_steps": 373, "total_steps": 750, "loss": 0.8203, "lr": 5.914037645686308e-06, "epoch": 1.492, "percentage": 49.73, "elapsed_time": "5:47:57", "remaining_time": "5:51:41"}
|
| 374 |
+
{"current_steps": 374, "total_steps": 750, "loss": 0.8417, "lr": 5.891148918885834e-06, "epoch": 1.496, "percentage": 49.87, "elapsed_time": "5:48:53", "remaining_time": "5:50:45"}
|
| 375 |
+
{"current_steps": 375, "total_steps": 750, "loss": 0.8497, "lr": 5.8682408883346535e-06, "epoch": 1.5, "percentage": 50.0, "elapsed_time": "5:49:55", "remaining_time": "5:49:55"}
|
| 376 |
+
{"current_steps": 376, "total_steps": 750, "loss": 0.7931, "lr": 5.84531405025837e-06, "epoch": 1.504, "percentage": 50.13, "elapsed_time": "5:50:44", "remaining_time": "5:48:52"}
|
| 377 |
+
{"current_steps": 377, "total_steps": 750, "loss": 0.7777, "lr": 5.8223689012899945e-06, "epoch": 1.508, "percentage": 50.27, "elapsed_time": "5:51:42", "remaining_time": "5:47:58"}
|
| 378 |
+
{"current_steps": 378, "total_steps": 750, "loss": 0.8256, "lr": 5.799405938459175e-06, "epoch": 1.512, "percentage": 50.4, "elapsed_time": "5:52:36", "remaining_time": "5:47:00"}
|
| 379 |
+
{"current_steps": 379, "total_steps": 750, "loss": 0.8315, "lr": 5.776425659181438e-06, "epoch": 1.516, "percentage": 50.53, "elapsed_time": "5:53:31", "remaining_time": "5:46:03"}
|
| 380 |
+
{"current_steps": 380, "total_steps": 750, "loss": 0.8276, "lr": 5.753428561247416e-06, "epoch": 1.52, "percentage": 50.67, "elapsed_time": "5:54:29", "remaining_time": "5:45:09"}
|
| 381 |
+
{"current_steps": 381, "total_steps": 750, "loss": 0.8376, "lr": 5.730415142812059e-06, "epoch": 1.524, "percentage": 50.8, "elapsed_time": "5:55:23", "remaining_time": "5:44:12"}
|
| 382 |
+
{"current_steps": 382, "total_steps": 750, "loss": 0.8344, "lr": 5.707385902383845e-06, "epoch": 1.528, "percentage": 50.93, "elapsed_time": "5:56:19", "remaining_time": "5:43:15"}
|
| 383 |
+
{"current_steps": 383, "total_steps": 750, "loss": 0.8016, "lr": 5.684341338813986e-06, "epoch": 1.532, "percentage": 51.07, "elapsed_time": "5:57:15", "remaining_time": "5:42:19"}
|
| 384 |
+
{"current_steps": 384, "total_steps": 750, "loss": 0.8216, "lr": 5.661281951285613e-06, "epoch": 1.536, "percentage": 51.2, "elapsed_time": "5:58:05", "remaining_time": "5:41:18"}
|
| 385 |
+
{"current_steps": 385, "total_steps": 750, "loss": 0.8302, "lr": 5.638208239302975e-06, "epoch": 1.54, "percentage": 51.33, "elapsed_time": "5:59:02", "remaining_time": "5:40:23"}
|
| 386 |
+
{"current_steps": 386, "total_steps": 750, "loss": 0.8124, "lr": 5.615120702680604e-06, "epoch": 1.544, "percentage": 51.47, "elapsed_time": "5:59:52", "remaining_time": "5:39:21"}
|
| 387 |
+
{"current_steps": 387, "total_steps": 750, "loss": 0.7866, "lr": 5.592019841532507e-06, "epoch": 1.548, "percentage": 51.6, "elapsed_time": "6:00:38", "remaining_time": "5:38:16"}
|
| 388 |
+
{"current_steps": 388, "total_steps": 750, "loss": 0.8453, "lr": 5.568906156261309e-06, "epoch": 1.552, "percentage": 51.73, "elapsed_time": "6:01:30", "remaining_time": "5:37:16"}
|
| 389 |
+
{"current_steps": 389, "total_steps": 750, "loss": 0.8188, "lr": 5.54578014754744e-06, "epoch": 1.556, "percentage": 51.87, "elapsed_time": "6:02:17", "remaining_time": "5:36:13"}
|
| 390 |
+
{"current_steps": 390, "total_steps": 750, "loss": 0.8008, "lr": 5.522642316338268e-06, "epoch": 1.56, "percentage": 52.0, "elapsed_time": "6:03:09", "remaining_time": "5:35:13"}
|
| 391 |
+
{"current_steps": 391, "total_steps": 750, "loss": 0.876, "lr": 5.499493163837258e-06, "epoch": 1.564, "percentage": 52.13, "elapsed_time": "6:04:09", "remaining_time": "5:34:20"}
|
| 392 |
+
{"current_steps": 392, "total_steps": 750, "loss": 0.7961, "lr": 5.476333191493108e-06, "epoch": 1.568, "percentage": 52.27, "elapsed_time": "6:04:54", "remaining_time": "5:33:15"}
|
| 393 |
+
{"current_steps": 393, "total_steps": 750, "loss": 0.8384, "lr": 5.453162900988902e-06, "epoch": 1.572, "percentage": 52.4, "elapsed_time": "6:05:55", "remaining_time": "5:32:23"}
|
| 394 |
+
{"current_steps": 394, "total_steps": 750, "loss": 0.8287, "lr": 5.429982794231221e-06, "epoch": 1.576, "percentage": 52.53, "elapsed_time": "6:06:59", "remaining_time": "5:31:35"}
|
| 395 |
+
{"current_steps": 395, "total_steps": 750, "loss": 0.825, "lr": 5.406793373339292e-06, "epoch": 1.58, "percentage": 52.67, "elapsed_time": "6:07:57", "remaining_time": "5:30:41"}
|
| 396 |
+
{"current_steps": 396, "total_steps": 750, "loss": 0.8195, "lr": 5.383595140634093e-06, "epoch": 1.584, "percentage": 52.8, "elapsed_time": "6:08:53", "remaining_time": "5:29:45"}
|
| 397 |
+
{"current_steps": 397, "total_steps": 750, "loss": 0.7859, "lr": 5.360388598627487e-06, "epoch": 1.588, "percentage": 52.93, "elapsed_time": "6:09:54", "remaining_time": "5:28:54"}
|
| 398 |
+
{"current_steps": 398, "total_steps": 750, "loss": 0.7739, "lr": 5.337174250011326e-06, "epoch": 1.592, "percentage": 53.07, "elapsed_time": "6:10:42", "remaining_time": "5:27:51"}
|
| 399 |
+
{"current_steps": 399, "total_steps": 750, "loss": 0.8241, "lr": 5.3139525976465675e-06, "epoch": 1.596, "percentage": 53.2, "elapsed_time": "6:11:46", "remaining_time": "5:27:03"}
|
| 400 |
+
{"current_steps": 400, "total_steps": 750, "loss": 0.8186, "lr": 5.290724144552379e-06, "epoch": 1.6, "percentage": 53.33, "elapsed_time": "6:12:39", "remaining_time": "5:26:04"}
|
| 401 |
+
{"current_steps": 401, "total_steps": 750, "loss": 0.7989, "lr": 5.267489393895247e-06, "epoch": 1.604, "percentage": 53.47, "elapsed_time": "6:13:32", "remaining_time": "5:25:06"}
|
| 402 |
+
{"current_steps": 402, "total_steps": 750, "loss": 0.8459, "lr": 5.244248848978067e-06, "epoch": 1.608, "percentage": 53.6, "elapsed_time": "6:14:35", "remaining_time": "5:24:16"}
|
| 403 |
+
{"current_steps": 403, "total_steps": 750, "loss": 0.8308, "lr": 5.221003013229253e-06, "epoch": 1.612, "percentage": 53.73, "elapsed_time": "6:15:28", "remaining_time": "5:23:17"}
|
| 404 |
+
{"current_steps": 404, "total_steps": 750, "loss": 0.8204, "lr": 5.197752390191827e-06, "epoch": 1.616, "percentage": 53.87, "elapsed_time": "6:16:26", "remaining_time": "5:22:24"}
|
| 405 |
+
{"current_steps": 405, "total_steps": 750, "loss": 0.8598, "lr": 5.174497483512506e-06, "epoch": 1.62, "percentage": 54.0, "elapsed_time": "6:17:24", "remaining_time": "5:21:30"}
|
| 406 |
+
{"current_steps": 406, "total_steps": 750, "loss": 0.8271, "lr": 5.151238796930804e-06, "epoch": 1.624, "percentage": 54.13, "elapsed_time": "6:18:16", "remaining_time": "5:20:30"}
|
| 407 |
+
{"current_steps": 407, "total_steps": 750, "loss": 0.8019, "lr": 5.127976834268112e-06, "epoch": 1.6280000000000001, "percentage": 54.27, "elapsed_time": "6:19:08", "remaining_time": "5:19:31"}
|
| 408 |
+
{"current_steps": 408, "total_steps": 750, "loss": 0.8342, "lr": 5.1047120994167855e-06, "epoch": 1.6320000000000001, "percentage": 54.4, "elapsed_time": "6:20:01", "remaining_time": "5:18:32"}
|
| 409 |
+
{"current_steps": 409, "total_steps": 750, "loss": 0.8294, "lr": 5.081445096329229e-06, "epoch": 1.6360000000000001, "percentage": 54.53, "elapsed_time": "6:20:49", "remaining_time": "5:17:30"}
|
| 410 |
+
{"current_steps": 410, "total_steps": 750, "loss": 0.797, "lr": 5.0581763290069865e-06, "epoch": 1.6400000000000001, "percentage": 54.67, "elapsed_time": "6:21:40", "remaining_time": "5:16:31"}
|
| 411 |
+
{"current_steps": 411, "total_steps": 750, "loss": 0.7843, "lr": 5.034906301489808e-06, "epoch": 1.6440000000000001, "percentage": 54.8, "elapsed_time": "6:22:37", "remaining_time": "5:15:35"}
|
| 412 |
+
{"current_steps": 412, "total_steps": 750, "loss": 0.7805, "lr": 5.011635517844753e-06, "epoch": 1.6480000000000001, "percentage": 54.93, "elapsed_time": "6:23:19", "remaining_time": "5:14:28"}
|
| 413 |
+
{"current_steps": 413, "total_steps": 750, "loss": 0.8101, "lr": 4.988364482155249e-06, "epoch": 1.6520000000000001, "percentage": 55.07, "elapsed_time": "6:24:13", "remaining_time": "5:13:31"}
|
| 414 |
+
{"current_steps": 414, "total_steps": 750, "loss": 0.7977, "lr": 4.965093698510192e-06, "epoch": 1.6560000000000001, "percentage": 55.2, "elapsed_time": "6:25:11", "remaining_time": "5:12:37"}
|
| 415 |
+
{"current_steps": 415, "total_steps": 750, "loss": 0.8385, "lr": 4.941823670993016e-06, "epoch": 1.6600000000000001, "percentage": 55.33, "elapsed_time": "6:26:08", "remaining_time": "5:11:42"}
|
| 416 |
+
{"current_steps": 416, "total_steps": 750, "loss": 0.8213, "lr": 4.9185549036707715e-06, "epoch": 1.6640000000000001, "percentage": 55.47, "elapsed_time": "6:27:13", "remaining_time": "5:10:53"}
|
| 417 |
+
{"current_steps": 417, "total_steps": 750, "loss": 0.8416, "lr": 4.895287900583216e-06, "epoch": 1.6680000000000001, "percentage": 55.6, "elapsed_time": "6:28:07", "remaining_time": "5:09:56"}
|
| 418 |
+
{"current_steps": 418, "total_steps": 750, "loss": 0.809, "lr": 4.87202316573189e-06, "epoch": 1.6720000000000002, "percentage": 55.73, "elapsed_time": "6:29:00", "remaining_time": "5:08:58"}
|
| 419 |
+
{"current_steps": 419, "total_steps": 750, "loss": 0.8451, "lr": 4.8487612030691975e-06, "epoch": 1.6760000000000002, "percentage": 55.87, "elapsed_time": "6:30:01", "remaining_time": "5:08:06"}
|
| 420 |
+
{"current_steps": 420, "total_steps": 750, "loss": 0.8033, "lr": 4.825502516487497e-06, "epoch": 1.6800000000000002, "percentage": 56.0, "elapsed_time": "6:30:50", "remaining_time": "5:07:05"}
|
| 421 |
+
{"current_steps": 421, "total_steps": 750, "loss": 0.7785, "lr": 4.802247609808175e-06, "epoch": 1.6840000000000002, "percentage": 56.13, "elapsed_time": "6:31:46", "remaining_time": "5:06:09"}
|
| 422 |
+
{"current_steps": 422, "total_steps": 750, "loss": 0.8273, "lr": 4.778996986770747e-06, "epoch": 1.688, "percentage": 56.27, "elapsed_time": "6:32:43", "remaining_time": "5:05:14"}
|
| 423 |
+
{"current_steps": 423, "total_steps": 750, "loss": 0.8136, "lr": 4.755751151021934e-06, "epoch": 1.692, "percentage": 56.4, "elapsed_time": "6:33:39", "remaining_time": "5:04:19"}
|
| 424 |
+
{"current_steps": 424, "total_steps": 750, "loss": 0.7944, "lr": 4.732510606104754e-06, "epoch": 1.696, "percentage": 56.53, "elapsed_time": "6:34:30", "remaining_time": "5:03:19"}
|
| 425 |
+
{"current_steps": 425, "total_steps": 750, "loss": 0.7787, "lr": 4.7092758554476215e-06, "epoch": 1.7, "percentage": 56.67, "elapsed_time": "6:35:17", "remaining_time": "5:02:16"}
|
| 426 |
+
{"current_steps": 426, "total_steps": 750, "loss": 0.8449, "lr": 4.686047402353433e-06, "epoch": 1.704, "percentage": 56.8, "elapsed_time": "6:36:11", "remaining_time": "5:01:19"}
|
| 427 |
+
{"current_steps": 427, "total_steps": 750, "loss": 0.8656, "lr": 4.662825749988675e-06, "epoch": 1.708, "percentage": 56.93, "elapsed_time": "6:37:09", "remaining_time": "5:00:25"}
|
| 428 |
+
{"current_steps": 428, "total_steps": 750, "loss": 0.8263, "lr": 4.639611401372514e-06, "epoch": 1.712, "percentage": 57.07, "elapsed_time": "6:38:00", "remaining_time": "4:59:26"}
|
| 429 |
+
{"current_steps": 429, "total_steps": 750, "loss": 0.7882, "lr": 4.6164048593659076e-06, "epoch": 1.716, "percentage": 57.2, "elapsed_time": "6:38:57", "remaining_time": "4:58:31"}
|
| 430 |
+
{"current_steps": 430, "total_steps": 750, "loss": 0.8271, "lr": 4.59320662666071e-06, "epoch": 1.72, "percentage": 57.33, "elapsed_time": "6:40:07", "remaining_time": "4:57:46"}
|
| 431 |
+
{"current_steps": 431, "total_steps": 750, "loss": 0.8182, "lr": 4.570017205768779e-06, "epoch": 1.724, "percentage": 57.47, "elapsed_time": "6:41:01", "remaining_time": "4:56:48"}
|
| 432 |
+
{"current_steps": 432, "total_steps": 750, "loss": 0.7873, "lr": 4.546837099011101e-06, "epoch": 1.728, "percentage": 57.6, "elapsed_time": "6:41:54", "remaining_time": "4:55:50"}
|
| 433 |
+
{"current_steps": 433, "total_steps": 750, "loss": 0.8012, "lr": 4.523666808506893e-06, "epoch": 1.732, "percentage": 57.73, "elapsed_time": "6:42:51", "remaining_time": "4:54:55"}
|
| 434 |
+
{"current_steps": 434, "total_steps": 750, "loss": 0.8149, "lr": 4.500506836162746e-06, "epoch": 1.736, "percentage": 57.87, "elapsed_time": "6:43:46", "remaining_time": "4:53:59"}
|
| 435 |
+
{"current_steps": 435, "total_steps": 750, "loss": 0.8252, "lr": 4.477357683661734e-06, "epoch": 1.74, "percentage": 58.0, "elapsed_time": "6:44:47", "remaining_time": "4:53:07"}
|
| 436 |
+
{"current_steps": 436, "total_steps": 750, "loss": 0.7868, "lr": 4.45421985245256e-06, "epoch": 1.744, "percentage": 58.13, "elapsed_time": "6:45:40", "remaining_time": "4:52:09"}
|
| 437 |
+
{"current_steps": 437, "total_steps": 750, "loss": 0.8138, "lr": 4.431093843738693e-06, "epoch": 1.748, "percentage": 58.27, "elapsed_time": "6:46:42", "remaining_time": "4:51:18"}
|
| 438 |
+
{"current_steps": 438, "total_steps": 750, "loss": 0.8376, "lr": 4.4079801584674955e-06, "epoch": 1.752, "percentage": 58.4, "elapsed_time": "6:47:39", "remaining_time": "4:50:23"}
|
| 439 |
+
{"current_steps": 439, "total_steps": 750, "loss": 0.8347, "lr": 4.384879297319398e-06, "epoch": 1.756, "percentage": 58.53, "elapsed_time": "6:48:30", "remaining_time": "4:49:23"}
|
| 440 |
+
{"current_steps": 440, "total_steps": 750, "loss": 0.8501, "lr": 4.361791760697027e-06, "epoch": 1.76, "percentage": 58.67, "elapsed_time": "6:49:26", "remaining_time": "4:48:28"}
|
| 441 |
+
{"current_steps": 441, "total_steps": 750, "loss": 0.8194, "lr": 4.3387180487143875e-06, "epoch": 1.764, "percentage": 58.8, "elapsed_time": "6:50:23", "remaining_time": "4:47:33"}
|
| 442 |
+
{"current_steps": 442, "total_steps": 750, "loss": 0.8352, "lr": 4.315658661186016e-06, "epoch": 1.768, "percentage": 58.93, "elapsed_time": "6:51:12", "remaining_time": "4:46:32"}
|
| 443 |
+
{"current_steps": 443, "total_steps": 750, "loss": 0.8033, "lr": 4.2926140976161555e-06, "epoch": 1.772, "percentage": 59.07, "elapsed_time": "6:52:03", "remaining_time": "4:45:33"}
|
| 444 |
+
{"current_steps": 444, "total_steps": 750, "loss": 0.7962, "lr": 4.269584857187942e-06, "epoch": 1.776, "percentage": 59.2, "elapsed_time": "6:53:08", "remaining_time": "4:44:44"}
|
| 445 |
+
{"current_steps": 445, "total_steps": 750, "loss": 0.8152, "lr": 4.246571438752585e-06, "epoch": 1.78, "percentage": 59.33, "elapsed_time": "6:53:59", "remaining_time": "4:43:44"}
|
| 446 |
+
{"current_steps": 446, "total_steps": 750, "loss": 0.8351, "lr": 4.2235743408185635e-06, "epoch": 1.784, "percentage": 59.47, "elapsed_time": "6:54:55", "remaining_time": "4:42:48"}
|
| 447 |
+
{"current_steps": 447, "total_steps": 750, "loss": 0.8292, "lr": 4.200594061540827e-06, "epoch": 1.788, "percentage": 59.6, "elapsed_time": "6:55:53", "remaining_time": "4:41:55"}
|
| 448 |
+
{"current_steps": 448, "total_steps": 750, "loss": 0.8349, "lr": 4.1776310987100054e-06, "epoch": 1.792, "percentage": 59.73, "elapsed_time": "6:56:49", "remaining_time": "4:40:59"}
|
| 449 |
+
{"current_steps": 449, "total_steps": 750, "loss": 0.841, "lr": 4.154685949741631e-06, "epoch": 1.796, "percentage": 59.87, "elapsed_time": "6:57:37", "remaining_time": "4:39:58"}
|
| 450 |
+
{"current_steps": 450, "total_steps": 750, "loss": 0.8478, "lr": 4.131759111665349e-06, "epoch": 1.8, "percentage": 60.0, "elapsed_time": "6:58:41", "remaining_time": "4:39:07"}
|
| 451 |
+
{"current_steps": 451, "total_steps": 750, "loss": 0.842, "lr": 4.108851081114169e-06, "epoch": 1.804, "percentage": 60.13, "elapsed_time": "6:59:32", "remaining_time": "4:38:08"}
|
| 452 |
+
{"current_steps": 452, "total_steps": 750, "loss": 0.8085, "lr": 4.0859623543136935e-06, "epoch": 1.808, "percentage": 60.27, "elapsed_time": "7:00:31", "remaining_time": "4:37:15"}
|
| 453 |
+
{"current_steps": 453, "total_steps": 750, "loss": 0.8226, "lr": 4.063093427071376e-06, "epoch": 1.812, "percentage": 60.4, "elapsed_time": "7:01:28", "remaining_time": "4:36:19"}
|
| 454 |
+
{"current_steps": 454, "total_steps": 750, "loss": 0.7907, "lr": 4.040244794765783e-06, "epoch": 1.8159999999999998, "percentage": 60.53, "elapsed_time": "7:02:18", "remaining_time": "4:35:19"}
|
| 455 |
+
{"current_steps": 455, "total_steps": 750, "loss": 0.8148, "lr": 4.017416952335849e-06, "epoch": 1.8199999999999998, "percentage": 60.67, "elapsed_time": "7:03:17", "remaining_time": "4:34:26"}
|
| 456 |
+
{"current_steps": 456, "total_steps": 750, "loss": 0.8446, "lr": 3.994610394270178e-06, "epoch": 1.8239999999999998, "percentage": 60.8, "elapsed_time": "7:04:18", "remaining_time": "4:33:33"}
|
| 457 |
+
{"current_steps": 457, "total_steps": 750, "loss": 0.8151, "lr": 3.971825614596308e-06, "epoch": 1.8279999999999998, "percentage": 60.93, "elapsed_time": "7:05:17", "remaining_time": "4:32:40"}
|
| 458 |
+
{"current_steps": 458, "total_steps": 750, "loss": 0.8365, "lr": 3.949063106870031e-06, "epoch": 1.8319999999999999, "percentage": 61.07, "elapsed_time": "7:06:20", "remaining_time": "4:31:48"}
|
| 459 |
+
{"current_steps": 459, "total_steps": 750, "loss": 0.8226, "lr": 3.926323364164684e-06, "epoch": 1.8359999999999999, "percentage": 61.2, "elapsed_time": "7:07:28", "remaining_time": "4:31:00"}
|
| 460 |
+
{"current_steps": 460, "total_steps": 750, "loss": 0.7785, "lr": 3.903606879060483e-06, "epoch": 1.8399999999999999, "percentage": 61.33, "elapsed_time": "7:08:23", "remaining_time": "4:30:04"}
|
| 461 |
+
{"current_steps": 461, "total_steps": 750, "loss": 0.7751, "lr": 3.880914143633844e-06, "epoch": 1.8439999999999999, "percentage": 61.47, "elapsed_time": "7:09:08", "remaining_time": "4:29:01"}
|
| 462 |
+
{"current_steps": 462, "total_steps": 750, "loss": 0.8252, "lr": 3.8582456494467214e-06, "epoch": 1.8479999999999999, "percentage": 61.6, "elapsed_time": "7:10:15", "remaining_time": "4:28:12"}
|
| 463 |
+
{"current_steps": 463, "total_steps": 750, "loss": 0.782, "lr": 3.835601887535971e-06, "epoch": 1.8519999999999999, "percentage": 61.73, "elapsed_time": "7:11:11", "remaining_time": "4:27:17"}
|
| 464 |
+
{"current_steps": 464, "total_steps": 750, "loss": 0.7884, "lr": 3.812983348402703e-06, "epoch": 1.8559999999999999, "percentage": 61.87, "elapsed_time": "7:12:04", "remaining_time": "4:26:19"}
|
| 465 |
+
{"current_steps": 465, "total_steps": 750, "loss": 0.8269, "lr": 3.790390522001662e-06, "epoch": 1.8599999999999999, "percentage": 62.0, "elapsed_time": "7:13:01", "remaining_time": "4:25:24"}
|
| 466 |
+
{"current_steps": 466, "total_steps": 750, "loss": 0.8175, "lr": 3.767823897730612e-06, "epoch": 1.8639999999999999, "percentage": 62.13, "elapsed_time": "7:13:57", "remaining_time": "4:24:28"}
|
| 467 |
+
{"current_steps": 467, "total_steps": 750, "loss": 0.8265, "lr": 3.745283964419736e-06, "epoch": 1.8679999999999999, "percentage": 62.27, "elapsed_time": "7:14:53", "remaining_time": "4:23:32"}
|
| 468 |
+
{"current_steps": 468, "total_steps": 750, "loss": 0.8422, "lr": 3.7227712103210485e-06, "epoch": 1.8719999999999999, "percentage": 62.4, "elapsed_time": "7:15:45", "remaining_time": "4:22:34"}
|
| 469 |
+
{"current_steps": 469, "total_steps": 750, "loss": 0.8218, "lr": 3.700286123097814e-06, "epoch": 1.876, "percentage": 62.53, "elapsed_time": "7:16:38", "remaining_time": "4:21:37"}
|
| 470 |
+
{"current_steps": 470, "total_steps": 750, "loss": 0.7906, "lr": 3.6778291898139907e-06, "epoch": 1.88, "percentage": 62.67, "elapsed_time": "7:17:23", "remaining_time": "4:20:34"}
|
| 471 |
+
{"current_steps": 471, "total_steps": 750, "loss": 0.7864, "lr": 3.655400896923672e-06, "epoch": 1.884, "percentage": 62.8, "elapsed_time": "7:18:12", "remaining_time": "4:19:34"}
|
| 472 |
+
{"current_steps": 472, "total_steps": 750, "loss": 0.8228, "lr": 3.633001730260558e-06, "epoch": 1.888, "percentage": 62.93, "elapsed_time": "7:19:13", "remaining_time": "4:18:42"}
|
| 473 |
+
{"current_steps": 473, "total_steps": 750, "loss": 0.816, "lr": 3.6106321750274275e-06, "epoch": 1.892, "percentage": 63.07, "elapsed_time": "7:20:08", "remaining_time": "4:17:45"}
|
| 474 |
+
{"current_steps": 474, "total_steps": 750, "loss": 0.8663, "lr": 3.5882927157856175e-06, "epoch": 1.896, "percentage": 63.2, "elapsed_time": "7:21:15", "remaining_time": "4:16:56"}
|
| 475 |
+
{"current_steps": 475, "total_steps": 750, "loss": 0.8209, "lr": 3.5659838364445505e-06, "epoch": 1.9, "percentage": 63.33, "elapsed_time": "7:22:14", "remaining_time": "4:16:02"}
|
| 476 |
+
{"current_steps": 476, "total_steps": 750, "loss": 0.8279, "lr": 3.543706020251223e-06, "epoch": 1.904, "percentage": 63.47, "elapsed_time": "7:23:07", "remaining_time": "4:15:04"}
|
| 477 |
+
{"current_steps": 477, "total_steps": 750, "loss": 0.8156, "lr": 3.521459749779769e-06, "epoch": 1.908, "percentage": 63.6, "elapsed_time": "7:24:08", "remaining_time": "4:14:11"}
|
| 478 |
+
{"current_steps": 478, "total_steps": 750, "loss": 0.8152, "lr": 3.4992455069209717e-06, "epoch": 1.912, "percentage": 63.73, "elapsed_time": "7:25:00", "remaining_time": "4:13:13"}
|
| 479 |
+
{"current_steps": 479, "total_steps": 750, "loss": 0.832, "lr": 3.4770637728718608e-06, "epoch": 1.916, "percentage": 63.87, "elapsed_time": "7:25:56", "remaining_time": "4:12:17"}
|
| 480 |
+
{"current_steps": 480, "total_steps": 750, "loss": 0.8177, "lr": 3.4549150281252635e-06, "epoch": 1.92, "percentage": 64.0, "elapsed_time": "7:26:59", "remaining_time": "4:11:26"}
|
| 481 |
+
{"current_steps": 481, "total_steps": 750, "loss": 0.8401, "lr": 3.4327997524594026e-06, "epoch": 1.924, "percentage": 64.13, "elapsed_time": "7:27:58", "remaining_time": "4:10:31"}
|
| 482 |
+
{"current_steps": 482, "total_steps": 750, "loss": 0.8577, "lr": 3.4107184249275114e-06, "epoch": 1.928, "percentage": 64.27, "elapsed_time": "7:29:02", "remaining_time": "4:09:40"}
|
| 483 |
+
{"current_steps": 483, "total_steps": 750, "loss": 0.8171, "lr": 3.3886715238474454e-06, "epoch": 1.932, "percentage": 64.4, "elapsed_time": "7:30:02", "remaining_time": "4:08:46"}
|
| 484 |
+
{"current_steps": 484, "total_steps": 750, "loss": 0.8573, "lr": 3.3666595267913293e-06, "epoch": 1.936, "percentage": 64.53, "elapsed_time": "7:31:07", "remaining_time": "4:07:55"}
|
| 485 |
+
{"current_steps": 485, "total_steps": 750, "loss": 0.8174, "lr": 3.3446829105752103e-06, "epoch": 1.94, "percentage": 64.67, "elapsed_time": "7:32:12", "remaining_time": "4:07:04"}
|
| 486 |
+
{"current_steps": 486, "total_steps": 750, "loss": 0.8119, "lr": 3.322742151248726e-06, "epoch": 1.944, "percentage": 64.8, "elapsed_time": "7:33:02", "remaining_time": "4:06:05"}
|
| 487 |
+
{"current_steps": 487, "total_steps": 750, "loss": 0.8051, "lr": 3.3008377240847955e-06, "epoch": 1.948, "percentage": 64.93, "elapsed_time": "7:34:03", "remaining_time": "4:05:12"}
|
| 488 |
+
{"current_steps": 488, "total_steps": 750, "loss": 0.8547, "lr": 3.2789701035693242e-06, "epoch": 1.952, "percentage": 65.07, "elapsed_time": "7:34:56", "remaining_time": "4:04:15"}
|
| 489 |
+
{"current_steps": 489, "total_steps": 750, "loss": 0.8522, "lr": 3.2571397633909252e-06, "epoch": 1.956, "percentage": 65.2, "elapsed_time": "7:35:59", "remaining_time": "4:03:22"}
|
| 490 |
+
{"current_steps": 490, "total_steps": 750, "loss": 0.8417, "lr": 3.2353471764306567e-06, "epoch": 1.96, "percentage": 65.33, "elapsed_time": "7:37:05", "remaining_time": "4:02:32"}
|
| 491 |
+
{"current_steps": 491, "total_steps": 750, "loss": 0.7664, "lr": 3.2135928147517803e-06, "epoch": 1.964, "percentage": 65.47, "elapsed_time": "7:37:52", "remaining_time": "4:01:31"}
|
| 492 |
+
{"current_steps": 492, "total_steps": 750, "loss": 0.8248, "lr": 3.1918771495895395e-06, "epoch": 1.968, "percentage": 65.6, "elapsed_time": "7:38:50", "remaining_time": "4:00:36"}
|
| 493 |
+
{"current_steps": 493, "total_steps": 750, "loss": 0.8189, "lr": 3.1702006513409393e-06, "epoch": 1.972, "percentage": 65.73, "elapsed_time": "7:39:43", "remaining_time": "3:59:39"}
|
| 494 |
+
{"current_steps": 494, "total_steps": 750, "loss": 0.8193, "lr": 3.148563789554575e-06, "epoch": 1.976, "percentage": 65.87, "elapsed_time": "7:40:39", "remaining_time": "3:58:43"}
|
| 495 |
+
{"current_steps": 495, "total_steps": 750, "loss": 0.8297, "lr": 3.12696703292044e-06, "epoch": 1.98, "percentage": 66.0, "elapsed_time": "7:41:30", "remaining_time": "3:57:44"}
|
| 496 |
+
{"current_steps": 496, "total_steps": 750, "loss": 0.7984, "lr": 3.105410849259796e-06, "epoch": 1.984, "percentage": 66.13, "elapsed_time": "7:42:27", "remaining_time": "3:56:49"}
|
| 497 |
+
{"current_steps": 497, "total_steps": 750, "loss": 0.8072, "lr": 3.0838957055150136e-06, "epoch": 1.988, "percentage": 66.27, "elapsed_time": "7:43:16", "remaining_time": "3:55:50"}
|
| 498 |
+
{"current_steps": 498, "total_steps": 750, "loss": 0.7919, "lr": 3.0624220677394854e-06, "epoch": 1.992, "percentage": 66.4, "elapsed_time": "7:44:12", "remaining_time": "3:54:54"}
|
| 499 |
+
{"current_steps": 499, "total_steps": 750, "loss": 0.8406, "lr": 3.040990401087508e-06, "epoch": 1.996, "percentage": 66.53, "elapsed_time": "7:45:14", "remaining_time": "3:54:01"}
|
| 500 |
+
{"current_steps": 500, "total_steps": 750, "loss": 0.7982, "lr": 3.019601169804216e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "7:46:11", "remaining_time": "3:53:05"}
|
| 501 |
+
{"current_steps": 501, "total_steps": 750, "loss": 0.7587, "lr": 2.9982548372155264e-06, "epoch": 2.004, "percentage": 66.8, "elapsed_time": "7:48:10", "remaining_time": "3:52:40"}
|
| 502 |
+
{"current_steps": 502, "total_steps": 750, "loss": 0.7893, "lr": 2.9769518657180953e-06, "epoch": 2.008, "percentage": 66.93, "elapsed_time": "7:49:01", "remaining_time": "3:51:42"}
|