Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74c76337a5307045a87fa4b8362f0d44299a09c1e800e54edededb91bd53b0bd
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58b88e9708c907da1e0c14458cc4281dc4a3292fc9823616a4e46f410a1be534
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cae79e345cf7a1a53d45865aeeffc95fb86fd7ddc47baec0ee23c50e7d046a4
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:acbf4ca0afcddf25301799d323c3a7e3b9e0fa372d1db58aacfefcf9f1452f57
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -294,3 +294,149 @@
|
|
| 294 |
{"current_steps": 294, "total_steps": 441, "loss": 0.6613, "lr": 2.425399127352235e-05, "epoch": 1.9940652818991098, "percentage": 66.67, "elapsed_time": "8:47:51", "remaining_time": "4:23:55"}
|
| 295 |
{"current_steps": 295, "total_steps": 441, "loss": 1.0436, "lr": 2.3962778583735463e-05, "epoch": 2.0008478168715556, "percentage": 66.89, "elapsed_time": "8:50:50", "remaining_time": "4:22:43"}
|
| 296 |
{"current_steps": 296, "total_steps": 441, "loss": 0.6518, "lr": 2.3672575231011888e-05, "epoch": 2.0076303518440017, "percentage": 67.12, "elapsed_time": "8:52:36", "remaining_time": "4:20:54"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 294 |
{"current_steps": 294, "total_steps": 441, "loss": 0.6613, "lr": 2.425399127352235e-05, "epoch": 1.9940652818991098, "percentage": 66.67, "elapsed_time": "8:47:51", "remaining_time": "4:23:55"}
|
| 295 |
{"current_steps": 295, "total_steps": 441, "loss": 1.0436, "lr": 2.3962778583735463e-05, "epoch": 2.0008478168715556, "percentage": 66.89, "elapsed_time": "8:50:50", "remaining_time": "4:22:43"}
|
| 296 |
{"current_steps": 296, "total_steps": 441, "loss": 0.6518, "lr": 2.3672575231011888e-05, "epoch": 2.0076303518440017, "percentage": 67.12, "elapsed_time": "8:52:36", "remaining_time": "4:20:54"}
|
| 297 |
+
{"current_steps": 297, "total_steps": 441, "loss": 0.6541, "lr": 2.338339947992455e-05, "epoch": 2.0144128868164475, "percentage": 67.35, "elapsed_time": "8:54:23", "remaining_time": "4:19:05"}
|
| 298 |
+
{"current_steps": 298, "total_steps": 441, "loss": 0.642, "lr": 2.3095269530372032e-05, "epoch": 2.0211954217888937, "percentage": 67.57, "elapsed_time": "8:56:09", "remaining_time": "4:17:17"}
|
| 299 |
+
{"current_steps": 299, "total_steps": 441, "loss": 0.6585, "lr": 2.2808203516433136e-05, "epoch": 2.0279779567613394, "percentage": 67.8, "elapsed_time": "8:57:56", "remaining_time": "4:15:28"}
|
| 300 |
+
{"current_steps": 300, "total_steps": 441, "loss": 0.6367, "lr": 2.2522219505225627e-05, "epoch": 2.0347604917337856, "percentage": 68.03, "elapsed_time": "8:59:44", "remaining_time": "4:13:40"}
|
| 301 |
+
{"current_steps": 301, "total_steps": 441, "loss": 0.6435, "lr": 2.2237335495769035e-05, "epoch": 2.0415430267062313, "percentage": 68.25, "elapsed_time": "9:01:31", "remaining_time": "4:11:52"}
|
| 302 |
+
{"current_steps": 302, "total_steps": 441, "loss": 0.6512, "lr": 2.1953569417851983e-05, "epoch": 2.0483255616786775, "percentage": 68.48, "elapsed_time": "9:03:18", "remaining_time": "4:10:03"}
|
| 303 |
+
{"current_steps": 303, "total_steps": 441, "loss": 0.6421, "lr": 2.1670939130903585e-05, "epoch": 2.0551080966511233, "percentage": 68.71, "elapsed_time": "9:05:05", "remaining_time": "4:08:15"}
|
| 304 |
+
{"current_steps": 304, "total_steps": 441, "loss": 0.6449, "lr": 2.1389462422869576e-05, "epoch": 2.0618906316235694, "percentage": 68.93, "elapsed_time": "9:06:51", "remaining_time": "4:06:26"}
|
| 305 |
+
{"current_steps": 305, "total_steps": 441, "loss": 0.645, "lr": 2.11091570090927e-05, "epoch": 2.068673166596015, "percentage": 69.16, "elapsed_time": "9:08:38", "remaining_time": "4:04:38"}
|
| 306 |
+
{"current_steps": 306, "total_steps": 441, "loss": 0.6486, "lr": 2.0830040531197744e-05, "epoch": 2.0754557015684614, "percentage": 69.39, "elapsed_time": "9:10:24", "remaining_time": "4:02:49"}
|
| 307 |
+
{"current_steps": 307, "total_steps": 441, "loss": 0.6294, "lr": 2.055213055598126e-05, "epoch": 2.082238236540907, "percentage": 69.61, "elapsed_time": "9:12:11", "remaining_time": "4:01:01"}
|
| 308 |
+
{"current_steps": 308, "total_steps": 441, "loss": 0.6533, "lr": 2.027544457430599e-05, "epoch": 2.0890207715133533, "percentage": 69.84, "elapsed_time": "9:13:58", "remaining_time": "3:59:12"}
|
| 309 |
+
{"current_steps": 309, "total_steps": 441, "loss": 0.6439, "lr": 2.0000000000000012e-05, "epoch": 2.095803306485799, "percentage": 70.07, "elapsed_time": "9:15:44", "remaining_time": "3:57:24"}
|
| 310 |
+
{"current_steps": 310, "total_steps": 441, "loss": 0.6326, "lr": 1.9725814168760688e-05, "epoch": 2.1025858414582452, "percentage": 70.29, "elapsed_time": "9:17:31", "remaining_time": "3:55:35"}
|
| 311 |
+
{"current_steps": 311, "total_steps": 441, "loss": 0.6294, "lr": 1.9452904337063757e-05, "epoch": 2.109368376430691, "percentage": 70.52, "elapsed_time": "9:19:17", "remaining_time": "3:53:47"}
|
| 312 |
+
{"current_steps": 312, "total_steps": 441, "loss": 0.6391, "lr": 1.9181287681077116e-05, "epoch": 2.1161509114031367, "percentage": 70.75, "elapsed_time": "9:21:04", "remaining_time": "3:51:58"}
|
| 313 |
+
{"current_steps": 313, "total_steps": 441, "loss": 0.6363, "lr": 1.8910981295579903e-05, "epoch": 2.122933446375583, "percentage": 70.98, "elapsed_time": "9:22:50", "remaining_time": "3:50:10"}
|
| 314 |
+
{"current_steps": 314, "total_steps": 441, "loss": 0.6499, "lr": 1.864200219288656e-05, "epoch": 2.1297159813480286, "percentage": 71.2, "elapsed_time": "9:24:36", "remaining_time": "3:48:21"}
|
| 315 |
+
{"current_steps": 315, "total_steps": 441, "loss": 0.6484, "lr": 1.8374367301776112e-05, "epoch": 2.136498516320475, "percentage": 71.43, "elapsed_time": "9:26:24", "remaining_time": "3:46:33"}
|
| 316 |
+
{"current_steps": 316, "total_steps": 441, "loss": 0.6517, "lr": 1.8108093466426713e-05, "epoch": 2.1432810512929206, "percentage": 71.66, "elapsed_time": "9:28:11", "remaining_time": "3:44:45"}
|
| 317 |
+
{"current_steps": 317, "total_steps": 441, "loss": 0.6424, "lr": 1.7843197445355593e-05, "epoch": 2.1500635862653668, "percentage": 71.88, "elapsed_time": "9:29:58", "remaining_time": "3:42:57"}
|
| 318 |
+
{"current_steps": 318, "total_steps": 441, "loss": 0.6327, "lr": 1.7579695910364235e-05, "epoch": 2.1568461212378125, "percentage": 72.11, "elapsed_time": "9:31:45", "remaining_time": "3:41:09"}
|
| 319 |
+
{"current_steps": 319, "total_steps": 441, "loss": 0.6332, "lr": 1.7317605445489178e-05, "epoch": 2.1636286562102587, "percentage": 72.34, "elapsed_time": "9:33:32", "remaining_time": "3:39:20"}
|
| 320 |
+
{"current_steps": 320, "total_steps": 441, "loss": 0.6664, "lr": 1.7056942545958167e-05, "epoch": 2.1704111911827044, "percentage": 72.56, "elapsed_time": "9:35:18", "remaining_time": "3:37:32"}
|
| 321 |
+
{"current_steps": 321, "total_steps": 441, "loss": 0.6411, "lr": 1.679772361715208e-05, "epoch": 2.1771937261551506, "percentage": 72.79, "elapsed_time": "9:37:06", "remaining_time": "3:35:44"}
|
| 322 |
+
{"current_steps": 322, "total_steps": 441, "loss": 0.6454, "lr": 1.6539964973572388e-05, "epoch": 2.1839762611275964, "percentage": 73.02, "elapsed_time": "9:38:54", "remaining_time": "3:33:56"}
|
| 323 |
+
{"current_steps": 323, "total_steps": 441, "loss": 0.646, "lr": 1.6283682837814388e-05, "epoch": 2.1907587961000425, "percentage": 73.24, "elapsed_time": "9:40:41", "remaining_time": "3:32:08"}
|
| 324 |
+
{"current_steps": 324, "total_steps": 441, "loss": 0.6326, "lr": 1.6028893339546122e-05, "epoch": 2.1975413310724883, "percentage": 73.47, "elapsed_time": "9:42:30", "remaining_time": "3:30:20"}
|
| 325 |
+
{"current_steps": 325, "total_steps": 441, "loss": 0.6461, "lr": 1.5775612514493343e-05, "epoch": 2.2043238660449345, "percentage": 73.7, "elapsed_time": "9:44:19", "remaining_time": "3:28:33"}
|
| 326 |
+
{"current_steps": 326, "total_steps": 441, "loss": 0.6372, "lr": 1.552385630343014e-05, "epoch": 2.21110640101738, "percentage": 73.92, "elapsed_time": "9:46:08", "remaining_time": "3:26:46"}
|
| 327 |
+
{"current_steps": 327, "total_steps": 441, "loss": 0.6286, "lr": 1.527364055117579e-05, "epoch": 2.2178889359898264, "percentage": 74.15, "elapsed_time": "9:47:58", "remaining_time": "3:24:58"}
|
| 328 |
+
{"current_steps": 328, "total_steps": 441, "loss": 0.6439, "lr": 1.502498100559747e-05, "epoch": 2.224671470962272, "percentage": 74.38, "elapsed_time": "9:49:45", "remaining_time": "3:23:10"}
|
| 329 |
+
{"current_steps": 329, "total_steps": 441, "loss": 0.6369, "lr": 1.4777893316619114e-05, "epoch": 2.231454005934718, "percentage": 74.6, "elapsed_time": "9:51:35", "remaining_time": "3:21:23"}
|
| 330 |
+
{"current_steps": 330, "total_steps": 441, "loss": 0.6385, "lr": 1.4532393035236477e-05, "epoch": 2.238236540907164, "percentage": 74.83, "elapsed_time": "9:53:25", "remaining_time": "3:19:36"}
|
| 331 |
+
{"current_steps": 331, "total_steps": 441, "loss": 0.6339, "lr": 1.4288495612538427e-05, "epoch": 2.24501907587961, "percentage": 75.06, "elapsed_time": "9:55:12", "remaining_time": "3:17:48"}
|
| 332 |
+
{"current_steps": 332, "total_steps": 441, "loss": 0.6397, "lr": 1.404621639873447e-05, "epoch": 2.251801610852056, "percentage": 75.28, "elapsed_time": "9:56:59", "remaining_time": "3:15:59"}
|
| 333 |
+
{"current_steps": 333, "total_steps": 441, "loss": 0.645, "lr": 1.3805570642188602e-05, "epoch": 2.2585841458245017, "percentage": 75.51, "elapsed_time": "9:58:45", "remaining_time": "3:14:11"}
|
| 334 |
+
{"current_steps": 334, "total_steps": 441, "loss": 0.6449, "lr": 1.3566573488459729e-05, "epoch": 2.265366680796948, "percentage": 75.74, "elapsed_time": "10:00:34", "remaining_time": "3:12:23"}
|
| 335 |
+
{"current_steps": 335, "total_steps": 441, "loss": 0.64, "lr": 1.3329239979348341e-05, "epoch": 2.2721492157693937, "percentage": 75.96, "elapsed_time": "10:02:21", "remaining_time": "3:10:35"}
|
| 336 |
+
{"current_steps": 336, "total_steps": 441, "loss": 0.6514, "lr": 1.30935850519499e-05, "epoch": 2.27893175074184, "percentage": 76.19, "elapsed_time": "10:04:07", "remaining_time": "3:08:47"}
|
| 337 |
+
{"current_steps": 337, "total_steps": 441, "loss": 0.6551, "lr": 1.2859623537714719e-05, "epoch": 2.2857142857142856, "percentage": 76.42, "elapsed_time": "10:05:54", "remaining_time": "3:06:59"}
|
| 338 |
+
{"current_steps": 338, "total_steps": 441, "loss": 0.6299, "lr": 1.262737016151447e-05, "epoch": 2.2924968206867318, "percentage": 76.64, "elapsed_time": "10:07:40", "remaining_time": "3:05:10"}
|
| 339 |
+
{"current_steps": 339, "total_steps": 441, "loss": 0.6316, "lr": 1.2396839540715528e-05, "epoch": 2.2992793556591775, "percentage": 76.87, "elapsed_time": "10:09:27", "remaining_time": "3:03:22"}
|
| 340 |
+
{"current_steps": 340, "total_steps": 441, "loss": 0.6284, "lr": 1.2168046184258896e-05, "epoch": 2.3060618906316237, "percentage": 77.1, "elapsed_time": "10:11:14", "remaining_time": "3:01:34"}
|
| 341 |
+
{"current_steps": 341, "total_steps": 441, "loss": 0.6436, "lr": 1.1941004491747145e-05, "epoch": 2.3128444256040694, "percentage": 77.32, "elapsed_time": "10:13:01", "remaining_time": "2:59:46"}
|
| 342 |
+
{"current_steps": 342, "total_steps": 441, "loss": 0.644, "lr": 1.1715728752538103e-05, "epoch": 2.3196269605765156, "percentage": 77.55, "elapsed_time": "10:14:48", "remaining_time": "2:57:58"}
|
| 343 |
+
{"current_steps": 343, "total_steps": 441, "loss": 0.654, "lr": 1.1492233144845497e-05, "epoch": 2.3264094955489614, "percentage": 77.78, "elapsed_time": "10:16:35", "remaining_time": "2:56:10"}
|
| 344 |
+
{"current_steps": 344, "total_steps": 441, "loss": 0.6383, "lr": 1.1270531734846642e-05, "epoch": 2.3331920305214076, "percentage": 78.0, "elapsed_time": "10:18:22", "remaining_time": "2:54:22"}
|
| 345 |
+
{"current_steps": 345, "total_steps": 441, "loss": 0.6486, "lr": 1.1050638475797193e-05, "epoch": 2.3399745654938533, "percentage": 78.23, "elapsed_time": "10:20:09", "remaining_time": "2:52:33"}
|
| 346 |
+
{"current_steps": 346, "total_steps": 441, "loss": 0.6404, "lr": 1.083256720715292e-05, "epoch": 2.3467571004662995, "percentage": 78.46, "elapsed_time": "10:21:55", "remaining_time": "2:50:45"}
|
| 347 |
+
{"current_steps": 347, "total_steps": 441, "loss": 0.6532, "lr": 1.0616331653698673e-05, "epoch": 2.3535396354387452, "percentage": 78.68, "elapsed_time": "10:23:43", "remaining_time": "2:48:57"}
|
| 348 |
+
{"current_steps": 348, "total_steps": 441, "loss": 0.6345, "lr": 1.0401945424684653e-05, "epoch": 2.360322170411191, "percentage": 78.91, "elapsed_time": "10:25:30", "remaining_time": "2:47:09"}
|
| 349 |
+
{"current_steps": 349, "total_steps": 441, "loss": 0.6482, "lr": 1.0189422012969814e-05, "epoch": 2.367104705383637, "percentage": 79.14, "elapsed_time": "10:27:18", "remaining_time": "2:45:21"}
|
| 350 |
+
{"current_steps": 350, "total_steps": 441, "loss": 0.6243, "lr": 9.978774794172717e-06, "epoch": 2.373887240356083, "percentage": 79.37, "elapsed_time": "10:29:05", "remaining_time": "2:43:33"}
|
| 351 |
+
{"current_steps": 351, "total_steps": 441, "loss": 0.6464, "lr": 9.770017025829675e-06, "epoch": 2.380669775328529, "percentage": 79.59, "elapsed_time": "10:30:52", "remaining_time": "2:41:45"}
|
| 352 |
+
{"current_steps": 352, "total_steps": 441, "loss": 0.6399, "lr": 9.563161846560342e-06, "epoch": 2.387452310300975, "percentage": 79.82, "elapsed_time": "10:32:38", "remaining_time": "2:39:57"}
|
| 353 |
+
{"current_steps": 353, "total_steps": 441, "loss": 0.6369, "lr": 9.358222275240884e-06, "epoch": 2.394234845273421, "percentage": 80.05, "elapsed_time": "10:34:25", "remaining_time": "2:38:09"}
|
| 354 |
+
{"current_steps": 354, "total_steps": 441, "loss": 0.6389, "lr": 9.155211210184495e-06, "epoch": 2.4010173802458668, "percentage": 80.27, "elapsed_time": "10:36:12", "remaining_time": "2:36:21"}
|
| 355 |
+
{"current_steps": 355, "total_steps": 441, "loss": 0.6377, "lr": 8.954141428329723e-06, "epoch": 2.407799915218313, "percentage": 80.5, "elapsed_time": "10:37:58", "remaining_time": "2:34:33"}
|
| 356 |
+
{"current_steps": 356, "total_steps": 441, "loss": 0.6376, "lr": 8.755025584436266e-06, "epoch": 2.4145824501907587, "percentage": 80.73, "elapsed_time": "10:39:45", "remaining_time": "2:32:45"}
|
| 357 |
+
{"current_steps": 357, "total_steps": 441, "loss": 0.6506, "lr": 8.55787621028851e-06, "epoch": 2.421364985163205, "percentage": 80.95, "elapsed_time": "10:41:31", "remaining_time": "2:30:56"}
|
| 358 |
+
{"current_steps": 358, "total_steps": 441, "loss": 0.6313, "lr": 8.362705713906836e-06, "epoch": 2.4281475201356506, "percentage": 81.18, "elapsed_time": "10:43:19", "remaining_time": "2:29:08"}
|
| 359 |
+
{"current_steps": 359, "total_steps": 441, "loss": 0.6429, "lr": 8.169526378766713e-06, "epoch": 2.434930055108097, "percentage": 81.41, "elapsed_time": "10:45:06", "remaining_time": "2:27:20"}
|
| 360 |
+
{"current_steps": 360, "total_steps": 441, "loss": 0.6407, "lr": 7.978350363025588e-06, "epoch": 2.4417125900805425, "percentage": 81.63, "elapsed_time": "10:46:53", "remaining_time": "2:25:33"}
|
| 361 |
+
{"current_steps": 361, "total_steps": 441, "loss": 0.6348, "lr": 7.789189698757656e-06, "epoch": 2.4484951250529887, "percentage": 81.86, "elapsed_time": "10:48:41", "remaining_time": "2:23:45"}
|
| 362 |
+
{"current_steps": 362, "total_steps": 441, "loss": 0.6459, "lr": 7.602056291196671e-06, "epoch": 2.4552776600254345, "percentage": 82.09, "elapsed_time": "10:50:29", "remaining_time": "2:21:57"}
|
| 363 |
+
{"current_steps": 363, "total_steps": 441, "loss": 0.6509, "lr": 7.416961917986572e-06, "epoch": 2.4620601949978806, "percentage": 82.31, "elapsed_time": "10:52:18", "remaining_time": "2:20:09"}
|
| 364 |
+
{"current_steps": 364, "total_steps": 441, "loss": 0.6348, "lr": 7.233918228440324e-06, "epoch": 2.4688427299703264, "percentage": 82.54, "elapsed_time": "10:54:07", "remaining_time": "2:18:22"}
|
| 365 |
+
{"current_steps": 365, "total_steps": 441, "loss": 0.646, "lr": 7.052936742806693e-06, "epoch": 2.4756252649427726, "percentage": 82.77, "elapsed_time": "10:55:56", "remaining_time": "2:16:34"}
|
| 366 |
+
{"current_steps": 366, "total_steps": 441, "loss": 0.64, "lr": 6.874028851545174e-06, "epoch": 2.4824077999152183, "percentage": 82.99, "elapsed_time": "10:57:45", "remaining_time": "2:14:47"}
|
| 367 |
+
{"current_steps": 367, "total_steps": 441, "loss": 0.6324, "lr": 6.697205814609149e-06, "epoch": 2.489190334887664, "percentage": 83.22, "elapsed_time": "10:59:34", "remaining_time": "2:12:59"}
|
| 368 |
+
{"current_steps": 368, "total_steps": 441, "loss": 0.6398, "lr": 6.522478760737212e-06, "epoch": 2.4959728698601102, "percentage": 83.45, "elapsed_time": "11:01:21", "remaining_time": "2:11:11"}
|
| 369 |
+
{"current_steps": 369, "total_steps": 441, "loss": 0.6441, "lr": 6.349858686752748e-06, "epoch": 2.5027554048325564, "percentage": 83.67, "elapsed_time": "11:03:08", "remaining_time": "2:09:23"}
|
| 370 |
+
{"current_steps": 370, "total_steps": 441, "loss": 0.6307, "lr": 6.17935645687183e-06, "epoch": 2.509537939805002, "percentage": 83.9, "elapsed_time": "11:04:54", "remaining_time": "2:07:35"}
|
| 371 |
+
{"current_steps": 371, "total_steps": 441, "loss": 0.6382, "lr": 6.010982802019429e-06, "epoch": 2.516320474777448, "percentage": 84.13, "elapsed_time": "11:06:41", "remaining_time": "2:05:47"}
|
| 372 |
+
{"current_steps": 372, "total_steps": 441, "loss": 0.6427, "lr": 5.8447483191540784e-06, "epoch": 2.523103009749894, "percentage": 84.35, "elapsed_time": "11:08:28", "remaining_time": "2:03:59"}
|
| 373 |
+
{"current_steps": 373, "total_steps": 441, "loss": 0.6479, "lr": 5.680663470600918e-06, "epoch": 2.52988554472234, "percentage": 84.58, "elapsed_time": "11:10:15", "remaining_time": "2:02:11"}
|
| 374 |
+
{"current_steps": 374, "total_steps": 441, "loss": 0.6508, "lr": 5.518738583393228e-06, "epoch": 2.536668079694786, "percentage": 84.81, "elapsed_time": "11:12:01", "remaining_time": "2:00:23"}
|
| 375 |
+
{"current_steps": 375, "total_steps": 441, "loss": 0.6372, "lr": 5.358983848622452e-06, "epoch": 2.5434506146672318, "percentage": 85.03, "elapsed_time": "11:13:49", "remaining_time": "1:58:35"}
|
| 376 |
+
{"current_steps": 376, "total_steps": 441, "loss": 0.6397, "lr": 5.201409320796842e-06, "epoch": 2.550233149639678, "percentage": 85.26, "elapsed_time": "11:15:35", "remaining_time": "1:56:47"}
|
| 377 |
+
{"current_steps": 377, "total_steps": 441, "loss": 0.6386, "lr": 5.046024917208603e-06, "epoch": 2.5570156846121237, "percentage": 85.49, "elapsed_time": "11:17:21", "remaining_time": "1:54:59"}
|
| 378 |
+
{"current_steps": 378, "total_steps": 441, "loss": 0.6489, "lr": 4.892840417309775e-06, "epoch": 2.56379821958457, "percentage": 85.71, "elapsed_time": "11:19:08", "remaining_time": "1:53:11"}
|
| 379 |
+
{"current_steps": 379, "total_steps": 441, "loss": 0.6527, "lr": 4.7418654620967216e-06, "epoch": 2.5705807545570156, "percentage": 85.94, "elapsed_time": "11:20:55", "remaining_time": "1:51:23"}
|
| 380 |
+
{"current_steps": 380, "total_steps": 441, "loss": 0.6428, "lr": 4.593109553503343e-06, "epoch": 2.577363289529462, "percentage": 86.17, "elapsed_time": "11:22:41", "remaining_time": "1:49:35"}
|
| 381 |
+
{"current_steps": 381, "total_steps": 441, "loss": 0.6408, "lr": 4.446582053803066e-06, "epoch": 2.5841458245019076, "percentage": 86.39, "elapsed_time": "11:24:28", "remaining_time": "1:47:47"}
|
| 382 |
+
{"current_steps": 382, "total_steps": 441, "loss": 0.6496, "lr": 4.302292185019603e-06, "epoch": 2.5909283594743533, "percentage": 86.62, "elapsed_time": "11:26:15", "remaining_time": "1:45:59"}
|
| 383 |
+
{"current_steps": 383, "total_steps": 441, "loss": 0.6407, "lr": 4.16024902834657e-06, "epoch": 2.5977108944467995, "percentage": 86.85, "elapsed_time": "11:28:02", "remaining_time": "1:44:11"}
|
| 384 |
+
{"current_steps": 384, "total_steps": 441, "loss": 0.6497, "lr": 4.020461523575873e-06, "epoch": 2.6044934294192457, "percentage": 87.07, "elapsed_time": "11:29:49", "remaining_time": "1:42:23"}
|
| 385 |
+
{"current_steps": 385, "total_steps": 441, "loss": 0.6473, "lr": 3.882938468535158e-06, "epoch": 2.6112759643916914, "percentage": 87.3, "elapsed_time": "11:31:35", "remaining_time": "1:40:35"}
|
| 386 |
+
{"current_steps": 386, "total_steps": 441, "loss": 0.6467, "lr": 3.747688518534003e-06, "epoch": 2.618058499364137, "percentage": 87.53, "elapsed_time": "11:33:21", "remaining_time": "1:38:47"}
|
| 387 |
+
{"current_steps": 387, "total_steps": 441, "loss": 0.6271, "lr": 3.6147201858192627e-06, "epoch": 2.6248410343365833, "percentage": 87.76, "elapsed_time": "11:35:08", "remaining_time": "1:36:59"}
|
| 388 |
+
{"current_steps": 388, "total_steps": 441, "loss": 0.6417, "lr": 3.4840418390392895e-06, "epoch": 2.6316235693090295, "percentage": 87.98, "elapsed_time": "11:36:55", "remaining_time": "1:35:11"}
|
| 389 |
+
{"current_steps": 389, "total_steps": 441, "loss": 0.6474, "lr": 3.3556617027172168e-06, "epoch": 2.6384061042814753, "percentage": 88.21, "elapsed_time": "11:38:41", "remaining_time": "1:33:23"}
|
| 390 |
+
{"current_steps": 390, "total_steps": 441, "loss": 0.6475, "lr": 3.2295878567333784e-06, "epoch": 2.645188639253921, "percentage": 88.44, "elapsed_time": "11:40:28", "remaining_time": "1:31:36"}
|
| 391 |
+
{"current_steps": 391, "total_steps": 441, "loss": 0.6478, "lr": 3.1058282358167503e-06, "epoch": 2.651971174226367, "percentage": 88.66, "elapsed_time": "11:42:15", "remaining_time": "1:29:48"}
|
| 392 |
+
{"current_steps": 392, "total_steps": 441, "loss": 0.6469, "lr": 2.984390629045555e-06, "epoch": 2.658753709198813, "percentage": 88.89, "elapsed_time": "11:44:02", "remaining_time": "1:28:00"}
|
| 393 |
+
{"current_steps": 393, "total_steps": 441, "loss": 0.625, "lr": 2.8652826793570975e-06, "epoch": 2.665536244171259, "percentage": 89.12, "elapsed_time": "11:45:49", "remaining_time": "1:26:12"}
|
| 394 |
+
{"current_steps": 394, "total_steps": 441, "loss": 0.6419, "lr": 2.7485118830666535e-06, "epoch": 2.672318779143705, "percentage": 89.34, "elapsed_time": "11:47:35", "remaining_time": "1:24:24"}
|
| 395 |
+
{"current_steps": 395, "total_steps": 441, "loss": 0.6396, "lr": 2.634085589395734e-06, "epoch": 2.679101314116151, "percentage": 89.57, "elapsed_time": "11:49:23", "remaining_time": "1:22:36"}
|
| 396 |
+
{"current_steps": 396, "total_steps": 441, "loss": 0.6453, "lr": 2.5220110000095366e-06, "epoch": 2.685883849088597, "percentage": 89.8, "elapsed_time": "11:51:11", "remaining_time": "1:20:49"}
|
| 397 |
+
{"current_steps": 397, "total_steps": 441, "loss": 0.6473, "lr": 2.4122951685636674e-06, "epoch": 2.692666384061043, "percentage": 90.02, "elapsed_time": "11:53:00", "remaining_time": "1:19:01"}
|
| 398 |
+
{"current_steps": 398, "total_steps": 441, "loss": 0.627, "lr": 2.3049450002602394e-06, "epoch": 2.6994489190334887, "percentage": 90.25, "elapsed_time": "11:54:47", "remaining_time": "1:17:13"}
|
| 399 |
+
{"current_steps": 399, "total_steps": 441, "loss": 0.6411, "lr": 2.199967251413262e-06, "epoch": 2.706231454005935, "percentage": 90.48, "elapsed_time": "11:56:34", "remaining_time": "1:15:25"}
|
| 400 |
+
{"current_steps": 400, "total_steps": 441, "loss": 0.6307, "lr": 2.0973685290234024e-06, "epoch": 2.7130139889783806, "percentage": 90.7, "elapsed_time": "11:58:23", "remaining_time": "1:13:38"}
|
| 401 |
+
{"current_steps": 401, "total_steps": 441, "loss": 0.6452, "lr": 1.997155290362187e-06, "epoch": 2.7197965239508264, "percentage": 90.93, "elapsed_time": "12:00:12", "remaining_time": "1:11:50"}
|
| 402 |
+
{"current_steps": 402, "total_steps": 441, "loss": 0.6472, "lr": 1.8993338425655805e-06, "epoch": 2.7265790589232726, "percentage": 91.16, "elapsed_time": "12:02:03", "remaining_time": "1:10:03"}
|
| 403 |
+
{"current_steps": 403, "total_steps": 441, "loss": 0.6341, "lr": 1.8039103422370452e-06, "epoch": 2.7333615938957188, "percentage": 91.38, "elapsed_time": "12:03:52", "remaining_time": "1:08:15"}
|
| 404 |
+
{"current_steps": 404, "total_steps": 441, "loss": 0.6292, "lr": 1.7108907950600516e-06, "epoch": 2.7401441288681645, "percentage": 91.61, "elapsed_time": "12:05:40", "remaining_time": "1:06:27"}
|
| 405 |
+
{"current_steps": 405, "total_steps": 441, "loss": 0.6437, "lr": 1.6202810554201099e-06, "epoch": 2.7469266638406102, "percentage": 91.84, "elapsed_time": "12:07:27", "remaining_time": "1:04:39"}
|
| 406 |
+
{"current_steps": 406, "total_steps": 441, "loss": 0.6456, "lr": 1.532086826036281e-06, "epoch": 2.7537091988130564, "percentage": 92.06, "elapsed_time": "12:09:13", "remaining_time": "1:02:51"}
|
| 407 |
+
{"current_steps": 407, "total_steps": 441, "loss": 0.6502, "lr": 1.4463136576023185e-06, "epoch": 2.760491733785502, "percentage": 92.29, "elapsed_time": "12:11:00", "remaining_time": "1:01:04"}
|
| 408 |
+
{"current_steps": 408, "total_steps": 441, "loss": 0.6469, "lr": 1.3629669484372722e-06, "epoch": 2.7672742687579484, "percentage": 92.52, "elapsed_time": "12:12:47", "remaining_time": "0:59:16"}
|
| 409 |
+
{"current_steps": 409, "total_steps": 441, "loss": 0.6431, "lr": 1.2820519441457502e-06, "epoch": 2.774056803730394, "percentage": 92.74, "elapsed_time": "12:14:34", "remaining_time": "0:57:28"}
|
| 410 |
+
{"current_steps": 410, "total_steps": 441, "loss": 0.6456, "lr": 1.2035737372877931e-06, "epoch": 2.7808393387028403, "percentage": 92.97, "elapsed_time": "12:16:21", "remaining_time": "0:55:40"}
|
| 411 |
+
{"current_steps": 411, "total_steps": 441, "loss": 0.6459, "lr": 1.127537267058334e-06, "epoch": 2.787621873675286, "percentage": 93.2, "elapsed_time": "12:18:08", "remaining_time": "0:53:52"}
|
| 412 |
+
{"current_steps": 412, "total_steps": 441, "loss": 0.6429, "lr": 1.0539473189763583e-06, "epoch": 2.794404408647732, "percentage": 93.42, "elapsed_time": "12:19:54", "remaining_time": "0:52:04"}
|
| 413 |
+
{"current_steps": 413, "total_steps": 441, "loss": 0.6341, "lr": 9.828085245837183e-07, "epoch": 2.801186943620178, "percentage": 93.65, "elapsed_time": "12:21:41", "remaining_time": "0:50:17"}
|
| 414 |
+
{"current_steps": 414, "total_steps": 441, "loss": 0.6494, "lr": 9.141253611536238e-07, "epoch": 2.807969478592624, "percentage": 93.88, "elapsed_time": "12:23:28", "remaining_time": "0:48:29"}
|
| 415 |
+
{"current_steps": 415, "total_steps": 441, "loss": 0.6424, "lr": 8.479021514088548e-07, "epoch": 2.81475201356507, "percentage": 94.1, "elapsed_time": "12:25:16", "remaining_time": "0:46:41"}
|
| 416 |
+
{"current_steps": 416, "total_steps": 441, "loss": 0.6426, "lr": 7.841430632497204e-07, "epoch": 2.821534548537516, "percentage": 94.33, "elapsed_time": "12:27:02", "remaining_time": "0:44:53"}
|
| 417 |
+
{"current_steps": 417, "total_steps": 441, "loss": 0.6438, "lr": 7.228521094917318e-07, "epoch": 2.828317083509962, "percentage": 94.56, "elapsed_time": "12:28:49", "remaining_time": "0:43:05"}
|
| 418 |
+
{"current_steps": 418, "total_steps": 441, "loss": 0.6405, "lr": 6.640331476130435e-07, "epoch": 2.835099618482408, "percentage": 94.78, "elapsed_time": "12:30:35", "remaining_time": "0:41:18"}
|
| 419 |
+
{"current_steps": 419, "total_steps": 441, "loss": 0.6489, "lr": 6.076898795116792e-07, "epoch": 2.8418821534548537, "percentage": 95.01, "elapsed_time": "12:32:22", "remaining_time": "0:39:30"}
|
| 420 |
+
{"current_steps": 420, "total_steps": 441, "loss": 0.6209, "lr": 5.538258512725403e-07, "epoch": 2.8486646884272995, "percentage": 95.24, "elapsed_time": "12:34:11", "remaining_time": "0:37:42"}
|
| 421 |
+
{"current_steps": 421, "total_steps": 441, "loss": 0.6447, "lr": 5.024444529442285e-07, "epoch": 2.8554472233997457, "percentage": 95.46, "elapsed_time": "12:35:57", "remaining_time": "0:35:54"}
|
| 422 |
+
{"current_steps": 422, "total_steps": 441, "loss": 0.6327, "lr": 4.5354891832569245e-07, "epoch": 2.862229758372192, "percentage": 95.69, "elapsed_time": "12:37:44", "remaining_time": "0:34:06"}
|
| 423 |
+
{"current_steps": 423, "total_steps": 441, "loss": 0.6357, "lr": 4.0714232476269265e-07, "epoch": 2.8690122933446376, "percentage": 95.92, "elapsed_time": "12:39:31", "remaining_time": "0:32:19"}
|
| 424 |
+
{"current_steps": 424, "total_steps": 441, "loss": 0.6384, "lr": 3.632275929541207e-07, "epoch": 2.8757948283170833, "percentage": 96.15, "elapsed_time": "12:41:17", "remaining_time": "0:30:31"}
|
| 425 |
+
{"current_steps": 425, "total_steps": 441, "loss": 0.6343, "lr": 3.218074867681864e-07, "epoch": 2.8825773632895295, "percentage": 96.37, "elapsed_time": "12:43:05", "remaining_time": "0:28:43"}
|
| 426 |
+
{"current_steps": 426, "total_steps": 441, "loss": 0.6418, "lr": 2.8288461306846817e-07, "epoch": 2.8893598982619753, "percentage": 96.6, "elapsed_time": "12:44:51", "remaining_time": "0:26:55"}
|
| 427 |
+
{"current_steps": 427, "total_steps": 441, "loss": 0.6399, "lr": 2.464614215498351e-07, "epoch": 2.8961424332344214, "percentage": 96.83, "elapsed_time": "12:46:38", "remaining_time": "0:25:08"}
|
| 428 |
+
{"current_steps": 428, "total_steps": 441, "loss": 0.645, "lr": 2.1254020458427281e-07, "epoch": 2.902924968206867, "percentage": 97.05, "elapsed_time": "12:48:24", "remaining_time": "0:23:20"}
|
| 429 |
+
{"current_steps": 429, "total_steps": 441, "loss": 0.6366, "lr": 1.8112309707661647e-07, "epoch": 2.9097075031793134, "percentage": 97.28, "elapsed_time": "12:50:11", "remaining_time": "0:21:32"}
|
| 430 |
+
{"current_steps": 430, "total_steps": 441, "loss": 0.6468, "lr": 1.522120763301782e-07, "epoch": 2.916490038151759, "percentage": 97.51, "elapsed_time": "12:51:57", "remaining_time": "0:19:44"}
|
| 431 |
+
{"current_steps": 431, "total_steps": 441, "loss": 0.6457, "lr": 1.2580896192230906e-07, "epoch": 2.9232725731242053, "percentage": 97.73, "elapsed_time": "12:53:45", "remaining_time": "0:17:57"}
|
| 432 |
+
{"current_steps": 432, "total_steps": 441, "loss": 0.648, "lr": 1.019154155898594e-07, "epoch": 2.930055108096651, "percentage": 97.96, "elapsed_time": "12:55:31", "remaining_time": "0:16:09"}
|
| 433 |
+
{"current_steps": 433, "total_steps": 441, "loss": 0.6406, "lr": 8.053294112462696e-08, "epoch": 2.9368376430690972, "percentage": 98.19, "elapsed_time": "12:57:18", "remaining_time": "0:14:21"}
|
| 434 |
+
{"current_steps": 434, "total_steps": 441, "loss": 0.6349, "lr": 6.166288427867706e-08, "epoch": 2.943620178041543, "percentage": 98.41, "elapsed_time": "12:59:06", "remaining_time": "0:12:33"}
|
| 435 |
+
{"current_steps": 435, "total_steps": 441, "loss": 0.6532, "lr": 4.530643267968149e-08, "epoch": 2.9504027130139887, "percentage": 98.64, "elapsed_time": "13:00:53", "remaining_time": "0:10:46"}
|
| 436 |
+
{"current_steps": 436, "total_steps": 441, "loss": 0.6323, "lr": 3.1464615756133796e-08, "epoch": 2.957185247986435, "percentage": 98.87, "elapsed_time": "13:02:40", "remaining_time": "0:08:58"}
|
| 437 |
+
{"current_steps": 437, "total_steps": 441, "loss": 0.6495, "lr": 2.01383046725967e-08, "epoch": 2.963967782958881, "percentage": 99.09, "elapsed_time": "13:04:29", "remaining_time": "0:07:10"}
|
| 438 |
+
{"current_steps": 438, "total_steps": 441, "loss": 0.6516, "lr": 1.1328212274839267e-08, "epoch": 2.970750317931327, "percentage": 99.32, "elapsed_time": "13:06:17", "remaining_time": "0:05:23"}
|
| 439 |
+
{"current_steps": 439, "total_steps": 441, "loss": 0.6377, "lr": 5.034893044997269e-09, "epoch": 2.9775328529037726, "percentage": 99.55, "elapsed_time": "13:08:06", "remaining_time": "0:03:35"}
|
| 440 |
+
{"current_steps": 440, "total_steps": 441, "loss": 0.6443, "lr": 1.2587430666766153e-09, "epoch": 2.9843153878762188, "percentage": 99.77, "elapsed_time": "13:09:56", "remaining_time": "0:01:47"}
|
| 441 |
+
{"current_steps": 441, "total_steps": 441, "loss": 0.6409, "lr": 0.0, "epoch": 2.991097922848665, "percentage": 100.0, "elapsed_time": "13:11:44", "remaining_time": "0:00:00"}
|
| 442 |
+
{"current_steps": 441, "total_steps": 441, "epoch": 2.991097922848665, "percentage": 100.0, "elapsed_time": "13:13:49", "remaining_time": "0:00:00"}
|