Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6d49ad30bcd6ad70aedc18fc8e27452edc708711851da4798b32cc418096753d
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cbef6f6bca0cc4b1f1b466aff2750ed5a791bf45b69f45c1abb2a0145ee319bf
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7658a695fae6c7a1d9b86ff973691a21f23093721a9cec921cf205e7ef20210d
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25a2acb4040aaa99033ca6d314f3872941e3ed125e2a024f0ae133bb93983380
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -499,3 +499,128 @@
|
|
| 499 |
{"current_steps": 499, "total_steps": 625, "loss": 0.4066, "lr": 9.518509952841586e-06, "epoch": 3.9860209685471792, "percentage": 79.84, "elapsed_time": "21:19:49", "remaining_time": "5:23:09"}
|
| 500 |
{"current_steps": 500, "total_steps": 625, "loss": 0.4039, "lr": 9.374197950119726e-06, "epoch": 3.9940089865202197, "percentage": 80.0, "elapsed_time": "21:22:21", "remaining_time": "5:20:35"}
|
| 501 |
{"current_steps": 501, "total_steps": 625, "loss": 0.7111, "lr": 9.230842950740002e-06, "epoch": 4.00199700449326, "percentage": 80.16, "elapsed_time": "21:26:30", "remaining_time": "5:18:25"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 499 |
{"current_steps": 499, "total_steps": 625, "loss": 0.4066, "lr": 9.518509952841586e-06, "epoch": 3.9860209685471792, "percentage": 79.84, "elapsed_time": "21:19:49", "remaining_time": "5:23:09"}
|
| 500 |
{"current_steps": 500, "total_steps": 625, "loss": 0.4039, "lr": 9.374197950119726e-06, "epoch": 3.9940089865202197, "percentage": 80.0, "elapsed_time": "21:22:21", "remaining_time": "5:20:35"}
|
| 501 |
{"current_steps": 501, "total_steps": 625, "loss": 0.7111, "lr": 9.230842950740002e-06, "epoch": 4.00199700449326, "percentage": 80.16, "elapsed_time": "21:26:30", "remaining_time": "5:18:25"}
|
| 502 |
+
{"current_steps": 502, "total_steps": 625, "loss": 0.3809, "lr": 9.088449434298204e-06, "epoch": 4.0099850224663, "percentage": 80.32, "elapsed_time": "21:29:03", "remaining_time": "5:15:50"}
|
| 503 |
+
{"current_steps": 503, "total_steps": 625, "loss": 0.3726, "lr": 8.947021850345398e-06, "epoch": 4.017973040439341, "percentage": 80.48, "elapsed_time": "21:31:36", "remaining_time": "5:13:16"}
|
| 504 |
+
{"current_steps": 504, "total_steps": 625, "loss": 0.3808, "lr": 8.806564618248999e-06, "epoch": 4.025961058412381, "percentage": 80.64, "elapsed_time": "21:34:09", "remaining_time": "5:10:42"}
|
| 505 |
+
{"current_steps": 505, "total_steps": 625, "loss": 0.3832, "lr": 8.667082127054533e-06, "epoch": 4.033949076385422, "percentage": 80.8, "elapsed_time": "21:36:42", "remaining_time": "5:08:07"}
|
| 506 |
+
{"current_steps": 506, "total_steps": 625, "loss": 0.3779, "lr": 8.52857873534862e-06, "epoch": 4.041937094358462, "percentage": 80.96, "elapsed_time": "21:39:15", "remaining_time": "5:05:33"}
|
| 507 |
+
{"current_steps": 507, "total_steps": 625, "loss": 0.3831, "lr": 8.391058771122673e-06, "epoch": 4.049925112331502, "percentage": 81.12, "elapsed_time": "21:41:49", "remaining_time": "5:02:59"}
|
| 508 |
+
{"current_steps": 508, "total_steps": 625, "loss": 0.3874, "lr": 8.254526531637727e-06, "epoch": 4.057913130304543, "percentage": 81.28, "elapsed_time": "21:44:21", "remaining_time": "5:00:24"}
|
| 509 |
+
{"current_steps": 509, "total_steps": 625, "loss": 0.3873, "lr": 8.118986283290096e-06, "epoch": 4.065901148277583, "percentage": 81.44, "elapsed_time": "21:46:54", "remaining_time": "4:57:50"}
|
| 510 |
+
{"current_steps": 510, "total_steps": 625, "loss": 0.3779, "lr": 7.984442261478108e-06, "epoch": 4.073889166250624, "percentage": 81.6, "elapsed_time": "21:49:28", "remaining_time": "4:55:16"}
|
| 511 |
+
{"current_steps": 511, "total_steps": 625, "loss": 0.3796, "lr": 7.850898670469745e-06, "epoch": 4.081877184223664, "percentage": 81.76, "elapsed_time": "21:52:01", "remaining_time": "4:52:42"}
|
| 512 |
+
{"current_steps": 512, "total_steps": 625, "loss": 0.3801, "lr": 7.718359683271224e-06, "epoch": 4.089865202196705, "percentage": 81.92, "elapsed_time": "21:54:34", "remaining_time": "4:50:07"}
|
| 513 |
+
{"current_steps": 513, "total_steps": 625, "loss": 0.3692, "lr": 7.586829441496668e-06, "epoch": 4.097853220169745, "percentage": 82.08, "elapsed_time": "21:57:07", "remaining_time": "4:47:33"}
|
| 514 |
+
{"current_steps": 514, "total_steps": 625, "loss": 0.3792, "lr": 7.456312055238606e-06, "epoch": 4.105841238142786, "percentage": 82.24, "elapsed_time": "21:59:40", "remaining_time": "4:44:59"}
|
| 515 |
+
{"current_steps": 515, "total_steps": 625, "loss": 0.3825, "lr": 7.326811602939634e-06, "epoch": 4.113829256115826, "percentage": 82.4, "elapsed_time": "22:02:13", "remaining_time": "4:42:24"}
|
| 516 |
+
{"current_steps": 516, "total_steps": 625, "loss": 0.3827, "lr": 7.198332131264876e-06, "epoch": 4.121817274088866, "percentage": 82.56, "elapsed_time": "22:04:45", "remaining_time": "4:39:50"}
|
| 517 |
+
{"current_steps": 517, "total_steps": 625, "loss": 0.3858, "lr": 7.070877654975614e-06, "epoch": 4.129805292061907, "percentage": 82.72, "elapsed_time": "22:07:17", "remaining_time": "4:37:16"}
|
| 518 |
+
{"current_steps": 518, "total_steps": 625, "loss": 0.3763, "lr": 6.944452156803763e-06, "epoch": 4.137793310034947, "percentage": 82.88, "elapsed_time": "22:09:50", "remaining_time": "4:34:41"}
|
| 519 |
+
{"current_steps": 519, "total_steps": 625, "loss": 0.3798, "lr": 6.819059587327479e-06, "epoch": 4.145781328007988, "percentage": 83.04, "elapsed_time": "22:12:25", "remaining_time": "4:32:07"}
|
| 520 |
+
{"current_steps": 520, "total_steps": 625, "loss": 0.3812, "lr": 6.694703864847673e-06, "epoch": 4.153769345981028, "percentage": 83.2, "elapsed_time": "22:14:59", "remaining_time": "4:29:33"}
|
| 521 |
+
{"current_steps": 521, "total_steps": 625, "loss": 0.3804, "lr": 6.571388875265592e-06, "epoch": 4.161757363954069, "percentage": 83.36, "elapsed_time": "22:17:35", "remaining_time": "4:27:00"}
|
| 522 |
+
{"current_steps": 522, "total_steps": 625, "loss": 0.3815, "lr": 6.449118471961342e-06, "epoch": 4.169745381927109, "percentage": 83.52, "elapsed_time": "22:20:09", "remaining_time": "4:24:26"}
|
| 523 |
+
{"current_steps": 523, "total_steps": 625, "loss": 0.3796, "lr": 6.327896475673561e-06, "epoch": 4.177733399900149, "percentage": 83.68, "elapsed_time": "22:22:42", "remaining_time": "4:21:52"}
|
| 524 |
+
{"current_steps": 524, "total_steps": 625, "loss": 0.3802, "lr": 6.207726674379961e-06, "epoch": 4.18572141787319, "percentage": 83.84, "elapsed_time": "22:25:15", "remaining_time": "4:19:17"}
|
| 525 |
+
{"current_steps": 525, "total_steps": 625, "loss": 0.3752, "lr": 6.088612823178968e-06, "epoch": 4.19370943584623, "percentage": 84.0, "elapsed_time": "22:27:47", "remaining_time": "4:16:43"}
|
| 526 |
+
{"current_steps": 526, "total_steps": 625, "loss": 0.3772, "lr": 5.970558644172424e-06, "epoch": 4.201697453819271, "percentage": 84.16, "elapsed_time": "22:30:20", "remaining_time": "4:14:09"}
|
| 527 |
+
{"current_steps": 527, "total_steps": 625, "loss": 0.3738, "lr": 5.853567826349213e-06, "epoch": 4.209685471792311, "percentage": 84.32, "elapsed_time": "22:32:53", "remaining_time": "4:11:34"}
|
| 528 |
+
{"current_steps": 528, "total_steps": 625, "loss": 0.3752, "lr": 5.737644025470057e-06, "epoch": 4.217673489765352, "percentage": 84.48, "elapsed_time": "22:35:25", "remaining_time": "4:09:00"}
|
| 529 |
+
{"current_steps": 529, "total_steps": 625, "loss": 0.3822, "lr": 5.6227908639532045e-06, "epoch": 4.225661507738392, "percentage": 84.64, "elapsed_time": "22:37:58", "remaining_time": "4:06:26"}
|
| 530 |
+
{"current_steps": 530, "total_steps": 625, "loss": 0.381, "lr": 5.509011930761308e-06, "epoch": 4.233649525711433, "percentage": 84.8, "elapsed_time": "22:40:31", "remaining_time": "4:03:52"}
|
| 531 |
+
{"current_steps": 531, "total_steps": 625, "loss": 0.3816, "lr": 5.396310781289243e-06, "epoch": 4.241637543684473, "percentage": 84.96, "elapsed_time": "22:43:04", "remaining_time": "4:01:17"}
|
| 532 |
+
{"current_steps": 532, "total_steps": 625, "loss": 0.3696, "lr": 5.284690937252977e-06, "epoch": 4.249625561657513, "percentage": 85.12, "elapsed_time": "22:45:37", "remaining_time": "3:58:43"}
|
| 533 |
+
{"current_steps": 533, "total_steps": 625, "loss": 0.3859, "lr": 5.1741558865795906e-06, "epoch": 4.257613579630554, "percentage": 85.28, "elapsed_time": "22:48:10", "remaining_time": "3:56:09"}
|
| 534 |
+
{"current_steps": 534, "total_steps": 625, "loss": 0.3822, "lr": 5.064709083298214e-06, "epoch": 4.265601597603594, "percentage": 85.44, "elapsed_time": "22:50:43", "remaining_time": "3:53:35"}
|
| 535 |
+
{"current_steps": 535, "total_steps": 625, "loss": 0.3782, "lr": 4.95635394743216e-06, "epoch": 4.273589615576635, "percentage": 85.6, "elapsed_time": "22:53:16", "remaining_time": "3:51:01"}
|
| 536 |
+
{"current_steps": 536, "total_steps": 625, "loss": 0.3822, "lr": 4.849093864891994e-06, "epoch": 4.281577633549675, "percentage": 85.76, "elapsed_time": "22:55:48", "remaining_time": "3:48:26"}
|
| 537 |
+
{"current_steps": 537, "total_steps": 625, "loss": 0.3783, "lr": 4.7429321873697865e-06, "epoch": 4.289565651522716, "percentage": 85.92, "elapsed_time": "22:58:21", "remaining_time": "3:45:52"}
|
| 538 |
+
{"current_steps": 538, "total_steps": 625, "loss": 0.3805, "lr": 4.637872232234326e-06, "epoch": 4.297553669495756, "percentage": 86.08, "elapsed_time": "23:00:55", "remaining_time": "3:43:18"}
|
| 539 |
+
{"current_steps": 539, "total_steps": 625, "loss": 0.3795, "lr": 4.5339172824274955e-06, "epoch": 4.305541687468796, "percentage": 86.24, "elapsed_time": "23:03:27", "remaining_time": "3:40:44"}
|
| 540 |
+
{"current_steps": 540, "total_steps": 625, "loss": 0.3794, "lr": 4.4310705863616835e-06, "epoch": 4.313529705441837, "percentage": 86.4, "elapsed_time": "23:06:00", "remaining_time": "3:38:10"}
|
| 541 |
+
{"current_steps": 541, "total_steps": 625, "loss": 0.3759, "lr": 4.329335357818236e-06, "epoch": 4.321517723414877, "percentage": 86.56, "elapsed_time": "23:08:34", "remaining_time": "3:35:36"}
|
| 542 |
+
{"current_steps": 542, "total_steps": 625, "loss": 0.3877, "lr": 4.228714775847084e-06, "epoch": 4.329505741387918, "percentage": 86.72, "elapsed_time": "23:11:06", "remaining_time": "3:33:01"}
|
| 543 |
+
{"current_steps": 543, "total_steps": 625, "loss": 0.3803, "lr": 4.129211984667385e-06, "epoch": 4.337493759360958, "percentage": 86.88, "elapsed_time": "23:13:39", "remaining_time": "3:30:27"}
|
| 544 |
+
{"current_steps": 544, "total_steps": 625, "loss": 0.3764, "lr": 4.030830093569247e-06, "epoch": 4.345481777333999, "percentage": 87.04, "elapsed_time": "23:16:11", "remaining_time": "3:27:53"}
|
| 545 |
+
{"current_steps": 545, "total_steps": 625, "loss": 0.3818, "lr": 3.933572176816602e-06, "epoch": 4.353469795307039, "percentage": 87.2, "elapsed_time": "23:18:44", "remaining_time": "3:25:19"}
|
| 546 |
+
{"current_steps": 546, "total_steps": 625, "loss": 0.3749, "lr": 3.837441273551137e-06, "epoch": 4.361457813280079, "percentage": 87.36, "elapsed_time": "23:21:17", "remaining_time": "3:22:45"}
|
| 547 |
+
{"current_steps": 547, "total_steps": 625, "loss": 0.3741, "lr": 3.7424403876972924e-06, "epoch": 4.36944583125312, "percentage": 87.52, "elapsed_time": "23:23:50", "remaining_time": "3:20:10"}
|
| 548 |
+
{"current_steps": 548, "total_steps": 625, "loss": 0.3889, "lr": 3.6485724878684382e-06, "epoch": 4.37743384922616, "percentage": 87.68, "elapsed_time": "23:26:22", "remaining_time": "3:17:36"}
|
| 549 |
+
{"current_steps": 549, "total_steps": 625, "loss": 0.3788, "lr": 3.555840507274093e-06, "epoch": 4.385421867199201, "percentage": 87.84, "elapsed_time": "23:28:56", "remaining_time": "3:15:02"}
|
| 550 |
+
{"current_steps": 550, "total_steps": 625, "loss": 0.3833, "lr": 3.464247343628242e-06, "epoch": 4.393409885172241, "percentage": 88.0, "elapsed_time": "23:31:29", "remaining_time": "3:12:28"}
|
| 551 |
+
{"current_steps": 551, "total_steps": 625, "loss": 0.3756, "lr": 3.373795859058837e-06, "epoch": 4.401397903145282, "percentage": 88.16, "elapsed_time": "23:34:01", "remaining_time": "3:09:54"}
|
| 552 |
+
{"current_steps": 552, "total_steps": 625, "loss": 0.3809, "lr": 3.284488880018315e-06, "epoch": 4.409385921118322, "percentage": 88.32, "elapsed_time": "23:36:34", "remaining_time": "3:07:20"}
|
| 553 |
+
{"current_steps": 553, "total_steps": 625, "loss": 0.379, "lr": 3.196329197195307e-06, "epoch": 4.417373939091363, "percentage": 88.48, "elapsed_time": "23:39:07", "remaining_time": "3:04:46"}
|
| 554 |
+
{"current_steps": 554, "total_steps": 625, "loss": 0.3844, "lr": 3.1093195654274024e-06, "epoch": 4.425361957064403, "percentage": 88.64, "elapsed_time": "23:41:40", "remaining_time": "3:02:12"}
|
| 555 |
+
{"current_steps": 555, "total_steps": 625, "loss": 0.3754, "lr": 3.0234627036151186e-06, "epoch": 4.433349975037443, "percentage": 88.8, "elapsed_time": "23:44:13", "remaining_time": "2:59:37"}
|
| 556 |
+
{"current_steps": 556, "total_steps": 625, "loss": 0.3767, "lr": 2.9387612946368647e-06, "epoch": 4.441337993010484, "percentage": 88.96, "elapsed_time": "23:46:45", "remaining_time": "2:57:03"}
|
| 557 |
+
{"current_steps": 557, "total_steps": 625, "loss": 0.3818, "lr": 2.855217985265184e-06, "epoch": 4.449326010983524, "percentage": 89.12, "elapsed_time": "23:49:18", "remaining_time": "2:54:29"}
|
| 558 |
+
{"current_steps": 558, "total_steps": 625, "loss": 0.3789, "lr": 2.7728353860839763e-06, "epoch": 4.457314028956565, "percentage": 89.28, "elapsed_time": "23:51:51", "remaining_time": "2:51:55"}
|
| 559 |
+
{"current_steps": 559, "total_steps": 625, "loss": 0.3721, "lr": 2.6916160714069817e-06, "epoch": 4.465302046929605, "percentage": 89.44, "elapsed_time": "23:54:23", "remaining_time": "2:49:21"}
|
| 560 |
+
{"current_steps": 560, "total_steps": 625, "loss": 0.3777, "lr": 2.6115625791973155e-06, "epoch": 4.473290064902646, "percentage": 89.6, "elapsed_time": "23:56:56", "remaining_time": "2:46:47"}
|
| 561 |
+
{"current_steps": 561, "total_steps": 625, "loss": 0.3805, "lr": 2.5326774109881223e-06, "epoch": 4.481278082875686, "percentage": 89.76, "elapsed_time": "23:59:29", "remaining_time": "2:44:13"}
|
| 562 |
+
{"current_steps": 562, "total_steps": 625, "loss": 0.3746, "lr": 2.454963031804485e-06, "epoch": 4.489266100848727, "percentage": 89.92, "elapsed_time": "1 day, 0:02:02", "remaining_time": "2:41:39"}
|
| 563 |
+
{"current_steps": 563, "total_steps": 625, "loss": 0.3761, "lr": 2.378421870086314e-06, "epoch": 4.497254118821767, "percentage": 90.08, "elapsed_time": "1 day, 0:04:35", "remaining_time": "2:39:05"}
|
| 564 |
+
{"current_steps": 564, "total_steps": 625, "loss": 0.3738, "lr": 2.3030563176125444e-06, "epoch": 4.5052421367948075, "percentage": 90.24, "elapsed_time": "1 day, 0:07:08", "remaining_time": "2:36:31"}
|
| 565 |
+
{"current_steps": 565, "total_steps": 625, "loss": 0.3765, "lr": 2.228868729426319e-06, "epoch": 4.513230154767848, "percentage": 90.4, "elapsed_time": "1 day, 0:09:41", "remaining_time": "2:33:56"}
|
| 566 |
+
{"current_steps": 566, "total_steps": 625, "loss": 0.3778, "lr": 2.1558614237614516e-06, "epoch": 4.521218172740888, "percentage": 90.56, "elapsed_time": "1 day, 0:12:14", "remaining_time": "2:31:22"}
|
| 567 |
+
{"current_steps": 567, "total_steps": 625, "loss": 0.3857, "lr": 2.0840366819699788e-06, "epoch": 4.529206190713929, "percentage": 90.72, "elapsed_time": "1 day, 0:14:46", "remaining_time": "2:28:48"}
|
| 568 |
+
{"current_steps": 568, "total_steps": 625, "loss": 0.3761, "lr": 2.013396748450842e-06, "epoch": 4.537194208686969, "percentage": 90.88, "elapsed_time": "1 day, 0:17:20", "remaining_time": "2:26:14"}
|
| 569 |
+
{"current_steps": 569, "total_steps": 625, "loss": 0.3756, "lr": 1.9439438305797776e-06, "epoch": 4.54518222666001, "percentage": 91.04, "elapsed_time": "1 day, 0:19:54", "remaining_time": "2:23:40"}
|
| 570 |
+
{"current_steps": 570, "total_steps": 625, "loss": 0.3782, "lr": 1.8756800986403466e-06, "epoch": 4.55317024463305, "percentage": 91.2, "elapsed_time": "1 day, 0:22:29", "remaining_time": "2:21:07"}
|
| 571 |
+
{"current_steps": 571, "total_steps": 625, "loss": 0.3776, "lr": 1.808607685756103e-06, "epoch": 4.5611582626060905, "percentage": 91.36, "elapsed_time": "1 day, 0:25:02", "remaining_time": "2:18:32"}
|
| 572 |
+
{"current_steps": 572, "total_steps": 625, "loss": 0.3713, "lr": 1.7427286878239247e-06, "epoch": 4.569146280579131, "percentage": 91.52, "elapsed_time": "1 day, 0:27:38", "remaining_time": "2:15:59"}
|
| 573 |
+
{"current_steps": 573, "total_steps": 625, "loss": 0.3781, "lr": 1.6780451634485606e-06, "epoch": 4.5771342985521715, "percentage": 91.68, "elapsed_time": "1 day, 0:30:12", "remaining_time": "2:13:25"}
|
| 574 |
+
{"current_steps": 574, "total_steps": 625, "loss": 0.3822, "lr": 1.614559133878264e-06, "epoch": 4.585122316525212, "percentage": 91.84, "elapsed_time": "1 day, 0:32:47", "remaining_time": "2:10:51"}
|
| 575 |
+
{"current_steps": 575, "total_steps": 625, "loss": 0.3789, "lr": 1.5522725829416474e-06, "epoch": 4.5931103344982525, "percentage": 92.0, "elapsed_time": "1 day, 0:35:20", "remaining_time": "2:08:17"}
|
| 576 |
+
{"current_steps": 576, "total_steps": 625, "loss": 0.3777, "lr": 1.4911874569856965e-06, "epoch": 4.601098352471293, "percentage": 92.16, "elapsed_time": "1 day, 0:37:55", "remaining_time": "2:05:43"}
|
| 577 |
+
{"current_steps": 577, "total_steps": 625, "loss": 0.3818, "lr": 1.4313056648149393e-06, "epoch": 4.6090863704443334, "percentage": 92.32, "elapsed_time": "1 day, 0:40:29", "remaining_time": "2:03:09"}
|
| 578 |
+
{"current_steps": 578, "total_steps": 625, "loss": 0.3752, "lr": 1.3726290776318175e-06, "epoch": 4.6170743884173735, "percentage": 92.48, "elapsed_time": "1 day, 0:43:03", "remaining_time": "2:00:35"}
|
| 579 |
+
{"current_steps": 579, "total_steps": 625, "loss": 0.3846, "lr": 1.3151595289781738e-06, "epoch": 4.625062406390414, "percentage": 92.64, "elapsed_time": "1 day, 0:45:35", "remaining_time": "1:58:01"}
|
| 580 |
+
{"current_steps": 580, "total_steps": 625, "loss": 0.3884, "lr": 1.2588988146780135e-06, "epoch": 4.6330504243634545, "percentage": 92.8, "elapsed_time": "1 day, 0:48:09", "remaining_time": "1:55:27"}
|
| 581 |
+
{"current_steps": 581, "total_steps": 625, "loss": 0.3841, "lr": 1.2038486927813354e-06, "epoch": 4.641038442336495, "percentage": 92.96, "elapsed_time": "1 day, 0:50:42", "remaining_time": "1:52:53"}
|
| 582 |
+
{"current_steps": 582, "total_steps": 625, "loss": 0.3812, "lr": 1.1500108835092472e-06, "epoch": 4.6490264603095355, "percentage": 93.12, "elapsed_time": "1 day, 0:53:14", "remaining_time": "1:50:19"}
|
| 583 |
+
{"current_steps": 583, "total_steps": 625, "loss": 0.3792, "lr": 1.0973870692001554e-06, "epoch": 4.657014478282576, "percentage": 93.28, "elapsed_time": "1 day, 0:55:48", "remaining_time": "1:47:45"}
|
| 584 |
+
{"current_steps": 584, "total_steps": 625, "loss": 0.3843, "lr": 1.0459788942572423e-06, "epoch": 4.6650024962556165, "percentage": 93.44, "elapsed_time": "1 day, 0:58:21", "remaining_time": "1:45:11"}
|
| 585 |
+
{"current_steps": 585, "total_steps": 625, "loss": 0.3857, "lr": 9.957879650970549e-07, "epoch": 4.6729905142286565, "percentage": 93.6, "elapsed_time": "1 day, 1:00:54", "remaining_time": "1:42:37"}
|
| 586 |
+
{"current_steps": 586, "total_steps": 625, "loss": 0.3874, "lr": 9.468158500993207e-07, "epoch": 4.6809785322016975, "percentage": 93.76, "elapsed_time": "1 day, 1:03:26", "remaining_time": "1:40:03"}
|
| 587 |
+
{"current_steps": 587, "total_steps": 625, "loss": 0.3808, "lr": 8.990640795579186e-07, "epoch": 4.6889665501747375, "percentage": 93.92, "elapsed_time": "1 day, 1:05:59", "remaining_time": "1:37:29"}
|
| 588 |
+
{"current_steps": 588, "total_steps": 625, "loss": 0.3727, "lr": 8.525341456330883e-07, "epoch": 4.6969545681477785, "percentage": 94.08, "elapsed_time": "1 day, 1:08:32", "remaining_time": "1:34:55"}
|
| 589 |
+
{"current_steps": 589, "total_steps": 625, "loss": 0.3761, "lr": 8.072275023047926e-07, "epoch": 4.7049425861208185, "percentage": 94.24, "elapsed_time": "1 day, 1:11:05", "remaining_time": "1:32:21"}
|
| 590 |
+
{"current_steps": 590, "total_steps": 625, "loss": 0.3832, "lr": 7.631455653272613e-07, "epoch": 4.712930604093859, "percentage": 94.4, "elapsed_time": "1 day, 1:13:38", "remaining_time": "1:29:47"}
|
| 591 |
+
{"current_steps": 591, "total_steps": 625, "loss": 0.3749, "lr": 7.202897121847852e-07, "epoch": 4.7209186220668995, "percentage": 94.56, "elapsed_time": "1 day, 1:16:10", "remaining_time": "1:27:13"}
|
| 592 |
+
{"current_steps": 592, "total_steps": 625, "loss": 0.3742, "lr": 6.786612820486449e-07, "epoch": 4.72890664003994, "percentage": 94.72, "elapsed_time": "1 day, 1:18:43", "remaining_time": "1:24:39"}
|
| 593 |
+
{"current_steps": 593, "total_steps": 625, "loss": 0.383, "lr": 6.382615757352817e-07, "epoch": 4.7368946580129805, "percentage": 94.88, "elapsed_time": "1 day, 1:21:16", "remaining_time": "1:22:05"}
|
| 594 |
+
{"current_steps": 594, "total_steps": 625, "loss": 0.3802, "lr": 5.990918556656411e-07, "epoch": 4.744882675986021, "percentage": 95.04, "elapsed_time": "1 day, 1:23:51", "remaining_time": "1:19:31"}
|
| 595 |
+
{"current_steps": 595, "total_steps": 625, "loss": 0.3826, "lr": 5.611533458257245e-07, "epoch": 4.7528706939590615, "percentage": 95.2, "elapsed_time": "1 day, 1:26:25", "remaining_time": "1:16:57"}
|
| 596 |
+
{"current_steps": 596, "total_steps": 625, "loss": 0.375, "lr": 5.2444723172834e-07, "epoch": 4.7608587119321015, "percentage": 95.36, "elapsed_time": "1 day, 1:28:57", "remaining_time": "1:14:23"}
|
| 597 |
+
{"current_steps": 597, "total_steps": 625, "loss": 0.3841, "lr": 4.889746603760693e-07, "epoch": 4.7688467299051425, "percentage": 95.52, "elapsed_time": "1 day, 1:31:30", "remaining_time": "1:11:49"}
|
| 598 |
+
{"current_steps": 598, "total_steps": 625, "loss": 0.3753, "lr": 4.5473674022541213e-07, "epoch": 4.7768347478781825, "percentage": 95.68, "elapsed_time": "1 day, 1:34:03", "remaining_time": "1:09:15"}
|
| 599 |
+
{"current_steps": 599, "total_steps": 625, "loss": 0.3838, "lr": 4.2173454115214783e-07, "epoch": 4.7848227658512235, "percentage": 95.84, "elapsed_time": "1 day, 1:36:35", "remaining_time": "1:06:41"}
|
| 600 |
+
{"current_steps": 600, "total_steps": 625, "loss": 0.3765, "lr": 3.899690944179257e-07, "epoch": 4.7928107838242635, "percentage": 96.0, "elapsed_time": "1 day, 1:39:08", "remaining_time": "1:04:07"}
|
| 601 |
+
{"current_steps": 601, "total_steps": 625, "loss": 0.3834, "lr": 3.5944139263800694e-07, "epoch": 4.8007988017973044, "percentage": 96.16, "elapsed_time": "1 day, 1:41:41", "remaining_time": "1:01:33"}
|
| 602 |
+
{"current_steps": 602, "total_steps": 625, "loss": 0.3694, "lr": 3.3015238975026675e-07, "epoch": 4.8087868197703445, "percentage": 96.32, "elapsed_time": "1 day, 1:44:14", "remaining_time": "0:58:59"}
|
| 603 |
+
{"current_steps": 603, "total_steps": 625, "loss": 0.3783, "lr": 3.021030009853876e-07, "epoch": 4.8167748377433846, "percentage": 96.48, "elapsed_time": "1 day, 1:46:47", "remaining_time": "0:56:26"}
|
| 604 |
+
{"current_steps": 604, "total_steps": 625, "loss": 0.3773, "lr": 2.752941028382594e-07, "epoch": 4.8247628557164255, "percentage": 96.64, "elapsed_time": "1 day, 1:49:19", "remaining_time": "0:53:52"}
|
| 605 |
+
{"current_steps": 605, "total_steps": 625, "loss": 0.3777, "lr": 2.4972653304057073e-07, "epoch": 4.8327508736894655, "percentage": 96.8, "elapsed_time": "1 day, 1:51:54", "remaining_time": "0:51:18"}
|
| 606 |
+
{"current_steps": 606, "total_steps": 625, "loss": 0.3808, "lr": 2.25401090534656e-07, "epoch": 4.8407388916625065, "percentage": 96.96, "elapsed_time": "1 day, 1:54:26", "remaining_time": "0:48:44"}
|
| 607 |
+
{"current_steps": 607, "total_steps": 625, "loss": 0.3744, "lr": 2.0231853544852465e-07, "epoch": 4.8487269096355465, "percentage": 97.12, "elapsed_time": "1 day, 1:56:59", "remaining_time": "0:46:10"}
|
| 608 |
+
{"current_steps": 608, "total_steps": 625, "loss": 0.3825, "lr": 1.8047958907209339e-07, "epoch": 4.8567149276085875, "percentage": 97.28, "elapsed_time": "1 day, 1:59:32", "remaining_time": "0:43:36"}
|
| 609 |
+
{"current_steps": 609, "total_steps": 625, "loss": 0.3749, "lr": 1.5988493383466198e-07, "epoch": 4.8647029455816275, "percentage": 97.44, "elapsed_time": "1 day, 2:02:05", "remaining_time": "0:41:02"}
|
| 610 |
+
{"current_steps": 610, "total_steps": 625, "loss": 0.3748, "lr": 1.40535213283588e-07, "epoch": 4.872690963554668, "percentage": 97.6, "elapsed_time": "1 day, 2:04:38", "remaining_time": "0:38:28"}
|
| 611 |
+
{"current_steps": 611, "total_steps": 625, "loss": 0.3819, "lr": 1.2243103206417418e-07, "epoch": 4.8806789815277085, "percentage": 97.76, "elapsed_time": "1 day, 2:07:11", "remaining_time": "0:35:54"}
|
| 612 |
+
{"current_steps": 612, "total_steps": 625, "loss": 0.3827, "lr": 1.05572955900759e-07, "epoch": 4.888666999500749, "percentage": 97.92, "elapsed_time": "1 day, 2:09:43", "remaining_time": "0:33:20"}
|
| 613 |
+
{"current_steps": 613, "total_steps": 625, "loss": 0.3674, "lr": 8.996151157907306e-08, "epoch": 4.8966550174737895, "percentage": 98.08, "elapsed_time": "1 day, 2:12:16", "remaining_time": "0:30:46"}
|
| 614 |
+
{"current_steps": 614, "total_steps": 625, "loss": 0.3755, "lr": 7.559718692974116e-08, "epoch": 4.90464303544683, "percentage": 98.24, "elapsed_time": "1 day, 2:14:48", "remaining_time": "0:28:12"}
|
| 615 |
+
{"current_steps": 615, "total_steps": 625, "loss": 0.3848, "lr": 6.248043081307664e-08, "epoch": 4.9126310534198705, "percentage": 98.4, "elapsed_time": "1 day, 2:17:22", "remaining_time": "0:25:38"}
|
| 616 |
+
{"current_steps": 616, "total_steps": 625, "loss": 0.3754, "lr": 5.0611653105003824e-08, "epoch": 4.9206190713929105, "percentage": 98.56, "elapsed_time": "1 day, 2:19:55", "remaining_time": "0:23:05"}
|
| 617 |
+
{"current_steps": 617, "total_steps": 625, "loss": 0.384, "lr": 3.99912246843126e-08, "epoch": 4.928607089365951, "percentage": 98.72, "elapsed_time": "1 day, 2:22:29", "remaining_time": "0:20:31"}
|
| 618 |
+
{"current_steps": 618, "total_steps": 625, "loss": 0.3797, "lr": 3.061947742101001e-08, "epoch": 4.9365951073389915, "percentage": 98.88, "elapsed_time": "1 day, 2:25:01", "remaining_time": "0:17:57"}
|
| 619 |
+
{"current_steps": 619, "total_steps": 625, "loss": 0.378, "lr": 2.2496704165995142e-08, "epoch": 4.944583125312032, "percentage": 99.04, "elapsed_time": "1 day, 2:27:34", "remaining_time": "0:15:23"}
|
| 620 |
+
{"current_steps": 620, "total_steps": 625, "loss": 0.3804, "lr": 1.5623158741884247e-08, "epoch": 4.9525711432850725, "percentage": 99.2, "elapsed_time": "1 day, 2:30:07", "remaining_time": "0:12:49"}
|
| 621 |
+
{"current_steps": 621, "total_steps": 625, "loss": 0.3661, "lr": 9.999055935074887e-09, "epoch": 4.960559161258113, "percentage": 99.36, "elapsed_time": "1 day, 2:32:40", "remaining_time": "0:10:15"}
|
| 622 |
+
{"current_steps": 622, "total_steps": 625, "loss": 0.3829, "lr": 5.624571489053488e-09, "epoch": 4.9685471792311535, "percentage": 99.52, "elapsed_time": "1 day, 2:35:13", "remaining_time": "0:07:41"}
|
| 623 |
+
{"current_steps": 623, "total_steps": 625, "loss": 0.3842, "lr": 2.499842098901972e-09, "epoch": 4.976535197204194, "percentage": 99.68, "elapsed_time": "1 day, 2:37:47", "remaining_time": "0:05:07"}
|
| 624 |
+
{"current_steps": 624, "total_steps": 625, "loss": 0.3817, "lr": 6.249654069989674e-10, "epoch": 4.9845232151772345, "percentage": 99.84, "elapsed_time": "1 day, 2:40:21", "remaining_time": "0:02:33"}
|
| 625 |
+
{"current_steps": 625, "total_steps": 625, "loss": 0.377, "lr": 0.0, "epoch": 4.992511233150275, "percentage": 100.0, "elapsed_time": "1 day, 2:42:53", "remaining_time": "0:00:00"}
|
| 626 |
+
{"current_steps": 625, "total_steps": 625, "epoch": 4.992511233150275, "percentage": 100.0, "elapsed_time": "1 day, 2:44:25", "remaining_time": "0:00:00"}
|