Training in progress, epoch 2
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- trainer_log.jsonl +363 -0
- training_args.bin +2 -2
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b573c6095682b47921bd586677914845b4dd1a7483c35cd4797d6127d8e6f45
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7bc7c0d1790bd7eb805a873d71f930a05e85e2ecc406f0fae2b0e3983a8f2efa
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09c8c1f64976e52b5e01c46ba354b008e5e79b267df98b99c13b66dd2d11df4d
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2500b749c7c9a9f92fd5bd26e4aad1adc9509aa1afeb79fdd299e5cb38cbf716
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -495,3 +495,366 @@
|
|
| 495 |
{"current_steps": 495, "total_steps": 1230, "loss": 0.3976, "lr": 2.9852175996655676e-05, "epoch": 2.010136847440446, "percentage": 40.24, "elapsed_time": "4:26:59", "remaining_time": "6:36:26"}
|
| 496 |
{"current_steps": 496, "total_steps": 1230, "loss": 0.3936, "lr": 2.980274210295326e-05, "epoch": 2.0141915864166244, "percentage": 40.33, "elapsed_time": "4:27:30", "remaining_time": "6:35:52"}
|
| 497 |
{"current_steps": 497, "total_steps": 1230, "loss": 0.3915, "lr": 2.9753229259313578e-05, "epoch": 2.018246325392803, "percentage": 40.41, "elapsed_time": "4:28:01", "remaining_time": "6:35:18"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 495 |
{"current_steps": 495, "total_steps": 1230, "loss": 0.3976, "lr": 2.9852175996655676e-05, "epoch": 2.010136847440446, "percentage": 40.24, "elapsed_time": "4:26:59", "remaining_time": "6:36:26"}
|
| 496 |
{"current_steps": 496, "total_steps": 1230, "loss": 0.3936, "lr": 2.980274210295326e-05, "epoch": 2.0141915864166244, "percentage": 40.33, "elapsed_time": "4:27:30", "remaining_time": "6:35:52"}
|
| 497 |
{"current_steps": 497, "total_steps": 1230, "loss": 0.3915, "lr": 2.9753229259313578e-05, "epoch": 2.018246325392803, "percentage": 40.41, "elapsed_time": "4:28:01", "remaining_time": "6:35:18"}
|
| 498 |
+
{"current_steps": 498, "total_steps": 1230, "loss": 0.3682, "lr": 2.9703637864506274e-05, "epoch": 2.0223010643689814, "percentage": 40.49, "elapsed_time": "4:28:33", "remaining_time": "6:34:45"}
|
| 499 |
+
{"current_steps": 499, "total_steps": 1230, "loss": 0.3862, "lr": 2.965396831793362e-05, "epoch": 2.02635580334516, "percentage": 40.57, "elapsed_time": "4:29:02", "remaining_time": "6:34:08"}
|
| 500 |
+
{"current_steps": 500, "total_steps": 1230, "loss": 0.3861, "lr": 2.9604221019627316e-05, "epoch": 2.030410542321338, "percentage": 40.65, "elapsed_time": "4:29:34", "remaining_time": "6:33:34"}
|
| 501 |
+
{"current_steps": 501, "total_steps": 1230, "loss": 0.3747, "lr": 2.955439637024526e-05, "epoch": 2.0344652812975164, "percentage": 40.73, "elapsed_time": "4:30:05", "remaining_time": "6:32:59"}
|
| 502 |
+
{"current_steps": 502, "total_steps": 1230, "loss": 0.3705, "lr": 2.9504494771068334e-05, "epoch": 2.038520020273695, "percentage": 40.81, "elapsed_time": "4:30:44", "remaining_time": "6:32:38"}
|
| 503 |
+
{"current_steps": 503, "total_steps": 1230, "loss": 0.3784, "lr": 2.9454516623997156e-05, "epoch": 2.0425747592498733, "percentage": 40.89, "elapsed_time": "4:31:16", "remaining_time": "6:32:04"}
|
| 504 |
+
{"current_steps": 504, "total_steps": 1230, "loss": 0.3628, "lr": 2.9404462331548847e-05, "epoch": 2.046629498226052, "percentage": 40.98, "elapsed_time": "4:31:46", "remaining_time": "6:31:28"}
|
| 505 |
+
{"current_steps": 505, "total_steps": 1230, "loss": 0.3666, "lr": 2.93543322968538e-05, "epoch": 2.0506842372022303, "percentage": 41.06, "elapsed_time": "4:32:18", "remaining_time": "6:30:56"}
|
| 506 |
+
{"current_steps": 506, "total_steps": 1230, "loss": 0.377, "lr": 2.9304126923652428e-05, "epoch": 2.0547389761784087, "percentage": 41.14, "elapsed_time": "4:32:48", "remaining_time": "6:30:20"}
|
| 507 |
+
{"current_steps": 507, "total_steps": 1230, "loss": 0.3981, "lr": 2.9253846616291896e-05, "epoch": 2.0587937151545868, "percentage": 41.22, "elapsed_time": "4:33:20", "remaining_time": "6:29:47"}
|
| 508 |
+
{"current_steps": 508, "total_steps": 1230, "loss": 0.381, "lr": 2.9203491779722896e-05, "epoch": 2.0628484541307652, "percentage": 41.3, "elapsed_time": "4:33:54", "remaining_time": "6:29:18"}
|
| 509 |
+
{"current_steps": 509, "total_steps": 1230, "loss": 0.3725, "lr": 2.9153062819496357e-05, "epoch": 2.0669031931069437, "percentage": 41.38, "elapsed_time": "4:34:26", "remaining_time": "6:28:45"}
|
| 510 |
+
{"current_steps": 510, "total_steps": 1230, "loss": 0.3683, "lr": 2.9102560141760178e-05, "epoch": 2.070957932083122, "percentage": 41.46, "elapsed_time": "4:35:00", "remaining_time": "6:28:14"}
|
| 511 |
+
{"current_steps": 511, "total_steps": 1230, "loss": 0.3942, "lr": 2.9051984153256004e-05, "epoch": 2.0750126710593007, "percentage": 41.54, "elapsed_time": "4:35:35", "remaining_time": "6:27:46"}
|
| 512 |
+
{"current_steps": 512, "total_steps": 1230, "loss": 0.3484, "lr": 2.900133526131588e-05, "epoch": 2.079067410035479, "percentage": 41.63, "elapsed_time": "4:36:03", "remaining_time": "6:27:08"}
|
| 513 |
+
{"current_steps": 513, "total_steps": 1230, "loss": 0.3675, "lr": 2.8950613873859025e-05, "epoch": 2.0831221490116576, "percentage": 41.71, "elapsed_time": "4:36:37", "remaining_time": "6:26:36"}
|
| 514 |
+
{"current_steps": 514, "total_steps": 1230, "loss": 0.4005, "lr": 2.8899820399388515e-05, "epoch": 2.0871768879878356, "percentage": 41.79, "elapsed_time": "4:37:06", "remaining_time": "6:26:01"}
|
| 515 |
+
{"current_steps": 515, "total_steps": 1230, "loss": 0.3911, "lr": 2.8848955246988012e-05, "epoch": 2.091231626964014, "percentage": 41.87, "elapsed_time": "4:37:42", "remaining_time": "6:25:33"}
|
| 516 |
+
{"current_steps": 516, "total_steps": 1230, "loss": 0.3752, "lr": 2.879801882631847e-05, "epoch": 2.0952863659401926, "percentage": 41.95, "elapsed_time": "4:38:11", "remaining_time": "6:24:56"}
|
| 517 |
+
{"current_steps": 517, "total_steps": 1230, "loss": 0.369, "lr": 2.8747011547614808e-05, "epoch": 2.099341104916371, "percentage": 42.03, "elapsed_time": "4:38:42", "remaining_time": "6:24:22"}
|
| 518 |
+
{"current_steps": 518, "total_steps": 1230, "loss": 0.3768, "lr": 2.8695933821682635e-05, "epoch": 2.1033958438925495, "percentage": 42.11, "elapsed_time": "4:39:11", "remaining_time": "6:23:44"}
|
| 519 |
+
{"current_steps": 519, "total_steps": 1230, "loss": 0.3587, "lr": 2.864478605989494e-05, "epoch": 2.107450582868728, "percentage": 42.2, "elapsed_time": "4:39:43", "remaining_time": "6:23:12"}
|
| 520 |
+
{"current_steps": 520, "total_steps": 1230, "loss": 0.3845, "lr": 2.8593568674188765e-05, "epoch": 2.111505321844906, "percentage": 42.28, "elapsed_time": "4:40:16", "remaining_time": "6:22:40"}
|
| 521 |
+
{"current_steps": 521, "total_steps": 1230, "loss": 0.3584, "lr": 2.8542282077061892e-05, "epoch": 2.1155600608210845, "percentage": 42.36, "elapsed_time": "4:40:41", "remaining_time": "6:21:58"}
|
| 522 |
+
{"current_steps": 522, "total_steps": 1230, "loss": 0.3785, "lr": 2.8490926681569523e-05, "epoch": 2.119614799797263, "percentage": 42.44, "elapsed_time": "4:41:15", "remaining_time": "6:21:28"}
|
| 523 |
+
{"current_steps": 523, "total_steps": 1230, "loss": 0.3632, "lr": 2.8439502901320956e-05, "epoch": 2.1236695387734414, "percentage": 42.52, "elapsed_time": "4:41:56", "remaining_time": "6:21:07"}
|
| 524 |
+
{"current_steps": 524, "total_steps": 1230, "loss": 0.3812, "lr": 2.8388011150476237e-05, "epoch": 2.12772427774962, "percentage": 42.6, "elapsed_time": "4:42:26", "remaining_time": "6:20:31"}
|
| 525 |
+
{"current_steps": 525, "total_steps": 1230, "loss": 0.3779, "lr": 2.8336451843742866e-05, "epoch": 2.1317790167257984, "percentage": 42.68, "elapsed_time": "4:42:58", "remaining_time": "6:19:59"}
|
| 526 |
+
{"current_steps": 526, "total_steps": 1230, "loss": 0.3831, "lr": 2.8284825396372387e-05, "epoch": 2.135833755701977, "percentage": 42.76, "elapsed_time": "4:43:31", "remaining_time": "6:19:27"}
|
| 527 |
+
{"current_steps": 527, "total_steps": 1230, "loss": 0.4052, "lr": 2.8233132224157132e-05, "epoch": 2.139888494678155, "percentage": 42.85, "elapsed_time": "4:44:02", "remaining_time": "6:18:54"}
|
| 528 |
+
{"current_steps": 528, "total_steps": 1230, "loss": 0.3783, "lr": 2.8181372743426805e-05, "epoch": 2.1439432336543334, "percentage": 42.93, "elapsed_time": "4:44:31", "remaining_time": "6:18:17"}
|
| 529 |
+
{"current_steps": 529, "total_steps": 1230, "loss": 0.3677, "lr": 2.8129547371045128e-05, "epoch": 2.147997972630512, "percentage": 43.01, "elapsed_time": "4:45:02", "remaining_time": "6:17:43"}
|
| 530 |
+
{"current_steps": 530, "total_steps": 1230, "loss": 0.4003, "lr": 2.8077656524406534e-05, "epoch": 2.1520527116066903, "percentage": 43.09, "elapsed_time": "4:45:40", "remaining_time": "6:17:18"}
|
| 531 |
+
{"current_steps": 531, "total_steps": 1230, "loss": 0.3913, "lr": 2.802570062143278e-05, "epoch": 2.156107450582869, "percentage": 43.17, "elapsed_time": "4:46:10", "remaining_time": "6:16:42"}
|
| 532 |
+
{"current_steps": 532, "total_steps": 1230, "loss": 0.3891, "lr": 2.7973680080569555e-05, "epoch": 2.1601621895590473, "percentage": 43.25, "elapsed_time": "4:46:40", "remaining_time": "6:16:08"}
|
| 533 |
+
{"current_steps": 533, "total_steps": 1230, "loss": 0.3715, "lr": 2.792159532078314e-05, "epoch": 2.1642169285352257, "percentage": 43.33, "elapsed_time": "4:47:13", "remaining_time": "6:15:36"}
|
| 534 |
+
{"current_steps": 534, "total_steps": 1230, "loss": 0.3683, "lr": 2.7869446761557033e-05, "epoch": 2.1682716675114038, "percentage": 43.41, "elapsed_time": "4:47:43", "remaining_time": "6:15:00"}
|
| 535 |
+
{"current_steps": 535, "total_steps": 1230, "loss": 0.3735, "lr": 2.781723482288857e-05, "epoch": 2.1723264064875822, "percentage": 43.5, "elapsed_time": "4:48:18", "remaining_time": "6:14:31"}
|
| 536 |
+
{"current_steps": 536, "total_steps": 1230, "loss": 0.4044, "lr": 2.7764959925285517e-05, "epoch": 2.1763811454637607, "percentage": 43.58, "elapsed_time": "4:48:49", "remaining_time": "6:13:57"}
|
| 537 |
+
{"current_steps": 537, "total_steps": 1230, "loss": 0.3889, "lr": 2.771262248976272e-05, "epoch": 2.180435884439939, "percentage": 43.66, "elapsed_time": "4:49:20", "remaining_time": "6:13:23"}
|
| 538 |
+
{"current_steps": 538, "total_steps": 1230, "loss": 0.3786, "lr": 2.7660222937838677e-05, "epoch": 2.1844906234161177, "percentage": 43.74, "elapsed_time": "4:49:48", "remaining_time": "6:12:46"}
|
| 539 |
+
{"current_steps": 539, "total_steps": 1230, "loss": 0.366, "lr": 2.7607761691532186e-05, "epoch": 2.188545362392296, "percentage": 43.82, "elapsed_time": "4:50:20", "remaining_time": "6:12:13"}
|
| 540 |
+
{"current_steps": 540, "total_steps": 1230, "loss": 0.3834, "lr": 2.7555239173358916e-05, "epoch": 2.1926001013684746, "percentage": 43.9, "elapsed_time": "4:50:51", "remaining_time": "6:11:38"}
|
| 541 |
+
{"current_steps": 541, "total_steps": 1230, "loss": 0.3628, "lr": 2.7502655806328e-05, "epoch": 2.1966548403446526, "percentage": 43.98, "elapsed_time": "4:51:23", "remaining_time": "6:11:06"}
|
| 542 |
+
{"current_steps": 542, "total_steps": 1230, "loss": 0.378, "lr": 2.7450012013938648e-05, "epoch": 2.200709579320831, "percentage": 44.07, "elapsed_time": "4:52:00", "remaining_time": "6:10:39"}
|
| 543 |
+
{"current_steps": 543, "total_steps": 1230, "loss": 0.385, "lr": 2.739730822017673e-05, "epoch": 2.2047643182970096, "percentage": 44.15, "elapsed_time": "4:52:34", "remaining_time": "6:10:10"}
|
| 544 |
+
{"current_steps": 544, "total_steps": 1230, "loss": 0.3818, "lr": 2.7344544849511355e-05, "epoch": 2.208819057273188, "percentage": 44.23, "elapsed_time": "4:53:09", "remaining_time": "6:09:41"}
|
| 545 |
+
{"current_steps": 545, "total_steps": 1230, "loss": 0.3681, "lr": 2.7291722326891456e-05, "epoch": 2.2128737962493665, "percentage": 44.31, "elapsed_time": "4:53:42", "remaining_time": "6:09:09"}
|
| 546 |
+
{"current_steps": 546, "total_steps": 1230, "loss": 0.3649, "lr": 2.723884107774236e-05, "epoch": 2.216928535225545, "percentage": 44.39, "elapsed_time": "4:54:17", "remaining_time": "6:08:40"}
|
| 547 |
+
{"current_steps": 547, "total_steps": 1230, "loss": 0.3798, "lr": 2.718590152796239e-05, "epoch": 2.220983274201723, "percentage": 44.47, "elapsed_time": "4:54:47", "remaining_time": "6:08:05"}
|
| 548 |
+
{"current_steps": 548, "total_steps": 1230, "loss": 0.3808, "lr": 2.71329041039194e-05, "epoch": 2.2250380131779015, "percentage": 44.55, "elapsed_time": "4:55:17", "remaining_time": "6:07:30"}
|
| 549 |
+
{"current_steps": 549, "total_steps": 1230, "loss": 0.3673, "lr": 2.7079849232447357e-05, "epoch": 2.22909275215408, "percentage": 44.63, "elapsed_time": "4:55:44", "remaining_time": "6:06:50"}
|
| 550 |
+
{"current_steps": 550, "total_steps": 1230, "loss": 0.3826, "lr": 2.7026737340842895e-05, "epoch": 2.2331474911302585, "percentage": 44.72, "elapsed_time": "4:56:17", "remaining_time": "6:06:19"}
|
| 551 |
+
{"current_steps": 551, "total_steps": 1230, "loss": 0.3935, "lr": 2.697356885686189e-05, "epoch": 2.237202230106437, "percentage": 44.8, "elapsed_time": "4:56:51", "remaining_time": "6:05:49"}
|
| 552 |
+
{"current_steps": 552, "total_steps": 1230, "loss": 0.3876, "lr": 2.6920344208716014e-05, "epoch": 2.2412569690826154, "percentage": 44.88, "elapsed_time": "4:57:19", "remaining_time": "6:05:11"}
|
| 553 |
+
{"current_steps": 553, "total_steps": 1230, "loss": 0.3913, "lr": 2.6867063825069252e-05, "epoch": 2.245311708058794, "percentage": 44.96, "elapsed_time": "4:57:50", "remaining_time": "6:04:37"}
|
| 554 |
+
{"current_steps": 554, "total_steps": 1230, "loss": 0.4115, "lr": 2.6813728135034494e-05, "epoch": 2.249366447034972, "percentage": 45.04, "elapsed_time": "4:58:22", "remaining_time": "6:04:05"}
|
| 555 |
+
{"current_steps": 555, "total_steps": 1230, "loss": 0.3749, "lr": 2.6760337568170056e-05, "epoch": 2.2534211860111504, "percentage": 45.12, "elapsed_time": "4:58:53", "remaining_time": "6:03:30"}
|
| 556 |
+
{"current_steps": 556, "total_steps": 1230, "loss": 0.4028, "lr": 2.6706892554476226e-05, "epoch": 2.257475924987329, "percentage": 45.2, "elapsed_time": "4:59:23", "remaining_time": "6:02:55"}
|
| 557 |
+
{"current_steps": 557, "total_steps": 1230, "loss": 0.3801, "lr": 2.6653393524391795e-05, "epoch": 2.2615306639635073, "percentage": 45.28, "elapsed_time": "4:59:54", "remaining_time": "6:02:21"}
|
| 558 |
+
{"current_steps": 558, "total_steps": 1230, "loss": 0.3773, "lr": 2.6599840908790592e-05, "epoch": 2.265585402939686, "percentage": 45.37, "elapsed_time": "5:00:25", "remaining_time": "6:01:48"}
|
| 559 |
+
{"current_steps": 559, "total_steps": 1230, "loss": 0.3895, "lr": 2.6546235138978028e-05, "epoch": 2.2696401419158643, "percentage": 45.45, "elapsed_time": "5:00:57", "remaining_time": "6:01:15"}
|
| 560 |
+
{"current_steps": 560, "total_steps": 1230, "loss": 0.3963, "lr": 2.6492576646687597e-05, "epoch": 2.2736948808920427, "percentage": 45.53, "elapsed_time": "5:01:29", "remaining_time": "6:00:43"}
|
| 561 |
+
{"current_steps": 561, "total_steps": 1230, "loss": 0.3903, "lr": 2.6438865864077425e-05, "epoch": 2.2777496198682208, "percentage": 45.61, "elapsed_time": "5:02:01", "remaining_time": "6:00:10"}
|
| 562 |
+
{"current_steps": 562, "total_steps": 1230, "loss": 0.3713, "lr": 2.6385103223726766e-05, "epoch": 2.2818043588443992, "percentage": 45.69, "elapsed_time": "5:02:32", "remaining_time": "5:59:36"}
|
| 563 |
+
{"current_steps": 563, "total_steps": 1230, "loss": 0.3798, "lr": 2.6331289158632537e-05, "epoch": 2.2858590978205777, "percentage": 45.77, "elapsed_time": "5:03:02", "remaining_time": "5:59:01"}
|
| 564 |
+
{"current_steps": 564, "total_steps": 1230, "loss": 0.3952, "lr": 2.6277424102205817e-05, "epoch": 2.289913836796756, "percentage": 45.85, "elapsed_time": "5:03:32", "remaining_time": "5:58:25"}
|
| 565 |
+
{"current_steps": 565, "total_steps": 1230, "loss": 0.4011, "lr": 2.6223508488268374e-05, "epoch": 2.2939685757729347, "percentage": 45.93, "elapsed_time": "5:04:01", "remaining_time": "5:57:50"}
|
| 566 |
+
{"current_steps": 566, "total_steps": 1230, "loss": 0.3659, "lr": 2.6169542751049148e-05, "epoch": 2.298023314749113, "percentage": 46.02, "elapsed_time": "5:04:32", "remaining_time": "5:57:16"}
|
| 567 |
+
{"current_steps": 567, "total_steps": 1230, "loss": 0.3799, "lr": 2.6115527325180754e-05, "epoch": 2.3020780537252916, "percentage": 46.1, "elapsed_time": "5:05:11", "remaining_time": "5:56:52"}
|
| 568 |
+
{"current_steps": 568, "total_steps": 1230, "loss": 0.3851, "lr": 2.606146264569603e-05, "epoch": 2.3061327927014696, "percentage": 46.18, "elapsed_time": "5:05:43", "remaining_time": "5:56:18"}
|
| 569 |
+
{"current_steps": 569, "total_steps": 1230, "loss": 0.3707, "lr": 2.6007349148024447e-05, "epoch": 2.310187531677648, "percentage": 46.26, "elapsed_time": "5:06:16", "remaining_time": "5:55:48"}
|
| 570 |
+
{"current_steps": 570, "total_steps": 1230, "loss": 0.3707, "lr": 2.5953187267988694e-05, "epoch": 2.3142422706538266, "percentage": 46.34, "elapsed_time": "5:06:50", "remaining_time": "5:55:17"}
|
| 571 |
+
{"current_steps": 571, "total_steps": 1230, "loss": 0.3923, "lr": 2.5898977441801097e-05, "epoch": 2.318297009630005, "percentage": 46.42, "elapsed_time": "5:07:20", "remaining_time": "5:54:42"}
|
| 572 |
+
{"current_steps": 572, "total_steps": 1230, "loss": 0.3681, "lr": 2.584472010606015e-05, "epoch": 2.3223517486061835, "percentage": 46.5, "elapsed_time": "5:07:46", "remaining_time": "5:54:02"}
|
| 573 |
+
{"current_steps": 573, "total_steps": 1230, "loss": 0.4125, "lr": 2.5790415697746976e-05, "epoch": 2.326406487582362, "percentage": 46.59, "elapsed_time": "5:08:21", "remaining_time": "5:53:33"}
|
| 574 |
+
{"current_steps": 574, "total_steps": 1230, "loss": 0.3805, "lr": 2.5736064654221808e-05, "epoch": 2.3304612265585405, "percentage": 46.67, "elapsed_time": "5:08:51", "remaining_time": "5:52:59"}
|
| 575 |
+
{"current_steps": 575, "total_steps": 1230, "loss": 0.3857, "lr": 2.568166741322048e-05, "epoch": 2.3345159655347185, "percentage": 46.75, "elapsed_time": "5:09:21", "remaining_time": "5:52:23"}
|
| 576 |
+
{"current_steps": 576, "total_steps": 1230, "loss": 0.3654, "lr": 2.56272244128509e-05, "epoch": 2.338570704510897, "percentage": 46.83, "elapsed_time": "5:09:52", "remaining_time": "5:51:50"}
|
| 577 |
+
{"current_steps": 577, "total_steps": 1230, "loss": 0.3641, "lr": 2.55727360915895e-05, "epoch": 2.3426254434870755, "percentage": 46.91, "elapsed_time": "5:10:24", "remaining_time": "5:51:17"}
|
| 578 |
+
{"current_steps": 578, "total_steps": 1230, "loss": 0.3951, "lr": 2.5518202888277734e-05, "epoch": 2.346680182463254, "percentage": 46.99, "elapsed_time": "5:10:53", "remaining_time": "5:50:42"}
|
| 579 |
+
{"current_steps": 579, "total_steps": 1230, "loss": 0.368, "lr": 2.5463625242118523e-05, "epoch": 2.3507349214394324, "percentage": 47.07, "elapsed_time": "5:11:29", "remaining_time": "5:50:13"}
|
| 580 |
+
{"current_steps": 580, "total_steps": 1230, "loss": 0.3842, "lr": 2.5409003592672723e-05, "epoch": 2.354789660415611, "percentage": 47.15, "elapsed_time": "5:11:58", "remaining_time": "5:49:38"}
|
| 581 |
+
{"current_steps": 581, "total_steps": 1230, "loss": 0.3799, "lr": 2.535433837985559e-05, "epoch": 2.3588443993917894, "percentage": 47.24, "elapsed_time": "5:12:30", "remaining_time": "5:49:05"}
|
| 582 |
+
{"current_steps": 582, "total_steps": 1230, "loss": 0.3767, "lr": 2.529963004393324e-05, "epoch": 2.3628991383679674, "percentage": 47.32, "elapsed_time": "5:13:02", "remaining_time": "5:48:33"}
|
| 583 |
+
{"current_steps": 583, "total_steps": 1230, "loss": 0.3995, "lr": 2.524487902551908e-05, "epoch": 2.366953877344146, "percentage": 47.4, "elapsed_time": "5:13:35", "remaining_time": "5:48:00"}
|
| 584 |
+
{"current_steps": 584, "total_steps": 1230, "loss": 0.3919, "lr": 2.519008576557029e-05, "epoch": 2.3710086163203243, "percentage": 47.48, "elapsed_time": "5:14:11", "remaining_time": "5:47:33"}
|
| 585 |
+
{"current_steps": 585, "total_steps": 1230, "loss": 0.3703, "lr": 2.5135250705384254e-05, "epoch": 2.375063355296503, "percentage": 47.56, "elapsed_time": "5:14:49", "remaining_time": "5:47:06"}
|
| 586 |
+
{"current_steps": 586, "total_steps": 1230, "loss": 0.3507, "lr": 2.5080374286595007e-05, "epoch": 2.3791180942726813, "percentage": 47.64, "elapsed_time": "5:15:17", "remaining_time": "5:46:30"}
|
| 587 |
+
{"current_steps": 587, "total_steps": 1230, "loss": 0.3817, "lr": 2.5025456951169677e-05, "epoch": 2.3831728332488598, "percentage": 47.72, "elapsed_time": "5:15:50", "remaining_time": "5:45:57"}
|
| 588 |
+
{"current_steps": 588, "total_steps": 1230, "loss": 0.388, "lr": 2.4970499141404942e-05, "epoch": 2.3872275722250382, "percentage": 47.8, "elapsed_time": "5:16:19", "remaining_time": "5:45:22"}
|
| 589 |
+
{"current_steps": 589, "total_steps": 1230, "loss": 0.3691, "lr": 2.491550129992345e-05, "epoch": 2.3912823112012163, "percentage": 47.89, "elapsed_time": "5:16:53", "remaining_time": "5:44:52"}
|
| 590 |
+
{"current_steps": 590, "total_steps": 1230, "loss": 0.3937, "lr": 2.486046386967024e-05, "epoch": 2.3953370501773947, "percentage": 47.97, "elapsed_time": "5:17:23", "remaining_time": "5:44:17"}
|
| 591 |
+
{"current_steps": 591, "total_steps": 1230, "loss": 0.3959, "lr": 2.4805387293909214e-05, "epoch": 2.399391789153573, "percentage": 48.05, "elapsed_time": "5:18:02", "remaining_time": "5:43:52"}
|
| 592 |
+
{"current_steps": 592, "total_steps": 1230, "loss": 0.3694, "lr": 2.4750272016219552e-05, "epoch": 2.4034465281297517, "percentage": 48.13, "elapsed_time": "5:18:34", "remaining_time": "5:43:19"}
|
| 593 |
+
{"current_steps": 593, "total_steps": 1230, "loss": 0.3961, "lr": 2.4695118480492114e-05, "epoch": 2.40750126710593, "percentage": 48.21, "elapsed_time": "5:19:09", "remaining_time": "5:42:50"}
|
| 594 |
+
{"current_steps": 594, "total_steps": 1230, "loss": 0.378, "lr": 2.4639927130925898e-05, "epoch": 2.4115560060821086, "percentage": 48.29, "elapsed_time": "5:19:42", "remaining_time": "5:42:18"}
|
| 595 |
+
{"current_steps": 595, "total_steps": 1230, "loss": 0.3768, "lr": 2.458469841202444e-05, "epoch": 2.415610745058287, "percentage": 48.37, "elapsed_time": "5:20:19", "remaining_time": "5:41:51"}
|
| 596 |
+
{"current_steps": 596, "total_steps": 1230, "loss": 0.3624, "lr": 2.452943276859226e-05, "epoch": 2.419665484034465, "percentage": 48.46, "elapsed_time": "5:20:50", "remaining_time": "5:41:18"}
|
| 597 |
+
{"current_steps": 597, "total_steps": 1230, "loss": 0.3722, "lr": 2.447413064573125e-05, "epoch": 2.4237202230106436, "percentage": 48.54, "elapsed_time": "5:21:22", "remaining_time": "5:40:45"}
|
| 598 |
+
{"current_steps": 598, "total_steps": 1230, "loss": 0.3822, "lr": 2.4418792488837095e-05, "epoch": 2.427774961986822, "percentage": 48.62, "elapsed_time": "5:21:58", "remaining_time": "5:40:17"}
|
| 599 |
+
{"current_steps": 599, "total_steps": 1230, "loss": 0.3669, "lr": 2.4363418743595713e-05, "epoch": 2.4318297009630006, "percentage": 48.7, "elapsed_time": "5:22:31", "remaining_time": "5:39:44"}
|
| 600 |
+
{"current_steps": 600, "total_steps": 1230, "loss": 0.3739, "lr": 2.430800985597963e-05, "epoch": 2.435884439939179, "percentage": 48.78, "elapsed_time": "5:23:02", "remaining_time": "5:39:11"}
|
| 601 |
+
{"current_steps": 601, "total_steps": 1230, "loss": 0.3726, "lr": 2.4252566272244415e-05, "epoch": 2.4399391789153575, "percentage": 48.86, "elapsed_time": "5:23:32", "remaining_time": "5:38:36"}
|
| 602 |
+
{"current_steps": 602, "total_steps": 1230, "loss": 0.3878, "lr": 2.4197088438925063e-05, "epoch": 2.443993917891536, "percentage": 48.94, "elapsed_time": "5:24:06", "remaining_time": "5:38:05"}
|
| 603 |
+
{"current_steps": 603, "total_steps": 1230, "loss": 0.3748, "lr": 2.4141576802832417e-05, "epoch": 2.448048656867714, "percentage": 49.02, "elapsed_time": "5:24:38", "remaining_time": "5:37:34"}
|
| 604 |
+
{"current_steps": 604, "total_steps": 1230, "loss": 0.3626, "lr": 2.408603181104957e-05, "epoch": 2.4521033958438925, "percentage": 49.11, "elapsed_time": "5:25:12", "remaining_time": "5:37:03"}
|
| 605 |
+
{"current_steps": 605, "total_steps": 1230, "loss": 0.3899, "lr": 2.4030453910928245e-05, "epoch": 2.456158134820071, "percentage": 49.19, "elapsed_time": "5:25:47", "remaining_time": "5:36:33"}
|
| 606 |
+
{"current_steps": 606, "total_steps": 1230, "loss": 0.3872, "lr": 2.397484355008521e-05, "epoch": 2.4602128737962494, "percentage": 49.27, "elapsed_time": "5:26:20", "remaining_time": "5:36:02"}
|
| 607 |
+
{"current_steps": 607, "total_steps": 1230, "loss": 0.401, "lr": 2.3919201176398662e-05, "epoch": 2.464267612772428, "percentage": 49.35, "elapsed_time": "5:26:53", "remaining_time": "5:35:30"}
|
| 608 |
+
{"current_steps": 493, "total_steps": 1230, "loss": 0.4399, "lr": 2.995080534235264e-05, "epoch": 2.0040506329113925, "percentage": 40.08, "elapsed_time": "0:00:37", "remaining_time": "0:00:56"}
|
| 609 |
+
{"current_steps": 494, "total_steps": 1230, "loss": 0.389, "lr": 2.9901530542287044e-05, "epoch": 2.008101265822785, "percentage": 40.16, "elapsed_time": "0:01:04", "remaining_time": "0:01:36"}
|
| 610 |
+
{"current_steps": 495, "total_steps": 1230, "loss": 0.3673, "lr": 2.9852175996655676e-05, "epoch": 2.012151898734177, "percentage": 40.24, "elapsed_time": "0:01:36", "remaining_time": "0:02:23"}
|
| 611 |
+
{"current_steps": 496, "total_steps": 1230, "loss": 0.3749, "lr": 2.980274210295326e-05, "epoch": 2.0162025316455696, "percentage": 40.33, "elapsed_time": "0:02:04", "remaining_time": "0:03:04"}
|
| 612 |
+
{"current_steps": 497, "total_steps": 1230, "loss": 0.3551, "lr": 2.9753229259313578e-05, "epoch": 2.020253164556962, "percentage": 40.41, "elapsed_time": "0:02:37", "remaining_time": "0:03:52"}
|
| 613 |
+
{"current_steps": 498, "total_steps": 1230, "loss": 0.3934, "lr": 2.9703637864506274e-05, "epoch": 2.0243037974683546, "percentage": 40.49, "elapsed_time": "0:03:05", "remaining_time": "0:04:33"}
|
| 614 |
+
{"current_steps": 499, "total_steps": 1230, "loss": 0.3804, "lr": 2.965396831793362e-05, "epoch": 2.0283544303797467, "percentage": 40.57, "elapsed_time": "0:03:38", "remaining_time": "0:05:20"}
|
| 615 |
+
{"current_steps": 500, "total_steps": 1230, "loss": 0.3831, "lr": 2.9604221019627316e-05, "epoch": 2.0324050632911392, "percentage": 40.65, "elapsed_time": "0:04:05", "remaining_time": "0:05:58"}
|
| 616 |
+
{"current_steps": 501, "total_steps": 1230, "loss": 0.3872, "lr": 2.955439637024526e-05, "epoch": 2.0364556962025318, "percentage": 40.73, "elapsed_time": "0:04:32", "remaining_time": "0:06:36"}
|
| 617 |
+
{"current_steps": 502, "total_steps": 1230, "loss": 0.3935, "lr": 2.9504494771068334e-05, "epoch": 2.0405063291139243, "percentage": 40.81, "elapsed_time": "0:05:04", "remaining_time": "0:07:21"}
|
| 618 |
+
{"current_steps": 503, "total_steps": 1230, "loss": 0.3941, "lr": 2.9454516623997156e-05, "epoch": 2.0445569620253163, "percentage": 40.89, "elapsed_time": "0:05:36", "remaining_time": "0:08:06"}
|
| 619 |
+
{"current_steps": 504, "total_steps": 1230, "loss": 0.3729, "lr": 2.9404462331548847e-05, "epoch": 2.048607594936709, "percentage": 40.98, "elapsed_time": "0:06:07", "remaining_time": "0:08:49"}
|
| 620 |
+
{"current_steps": 505, "total_steps": 1230, "loss": 0.3661, "lr": 2.93543322968538e-05, "epoch": 2.0526582278481014, "percentage": 41.06, "elapsed_time": "0:06:40", "remaining_time": "0:09:34"}
|
| 621 |
+
{"current_steps": 506, "total_steps": 1230, "loss": 0.3799, "lr": 2.9304126923652428e-05, "epoch": 2.056708860759494, "percentage": 41.14, "elapsed_time": "0:07:08", "remaining_time": "0:10:12"}
|
| 622 |
+
{"current_steps": 507, "total_steps": 1230, "loss": 0.397, "lr": 2.9253846616291896e-05, "epoch": 2.060759493670886, "percentage": 41.22, "elapsed_time": "0:07:43", "remaining_time": "0:11:00"}
|
| 623 |
+
{"current_steps": 508, "total_steps": 1230, "loss": 0.3691, "lr": 2.9203491779722896e-05, "epoch": 2.0648101265822785, "percentage": 41.3, "elapsed_time": "0:08:15", "remaining_time": "0:11:44"}
|
| 624 |
+
{"current_steps": 509, "total_steps": 1230, "loss": 0.3838, "lr": 2.9153062819496357e-05, "epoch": 2.068860759493671, "percentage": 41.38, "elapsed_time": "0:08:48", "remaining_time": "0:12:28"}
|
| 625 |
+
{"current_steps": 510, "total_steps": 1230, "loss": 0.3921, "lr": 2.9102560141760178e-05, "epoch": 2.0729113924050635, "percentage": 41.46, "elapsed_time": "0:09:21", "remaining_time": "0:13:12"}
|
| 626 |
+
{"current_steps": 511, "total_steps": 1230, "loss": 0.3722, "lr": 2.9051984153256004e-05, "epoch": 2.0769620253164556, "percentage": 41.54, "elapsed_time": "0:09:53", "remaining_time": "0:13:54"}
|
| 627 |
+
{"current_steps": 512, "total_steps": 1230, "loss": 0.3709, "lr": 2.900133526131588e-05, "epoch": 2.081012658227848, "percentage": 41.63, "elapsed_time": "0:10:19", "remaining_time": "0:14:28"}
|
| 628 |
+
{"current_steps": 513, "total_steps": 1230, "loss": 0.367, "lr": 2.8950613873859025e-05, "epoch": 2.0850632911392406, "percentage": 41.71, "elapsed_time": "0:10:54", "remaining_time": "0:15:14"}
|
| 629 |
+
{"current_steps": 514, "total_steps": 1230, "loss": 0.3781, "lr": 2.8899820399388515e-05, "epoch": 2.089113924050633, "percentage": 41.79, "elapsed_time": "0:11:29", "remaining_time": "0:16:00"}
|
| 630 |
+
{"current_steps": 515, "total_steps": 1230, "loss": 0.3928, "lr": 2.8848955246988012e-05, "epoch": 2.093164556962025, "percentage": 41.87, "elapsed_time": "0:11:58", "remaining_time": "0:16:36"}
|
| 631 |
+
{"current_steps": 516, "total_steps": 1230, "loss": 0.3808, "lr": 2.879801882631847e-05, "epoch": 2.0972151898734177, "percentage": 41.95, "elapsed_time": "0:12:29", "remaining_time": "0:17:16"}
|
| 632 |
+
{"current_steps": 517, "total_steps": 1230, "loss": 0.3744, "lr": 2.8747011547614808e-05, "epoch": 2.1012658227848102, "percentage": 42.03, "elapsed_time": "0:13:01", "remaining_time": "0:17:57"}
|
| 633 |
+
{"current_steps": 518, "total_steps": 1230, "loss": 0.3628, "lr": 2.8695933821682635e-05, "epoch": 2.1053164556962027, "percentage": 42.11, "elapsed_time": "0:13:34", "remaining_time": "0:18:39"}
|
| 634 |
+
{"current_steps": 519, "total_steps": 1230, "loss": 0.3815, "lr": 2.864478605989494e-05, "epoch": 2.109367088607595, "percentage": 42.2, "elapsed_time": "0:14:04", "remaining_time": "0:19:17"}
|
| 635 |
+
{"current_steps": 520, "total_steps": 1230, "loss": 0.3877, "lr": 2.8593568674188765e-05, "epoch": 2.1134177215189873, "percentage": 42.28, "elapsed_time": "0:14:40", "remaining_time": "0:20:01"}
|
| 636 |
+
{"current_steps": 521, "total_steps": 1230, "loss": 0.3986, "lr": 2.8542282077061892e-05, "epoch": 2.11746835443038, "percentage": 42.36, "elapsed_time": "0:15:09", "remaining_time": "0:20:37"}
|
| 637 |
+
{"current_steps": 522, "total_steps": 1230, "loss": 0.3846, "lr": 2.8490926681569523e-05, "epoch": 2.1215189873417724, "percentage": 42.44, "elapsed_time": "0:15:50", "remaining_time": "0:21:29"}
|
| 638 |
+
{"current_steps": 523, "total_steps": 1230, "loss": 0.3721, "lr": 2.8439502901320956e-05, "epoch": 2.1255696202531644, "percentage": 42.52, "elapsed_time": "0:16:30", "remaining_time": "0:22:18"}
|
| 639 |
+
{"current_steps": 524, "total_steps": 1230, "loss": 0.3741, "lr": 2.8388011150476237e-05, "epoch": 2.129620253164557, "percentage": 42.6, "elapsed_time": "0:17:01", "remaining_time": "0:22:56"}
|
| 640 |
+
{"current_steps": 525, "total_steps": 1230, "loss": 0.3708, "lr": 2.8336451843742866e-05, "epoch": 2.1336708860759495, "percentage": 42.68, "elapsed_time": "0:17:36", "remaining_time": "0:23:38"}
|
| 641 |
+
{"current_steps": 526, "total_steps": 1230, "loss": 0.3899, "lr": 2.8284825396372387e-05, "epoch": 2.137721518987342, "percentage": 42.76, "elapsed_time": "0:18:08", "remaining_time": "0:24:17"}
|
| 642 |
+
{"current_steps": 527, "total_steps": 1230, "loss": 0.396, "lr": 2.8233132224157132e-05, "epoch": 2.141772151898734, "percentage": 42.85, "elapsed_time": "0:18:41", "remaining_time": "0:24:55"}
|
| 643 |
+
{"current_steps": 528, "total_steps": 1230, "loss": 0.382, "lr": 2.8181372743426805e-05, "epoch": 2.1458227848101266, "percentage": 42.93, "elapsed_time": "0:19:19", "remaining_time": "0:25:41"}
|
| 644 |
+
{"current_steps": 529, "total_steps": 1230, "loss": 0.3901, "lr": 2.8129547371045128e-05, "epoch": 2.149873417721519, "percentage": 43.01, "elapsed_time": "0:19:48", "remaining_time": "0:26:15"}
|
| 645 |
+
{"current_steps": 530, "total_steps": 1230, "loss": 0.371, "lr": 2.8077656524406534e-05, "epoch": 2.1539240506329116, "percentage": 43.09, "elapsed_time": "0:20:19", "remaining_time": "0:26:50"}
|
| 646 |
+
{"current_steps": 531, "total_steps": 1230, "loss": 0.3961, "lr": 2.802570062143278e-05, "epoch": 2.1579746835443037, "percentage": 43.17, "elapsed_time": "0:20:54", "remaining_time": "0:27:30"}
|
| 647 |
+
{"current_steps": 532, "total_steps": 1230, "loss": 0.3775, "lr": 2.7973680080569555e-05, "epoch": 2.162025316455696, "percentage": 43.25, "elapsed_time": "0:21:21", "remaining_time": "0:28:01"}
|
| 648 |
+
{"current_steps": 533, "total_steps": 1230, "loss": 0.367, "lr": 2.792159532078314e-05, "epoch": 2.1660759493670887, "percentage": 43.33, "elapsed_time": "0:21:52", "remaining_time": "0:28:36"}
|
| 649 |
+
{"current_steps": 534, "total_steps": 1230, "loss": 0.3725, "lr": 2.7869446761557033e-05, "epoch": 2.170126582278481, "percentage": 43.41, "elapsed_time": "0:22:24", "remaining_time": "0:29:12"}
|
| 650 |
+
{"current_steps": 535, "total_steps": 1230, "loss": 0.3762, "lr": 2.781723482288857e-05, "epoch": 2.1741772151898733, "percentage": 43.5, "elapsed_time": "0:22:56", "remaining_time": "0:29:48"}
|
| 651 |
+
{"current_steps": 536, "total_steps": 1230, "loss": 0.38, "lr": 2.7764959925285517e-05, "epoch": 2.178227848101266, "percentage": 43.58, "elapsed_time": "0:23:30", "remaining_time": "0:30:25"}
|
| 652 |
+
{"current_steps": 537, "total_steps": 1230, "loss": 0.3392, "lr": 2.771262248976272e-05, "epoch": 2.1822784810126583, "percentage": 43.66, "elapsed_time": "0:24:04", "remaining_time": "0:31:04"}
|
| 653 |
+
{"current_steps": 538, "total_steps": 1230, "loss": 0.3753, "lr": 2.7660222937838677e-05, "epoch": 2.186329113924051, "percentage": 43.74, "elapsed_time": "0:24:37", "remaining_time": "0:31:40"}
|
| 654 |
+
{"current_steps": 539, "total_steps": 1230, "loss": 0.3771, "lr": 2.7607761691532186e-05, "epoch": 2.190379746835443, "percentage": 43.82, "elapsed_time": "0:25:08", "remaining_time": "0:32:14"}
|
| 655 |
+
{"current_steps": 540, "total_steps": 1230, "loss": 0.3522, "lr": 2.7555239173358916e-05, "epoch": 2.1944303797468354, "percentage": 43.9, "elapsed_time": "0:25:40", "remaining_time": "0:32:48"}
|
| 656 |
+
{"current_steps": 541, "total_steps": 1230, "loss": 0.3914, "lr": 2.7502655806328e-05, "epoch": 2.198481012658228, "percentage": 43.98, "elapsed_time": "0:26:12", "remaining_time": "0:33:22"}
|
| 657 |
+
{"current_steps": 542, "total_steps": 1230, "loss": 0.3767, "lr": 2.7450012013938648e-05, "epoch": 2.2025316455696204, "percentage": 44.07, "elapsed_time": "0:26:41", "remaining_time": "0:33:52"}
|
| 658 |
+
{"current_steps": 543, "total_steps": 1230, "loss": 0.386, "lr": 2.739730822017673e-05, "epoch": 2.2065822784810125, "percentage": 44.15, "elapsed_time": "0:27:12", "remaining_time": "0:34:25"}
|
| 659 |
+
{"current_steps": 544, "total_steps": 1230, "loss": 0.3899, "lr": 2.7344544849511355e-05, "epoch": 2.210632911392405, "percentage": 44.23, "elapsed_time": "0:27:39", "remaining_time": "0:34:52"}
|
| 660 |
+
{"current_steps": 545, "total_steps": 1230, "loss": 0.3814, "lr": 2.7291722326891456e-05, "epoch": 2.2146835443037975, "percentage": 44.31, "elapsed_time": "0:28:08", "remaining_time": "0:35:21"}
|
| 661 |
+
{"current_steps": 546, "total_steps": 1230, "loss": 0.3812, "lr": 2.723884107774236e-05, "epoch": 2.21873417721519, "percentage": 44.39, "elapsed_time": "0:28:41", "remaining_time": "0:35:56"}
|
| 662 |
+
{"current_steps": 547, "total_steps": 1230, "loss": 0.3707, "lr": 2.718590152796239e-05, "epoch": 2.222784810126582, "percentage": 44.47, "elapsed_time": "0:29:13", "remaining_time": "0:36:29"}
|
| 663 |
+
{"current_steps": 548, "total_steps": 1230, "loss": 0.3719, "lr": 2.71329041039194e-05, "epoch": 2.2268354430379746, "percentage": 44.55, "elapsed_time": "0:29:46", "remaining_time": "0:37:02"}
|
| 664 |
+
{"current_steps": 549, "total_steps": 1230, "loss": 0.3827, "lr": 2.7079849232447357e-05, "epoch": 2.230886075949367, "percentage": 44.63, "elapsed_time": "0:30:20", "remaining_time": "0:37:38"}
|
| 665 |
+
{"current_steps": 550, "total_steps": 1230, "loss": 0.3756, "lr": 2.7026737340842895e-05, "epoch": 2.2349367088607597, "percentage": 44.72, "elapsed_time": "0:30:55", "remaining_time": "0:38:14"}
|
| 666 |
+
{"current_steps": 551, "total_steps": 1230, "loss": 0.3697, "lr": 2.697356885686189e-05, "epoch": 2.2389873417721518, "percentage": 44.8, "elapsed_time": "0:31:25", "remaining_time": "0:38:43"}
|
| 667 |
+
{"current_steps": 552, "total_steps": 1230, "loss": 0.3605, "lr": 2.6920344208716014e-05, "epoch": 2.2430379746835443, "percentage": 44.88, "elapsed_time": "0:31:53", "remaining_time": "0:39:10"}
|
| 668 |
+
{"current_steps": 553, "total_steps": 1230, "loss": 0.3925, "lr": 2.6867063825069252e-05, "epoch": 2.247088607594937, "percentage": 44.96, "elapsed_time": "0:32:22", "remaining_time": "0:39:37"}
|
| 669 |
+
{"current_steps": 554, "total_steps": 1230, "loss": 0.3749, "lr": 2.6813728135034494e-05, "epoch": 2.2511392405063293, "percentage": 45.04, "elapsed_time": "0:32:59", "remaining_time": "0:40:15"}
|
| 670 |
+
{"current_steps": 555, "total_steps": 1230, "loss": 0.3908, "lr": 2.6760337568170056e-05, "epoch": 2.2551898734177214, "percentage": 45.12, "elapsed_time": "0:33:32", "remaining_time": "0:40:47"}
|
| 671 |
+
{"current_steps": 556, "total_steps": 1230, "loss": 0.3737, "lr": 2.6706892554476226e-05, "epoch": 2.259240506329114, "percentage": 45.2, "elapsed_time": "0:34:08", "remaining_time": "0:41:23"}
|
| 672 |
+
{"current_steps": 557, "total_steps": 1230, "loss": 0.3731, "lr": 2.6653393524391795e-05, "epoch": 2.2632911392405064, "percentage": 45.28, "elapsed_time": "0:34:43", "remaining_time": "0:41:57"}
|
| 673 |
+
{"current_steps": 558, "total_steps": 1230, "loss": 0.3851, "lr": 2.6599840908790592e-05, "epoch": 2.267341772151899, "percentage": 45.37, "elapsed_time": "0:35:15", "remaining_time": "0:42:28"}
|
| 674 |
+
{"current_steps": 559, "total_steps": 1230, "loss": 0.3942, "lr": 2.6546235138978028e-05, "epoch": 2.271392405063291, "percentage": 45.45, "elapsed_time": "0:35:47", "remaining_time": "0:42:58"}
|
| 675 |
+
{"current_steps": 560, "total_steps": 1230, "loss": 0.378, "lr": 2.6492576646687597e-05, "epoch": 2.2754430379746835, "percentage": 45.53, "elapsed_time": "0:36:17", "remaining_time": "0:43:25"}
|
| 676 |
+
{"current_steps": 561, "total_steps": 1230, "loss": 0.3743, "lr": 2.6438865864077425e-05, "epoch": 2.279493670886076, "percentage": 45.61, "elapsed_time": "0:36:49", "remaining_time": "0:43:55"}
|
| 677 |
+
{"current_steps": 562, "total_steps": 1230, "loss": 0.3831, "lr": 2.6385103223726766e-05, "epoch": 2.2835443037974685, "percentage": 45.69, "elapsed_time": "0:37:23", "remaining_time": "0:44:26"}
|
| 678 |
+
{"current_steps": 563, "total_steps": 1230, "loss": 0.3779, "lr": 2.6331289158632537e-05, "epoch": 2.2875949367088606, "percentage": 45.77, "elapsed_time": "0:37:56", "remaining_time": "0:44:56"}
|
| 679 |
+
{"current_steps": 564, "total_steps": 1230, "loss": 0.3801, "lr": 2.6277424102205817e-05, "epoch": 2.291645569620253, "percentage": 45.85, "elapsed_time": "0:38:26", "remaining_time": "0:45:23"}
|
| 680 |
+
{"current_steps": 565, "total_steps": 1230, "loss": 0.3884, "lr": 2.6223508488268374e-05, "epoch": 2.2956962025316456, "percentage": 45.93, "elapsed_time": "0:39:01", "remaining_time": "0:45:56"}
|
| 681 |
+
{"current_steps": 566, "total_steps": 1230, "loss": 0.3922, "lr": 2.6169542751049148e-05, "epoch": 2.299746835443038, "percentage": 46.02, "elapsed_time": "0:39:33", "remaining_time": "0:46:24"}
|
| 682 |
+
{"current_steps": 567, "total_steps": 1230, "loss": 0.3822, "lr": 2.6115527325180754e-05, "epoch": 2.3037974683544302, "percentage": 46.1, "elapsed_time": "0:40:09", "remaining_time": "0:46:57"}
|
| 683 |
+
{"current_steps": 568, "total_steps": 1230, "loss": 0.387, "lr": 2.606146264569603e-05, "epoch": 2.3078481012658227, "percentage": 46.18, "elapsed_time": "0:40:44", "remaining_time": "0:47:29"}
|
| 684 |
+
{"current_steps": 569, "total_steps": 1230, "loss": 0.3434, "lr": 2.6007349148024447e-05, "epoch": 2.3118987341772153, "percentage": 46.26, "elapsed_time": "0:41:17", "remaining_time": "0:47:57"}
|
| 685 |
+
{"current_steps": 570, "total_steps": 1230, "loss": 0.3991, "lr": 2.5953187267988694e-05, "epoch": 2.3159493670886078, "percentage": 46.34, "elapsed_time": "0:41:49", "remaining_time": "0:48:25"}
|
| 686 |
+
{"current_steps": 571, "total_steps": 1230, "loss": 0.3749, "lr": 2.5898977441801097e-05, "epoch": 2.32, "percentage": 46.42, "elapsed_time": "0:42:17", "remaining_time": "0:48:48"}
|
| 687 |
+
{"current_steps": 572, "total_steps": 1230, "loss": 0.3862, "lr": 2.584472010606015e-05, "epoch": 2.3240506329113924, "percentage": 46.5, "elapsed_time": "0:42:52", "remaining_time": "0:49:19"}
|
| 688 |
+
{"current_steps": 573, "total_steps": 1230, "loss": 0.3867, "lr": 2.5790415697746976e-05, "epoch": 2.328101265822785, "percentage": 46.59, "elapsed_time": "0:43:21", "remaining_time": "0:49:42"}
|
| 689 |
+
{"current_steps": 574, "total_steps": 1230, "loss": 0.3544, "lr": 2.5736064654221808e-05, "epoch": 2.3321518987341774, "percentage": 46.67, "elapsed_time": "0:43:51", "remaining_time": "0:50:07"}
|
| 690 |
+
{"current_steps": 575, "total_steps": 1230, "loss": 0.3727, "lr": 2.568166741322048e-05, "epoch": 2.3362025316455695, "percentage": 46.75, "elapsed_time": "0:44:24", "remaining_time": "0:50:35"}
|
| 691 |
+
{"current_steps": 576, "total_steps": 1230, "loss": 0.3919, "lr": 2.56272244128509e-05, "epoch": 2.340253164556962, "percentage": 46.83, "elapsed_time": "0:44:48", "remaining_time": "0:50:53"}
|
| 692 |
+
{"current_steps": 577, "total_steps": 1230, "loss": 0.3657, "lr": 2.55727360915895e-05, "epoch": 2.3443037974683545, "percentage": 46.91, "elapsed_time": "0:45:23", "remaining_time": "0:51:22"}
|
| 693 |
+
{"current_steps": 578, "total_steps": 1230, "loss": 0.4041, "lr": 2.5518202888277734e-05, "epoch": 2.348354430379747, "percentage": 46.99, "elapsed_time": "0:46:00", "remaining_time": "0:51:53"}
|
| 694 |
+
{"current_steps": 579, "total_steps": 1230, "loss": 0.3763, "lr": 2.5463625242118523e-05, "epoch": 2.352405063291139, "percentage": 47.07, "elapsed_time": "0:46:32", "remaining_time": "0:52:19"}
|
| 695 |
+
{"current_steps": 580, "total_steps": 1230, "loss": 0.3901, "lr": 2.5409003592672723e-05, "epoch": 2.3564556962025316, "percentage": 47.15, "elapsed_time": "0:46:55", "remaining_time": "0:52:35"}
|
| 696 |
+
{"current_steps": 581, "total_steps": 1230, "loss": 0.3729, "lr": 2.535433837985559e-05, "epoch": 2.360506329113924, "percentage": 47.24, "elapsed_time": "0:47:27", "remaining_time": "0:53:01"}
|
| 697 |
+
{"current_steps": 582, "total_steps": 1230, "loss": 0.381, "lr": 2.529963004393324e-05, "epoch": 2.3645569620253166, "percentage": 47.32, "elapsed_time": "0:48:04", "remaining_time": "0:53:31"}
|
| 698 |
+
{"current_steps": 583, "total_steps": 1230, "loss": 0.3585, "lr": 2.524487902551908e-05, "epoch": 2.3686075949367087, "percentage": 47.4, "elapsed_time": "0:48:37", "remaining_time": "0:53:58"}
|
| 699 |
+
{"current_steps": 584, "total_steps": 1230, "loss": 0.3968, "lr": 2.519008576557029e-05, "epoch": 2.372658227848101, "percentage": 47.48, "elapsed_time": "0:49:10", "remaining_time": "0:54:24"}
|
| 700 |
+
{"current_steps": 585, "total_steps": 1230, "loss": 0.3897, "lr": 2.5135250705384254e-05, "epoch": 2.3767088607594937, "percentage": 47.56, "elapsed_time": "0:49:38", "remaining_time": "0:54:44"}
|
| 701 |
+
{"current_steps": 586, "total_steps": 1230, "loss": 0.363, "lr": 2.5080374286595007e-05, "epoch": 2.3807594936708862, "percentage": 47.64, "elapsed_time": "0:50:10", "remaining_time": "0:55:08"}
|
| 702 |
+
{"current_steps": 587, "total_steps": 1230, "loss": 0.378, "lr": 2.5025456951169677e-05, "epoch": 2.3848101265822783, "percentage": 47.72, "elapsed_time": "0:50:43", "remaining_time": "0:55:33"}
|
| 703 |
+
{"current_steps": 588, "total_steps": 1230, "loss": 0.3893, "lr": 2.4970499141404942e-05, "epoch": 2.388860759493671, "percentage": 47.8, "elapsed_time": "0:51:14", "remaining_time": "0:55:56"}
|
| 704 |
+
{"current_steps": 589, "total_steps": 1230, "loss": 0.3788, "lr": 2.491550129992345e-05, "epoch": 2.3929113924050633, "percentage": 47.89, "elapsed_time": "0:51:45", "remaining_time": "0:56:19"}
|
| 705 |
+
{"current_steps": 590, "total_steps": 1230, "loss": 0.3667, "lr": 2.486046386967024e-05, "epoch": 2.396962025316456, "percentage": 47.97, "elapsed_time": "0:52:17", "remaining_time": "0:56:42"}
|
| 706 |
+
{"current_steps": 591, "total_steps": 1230, "loss": 0.388, "lr": 2.4805387293909214e-05, "epoch": 2.401012658227848, "percentage": 48.05, "elapsed_time": "0:52:43", "remaining_time": "0:57:00"}
|
| 707 |
+
{"current_steps": 592, "total_steps": 1230, "loss": 0.3817, "lr": 2.4750272016219552e-05, "epoch": 2.4050632911392404, "percentage": 48.13, "elapsed_time": "0:53:14", "remaining_time": "0:57:23"}
|
| 708 |
+
{"current_steps": 593, "total_steps": 1230, "loss": 0.3804, "lr": 2.4695118480492114e-05, "epoch": 2.409113924050633, "percentage": 48.21, "elapsed_time": "0:53:48", "remaining_time": "0:57:48"}
|
| 709 |
+
{"current_steps": 594, "total_steps": 1230, "loss": 0.369, "lr": 2.4639927130925898e-05, "epoch": 2.4131645569620255, "percentage": 48.29, "elapsed_time": "0:54:22", "remaining_time": "0:58:13"}
|
| 710 |
+
{"current_steps": 595, "total_steps": 1230, "loss": 0.3875, "lr": 2.458469841202444e-05, "epoch": 2.4172151898734175, "percentage": 48.37, "elapsed_time": "0:54:53", "remaining_time": "0:58:34"}
|
| 711 |
+
{"current_steps": 596, "total_steps": 1230, "loss": 0.3803, "lr": 2.452943276859226e-05, "epoch": 2.42126582278481, "percentage": 48.46, "elapsed_time": "0:55:27", "remaining_time": "0:58:59"}
|
| 712 |
+
{"current_steps": 597, "total_steps": 1230, "loss": 0.3857, "lr": 2.447413064573125e-05, "epoch": 2.4253164556962026, "percentage": 48.54, "elapsed_time": "0:55:58", "remaining_time": "0:59:21"}
|
| 713 |
+
{"current_steps": 598, "total_steps": 1230, "loss": 0.3875, "lr": 2.4418792488837095e-05, "epoch": 2.429367088607595, "percentage": 48.62, "elapsed_time": "0:56:31", "remaining_time": "0:59:44"}
|
| 714 |
+
{"current_steps": 599, "total_steps": 1230, "loss": 0.4015, "lr": 2.4363418743595713e-05, "epoch": 2.433417721518987, "percentage": 48.7, "elapsed_time": "0:57:03", "remaining_time": "1:00:06"}
|
| 715 |
+
{"current_steps": 600, "total_steps": 1230, "loss": 0.3821, "lr": 2.430800985597963e-05, "epoch": 2.4374683544303797, "percentage": 48.78, "elapsed_time": "0:57:34", "remaining_time": "1:00:27"}
|
| 716 |
+
{"current_steps": 601, "total_steps": 1230, "loss": 0.3929, "lr": 2.4252566272244415e-05, "epoch": 2.441518987341772, "percentage": 48.86, "elapsed_time": "0:58:04", "remaining_time": "1:00:46"}
|
| 717 |
+
{"current_steps": 602, "total_steps": 1230, "loss": 0.3648, "lr": 2.4197088438925063e-05, "epoch": 2.4455696202531647, "percentage": 48.94, "elapsed_time": "0:58:32", "remaining_time": "1:01:03"}
|
| 718 |
+
{"current_steps": 603, "total_steps": 1230, "loss": 0.3842, "lr": 2.4141576802832417e-05, "epoch": 2.449620253164557, "percentage": 49.02, "elapsed_time": "0:59:06", "remaining_time": "1:01:27"}
|
| 719 |
+
{"current_steps": 604, "total_steps": 1230, "loss": 0.3902, "lr": 2.408603181104957e-05, "epoch": 2.4536708860759493, "percentage": 49.11, "elapsed_time": "0:59:43", "remaining_time": "1:01:53"}
|
| 720 |
+
{"current_steps": 605, "total_steps": 1230, "loss": 0.3863, "lr": 2.4030453910928245e-05, "epoch": 2.457721518987342, "percentage": 49.19, "elapsed_time": "1:00:16", "remaining_time": "1:02:16"}
|
| 721 |
+
{"current_steps": 606, "total_steps": 1230, "loss": 0.3924, "lr": 2.397484355008521e-05, "epoch": 2.4617721518987343, "percentage": 49.27, "elapsed_time": "1:00:52", "remaining_time": "1:02:40"}
|
| 722 |
+
{"current_steps": 607, "total_steps": 1230, "loss": 0.3721, "lr": 2.3919201176398662e-05, "epoch": 2.4658227848101264, "percentage": 49.35, "elapsed_time": "1:01:26", "remaining_time": "1:03:03"}
|
| 723 |
+
{"current_steps": 608, "total_steps": 1230, "loss": 0.3812, "lr": 2.3863527238004633e-05, "epoch": 2.469873417721519, "percentage": 49.43, "elapsed_time": "1:01:55", "remaining_time": "1:03:20"}
|
| 724 |
+
{"current_steps": 609, "total_steps": 1230, "loss": 0.3747, "lr": 2.380782218329337e-05, "epoch": 2.4739240506329114, "percentage": 49.51, "elapsed_time": "1:02:31", "remaining_time": "1:03:44"}
|
| 725 |
+
{"current_steps": 610, "total_steps": 1230, "loss": 0.373, "lr": 2.3752086460905725e-05, "epoch": 2.477974683544304, "percentage": 49.59, "elapsed_time": "1:03:01", "remaining_time": "1:04:03"}
|
| 726 |
+
{"current_steps": 611, "total_steps": 1230, "loss": 0.3631, "lr": 2.3696320519729544e-05, "epoch": 2.482025316455696, "percentage": 49.67, "elapsed_time": "1:03:37", "remaining_time": "1:04:27"}
|
| 727 |
+
{"current_steps": 612, "total_steps": 1230, "loss": 0.3786, "lr": 2.3640524808896045e-05, "epoch": 2.4860759493670885, "percentage": 49.76, "elapsed_time": "1:04:14", "remaining_time": "1:04:52"}
|
| 728 |
+
{"current_steps": 613, "total_steps": 1230, "loss": 0.3743, "lr": 2.3584699777776222e-05, "epoch": 2.490126582278481, "percentage": 49.84, "elapsed_time": "1:04:51", "remaining_time": "1:05:16"}
|
| 729 |
+
{"current_steps": 614, "total_steps": 1230, "loss": 0.3874, "lr": 2.3528845875977195e-05, "epoch": 2.4941772151898736, "percentage": 49.92, "elapsed_time": "1:05:23", "remaining_time": "1:05:35"}
|
| 730 |
+
{"current_steps": 615, "total_steps": 1230, "loss": 0.4031, "lr": 2.3472963553338614e-05, "epoch": 2.4982278481012656, "percentage": 50.0, "elapsed_time": "1:05:57", "remaining_time": "1:05:57"}
|
| 731 |
+
{"current_steps": 616, "total_steps": 1230, "loss": 0.4057, "lr": 2.341705325992901e-05, "epoch": 2.502278481012658, "percentage": 50.08, "elapsed_time": "1:06:31", "remaining_time": "1:06:18"}
|
| 732 |
+
{"current_steps": 617, "total_steps": 1230, "loss": 0.3886, "lr": 2.336111544604222e-05, "epoch": 2.5063291139240507, "percentage": 50.16, "elapsed_time": "1:07:00", "remaining_time": "1:06:34"}
|
| 733 |
+
{"current_steps": 618, "total_steps": 1230, "loss": 0.3717, "lr": 2.33051505621937e-05, "epoch": 2.510379746835443, "percentage": 50.24, "elapsed_time": "1:07:31", "remaining_time": "1:06:52"}
|
| 734 |
+
{"current_steps": 619, "total_steps": 1230, "loss": 0.3756, "lr": 2.324915905911693e-05, "epoch": 2.5144303797468357, "percentage": 50.33, "elapsed_time": "1:08:01", "remaining_time": "1:07:09"}
|
| 735 |
+
{"current_steps": 620, "total_steps": 1230, "loss": 0.3763, "lr": 2.319314138775977e-05, "epoch": 2.5184810126582278, "percentage": 50.41, "elapsed_time": "1:08:33", "remaining_time": "1:07:26"}
|
| 736 |
+
{"current_steps": 621, "total_steps": 1230, "loss": 0.3674, "lr": 2.3137097999280856e-05, "epoch": 2.5225316455696203, "percentage": 50.49, "elapsed_time": "1:09:07", "remaining_time": "1:07:47"}
|
| 737 |
+
{"current_steps": 622, "total_steps": 1230, "loss": 0.3713, "lr": 2.308102934504593e-05, "epoch": 2.526582278481013, "percentage": 50.57, "elapsed_time": "1:09:45", "remaining_time": "1:08:11"}
|
| 738 |
+
{"current_steps": 623, "total_steps": 1230, "loss": 0.3701, "lr": 2.3024935876624222e-05, "epoch": 2.530632911392405, "percentage": 50.65, "elapsed_time": "1:10:22", "remaining_time": "1:08:34"}
|
| 739 |
+
{"current_steps": 624, "total_steps": 1230, "loss": 0.3834, "lr": 2.2968818045784813e-05, "epoch": 2.5346835443037974, "percentage": 50.73, "elapsed_time": "1:10:51", "remaining_time": "1:08:48"}
|
| 740 |
+
{"current_steps": 625, "total_steps": 1230, "loss": 0.3779, "lr": 2.2912676304493006e-05, "epoch": 2.53873417721519, "percentage": 50.81, "elapsed_time": "1:11:22", "remaining_time": "1:09:05"}
|
| 741 |
+
{"current_steps": 626, "total_steps": 1230, "loss": 0.3636, "lr": 2.2856511104906668e-05, "epoch": 2.5427848101265824, "percentage": 50.89, "elapsed_time": "1:11:55", "remaining_time": "1:09:24"}
|
| 742 |
+
{"current_steps": 627, "total_steps": 1230, "loss": 0.3742, "lr": 2.2800322899372586e-05, "epoch": 2.546835443037975, "percentage": 50.98, "elapsed_time": "1:12:28", "remaining_time": "1:09:42"}
|
| 743 |
+
{"current_steps": 628, "total_steps": 1230, "loss": 0.3962, "lr": 2.2744112140422844e-05, "epoch": 2.550886075949367, "percentage": 51.06, "elapsed_time": "1:13:03", "remaining_time": "1:10:02"}
|
| 744 |
+
{"current_steps": 629, "total_steps": 1230, "loss": 0.3824, "lr": 2.2687879280771177e-05, "epoch": 2.5549367088607595, "percentage": 51.14, "elapsed_time": "1:13:35", "remaining_time": "1:10:18"}
|
| 745 |
+
{"current_steps": 630, "total_steps": 1230, "loss": 0.3659, "lr": 2.26316247733093e-05, "epoch": 2.558987341772152, "percentage": 51.22, "elapsed_time": "1:14:02", "remaining_time": "1:10:31"}
|
| 746 |
+
{"current_steps": 631, "total_steps": 1230, "loss": 0.3717, "lr": 2.257534907110328e-05, "epoch": 2.563037974683544, "percentage": 51.3, "elapsed_time": "1:14:31", "remaining_time": "1:10:45"}
|
| 747 |
+
{"current_steps": 632, "total_steps": 1230, "loss": 0.3786, "lr": 2.2519052627389882e-05, "epoch": 2.5670886075949366, "percentage": 51.38, "elapsed_time": "1:14:56", "remaining_time": "1:10:54"}
|
| 748 |
+
{"current_steps": 633, "total_steps": 1230, "loss": 0.3602, "lr": 2.246273589557294e-05, "epoch": 2.571139240506329, "percentage": 51.46, "elapsed_time": "1:15:30", "remaining_time": "1:11:12"}
|
| 749 |
+
{"current_steps": 634, "total_steps": 1230, "loss": 0.385, "lr": 2.240639932921966e-05, "epoch": 2.5751898734177217, "percentage": 51.54, "elapsed_time": "1:15:59", "remaining_time": "1:11:26"}
|
| 750 |
+
{"current_steps": 635, "total_steps": 1230, "loss": 0.3792, "lr": 2.2350043382056995e-05, "epoch": 2.579240506329114, "percentage": 51.63, "elapsed_time": "1:16:35", "remaining_time": "1:11:45"}
|
| 751 |
+
{"current_steps": 636, "total_steps": 1230, "loss": 0.3784, "lr": 2.2293668507968015e-05, "epoch": 2.5832911392405062, "percentage": 51.71, "elapsed_time": "1:17:02", "remaining_time": "1:11:57"}
|
| 752 |
+
{"current_steps": 637, "total_steps": 1230, "loss": 0.365, "lr": 2.2237275160988186e-05, "epoch": 2.5873417721518988, "percentage": 51.79, "elapsed_time": "1:17:32", "remaining_time": "1:12:11"}
|
| 753 |
+
{"current_steps": 638, "total_steps": 1230, "loss": 0.405, "lr": 2.2180863795301787e-05, "epoch": 2.5913924050632913, "percentage": 51.87, "elapsed_time": "1:18:04", "remaining_time": "1:12:27"}
|
| 754 |
+
{"current_steps": 639, "total_steps": 1230, "loss": 0.3821, "lr": 2.212443486523819e-05, "epoch": 2.5954430379746833, "percentage": 51.95, "elapsed_time": "1:18:39", "remaining_time": "1:12:45"}
|
| 755 |
+
{"current_steps": 640, "total_steps": 1230, "loss": 0.3599, "lr": 2.2067988825268243e-05, "epoch": 2.599493670886076, "percentage": 52.03, "elapsed_time": "1:19:13", "remaining_time": "1:13:02"}
|
| 756 |
+
{"current_steps": 641, "total_steps": 1230, "loss": 0.3969, "lr": 2.2011526130000596e-05, "epoch": 2.6035443037974684, "percentage": 52.11, "elapsed_time": "1:19:48", "remaining_time": "1:13:19"}
|
| 757 |
+
{"current_steps": 642, "total_steps": 1230, "loss": 0.3807, "lr": 2.1955047234178038e-05, "epoch": 2.607594936708861, "percentage": 52.2, "elapsed_time": "1:20:18", "remaining_time": "1:13:33"}
|
| 758 |
+
{"current_steps": 643, "total_steps": 1230, "loss": 0.3706, "lr": 2.1898552592673825e-05, "epoch": 2.6116455696202534, "percentage": 52.28, "elapsed_time": "1:20:47", "remaining_time": "1:13:45"}
|
| 759 |
+
{"current_steps": 644, "total_steps": 1230, "loss": 0.3676, "lr": 2.184204266048803e-05, "epoch": 2.6156962025316455, "percentage": 52.36, "elapsed_time": "1:21:18", "remaining_time": "1:13:59"}
|
| 760 |
+
{"current_steps": 645, "total_steps": 1230, "loss": 0.3949, "lr": 2.1785517892743887e-05, "epoch": 2.619746835443038, "percentage": 52.44, "elapsed_time": "1:21:53", "remaining_time": "1:14:16"}
|
| 761 |
+
{"current_steps": 646, "total_steps": 1230, "loss": 0.3804, "lr": 2.17289787446841e-05, "epoch": 2.6237974683544305, "percentage": 52.52, "elapsed_time": "1:22:23", "remaining_time": "1:14:28"}
|
| 762 |
+
{"current_steps": 647, "total_steps": 1230, "loss": 0.3958, "lr": 2.1672425671667198e-05, "epoch": 2.6278481012658226, "percentage": 52.6, "elapsed_time": "1:22:55", "remaining_time": "1:14:43"}
|
| 763 |
+
{"current_steps": 648, "total_steps": 1230, "loss": 0.3798, "lr": 2.161585912916385e-05, "epoch": 2.631898734177215, "percentage": 52.68, "elapsed_time": "1:23:24", "remaining_time": "1:14:54"}
|
| 764 |
+
{"current_steps": 649, "total_steps": 1230, "loss": 0.3945, "lr": 2.1559279572753214e-05, "epoch": 2.6359493670886076, "percentage": 52.76, "elapsed_time": "1:23:58", "remaining_time": "1:15:10"}
|
| 765 |
+
{"current_steps": 650, "total_steps": 1230, "loss": 0.3522, "lr": 2.1502687458119268e-05, "epoch": 2.64, "percentage": 52.85, "elapsed_time": "1:24:27", "remaining_time": "1:15:21"}
|
| 766 |
+
{"current_steps": 651, "total_steps": 1230, "loss": 0.372, "lr": 2.1446083241047116e-05, "epoch": 2.6440506329113926, "percentage": 52.93, "elapsed_time": "1:24:58", "remaining_time": "1:15:34"}
|
| 767 |
+
{"current_steps": 652, "total_steps": 1230, "loss": 0.3746, "lr": 2.1389467377419333e-05, "epoch": 2.6481012658227847, "percentage": 53.01, "elapsed_time": "1:25:30", "remaining_time": "1:15:47"}
|
| 768 |
+
{"current_steps": 653, "total_steps": 1230, "loss": 0.3887, "lr": 2.133284032321232e-05, "epoch": 2.6521518987341772, "percentage": 53.09, "elapsed_time": "1:26:07", "remaining_time": "1:16:05"}
|
| 769 |
+
{"current_steps": 654, "total_steps": 1230, "loss": 0.3653, "lr": 2.1276202534492566e-05, "epoch": 2.6562025316455697, "percentage": 53.17, "elapsed_time": "1:26:35", "remaining_time": "1:16:15"}
|
| 770 |
+
{"current_steps": 655, "total_steps": 1230, "loss": 0.3881, "lr": 2.121955446741306e-05, "epoch": 2.660253164556962, "percentage": 53.25, "elapsed_time": "1:27:09", "remaining_time": "1:16:30"}
|
| 771 |
+
{"current_steps": 656, "total_steps": 1230, "loss": 0.3815, "lr": 2.1162896578209517e-05, "epoch": 2.6643037974683543, "percentage": 53.33, "elapsed_time": "1:27:36", "remaining_time": "1:16:39"}
|
| 772 |
+
{"current_steps": 657, "total_steps": 1230, "loss": 0.4014, "lr": 2.1106229323196813e-05, "epoch": 2.668354430379747, "percentage": 53.41, "elapsed_time": "1:28:06", "remaining_time": "1:16:50"}
|
| 773 |
+
{"current_steps": 658, "total_steps": 1230, "loss": 0.3885, "lr": 2.1049553158765214e-05, "epoch": 2.6724050632911394, "percentage": 53.5, "elapsed_time": "1:28:42", "remaining_time": "1:17:06"}
|
| 774 |
+
{"current_steps": 659, "total_steps": 1230, "loss": 0.3659, "lr": 2.0992868541376764e-05, "epoch": 2.676455696202532, "percentage": 53.58, "elapsed_time": "1:29:13", "remaining_time": "1:17:18"}
|
| 775 |
+
{"current_steps": 660, "total_steps": 1230, "loss": 0.4145, "lr": 2.093617592756158e-05, "epoch": 2.680506329113924, "percentage": 53.66, "elapsed_time": "1:29:43", "remaining_time": "1:17:29"}
|
| 776 |
+
{"current_steps": 661, "total_steps": 1230, "loss": 0.3763, "lr": 2.0879475773914167e-05, "epoch": 2.6845569620253165, "percentage": 53.74, "elapsed_time": "1:30:15", "remaining_time": "1:17:42"}
|
| 777 |
+
{"current_steps": 662, "total_steps": 1230, "loss": 0.3749, "lr": 2.082276853708978e-05, "epoch": 2.688607594936709, "percentage": 53.82, "elapsed_time": "1:30:39", "remaining_time": "1:17:47"}
|
| 778 |
+
{"current_steps": 663, "total_steps": 1230, "loss": 0.3754, "lr": 2.076605467380071e-05, "epoch": 2.692658227848101, "percentage": 53.9, "elapsed_time": "1:31:10", "remaining_time": "1:17:58"}
|
| 779 |
+
{"current_steps": 664, "total_steps": 1230, "loss": 0.3868, "lr": 2.0709334640812613e-05, "epoch": 2.6967088607594936, "percentage": 53.98, "elapsed_time": "1:31:45", "remaining_time": "1:18:13"}
|
| 780 |
+
{"current_steps": 665, "total_steps": 1230, "loss": 0.3862, "lr": 2.0652608894940824e-05, "epoch": 2.700759493670886, "percentage": 54.07, "elapsed_time": "1:32:18", "remaining_time": "1:18:25"}
|
| 781 |
+
{"current_steps": 666, "total_steps": 1230, "loss": 0.3726, "lr": 2.0595877893046722e-05, "epoch": 2.7048101265822786, "percentage": 54.15, "elapsed_time": "1:32:48", "remaining_time": "1:18:35"}
|
| 782 |
+
{"current_steps": 667, "total_steps": 1230, "loss": 0.3906, "lr": 2.0539142092033985e-05, "epoch": 2.708860759493671, "percentage": 54.23, "elapsed_time": "1:33:21", "remaining_time": "1:18:48"}
|
| 783 |
+
{"current_steps": 668, "total_steps": 1230, "loss": 0.3925, "lr": 2.048240194884496e-05, "epoch": 2.712911392405063, "percentage": 54.31, "elapsed_time": "1:33:53", "remaining_time": "1:18:59"}
|
| 784 |
+
{"current_steps": 669, "total_steps": 1230, "loss": 0.3809, "lr": 2.042565792045695e-05, "epoch": 2.7169620253164557, "percentage": 54.39, "elapsed_time": "1:34:27", "remaining_time": "1:19:12"}
|
| 785 |
+
{"current_steps": 670, "total_steps": 1230, "loss": 0.3856, "lr": 2.036891046387857e-05, "epoch": 2.721012658227848, "percentage": 54.47, "elapsed_time": "1:34:58", "remaining_time": "1:19:22"}
|
| 786 |
+
{"current_steps": 671, "total_steps": 1230, "loss": 0.3823, "lr": 2.0312160036146036e-05, "epoch": 2.7250632911392403, "percentage": 54.55, "elapsed_time": "1:35:34", "remaining_time": "1:19:37"}
|
| 787 |
+
{"current_steps": 672, "total_steps": 1230, "loss": 0.3906, "lr": 2.025540709431948e-05, "epoch": 2.729113924050633, "percentage": 54.63, "elapsed_time": "1:36:07", "remaining_time": "1:19:49"}
|
| 788 |
+
{"current_steps": 673, "total_steps": 1230, "loss": 0.3807, "lr": 2.0198652095479298e-05, "epoch": 2.7331645569620253, "percentage": 54.72, "elapsed_time": "1:36:41", "remaining_time": "1:20:01"}
|
| 789 |
+
{"current_steps": 674, "total_steps": 1230, "loss": 0.3746, "lr": 2.014189549672245e-05, "epoch": 2.737215189873418, "percentage": 54.8, "elapsed_time": "1:37:13", "remaining_time": "1:20:11"}
|
| 790 |
+
{"current_steps": 675, "total_steps": 1230, "loss": 0.3928, "lr": 2.0085137755158776e-05, "epoch": 2.7412658227848103, "percentage": 54.88, "elapsed_time": "1:37:49", "remaining_time": "1:20:26"}
|
| 791 |
+
{"current_steps": 676, "total_steps": 1230, "loss": 0.3902, "lr": 2.0028379327907327e-05, "epoch": 2.7453164556962024, "percentage": 54.96, "elapsed_time": "1:38:22", "remaining_time": "1:20:37"}
|
| 792 |
+
{"current_steps": 677, "total_steps": 1230, "loss": 0.3615, "lr": 1.9971620672092676e-05, "epoch": 2.749367088607595, "percentage": 55.04, "elapsed_time": "1:38:56", "remaining_time": "1:20:49"}
|
| 793 |
+
{"current_steps": 678, "total_steps": 1230, "loss": 0.4028, "lr": 1.991486224484123e-05, "epoch": 2.7534177215189874, "percentage": 55.12, "elapsed_time": "1:39:33", "remaining_time": "1:21:03"}
|
| 794 |
+
{"current_steps": 679, "total_steps": 1230, "loss": 0.3878, "lr": 1.985810450327756e-05, "epoch": 2.7574683544303795, "percentage": 55.2, "elapsed_time": "1:40:04", "remaining_time": "1:21:12"}
|
| 795 |
+
{"current_steps": 680, "total_steps": 1230, "loss": 0.3624, "lr": 1.9801347904520706e-05, "epoch": 2.761518987341772, "percentage": 55.28, "elapsed_time": "1:40:32", "remaining_time": "1:21:18"}
|
| 796 |
+
{"current_steps": 681, "total_steps": 1230, "loss": 0.3825, "lr": 1.974459290568053e-05, "epoch": 2.7655696202531646, "percentage": 55.37, "elapsed_time": "1:41:07", "remaining_time": "1:21:31"}
|
| 797 |
+
{"current_steps": 682, "total_steps": 1230, "loss": 0.362, "lr": 1.968783996385397e-05, "epoch": 2.769620253164557, "percentage": 55.45, "elapsed_time": "1:41:44", "remaining_time": "1:21:45"}
|
| 798 |
+
{"current_steps": 683, "total_steps": 1230, "loss": 0.378, "lr": 1.963108953612143e-05, "epoch": 2.7736708860759496, "percentage": 55.53, "elapsed_time": "1:42:15", "remaining_time": "1:21:53"}
|
| 799 |
+
{"current_steps": 684, "total_steps": 1230, "loss": 0.3718, "lr": 1.9574342079543056e-05, "epoch": 2.7777215189873417, "percentage": 55.61, "elapsed_time": "1:42:48", "remaining_time": "1:22:03"}
|
| 800 |
+
{"current_steps": 685, "total_steps": 1230, "loss": 0.3955, "lr": 1.9517598051155046e-05, "epoch": 2.781772151898734, "percentage": 55.69, "elapsed_time": "1:43:20", "remaining_time": "1:22:13"}
|
| 801 |
+
{"current_steps": 686, "total_steps": 1230, "loss": 0.3637, "lr": 1.9460857907966025e-05, "epoch": 2.7858227848101267, "percentage": 55.77, "elapsed_time": "1:43:55", "remaining_time": "1:22:24"}
|
| 802 |
+
{"current_steps": 687, "total_steps": 1230, "loss": 0.3636, "lr": 1.9404122106953285e-05, "epoch": 2.7898734177215188, "percentage": 55.85, "elapsed_time": "1:44:24", "remaining_time": "1:22:31"}
|
| 803 |
+
{"current_steps": 688, "total_steps": 1230, "loss": 0.3945, "lr": 1.9347391105059176e-05, "epoch": 2.7939240506329113, "percentage": 55.93, "elapsed_time": "1:44:58", "remaining_time": "1:22:41"}
|
| 804 |
+
{"current_steps": 689, "total_steps": 1230, "loss": 0.3827, "lr": 1.92906653591874e-05, "epoch": 2.797974683544304, "percentage": 56.02, "elapsed_time": "1:45:29", "remaining_time": "1:22:50"}
|
| 805 |
+
{"current_steps": 690, "total_steps": 1230, "loss": 0.3752, "lr": 1.9233945326199295e-05, "epoch": 2.8020253164556963, "percentage": 56.1, "elapsed_time": "1:46:00", "remaining_time": "1:22:57"}
|
| 806 |
+
{"current_steps": 691, "total_steps": 1230, "loss": 0.387, "lr": 1.917723146291022e-05, "epoch": 2.806075949367089, "percentage": 56.18, "elapsed_time": "1:46:36", "remaining_time": "1:23:09"}
|
| 807 |
+
{"current_steps": 692, "total_steps": 1230, "loss": 0.3785, "lr": 1.912052422608584e-05, "epoch": 2.810126582278481, "percentage": 56.26, "elapsed_time": "1:47:10", "remaining_time": "1:23:19"}
|
| 808 |
+
{"current_steps": 693, "total_steps": 1230, "loss": 0.4073, "lr": 1.9063824072438428e-05, "epoch": 2.8141772151898734, "percentage": 56.34, "elapsed_time": "1:47:44", "remaining_time": "1:23:29"}
|
| 809 |
+
{"current_steps": 694, "total_steps": 1230, "loss": 0.3517, "lr": 1.9007131458623246e-05, "epoch": 2.818227848101266, "percentage": 56.42, "elapsed_time": "1:48:10", "remaining_time": "1:23:32"}
|
| 810 |
+
{"current_steps": 695, "total_steps": 1230, "loss": 0.3842, "lr": 1.895044684123479e-05, "epoch": 2.822278481012658, "percentage": 56.5, "elapsed_time": "1:48:37", "remaining_time": "1:23:37"}
|
| 811 |
+
{"current_steps": 696, "total_steps": 1230, "loss": 0.3746, "lr": 1.8893770676803194e-05, "epoch": 2.8263291139240505, "percentage": 56.59, "elapsed_time": "1:49:08", "remaining_time": "1:23:44"}
|
| 812 |
+
{"current_steps": 697, "total_steps": 1230, "loss": 0.3587, "lr": 1.8837103421790486e-05, "epoch": 2.830379746835443, "percentage": 56.67, "elapsed_time": "1:49:41", "remaining_time": "1:23:53"}
|
| 813 |
+
{"current_steps": 698, "total_steps": 1230, "loss": 0.3673, "lr": 1.8780445532586952e-05, "epoch": 2.8344303797468355, "percentage": 56.75, "elapsed_time": "1:50:05", "remaining_time": "1:23:54"}
|
| 814 |
+
{"current_steps": 699, "total_steps": 1230, "loss": 0.3794, "lr": 1.872379746550743e-05, "epoch": 2.838481012658228, "percentage": 56.83, "elapsed_time": "1:50:37", "remaining_time": "1:24:02"}
|
| 815 |
+
{"current_steps": 700, "total_steps": 1230, "loss": 0.3983, "lr": 1.866715967678769e-05, "epoch": 2.84253164556962, "percentage": 56.91, "elapsed_time": "1:51:05", "remaining_time": "1:24:06"}
|
| 816 |
+
{"current_steps": 701, "total_steps": 1230, "loss": 0.3653, "lr": 1.861053262258067e-05, "epoch": 2.8465822784810126, "percentage": 56.99, "elapsed_time": "1:51:39", "remaining_time": "1:24:15"}
|
| 817 |
+
{"current_steps": 702, "total_steps": 1230, "loss": 0.3559, "lr": 1.8553916758952897e-05, "epoch": 2.850632911392405, "percentage": 57.07, "elapsed_time": "1:52:14", "remaining_time": "1:24:25"}
|
| 818 |
+
{"current_steps": 703, "total_steps": 1230, "loss": 0.39, "lr": 1.8497312541880735e-05, "epoch": 2.8546835443037972, "percentage": 57.15, "elapsed_time": "1:52:40", "remaining_time": "1:24:27"}
|
| 819 |
+
{"current_steps": 704, "total_steps": 1230, "loss": 0.3465, "lr": 1.8440720427246786e-05, "epoch": 2.8587341772151897, "percentage": 57.24, "elapsed_time": "1:53:10", "remaining_time": "1:24:33"}
|
| 820 |
+
{"current_steps": 705, "total_steps": 1230, "loss": 0.3752, "lr": 1.8384140870836157e-05, "epoch": 2.8627848101265823, "percentage": 57.32, "elapsed_time": "1:53:40", "remaining_time": "1:24:39"}
|
| 821 |
+
{"current_steps": 706, "total_steps": 1230, "loss": 0.3662, "lr": 1.8327574328332806e-05, "epoch": 2.8668354430379748, "percentage": 57.4, "elapsed_time": "1:54:09", "remaining_time": "1:24:43"}
|
| 822 |
+
{"current_steps": 707, "total_steps": 1230, "loss": 0.3769, "lr": 1.8271021255315906e-05, "epoch": 2.8708860759493673, "percentage": 57.48, "elapsed_time": "1:54:40", "remaining_time": "1:24:49"}
|
| 823 |
+
{"current_steps": 708, "total_steps": 1230, "loss": 0.3791, "lr": 1.8214482107256117e-05, "epoch": 2.8749367088607594, "percentage": 57.56, "elapsed_time": "1:55:11", "remaining_time": "1:24:56"}
|
| 824 |
+
{"current_steps": 709, "total_steps": 1230, "loss": 0.3874, "lr": 1.8157957339511968e-05, "epoch": 2.878987341772152, "percentage": 57.64, "elapsed_time": "1:55:41", "remaining_time": "1:25:00"}
|
| 825 |
+
{"current_steps": 710, "total_steps": 1230, "loss": 0.3747, "lr": 1.8101447407326182e-05, "epoch": 2.8830379746835444, "percentage": 57.72, "elapsed_time": "1:56:11", "remaining_time": "1:25:05"}
|
| 826 |
+
{"current_steps": 711, "total_steps": 1230, "loss": 0.3751, "lr": 1.8044952765821966e-05, "epoch": 2.8870886075949365, "percentage": 57.8, "elapsed_time": "1:56:42", "remaining_time": "1:25:11"}
|
| 827 |
+
{"current_steps": 712, "total_steps": 1230, "loss": 0.3993, "lr": 1.7988473869999407e-05, "epoch": 2.891139240506329, "percentage": 57.89, "elapsed_time": "1:57:18", "remaining_time": "1:25:20"}
|
| 828 |
+
{"current_steps": 713, "total_steps": 1230, "loss": 0.3855, "lr": 1.7932011174731764e-05, "epoch": 2.8951898734177215, "percentage": 57.97, "elapsed_time": "1:57:53", "remaining_time": "1:25:29"}
|
| 829 |
+
{"current_steps": 714, "total_steps": 1230, "loss": 0.3599, "lr": 1.7875565134761817e-05, "epoch": 2.899240506329114, "percentage": 58.05, "elapsed_time": "1:58:22", "remaining_time": "1:25:33"}
|
| 830 |
+
{"current_steps": 715, "total_steps": 1230, "loss": 0.368, "lr": 1.7819136204698226e-05, "epoch": 2.9032911392405065, "percentage": 58.13, "elapsed_time": "1:58:53", "remaining_time": "1:25:38"}
|
| 831 |
+
{"current_steps": 716, "total_steps": 1230, "loss": 0.3582, "lr": 1.776272483901182e-05, "epoch": 2.9073417721518986, "percentage": 58.21, "elapsed_time": "1:59:27", "remaining_time": "1:25:45"}
|
| 832 |
+
{"current_steps": 717, "total_steps": 1230, "loss": 0.343, "lr": 1.7706331492031995e-05, "epoch": 2.911392405063291, "percentage": 58.29, "elapsed_time": "1:59:56", "remaining_time": "1:25:48"}
|
| 833 |
+
{"current_steps": 718, "total_steps": 1230, "loss": 0.4067, "lr": 1.764995661794301e-05, "epoch": 2.9154430379746836, "percentage": 58.37, "elapsed_time": "2:00:31", "remaining_time": "1:25:56"}
|
| 834 |
+
{"current_steps": 719, "total_steps": 1230, "loss": 0.393, "lr": 1.759360067078035e-05, "epoch": 2.9194936708860757, "percentage": 58.46, "elapsed_time": "2:01:07", "remaining_time": "1:26:04"}
|
| 835 |
+
{"current_steps": 720, "total_steps": 1230, "loss": 0.3943, "lr": 1.7537264104427064e-05, "epoch": 2.923544303797468, "percentage": 58.54, "elapsed_time": "2:01:46", "remaining_time": "1:26:15"}
|
| 836 |
+
{"current_steps": 721, "total_steps": 1230, "loss": 0.3808, "lr": 1.748094737261012e-05, "epoch": 2.9275949367088607, "percentage": 58.62, "elapsed_time": "2:02:20", "remaining_time": "1:26:21"}
|
| 837 |
+
{"current_steps": 722, "total_steps": 1230, "loss": 0.3883, "lr": 1.7424650928896726e-05, "epoch": 2.9316455696202532, "percentage": 58.7, "elapsed_time": "2:02:56", "remaining_time": "1:26:29"}
|
| 838 |
+
{"current_steps": 723, "total_steps": 1230, "loss": 0.3841, "lr": 1.7368375226690712e-05, "epoch": 2.9356962025316458, "percentage": 58.78, "elapsed_time": "2:03:32", "remaining_time": "1:26:37"}
|
| 839 |
+
{"current_steps": 724, "total_steps": 1230, "loss": 0.3652, "lr": 1.731212071922883e-05, "epoch": 2.939746835443038, "percentage": 58.86, "elapsed_time": "2:03:58", "remaining_time": "1:26:38"}
|
| 840 |
+
{"current_steps": 725, "total_steps": 1230, "loss": 0.3591, "lr": 1.7255887859577156e-05, "epoch": 2.9437974683544303, "percentage": 58.94, "elapsed_time": "2:04:29", "remaining_time": "1:26:42"}
|
| 841 |
+
{"current_steps": 726, "total_steps": 1230, "loss": 0.3516, "lr": 1.7199677100627427e-05, "epoch": 2.947848101265823, "percentage": 59.02, "elapsed_time": "2:05:00", "remaining_time": "1:26:47"}
|
| 842 |
+
{"current_steps": 727, "total_steps": 1230, "loss": 0.3657, "lr": 1.7143488895093343e-05, "epoch": 2.951898734177215, "percentage": 59.11, "elapsed_time": "2:05:32", "remaining_time": "1:26:51"}
|
| 843 |
+
{"current_steps": 728, "total_steps": 1230, "loss": 0.4001, "lr": 1.7087323695506994e-05, "epoch": 2.9559493670886074, "percentage": 59.19, "elapsed_time": "2:05:59", "remaining_time": "1:26:52"}
|
| 844 |
+
{"current_steps": 729, "total_steps": 1230, "loss": 0.3876, "lr": 1.7031181954215194e-05, "epoch": 2.96, "percentage": 59.27, "elapsed_time": "2:06:31", "remaining_time": "1:26:57"}
|
| 845 |
+
{"current_steps": 730, "total_steps": 1230, "loss": 0.3724, "lr": 1.6975064123375788e-05, "epoch": 2.9640506329113925, "percentage": 59.35, "elapsed_time": "2:07:03", "remaining_time": "1:27:01"}
|
| 846 |
+
{"current_steps": 731, "total_steps": 1230, "loss": 0.3781, "lr": 1.6918970654954084e-05, "epoch": 2.968101265822785, "percentage": 59.43, "elapsed_time": "2:07:39", "remaining_time": "1:27:08"}
|
| 847 |
+
{"current_steps": 732, "total_steps": 1230, "loss": 0.3777, "lr": 1.686290200071915e-05, "epoch": 2.972151898734177, "percentage": 59.51, "elapsed_time": "2:08:14", "remaining_time": "1:27:14"}
|
| 848 |
+
{"current_steps": 733, "total_steps": 1230, "loss": 0.3842, "lr": 1.6806858612240234e-05, "epoch": 2.9762025316455696, "percentage": 59.59, "elapsed_time": "2:08:45", "remaining_time": "1:27:18"}
|
| 849 |
+
{"current_steps": 734, "total_steps": 1230, "loss": 0.3711, "lr": 1.6750840940883078e-05, "epoch": 2.980253164556962, "percentage": 59.67, "elapsed_time": "2:09:24", "remaining_time": "1:27:26"}
|
| 850 |
+
{"current_steps": 735, "total_steps": 1230, "loss": 0.3679, "lr": 1.6694849437806305e-05, "epoch": 2.984303797468354, "percentage": 59.76, "elapsed_time": "2:10:02", "remaining_time": "1:27:34"}
|
| 851 |
+
{"current_steps": 736, "total_steps": 1230, "loss": 0.3704, "lr": 1.663888455395778e-05, "epoch": 2.9883544303797467, "percentage": 59.84, "elapsed_time": "2:10:37", "remaining_time": "1:27:40"}
|
| 852 |
+
{"current_steps": 737, "total_steps": 1230, "loss": 0.3671, "lr": 1.6582946740070995e-05, "epoch": 2.992405063291139, "percentage": 59.92, "elapsed_time": "2:11:08", "remaining_time": "1:27:43"}
|
| 853 |
+
{"current_steps": 738, "total_steps": 1230, "loss": 0.3718, "lr": 1.6527036446661396e-05, "epoch": 2.9964556962025317, "percentage": 60.0, "elapsed_time": "2:11:38", "remaining_time": "1:27:45"}
|
| 854 |
+
{"current_steps": 739, "total_steps": 1230, "loss": 0.3772, "lr": 1.6471154124022818e-05, "epoch": 3.0005063291139242, "percentage": 60.08, "elapsed_time": "2:14:34", "remaining_time": "1:29:24"}
|
| 855 |
+
{"current_steps": 740, "total_steps": 1230, "loss": 0.2749, "lr": 1.6415300222223788e-05, "epoch": 3.0045569620253163, "percentage": 60.16, "elapsed_time": "2:15:08", "remaining_time": "1:29:28"}
|
| 856 |
+
{"current_steps": 741, "total_steps": 1230, "loss": 0.275, "lr": 1.6359475191103958e-05, "epoch": 3.008607594936709, "percentage": 60.24, "elapsed_time": "2:15:37", "remaining_time": "1:29:29"}
|
| 857 |
+
{"current_steps": 742, "total_steps": 1230, "loss": 0.2584, "lr": 1.6303679480270466e-05, "epoch": 3.0126582278481013, "percentage": 60.33, "elapsed_time": "2:16:06", "remaining_time": "1:29:31"}
|
| 858 |
+
{"current_steps": 743, "total_steps": 1230, "loss": 0.2682, "lr": 1.624791353909428e-05, "epoch": 3.016708860759494, "percentage": 60.41, "elapsed_time": "2:16:42", "remaining_time": "1:29:36"}
|
| 859 |
+
{"current_steps": 744, "total_steps": 1230, "loss": 0.2685, "lr": 1.619217781670663e-05, "epoch": 3.020759493670886, "percentage": 60.49, "elapsed_time": "2:17:13", "remaining_time": "1:29:38"}
|
| 860 |
+
{"current_steps": 745, "total_steps": 1230, "loss": 0.2529, "lr": 1.6136472761995373e-05, "epoch": 3.0248101265822784, "percentage": 60.57, "elapsed_time": "2:17:42", "remaining_time": "1:29:38"}
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a961807021211f5b4e41fd67326ded975493ba88dc18767826c2d605f7cbdbbd
|
| 3 |
+
size 7352
|