Training in progress, epoch 2
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- trainer_log.jsonl +313 -0
- training_args.bin +1 -1
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c5ea0452a712a9573209f711abe0c32f612258f0c1aada898967953834241f1
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3821ff2311e5726f08585ec497859aa4bcd6cc145d4fa36005ada8da2534e1c2
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ace206dcd8b8fa3b55a0f48f96a33a3dae36964b339cfeb2733015ee8e1678d7
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dbda001c85a29bd1c17927101ca90553ddbd51d26ff7e00b809a3367a1fbd2ca
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -1083,3 +1083,316 @@
|
|
| 1083 |
{"current_steps": 588, "total_steps": 1230, "loss": 0.2393, "lr": 2.4970499141404942e-05, "epoch": 2.3848101265822783, "percentage": 47.8, "elapsed_time": "13:58:01", "remaining_time": "15:14:58"}
|
| 1084 |
{"current_steps": 496, "total_steps": 1230, "loss": 0.2479, "lr": 2.980274210295326e-05, "epoch": 2.012151898734177, "percentage": 40.33, "elapsed_time": "11:47:43", "remaining_time": "17:27:19"}
|
| 1085 |
{"current_steps": 589, "total_steps": 1230, "loss": 0.2506, "lr": 2.491550129992345e-05, "epoch": 2.388860759493671, "percentage": 47.89, "elapsed_time": "13:59:28", "remaining_time": "15:13:35"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1083 |
{"current_steps": 588, "total_steps": 1230, "loss": 0.2393, "lr": 2.4970499141404942e-05, "epoch": 2.3848101265822783, "percentage": 47.8, "elapsed_time": "13:58:01", "remaining_time": "15:14:58"}
|
| 1084 |
{"current_steps": 496, "total_steps": 1230, "loss": 0.2479, "lr": 2.980274210295326e-05, "epoch": 2.012151898734177, "percentage": 40.33, "elapsed_time": "11:47:43", "remaining_time": "17:27:19"}
|
| 1085 |
{"current_steps": 589, "total_steps": 1230, "loss": 0.2506, "lr": 2.491550129992345e-05, "epoch": 2.388860759493671, "percentage": 47.89, "elapsed_time": "13:59:28", "remaining_time": "15:13:35"}
|
| 1086 |
+
{"current_steps": 497, "total_steps": 1230, "loss": 0.2384, "lr": 2.9753229259313578e-05, "epoch": 2.0162025316455696, "percentage": 40.41, "elapsed_time": "11:49:12", "remaining_time": "17:25:58"}
|
| 1087 |
+
{"current_steps": 590, "total_steps": 1230, "loss": 0.2602, "lr": 2.486046386967024e-05, "epoch": 2.3929113924050633, "percentage": 47.97, "elapsed_time": "14:01:00", "remaining_time": "15:12:16"}
|
| 1088 |
+
{"current_steps": 498, "total_steps": 1230, "loss": 0.2398, "lr": 2.9703637864506274e-05, "epoch": 2.020253164556962, "percentage": 40.49, "elapsed_time": "11:50:26", "remaining_time": "17:24:15"}
|
| 1089 |
+
{"current_steps": 591, "total_steps": 1230, "loss": 0.252, "lr": 2.4805387293909214e-05, "epoch": 2.396962025316456, "percentage": 48.05, "elapsed_time": "14:02:28", "remaining_time": "15:10:53"}
|
| 1090 |
+
{"current_steps": 499, "total_steps": 1230, "loss": 0.2598, "lr": 2.965396831793362e-05, "epoch": 2.0243037974683546, "percentage": 40.57, "elapsed_time": "11:52:08", "remaining_time": "17:23:14"}
|
| 1091 |
+
{"current_steps": 592, "total_steps": 1230, "loss": 0.2757, "lr": 2.4750272016219552e-05, "epoch": 2.401012658227848, "percentage": 48.13, "elapsed_time": "14:04:01", "remaining_time": "15:09:36"}
|
| 1092 |
+
{"current_steps": 500, "total_steps": 1230, "loss": 0.2344, "lr": 2.9604221019627316e-05, "epoch": 2.0283544303797467, "percentage": 40.65, "elapsed_time": "11:53:34", "remaining_time": "17:21:49"}
|
| 1093 |
+
{"current_steps": 593, "total_steps": 1230, "loss": 0.2343, "lr": 2.4695118480492114e-05, "epoch": 2.4050632911392404, "percentage": 48.21, "elapsed_time": "14:05:13", "remaining_time": "15:07:56"}
|
| 1094 |
+
{"current_steps": 501, "total_steps": 1230, "loss": 0.2568, "lr": 2.955439637024526e-05, "epoch": 2.0324050632911392, "percentage": 40.73, "elapsed_time": "11:54:56", "remaining_time": "17:20:18"}
|
| 1095 |
+
{"current_steps": 594, "total_steps": 1230, "loss": 0.2608, "lr": 2.4639927130925898e-05, "epoch": 2.409113924050633, "percentage": 48.29, "elapsed_time": "14:06:46", "remaining_time": "15:06:39"}
|
| 1096 |
+
{"current_steps": 502, "total_steps": 1230, "loss": 0.2622, "lr": 2.9504494771068334e-05, "epoch": 2.0364556962025318, "percentage": 40.81, "elapsed_time": "11:56:16", "remaining_time": "17:18:44"}
|
| 1097 |
+
{"current_steps": 595, "total_steps": 1230, "loss": 0.2424, "lr": 2.458469841202444e-05, "epoch": 2.4131645569620255, "percentage": 48.37, "elapsed_time": "14:08:00", "remaining_time": "15:05:00"}
|
| 1098 |
+
{"current_steps": 503, "total_steps": 1230, "loss": 0.2345, "lr": 2.9454516623997156e-05, "epoch": 2.0405063291139243, "percentage": 40.89, "elapsed_time": "11:57:35", "remaining_time": "17:17:09"}
|
| 1099 |
+
{"current_steps": 596, "total_steps": 1230, "loss": 0.2488, "lr": 2.452943276859226e-05, "epoch": 2.4172151898734175, "percentage": 48.46, "elapsed_time": "14:09:22", "remaining_time": "15:03:32"}
|
| 1100 |
+
{"current_steps": 504, "total_steps": 1230, "loss": 0.2347, "lr": 2.9404462331548847e-05, "epoch": 2.0445569620253163, "percentage": 40.98, "elapsed_time": "11:58:49", "remaining_time": "17:15:27"}
|
| 1101 |
+
{"current_steps": 597, "total_steps": 1230, "loss": 0.2456, "lr": 2.447413064573125e-05, "epoch": 2.42126582278481, "percentage": 48.54, "elapsed_time": "14:10:38", "remaining_time": "15:01:56"}
|
| 1102 |
+
{"current_steps": 505, "total_steps": 1230, "loss": 0.2599, "lr": 2.93543322968538e-05, "epoch": 2.048607594936709, "percentage": 41.06, "elapsed_time": "12:00:26", "remaining_time": "17:14:18"}
|
| 1103 |
+
{"current_steps": 598, "total_steps": 1230, "loss": 0.2332, "lr": 2.4418792488837095e-05, "epoch": 2.4253164556962026, "percentage": 48.62, "elapsed_time": "14:11:39", "remaining_time": "15:00:05"}
|
| 1104 |
+
{"current_steps": 599, "total_steps": 1230, "loss": 0.2348, "lr": 2.4363418743595713e-05, "epoch": 2.429367088607595, "percentage": 48.7, "elapsed_time": "14:12:54", "remaining_time": "14:58:28"}
|
| 1105 |
+
{"current_steps": 506, "total_steps": 1230, "loss": 0.2412, "lr": 2.9304126923652428e-05, "epoch": 2.0526582278481014, "percentage": 41.14, "elapsed_time": "12:02:11", "remaining_time": "17:13:20"}
|
| 1106 |
+
{"current_steps": 600, "total_steps": 1230, "loss": 0.2435, "lr": 2.430800985597963e-05, "epoch": 2.433417721518987, "percentage": 48.78, "elapsed_time": "14:14:20", "remaining_time": "14:57:03"}
|
| 1107 |
+
{"current_steps": 507, "total_steps": 1230, "loss": 0.2787, "lr": 2.9253846616291896e-05, "epoch": 2.056708860759494, "percentage": 41.22, "elapsed_time": "12:03:39", "remaining_time": "17:11:57"}
|
| 1108 |
+
{"current_steps": 601, "total_steps": 1230, "loss": 0.274, "lr": 2.4252566272244415e-05, "epoch": 2.4374683544303797, "percentage": 48.86, "elapsed_time": "14:15:58", "remaining_time": "14:55:51"}
|
| 1109 |
+
{"current_steps": 508, "total_steps": 1230, "loss": 0.2412, "lr": 2.9203491779722896e-05, "epoch": 2.060759493670886, "percentage": 41.3, "elapsed_time": "12:04:52", "remaining_time": "17:10:13"}
|
| 1110 |
+
{"current_steps": 509, "total_steps": 1230, "loss": 0.2539, "lr": 2.9153062819496357e-05, "epoch": 2.0648101265822785, "percentage": 41.38, "elapsed_time": "12:06:01", "remaining_time": "17:08:25"}
|
| 1111 |
+
{"current_steps": 602, "total_steps": 1230, "loss": 0.2681, "lr": 2.4197088438925063e-05, "epoch": 2.441518987341772, "percentage": 48.94, "elapsed_time": "14:17:27", "remaining_time": "14:54:29"}
|
| 1112 |
+
{"current_steps": 510, "total_steps": 1230, "loss": 0.2396, "lr": 2.9102560141760178e-05, "epoch": 2.068860759493671, "percentage": 41.46, "elapsed_time": "12:07:17", "remaining_time": "17:06:45"}
|
| 1113 |
+
{"current_steps": 603, "total_steps": 1230, "loss": 0.2682, "lr": 2.4141576802832417e-05, "epoch": 2.4455696202531647, "percentage": 49.02, "elapsed_time": "14:19:01", "remaining_time": "14:53:12"}
|
| 1114 |
+
{"current_steps": 511, "total_steps": 1230, "loss": 0.257, "lr": 2.9051984153256004e-05, "epoch": 2.0729113924050635, "percentage": 41.54, "elapsed_time": "12:08:46", "remaining_time": "17:05:25"}
|
| 1115 |
+
{"current_steps": 604, "total_steps": 1230, "loss": 0.2531, "lr": 2.408603181104957e-05, "epoch": 2.449620253164557, "percentage": 49.11, "elapsed_time": "14:20:34", "remaining_time": "14:51:54"}
|
| 1116 |
+
{"current_steps": 512, "total_steps": 1230, "loss": 0.2628, "lr": 2.900133526131588e-05, "epoch": 2.0769620253164556, "percentage": 41.63, "elapsed_time": "12:10:08", "remaining_time": "17:03:54"}
|
| 1117 |
+
{"current_steps": 605, "total_steps": 1230, "loss": 0.259, "lr": 2.4030453910928245e-05, "epoch": 2.4536708860759493, "percentage": 49.19, "elapsed_time": "14:21:48", "remaining_time": "14:50:17"}
|
| 1118 |
+
{"current_steps": 513, "total_steps": 1230, "loss": 0.2552, "lr": 2.8950613873859025e-05, "epoch": 2.081012658227848, "percentage": 41.71, "elapsed_time": "12:11:48", "remaining_time": "17:02:48"}
|
| 1119 |
+
{"current_steps": 606, "total_steps": 1230, "loss": 0.2289, "lr": 2.397484355008521e-05, "epoch": 2.457721518987342, "percentage": 49.27, "elapsed_time": "14:23:02", "remaining_time": "14:48:40"}
|
| 1120 |
+
{"current_steps": 607, "total_steps": 1230, "loss": 0.2524, "lr": 2.3919201176398662e-05, "epoch": 2.4617721518987343, "percentage": 49.35, "elapsed_time": "14:24:14", "remaining_time": "14:47:00"}
|
| 1121 |
+
{"current_steps": 514, "total_steps": 1230, "loss": 0.2449, "lr": 2.8899820399388515e-05, "epoch": 2.0850632911392406, "percentage": 41.79, "elapsed_time": "12:13:21", "remaining_time": "17:01:33"}
|
| 1122 |
+
{"current_steps": 608, "total_steps": 1230, "loss": 0.2809, "lr": 2.3863527238004633e-05, "epoch": 2.4658227848101264, "percentage": 49.43, "elapsed_time": "14:25:58", "remaining_time": "14:45:55"}
|
| 1123 |
+
{"current_steps": 515, "total_steps": 1230, "loss": 0.2483, "lr": 2.8848955246988012e-05, "epoch": 2.089113924050633, "percentage": 41.87, "elapsed_time": "12:14:58", "remaining_time": "17:00:24"}
|
| 1124 |
+
{"current_steps": 609, "total_steps": 1230, "loss": 0.24, "lr": 2.380782218329337e-05, "epoch": 2.469873417721519, "percentage": 49.51, "elapsed_time": "14:27:23", "remaining_time": "14:44:28"}
|
| 1125 |
+
{"current_steps": 516, "total_steps": 1230, "loss": 0.2347, "lr": 2.879801882631847e-05, "epoch": 2.093164556962025, "percentage": 41.95, "elapsed_time": "12:16:20", "remaining_time": "16:58:53"}
|
| 1126 |
+
{"current_steps": 517, "total_steps": 1230, "loss": 0.2308, "lr": 2.8747011547614808e-05, "epoch": 2.0972151898734177, "percentage": 42.03, "elapsed_time": "12:17:32", "remaining_time": "16:57:09"}
|
| 1127 |
+
{"current_steps": 610, "total_steps": 1230, "loss": 0.2611, "lr": 2.3752086460905725e-05, "epoch": 2.4739240506329114, "percentage": 49.59, "elapsed_time": "14:29:01", "remaining_time": "14:43:16"}
|
| 1128 |
+
{"current_steps": 518, "total_steps": 1230, "loss": 0.2556, "lr": 2.8695933821682635e-05, "epoch": 2.1012658227848102, "percentage": 42.11, "elapsed_time": "12:19:07", "remaining_time": "16:55:56"}
|
| 1129 |
+
{"current_steps": 611, "total_steps": 1230, "loss": 0.2617, "lr": 2.3696320519729544e-05, "epoch": 2.477974683544304, "percentage": 49.67, "elapsed_time": "14:30:22", "remaining_time": "14:41:46"}
|
| 1130 |
+
{"current_steps": 519, "total_steps": 1230, "loss": 0.2395, "lr": 2.864478605989494e-05, "epoch": 2.1053164556962027, "percentage": 42.2, "elapsed_time": "12:20:08", "remaining_time": "16:53:56"}
|
| 1131 |
+
{"current_steps": 612, "total_steps": 1230, "loss": 0.2468, "lr": 2.3640524808896045e-05, "epoch": 2.482025316455696, "percentage": 49.76, "elapsed_time": "14:31:41", "remaining_time": "14:40:14"}
|
| 1132 |
+
{"current_steps": 520, "total_steps": 1230, "loss": 0.2537, "lr": 2.8593568674188765e-05, "epoch": 2.109367088607595, "percentage": 42.28, "elapsed_time": "12:21:27", "remaining_time": "16:52:23"}
|
| 1133 |
+
{"current_steps": 613, "total_steps": 1230, "loss": 0.2401, "lr": 2.3584699777776222e-05, "epoch": 2.4860759493670885, "percentage": 49.84, "elapsed_time": "14:32:52", "remaining_time": "14:38:34"}
|
| 1134 |
+
{"current_steps": 521, "total_steps": 1230, "loss": 0.2298, "lr": 2.8542282077061892e-05, "epoch": 2.1134177215189873, "percentage": 42.36, "elapsed_time": "12:22:44", "remaining_time": "16:50:45"}
|
| 1135 |
+
{"current_steps": 614, "total_steps": 1230, "loss": 0.247, "lr": 2.3528845875977195e-05, "epoch": 2.490126582278481, "percentage": 49.92, "elapsed_time": "14:34:13", "remaining_time": "14:37:04"}
|
| 1136 |
+
{"current_steps": 522, "total_steps": 1230, "loss": 0.2342, "lr": 2.8490926681569523e-05, "epoch": 2.11746835443038, "percentage": 42.44, "elapsed_time": "12:24:02", "remaining_time": "16:49:08"}
|
| 1137 |
+
{"current_steps": 615, "total_steps": 1230, "loss": 0.2568, "lr": 2.3472963553338614e-05, "epoch": 2.4941772151898736, "percentage": 50.0, "elapsed_time": "14:35:33", "remaining_time": "14:35:33"}
|
| 1138 |
+
{"current_steps": 523, "total_steps": 1230, "loss": 0.2356, "lr": 2.8439502901320956e-05, "epoch": 2.1215189873417724, "percentage": 42.52, "elapsed_time": "12:25:22", "remaining_time": "16:47:36"}
|
| 1139 |
+
{"current_steps": 616, "total_steps": 1230, "loss": 0.2484, "lr": 2.341705325992901e-05, "epoch": 2.4982278481012656, "percentage": 50.08, "elapsed_time": "14:36:50", "remaining_time": "14:33:59"}
|
| 1140 |
+
{"current_steps": 617, "total_steps": 1230, "loss": 0.2364, "lr": 2.336111544604222e-05, "epoch": 2.502278481012658, "percentage": 50.16, "elapsed_time": "14:38:03", "remaining_time": "14:32:21"}
|
| 1141 |
+
{"current_steps": 524, "total_steps": 1230, "loss": 0.2504, "lr": 2.8388011150476237e-05, "epoch": 2.1255696202531644, "percentage": 42.6, "elapsed_time": "12:26:57", "remaining_time": "16:46:23"}
|
| 1142 |
+
{"current_steps": 618, "total_steps": 1230, "loss": 0.235, "lr": 2.33051505621937e-05, "epoch": 2.5063291139240507, "percentage": 50.24, "elapsed_time": "14:39:12", "remaining_time": "14:30:40"}
|
| 1143 |
+
{"current_steps": 525, "total_steps": 1230, "loss": 0.2473, "lr": 2.8336451843742866e-05, "epoch": 2.129620253164557, "percentage": 42.68, "elapsed_time": "12:28:19", "remaining_time": "16:44:53"}
|
| 1144 |
+
{"current_steps": 619, "total_steps": 1230, "loss": 0.2351, "lr": 2.324915905911693e-05, "epoch": 2.510379746835443, "percentage": 50.33, "elapsed_time": "14:40:35", "remaining_time": "14:29:12"}
|
| 1145 |
+
{"current_steps": 526, "total_steps": 1230, "loss": 0.2611, "lr": 2.8284825396372387e-05, "epoch": 2.1336708860759495, "percentage": 42.76, "elapsed_time": "12:30:11", "remaining_time": "16:44:03"}
|
| 1146 |
+
{"current_steps": 620, "total_steps": 1230, "loss": 0.2782, "lr": 2.319314138775977e-05, "epoch": 2.5144303797468357, "percentage": 50.41, "elapsed_time": "14:42:22", "remaining_time": "14:28:08"}
|
| 1147 |
+
{"current_steps": 527, "total_steps": 1230, "loss": 0.2611, "lr": 2.8233132224157132e-05, "epoch": 2.137721518987342, "percentage": 42.85, "elapsed_time": "12:31:33", "remaining_time": "16:42:32"}
|
| 1148 |
+
{"current_steps": 621, "total_steps": 1230, "loss": 0.254, "lr": 2.3137097999280856e-05, "epoch": 2.5184810126582278, "percentage": 50.49, "elapsed_time": "14:43:48", "remaining_time": "14:26:44"}
|
| 1149 |
+
{"current_steps": 528, "total_steps": 1230, "loss": 0.2461, "lr": 2.8181372743426805e-05, "epoch": 2.141772151898734, "percentage": 42.93, "elapsed_time": "12:32:45", "remaining_time": "16:40:49"}
|
| 1150 |
+
{"current_steps": 529, "total_steps": 1230, "loss": 0.2551, "lr": 2.8129547371045128e-05, "epoch": 2.1458227848101266, "percentage": 43.01, "elapsed_time": "12:34:02", "remaining_time": "16:39:12"}
|
| 1151 |
+
{"current_steps": 622, "total_steps": 1230, "loss": 0.2358, "lr": 2.308102934504593e-05, "epoch": 2.5225316455696203, "percentage": 50.57, "elapsed_time": "14:45:17", "remaining_time": "14:25:22"}
|
| 1152 |
+
{"current_steps": 530, "total_steps": 1230, "loss": 0.2567, "lr": 2.8077656524406534e-05, "epoch": 2.149873417721519, "percentage": 43.09, "elapsed_time": "12:35:24", "remaining_time": "16:37:42"}
|
| 1153 |
+
{"current_steps": 623, "total_steps": 1230, "loss": 0.2593, "lr": 2.3024935876624222e-05, "epoch": 2.526582278481013, "percentage": 50.65, "elapsed_time": "14:46:49", "remaining_time": "14:24:02"}
|
| 1154 |
+
{"current_steps": 531, "total_steps": 1230, "loss": 0.2506, "lr": 2.802570062143278e-05, "epoch": 2.1539240506329116, "percentage": 43.17, "elapsed_time": "12:36:54", "remaining_time": "16:36:23"}
|
| 1155 |
+
{"current_steps": 624, "total_steps": 1230, "loss": 0.2268, "lr": 2.2968818045784813e-05, "epoch": 2.530632911392405, "percentage": 50.73, "elapsed_time": "14:48:10", "remaining_time": "14:22:32"}
|
| 1156 |
+
{"current_steps": 532, "total_steps": 1230, "loss": 0.2275, "lr": 2.7973680080569555e-05, "epoch": 2.1579746835443037, "percentage": 43.25, "elapsed_time": "12:38:06", "remaining_time": "16:34:39"}
|
| 1157 |
+
{"current_steps": 625, "total_steps": 1230, "loss": 0.2587, "lr": 2.2912676304493006e-05, "epoch": 2.5346835443037974, "percentage": 50.81, "elapsed_time": "14:49:38", "remaining_time": "14:21:10"}
|
| 1158 |
+
{"current_steps": 533, "total_steps": 1230, "loss": 0.2364, "lr": 2.792159532078314e-05, "epoch": 2.162025316455696, "percentage": 43.33, "elapsed_time": "12:39:18", "remaining_time": "16:32:56"}
|
| 1159 |
+
{"current_steps": 626, "total_steps": 1230, "loss": 0.2628, "lr": 2.2856511104906668e-05, "epoch": 2.53873417721519, "percentage": 50.89, "elapsed_time": "14:51:03", "remaining_time": "14:19:44"}
|
| 1160 |
+
{"current_steps": 534, "total_steps": 1230, "loss": 0.2369, "lr": 2.7869446761557033e-05, "epoch": 2.1660759493670887, "percentage": 43.41, "elapsed_time": "12:40:20", "remaining_time": "16:31:00"}
|
| 1161 |
+
{"current_steps": 627, "total_steps": 1230, "loss": 0.2585, "lr": 2.2800322899372586e-05, "epoch": 2.5427848101265824, "percentage": 50.98, "elapsed_time": "14:52:18", "remaining_time": "14:18:09"}
|
| 1162 |
+
{"current_steps": 535, "total_steps": 1230, "loss": 0.2469, "lr": 2.781723482288857e-05, "epoch": 2.170126582278481, "percentage": 43.5, "elapsed_time": "12:41:35", "remaining_time": "16:29:21"}
|
| 1163 |
+
{"current_steps": 628, "total_steps": 1230, "loss": 0.2409, "lr": 2.2744112140422844e-05, "epoch": 2.546835443037975, "percentage": 51.06, "elapsed_time": "14:53:25", "remaining_time": "14:16:26"}
|
| 1164 |
+
{"current_steps": 536, "total_steps": 1230, "loss": 0.2665, "lr": 2.7764959925285517e-05, "epoch": 2.1741772151898733, "percentage": 43.58, "elapsed_time": "12:42:47", "remaining_time": "16:27:39"}
|
| 1165 |
+
{"current_steps": 629, "total_steps": 1230, "loss": 0.2487, "lr": 2.2687879280771177e-05, "epoch": 2.550886075949367, "percentage": 51.14, "elapsed_time": "14:54:49", "remaining_time": "14:14:59"}
|
| 1166 |
+
{"current_steps": 537, "total_steps": 1230, "loss": 0.2563, "lr": 2.771262248976272e-05, "epoch": 2.178227848101266, "percentage": 43.66, "elapsed_time": "12:44:04", "remaining_time": "16:26:02"}
|
| 1167 |
+
{"current_steps": 630, "total_steps": 1230, "loss": 0.2355, "lr": 2.26316247733093e-05, "epoch": 2.5549367088607595, "percentage": 51.22, "elapsed_time": "14:56:00", "remaining_time": "14:13:20"}
|
| 1168 |
+
{"current_steps": 538, "total_steps": 1230, "loss": 0.2596, "lr": 2.7660222937838677e-05, "epoch": 2.1822784810126583, "percentage": 43.74, "elapsed_time": "12:45:29", "remaining_time": "16:24:36"}
|
| 1169 |
+
{"current_steps": 631, "total_steps": 1230, "loss": 0.2459, "lr": 2.257534907110328e-05, "epoch": 2.558987341772152, "percentage": 51.3, "elapsed_time": "14:57:33", "remaining_time": "14:12:02"}
|
| 1170 |
+
{"current_steps": 539, "total_steps": 1230, "loss": 0.2411, "lr": 2.7607761691532186e-05, "epoch": 2.186329113924051, "percentage": 43.82, "elapsed_time": "12:46:41", "remaining_time": "16:22:54"}
|
| 1171 |
+
{"current_steps": 632, "total_steps": 1230, "loss": 0.2487, "lr": 2.2519052627389882e-05, "epoch": 2.563037974683544, "percentage": 51.38, "elapsed_time": "14:59:09", "remaining_time": "14:10:47"}
|
| 1172 |
+
{"current_steps": 540, "total_steps": 1230, "loss": 0.238, "lr": 2.7555239173358916e-05, "epoch": 2.190379746835443, "percentage": 43.9, "elapsed_time": "12:48:02", "remaining_time": "16:21:22"}
|
| 1173 |
+
{"current_steps": 633, "total_steps": 1230, "loss": 0.2266, "lr": 2.246273589557294e-05, "epoch": 2.5670886075949366, "percentage": 51.46, "elapsed_time": "15:00:24", "remaining_time": "14:09:12"}
|
| 1174 |
+
{"current_steps": 541, "total_steps": 1230, "loss": 0.2583, "lr": 2.7502655806328e-05, "epoch": 2.1944303797468354, "percentage": 43.98, "elapsed_time": "12:49:29", "remaining_time": "16:19:59"}
|
| 1175 |
+
{"current_steps": 634, "total_steps": 1230, "loss": 0.2614, "lr": 2.240639932921966e-05, "epoch": 2.571139240506329, "percentage": 51.54, "elapsed_time": "15:01:45", "remaining_time": "14:07:42"}
|
| 1176 |
+
{"current_steps": 542, "total_steps": 1230, "loss": 0.2496, "lr": 2.7450012013938648e-05, "epoch": 2.198481012658228, "percentage": 44.07, "elapsed_time": "12:50:46", "remaining_time": "16:18:24"}
|
| 1177 |
+
{"current_steps": 543, "total_steps": 1230, "loss": 0.239, "lr": 2.739730822017673e-05, "epoch": 2.2025316455696204, "percentage": 44.15, "elapsed_time": "12:51:58", "remaining_time": "16:16:41"}
|
| 1178 |
+
{"current_steps": 635, "total_steps": 1230, "loss": 0.2597, "lr": 2.2350043382056995e-05, "epoch": 2.5751898734177217, "percentage": 51.63, "elapsed_time": "15:03:10", "remaining_time": "14:06:16"}
|
| 1179 |
+
{"current_steps": 544, "total_steps": 1230, "loss": 0.237, "lr": 2.7344544849511355e-05, "epoch": 2.2065822784810125, "percentage": 44.23, "elapsed_time": "12:53:26", "remaining_time": "16:15:19"}
|
| 1180 |
+
{"current_steps": 636, "total_steps": 1230, "loss": 0.258, "lr": 2.2293668507968015e-05, "epoch": 2.579240506329114, "percentage": 51.71, "elapsed_time": "15:04:37", "remaining_time": "14:04:52"}
|
| 1181 |
+
{"current_steps": 637, "total_steps": 1230, "loss": 0.239, "lr": 2.2237275160988186e-05, "epoch": 2.5832911392405062, "percentage": 51.79, "elapsed_time": "15:05:45", "remaining_time": "14:03:11"}
|
| 1182 |
+
{"current_steps": 545, "total_steps": 1230, "loss": 0.2605, "lr": 2.7291722326891456e-05, "epoch": 2.210632911392405, "percentage": 44.31, "elapsed_time": "12:54:40", "remaining_time": "16:13:40"}
|
| 1183 |
+
{"current_steps": 546, "total_steps": 1230, "loss": 0.2481, "lr": 2.723884107774236e-05, "epoch": 2.2146835443037975, "percentage": 44.39, "elapsed_time": "12:55:54", "remaining_time": "16:12:01"}
|
| 1184 |
+
{"current_steps": 638, "total_steps": 1230, "loss": 0.2682, "lr": 2.2180863795301787e-05, "epoch": 2.5873417721518988, "percentage": 51.87, "elapsed_time": "15:07:22", "remaining_time": "14:01:56"}
|
| 1185 |
+
{"current_steps": 547, "total_steps": 1230, "loss": 0.2721, "lr": 2.718590152796239e-05, "epoch": 2.21873417721519, "percentage": 44.47, "elapsed_time": "12:57:24", "remaining_time": "16:10:41"}
|
| 1186 |
+
{"current_steps": 639, "total_steps": 1230, "loss": 0.2299, "lr": 2.212443486523819e-05, "epoch": 2.5913924050632913, "percentage": 51.95, "elapsed_time": "15:08:42", "remaining_time": "14:00:26"}
|
| 1187 |
+
{"current_steps": 548, "total_steps": 1230, "loss": 0.2209, "lr": 2.71329041039194e-05, "epoch": 2.222784810126582, "percentage": 44.55, "elapsed_time": "12:58:23", "remaining_time": "16:08:43"}
|
| 1188 |
+
{"current_steps": 640, "total_steps": 1230, "loss": 0.2457, "lr": 2.2067988825268243e-05, "epoch": 2.5954430379746833, "percentage": 52.03, "elapsed_time": "15:09:50", "remaining_time": "13:58:45"}
|
| 1189 |
+
{"current_steps": 549, "total_steps": 1230, "loss": 0.2344, "lr": 2.7079849232447357e-05, "epoch": 2.2268354430379746, "percentage": 44.63, "elapsed_time": "12:59:48", "remaining_time": "16:07:18"}
|
| 1190 |
+
{"current_steps": 641, "total_steps": 1230, "loss": 0.2336, "lr": 2.2011526130000596e-05, "epoch": 2.599493670886076, "percentage": 52.11, "elapsed_time": "15:11:09", "remaining_time": "13:57:14"}
|
| 1191 |
+
{"current_steps": 550, "total_steps": 1230, "loss": 0.251, "lr": 2.7026737340842895e-05, "epoch": 2.230886075949367, "percentage": 44.72, "elapsed_time": "13:01:05", "remaining_time": "16:05:42"}
|
| 1192 |
+
{"current_steps": 642, "total_steps": 1230, "loss": 0.25, "lr": 2.1955047234178038e-05, "epoch": 2.6035443037974684, "percentage": 52.2, "elapsed_time": "15:12:27", "remaining_time": "13:55:42"}
|
| 1193 |
+
{"current_steps": 551, "total_steps": 1230, "loss": 0.2499, "lr": 2.697356885686189e-05, "epoch": 2.2349367088607597, "percentage": 44.8, "elapsed_time": "13:02:25", "remaining_time": "16:04:10"}
|
| 1194 |
+
{"current_steps": 643, "total_steps": 1230, "loss": 0.2578, "lr": 2.1898552592673825e-05, "epoch": 2.607594936708861, "percentage": 52.28, "elapsed_time": "15:14:06", "remaining_time": "13:54:29"}
|
| 1195 |
+
{"current_steps": 552, "total_steps": 1230, "loss": 0.229, "lr": 2.6920344208716014e-05, "epoch": 2.2389873417721518, "percentage": 44.88, "elapsed_time": "13:03:35", "remaining_time": "16:02:27"}
|
| 1196 |
+
{"current_steps": 644, "total_steps": 1230, "loss": 0.24, "lr": 2.184204266048803e-05, "epoch": 2.6116455696202534, "percentage": 52.36, "elapsed_time": "15:15:29", "remaining_time": "13:53:02"}
|
| 1197 |
+
{"current_steps": 553, "total_steps": 1230, "loss": 0.2497, "lr": 2.6867063825069252e-05, "epoch": 2.2430379746835443, "percentage": 44.96, "elapsed_time": "13:04:46", "remaining_time": "16:00:44"}
|
| 1198 |
+
{"current_steps": 645, "total_steps": 1230, "loss": 0.2713, "lr": 2.1785517892743887e-05, "epoch": 2.6156962025316455, "percentage": 52.44, "elapsed_time": "15:16:53", "remaining_time": "13:51:35"}
|
| 1199 |
+
{"current_steps": 554, "total_steps": 1230, "loss": 0.2647, "lr": 2.6813728135034494e-05, "epoch": 2.247088607594937, "percentage": 45.04, "elapsed_time": "13:06:13", "remaining_time": "15:59:21"}
|
| 1200 |
+
{"current_steps": 646, "total_steps": 1230, "loss": 0.2637, "lr": 2.17289787446841e-05, "epoch": 2.619746835443038, "percentage": 52.52, "elapsed_time": "15:18:09", "remaining_time": "13:50:02"}
|
| 1201 |
+
{"current_steps": 555, "total_steps": 1230, "loss": 0.2324, "lr": 2.6760337568170056e-05, "epoch": 2.2511392405063293, "percentage": 45.12, "elapsed_time": "13:07:27", "remaining_time": "15:57:43"}
|
| 1202 |
+
{"current_steps": 647, "total_steps": 1230, "loss": 0.2522, "lr": 2.1672425671667198e-05, "epoch": 2.6237974683544305, "percentage": 52.6, "elapsed_time": "15:19:40", "remaining_time": "13:48:42"}
|
| 1203 |
+
{"current_steps": 556, "total_steps": 1230, "loss": 0.2349, "lr": 2.6706892554476226e-05, "epoch": 2.2551898734177214, "percentage": 45.2, "elapsed_time": "13:08:38", "remaining_time": "15:56:01"}
|
| 1204 |
+
{"current_steps": 648, "total_steps": 1230, "loss": 0.2155, "lr": 2.161585912916385e-05, "epoch": 2.6278481012658226, "percentage": 52.68, "elapsed_time": "15:20:44", "remaining_time": "13:46:57"}
|
| 1205 |
+
{"current_steps": 557, "total_steps": 1230, "loss": 0.2365, "lr": 2.6653393524391795e-05, "epoch": 2.259240506329114, "percentage": 45.28, "elapsed_time": "13:10:05", "remaining_time": "15:54:38"}
|
| 1206 |
+
{"current_steps": 649, "total_steps": 1230, "loss": 0.2205, "lr": 2.1559279572753214e-05, "epoch": 2.631898734177215, "percentage": 52.76, "elapsed_time": "15:22:01", "remaining_time": "13:45:24"}
|
| 1207 |
+
{"current_steps": 558, "total_steps": 1230, "loss": 0.2465, "lr": 2.6599840908790592e-05, "epoch": 2.2632911392405064, "percentage": 45.37, "elapsed_time": "13:11:27", "remaining_time": "15:53:09"}
|
| 1208 |
+
{"current_steps": 650, "total_steps": 1230, "loss": 0.2759, "lr": 2.1502687458119268e-05, "epoch": 2.6359493670886076, "percentage": 52.85, "elapsed_time": "15:23:37", "remaining_time": "13:44:09"}
|
| 1209 |
+
{"current_steps": 559, "total_steps": 1230, "loss": 0.2576, "lr": 2.6546235138978028e-05, "epoch": 2.267341772151899, "percentage": 45.45, "elapsed_time": "13:12:57", "remaining_time": "15:51:49"}
|
| 1210 |
+
{"current_steps": 651, "total_steps": 1230, "loss": 0.2499, "lr": 2.1446083241047116e-05, "epoch": 2.64, "percentage": 52.93, "elapsed_time": "15:24:56", "remaining_time": "13:42:38"}
|
| 1211 |
+
{"current_steps": 560, "total_steps": 1230, "loss": 0.2533, "lr": 2.6492576646687597e-05, "epoch": 2.271392405063291, "percentage": 45.53, "elapsed_time": "13:14:28", "remaining_time": "15:50:32"}
|
| 1212 |
+
{"current_steps": 652, "total_steps": 1230, "loss": 0.2557, "lr": 2.1389467377419333e-05, "epoch": 2.6440506329113926, "percentage": 53.01, "elapsed_time": "15:26:26", "remaining_time": "13:41:17"}
|
| 1213 |
+
{"current_steps": 561, "total_steps": 1230, "loss": 0.2463, "lr": 2.6438865864077425e-05, "epoch": 2.2754430379746835, "percentage": 45.61, "elapsed_time": "13:15:47", "remaining_time": "15:48:58"}
|
| 1214 |
+
{"current_steps": 653, "total_steps": 1230, "loss": 0.2468, "lr": 2.133284032321232e-05, "epoch": 2.6481012658227847, "percentage": 53.09, "elapsed_time": "15:27:45", "remaining_time": "13:39:46"}
|
| 1215 |
+
{"current_steps": 562, "total_steps": 1230, "loss": 0.2377, "lr": 2.6385103223726766e-05, "epoch": 2.279493670886076, "percentage": 45.69, "elapsed_time": "13:16:51", "remaining_time": "15:47:09"}
|
| 1216 |
+
{"current_steps": 654, "total_steps": 1230, "loss": 0.2494, "lr": 2.1276202534492566e-05, "epoch": 2.6521518987341772, "percentage": 53.17, "elapsed_time": "15:29:09", "remaining_time": "13:38:20"}
|
| 1217 |
+
{"current_steps": 563, "total_steps": 1230, "loss": 0.2345, "lr": 2.6331289158632537e-05, "epoch": 2.2835443037974685, "percentage": 45.77, "elapsed_time": "13:18:19", "remaining_time": "15:45:47"}
|
| 1218 |
+
{"current_steps": 655, "total_steps": 1230, "loss": 0.2602, "lr": 2.121955446741306e-05, "epoch": 2.6562025316455697, "percentage": 53.25, "elapsed_time": "15:30:37", "remaining_time": "13:36:57"}
|
| 1219 |
+
{"current_steps": 564, "total_steps": 1230, "loss": 0.2612, "lr": 2.6277424102205817e-05, "epoch": 2.2875949367088606, "percentage": 45.85, "elapsed_time": "13:19:45", "remaining_time": "15:44:23"}
|
| 1220 |
+
{"current_steps": 656, "total_steps": 1230, "loss": 0.2113, "lr": 2.1162896578209517e-05, "epoch": 2.660253164556962, "percentage": 53.33, "elapsed_time": "15:31:51", "remaining_time": "13:35:22"}
|
| 1221 |
+
{"current_steps": 565, "total_steps": 1230, "loss": 0.2518, "lr": 2.6223508488268374e-05, "epoch": 2.291645569620253, "percentage": 45.93, "elapsed_time": "13:21:11", "remaining_time": "15:42:59"}
|
| 1222 |
+
{"current_steps": 657, "total_steps": 1230, "loss": 0.2569, "lr": 2.1106229323196813e-05, "epoch": 2.6643037974683543, "percentage": 53.41, "elapsed_time": "15:33:28", "remaining_time": "13:34:07"}
|
| 1223 |
+
{"current_steps": 566, "total_steps": 1230, "loss": 0.2513, "lr": 2.6169542751049148e-05, "epoch": 2.2956962025316456, "percentage": 46.02, "elapsed_time": "13:22:43", "remaining_time": "15:41:42"}
|
| 1224 |
+
{"current_steps": 658, "total_steps": 1230, "loss": 0.2692, "lr": 2.1049553158765214e-05, "epoch": 2.668354430379747, "percentage": 53.5, "elapsed_time": "15:34:58", "remaining_time": "13:32:46"}
|
| 1225 |
+
{"current_steps": 567, "total_steps": 1230, "loss": 0.2716, "lr": 2.6115527325180754e-05, "epoch": 2.299746835443038, "percentage": 46.1, "elapsed_time": "13:24:14", "remaining_time": "15:40:25"}
|
| 1226 |
+
{"current_steps": 659, "total_steps": 1230, "loss": 0.2427, "lr": 2.0992868541376764e-05, "epoch": 2.6724050632911394, "percentage": 53.58, "elapsed_time": "15:36:16", "remaining_time": "13:31:15"}
|
| 1227 |
+
{"current_steps": 568, "total_steps": 1230, "loss": 0.2445, "lr": 2.606146264569603e-05, "epoch": 2.3037974683544302, "percentage": 46.18, "elapsed_time": "13:25:48", "remaining_time": "15:39:09"}
|
| 1228 |
+
{"current_steps": 660, "total_steps": 1230, "loss": 0.24, "lr": 2.093617592756158e-05, "epoch": 2.676455696202532, "percentage": 53.66, "elapsed_time": "15:37:38", "remaining_time": "13:29:46"}
|
| 1229 |
+
{"current_steps": 569, "total_steps": 1230, "loss": 0.2465, "lr": 2.6007349148024447e-05, "epoch": 2.3078481012658227, "percentage": 46.26, "elapsed_time": "13:27:08", "remaining_time": "15:37:38"}
|
| 1230 |
+
{"current_steps": 661, "total_steps": 1230, "loss": 0.2541, "lr": 2.0879475773914167e-05, "epoch": 2.680506329113924, "percentage": 53.74, "elapsed_time": "15:38:58", "remaining_time": "13:28:16"}
|
| 1231 |
+
{"current_steps": 570, "total_steps": 1230, "loss": 0.2434, "lr": 2.5953187267988694e-05, "epoch": 2.3118987341772153, "percentage": 46.34, "elapsed_time": "13:28:29", "remaining_time": "15:36:09"}
|
| 1232 |
+
{"current_steps": 662, "total_steps": 1230, "loss": 0.2383, "lr": 2.082276853708978e-05, "epoch": 2.6845569620253165, "percentage": 53.82, "elapsed_time": "15:40:20", "remaining_time": "13:26:49"}
|
| 1233 |
+
{"current_steps": 571, "total_steps": 1230, "loss": 0.2547, "lr": 2.5898977441801097e-05, "epoch": 2.3159493670886078, "percentage": 46.42, "elapsed_time": "13:29:48", "remaining_time": "15:34:36"}
|
| 1234 |
+
{"current_steps": 663, "total_steps": 1230, "loss": 0.252, "lr": 2.076605467380071e-05, "epoch": 2.688607594936709, "percentage": 53.9, "elapsed_time": "15:41:54", "remaining_time": "13:25:31"}
|
| 1235 |
+
{"current_steps": 572, "total_steps": 1230, "loss": 0.2815, "lr": 2.584472010606015e-05, "epoch": 2.32, "percentage": 46.5, "elapsed_time": "13:31:38", "remaining_time": "15:33:40"}
|
| 1236 |
+
{"current_steps": 664, "total_steps": 1230, "loss": 0.2428, "lr": 2.0709334640812613e-05, "epoch": 2.692658227848101, "percentage": 53.98, "elapsed_time": "15:43:08", "remaining_time": "13:23:56"}
|
| 1237 |
+
{"current_steps": 573, "total_steps": 1230, "loss": 0.2385, "lr": 2.5790415697746976e-05, "epoch": 2.3240506329113924, "percentage": 46.59, "elapsed_time": "13:32:49", "remaining_time": "15:31:58"}
|
| 1238 |
+
{"current_steps": 665, "total_steps": 1230, "loss": 0.2638, "lr": 2.0652608894940824e-05, "epoch": 2.6967088607594936, "percentage": 54.07, "elapsed_time": "15:44:41", "remaining_time": "13:22:38"}
|
| 1239 |
+
{"current_steps": 574, "total_steps": 1230, "loss": 0.242, "lr": 2.5736064654221808e-05, "epoch": 2.328101265822785, "percentage": 46.67, "elapsed_time": "13:34:01", "remaining_time": "15:30:18"}
|
| 1240 |
+
{"current_steps": 666, "total_steps": 1230, "loss": 0.239, "lr": 2.0595877893046722e-05, "epoch": 2.700759493670886, "percentage": 54.15, "elapsed_time": "15:46:09", "remaining_time": "13:21:15"}
|
| 1241 |
+
{"current_steps": 575, "total_steps": 1230, "loss": 0.236, "lr": 2.568166741322048e-05, "epoch": 2.3321518987341774, "percentage": 46.75, "elapsed_time": "13:35:15", "remaining_time": "15:28:40"}
|
| 1242 |
+
{"current_steps": 667, "total_steps": 1230, "loss": 0.2559, "lr": 2.0539142092033985e-05, "epoch": 2.7048101265822786, "percentage": 54.23, "elapsed_time": "15:47:32", "remaining_time": "13:19:47"}
|
| 1243 |
+
{"current_steps": 576, "total_steps": 1230, "loss": 0.2654, "lr": 2.56272244128509e-05, "epoch": 2.3362025316455695, "percentage": 46.83, "elapsed_time": "13:36:44", "remaining_time": "15:27:20"}
|
| 1244 |
+
{"current_steps": 668, "total_steps": 1230, "loss": 0.2575, "lr": 2.048240194884496e-05, "epoch": 2.708860759493671, "percentage": 54.31, "elapsed_time": "15:48:49", "remaining_time": "13:18:15"}
|
| 1245 |
+
{"current_steps": 577, "total_steps": 1230, "loss": 0.2458, "lr": 2.55727360915895e-05, "epoch": 2.340253164556962, "percentage": 46.91, "elapsed_time": "13:38:04", "remaining_time": "15:25:49"}
|
| 1246 |
+
{"current_steps": 669, "total_steps": 1230, "loss": 0.2547, "lr": 2.042565792045695e-05, "epoch": 2.712911392405063, "percentage": 54.39, "elapsed_time": "15:50:25", "remaining_time": "13:16:59"}
|
| 1247 |
+
{"current_steps": 578, "total_steps": 1230, "loss": 0.2596, "lr": 2.5518202888277734e-05, "epoch": 2.3443037974683545, "percentage": 46.99, "elapsed_time": "13:39:22", "remaining_time": "15:24:17"}
|
| 1248 |
+
{"current_steps": 670, "total_steps": 1230, "loss": 0.2727, "lr": 2.036891046387857e-05, "epoch": 2.7169620253164557, "percentage": 54.47, "elapsed_time": "15:51:54", "remaining_time": "13:15:37"}
|
| 1249 |
+
{"current_steps": 579, "total_steps": 1230, "loss": 0.2492, "lr": 2.5463625242118523e-05, "epoch": 2.348354430379747, "percentage": 47.07, "elapsed_time": "13:40:58", "remaining_time": "15:23:03"}
|
| 1250 |
+
{"current_steps": 671, "total_steps": 1230, "loss": 0.2466, "lr": 2.0312160036146036e-05, "epoch": 2.721012658227848, "percentage": 54.55, "elapsed_time": "15:53:16", "remaining_time": "13:14:09"}
|
| 1251 |
+
{"current_steps": 580, "total_steps": 1230, "loss": 0.2588, "lr": 2.5409003592672723e-05, "epoch": 2.352405063291139, "percentage": 47.15, "elapsed_time": "13:42:25", "remaining_time": "15:21:40"}
|
| 1252 |
+
{"current_steps": 672, "total_steps": 1230, "loss": 0.2457, "lr": 2.025540709431948e-05, "epoch": 2.7250632911392403, "percentage": 54.63, "elapsed_time": "15:54:32", "remaining_time": "13:12:36"}
|
| 1253 |
+
{"current_steps": 581, "total_steps": 1230, "loss": 0.2525, "lr": 2.535433837985559e-05, "epoch": 2.3564556962025316, "percentage": 47.24, "elapsed_time": "13:43:33", "remaining_time": "15:19:56"}
|
| 1254 |
+
{"current_steps": 673, "total_steps": 1230, "loss": 0.2651, "lr": 2.0198652095479298e-05, "epoch": 2.729113924050633, "percentage": 54.72, "elapsed_time": "15:55:55", "remaining_time": "13:11:09"}
|
| 1255 |
+
{"current_steps": 582, "total_steps": 1230, "loss": 0.2619, "lr": 2.529963004393324e-05, "epoch": 2.360506329113924, "percentage": 47.32, "elapsed_time": "13:45:00", "remaining_time": "15:18:33"}
|
| 1256 |
+
{"current_steps": 674, "total_steps": 1230, "loss": 0.2399, "lr": 2.014189549672245e-05, "epoch": 2.7331645569620253, "percentage": 54.8, "elapsed_time": "15:57:22", "remaining_time": "13:09:45"}
|
| 1257 |
+
{"current_steps": 583, "total_steps": 1230, "loss": 0.2418, "lr": 2.524487902551908e-05, "epoch": 2.3645569620253166, "percentage": 47.4, "elapsed_time": "13:46:18", "remaining_time": "15:17:00"}
|
| 1258 |
+
{"current_steps": 675, "total_steps": 1230, "loss": 0.2495, "lr": 2.0085137755158776e-05, "epoch": 2.737215189873418, "percentage": 54.88, "elapsed_time": "15:58:29", "remaining_time": "13:08:05"}
|
| 1259 |
+
{"current_steps": 584, "total_steps": 1230, "loss": 0.2422, "lr": 2.519008576557029e-05, "epoch": 2.3686075949367087, "percentage": 47.48, "elapsed_time": "13:47:38", "remaining_time": "15:15:29"}
|
| 1260 |
+
{"current_steps": 676, "total_steps": 1230, "loss": 0.242, "lr": 2.0028379327907327e-05, "epoch": 2.7412658227848103, "percentage": 54.96, "elapsed_time": "15:59:41", "remaining_time": "13:06:29"}
|
| 1261 |
+
{"current_steps": 585, "total_steps": 1230, "loss": 0.2868, "lr": 2.5135250705384254e-05, "epoch": 2.372658227848101, "percentage": 47.56, "elapsed_time": "13:49:21", "remaining_time": "15:14:25"}
|
| 1262 |
+
{"current_steps": 677, "total_steps": 1230, "loss": 0.2566, "lr": 1.9971620672092676e-05, "epoch": 2.7453164556962024, "percentage": 55.04, "elapsed_time": "16:01:04", "remaining_time": "13:05:02"}
|
| 1263 |
+
{"current_steps": 586, "total_steps": 1230, "loss": 0.2481, "lr": 2.5080374286595007e-05, "epoch": 2.3767088607594937, "percentage": 47.64, "elapsed_time": "13:50:55", "remaining_time": "15:13:09"}
|
| 1264 |
+
{"current_steps": 678, "total_steps": 1230, "loss": 0.2329, "lr": 1.991486224484123e-05, "epoch": 2.749367088607595, "percentage": 55.12, "elapsed_time": "16:02:17", "remaining_time": "13:03:27"}
|
| 1265 |
+
{"current_steps": 587, "total_steps": 1230, "loss": 0.2563, "lr": 2.5025456951169677e-05, "epoch": 2.3807594936708862, "percentage": 47.72, "elapsed_time": "13:52:18", "remaining_time": "15:11:42"}
|
| 1266 |
+
{"current_steps": 679, "total_steps": 1230, "loss": 0.2582, "lr": 1.985810450327756e-05, "epoch": 2.7534177215189874, "percentage": 55.2, "elapsed_time": "16:03:38", "remaining_time": "13:01:58"}
|
| 1267 |
+
{"current_steps": 588, "total_steps": 1230, "loss": 0.2378, "lr": 2.4970499141404942e-05, "epoch": 2.3848101265822783, "percentage": 47.8, "elapsed_time": "13:53:28", "remaining_time": "15:10:00"}
|
| 1268 |
+
{"current_steps": 680, "total_steps": 1230, "loss": 0.2517, "lr": 1.9801347904520706e-05, "epoch": 2.7574683544303795, "percentage": 55.28, "elapsed_time": "16:05:16", "remaining_time": "13:00:44"}
|
| 1269 |
+
{"current_steps": 589, "total_steps": 1230, "loss": 0.2508, "lr": 2.491550129992345e-05, "epoch": 2.388860759493671, "percentage": 47.89, "elapsed_time": "13:54:55", "remaining_time": "15:08:38"}
|
| 1270 |
+
{"current_steps": 681, "total_steps": 1230, "loss": 0.2658, "lr": 1.974459290568053e-05, "epoch": 2.761518987341772, "percentage": 55.37, "elapsed_time": "16:06:48", "remaining_time": "12:59:24"}
|
| 1271 |
+
{"current_steps": 590, "total_steps": 1230, "loss": 0.2597, "lr": 2.486046386967024e-05, "epoch": 2.3929113924050633, "percentage": 47.97, "elapsed_time": "13:56:27", "remaining_time": "15:07:20"}
|
| 1272 |
+
{"current_steps": 682, "total_steps": 1230, "loss": 0.248, "lr": 1.968783996385397e-05, "epoch": 2.7655696202531646, "percentage": 55.45, "elapsed_time": "16:08:13", "remaining_time": "12:57:58"}
|
| 1273 |
+
{"current_steps": 591, "total_steps": 1230, "loss": 0.2517, "lr": 2.4805387293909214e-05, "epoch": 2.396962025316456, "percentage": 48.05, "elapsed_time": "13:57:54", "remaining_time": "15:05:58"}
|
| 1274 |
+
{"current_steps": 683, "total_steps": 1230, "loss": 0.2453, "lr": 1.963108953612143e-05, "epoch": 2.769620253164557, "percentage": 55.53, "elapsed_time": "16:09:37", "remaining_time": "12:56:33"}
|
| 1275 |
+
{"current_steps": 592, "total_steps": 1230, "loss": 0.2751, "lr": 2.4750272016219552e-05, "epoch": 2.401012658227848, "percentage": 48.13, "elapsed_time": "13:59:27", "remaining_time": "15:04:41"}
|
| 1276 |
+
{"current_steps": 684, "total_steps": 1230, "loss": 0.2358, "lr": 1.9574342079543056e-05, "epoch": 2.7736708860759496, "percentage": 55.61, "elapsed_time": "16:10:59", "remaining_time": "12:55:05"}
|
| 1277 |
+
{"current_steps": 593, "total_steps": 1230, "loss": 0.2345, "lr": 2.4695118480492114e-05, "epoch": 2.4050632911392404, "percentage": 48.21, "elapsed_time": "14:00:39", "remaining_time": "15:03:01"}
|
| 1278 |
+
{"current_steps": 685, "total_steps": 1230, "loss": 0.2324, "lr": 1.9517598051155046e-05, "epoch": 2.7777215189873417, "percentage": 55.69, "elapsed_time": "16:12:05", "remaining_time": "12:53:25"}
|
| 1279 |
+
{"current_steps": 594, "total_steps": 1230, "loss": 0.2605, "lr": 2.4639927130925898e-05, "epoch": 2.409113924050633, "percentage": 48.29, "elapsed_time": "14:02:10", "remaining_time": "15:01:42"}
|
| 1280 |
+
{"current_steps": 686, "total_steps": 1230, "loss": 0.2521, "lr": 1.9460857907966025e-05, "epoch": 2.781772151898734, "percentage": 55.77, "elapsed_time": "16:13:28", "remaining_time": "12:51:58"}
|
| 1281 |
+
{"current_steps": 595, "total_steps": 1230, "loss": 0.2427, "lr": 2.458469841202444e-05, "epoch": 2.4131645569620255, "percentage": 48.37, "elapsed_time": "14:03:23", "remaining_time": "15:00:04"}
|
| 1282 |
+
{"current_steps": 687, "total_steps": 1230, "loss": 0.2569, "lr": 1.9404122106953285e-05, "epoch": 2.7858227848101267, "percentage": 55.85, "elapsed_time": "16:15:07", "remaining_time": "12:50:43"}
|
| 1283 |
+
{"current_steps": 596, "total_steps": 1230, "loss": 0.2487, "lr": 2.452943276859226e-05, "epoch": 2.4172151898734175, "percentage": 48.46, "elapsed_time": "14:04:45", "remaining_time": "14:58:37"}
|
| 1284 |
+
{"current_steps": 688, "total_steps": 1230, "loss": 0.2471, "lr": 1.9347391105059176e-05, "epoch": 2.7898734177215188, "percentage": 55.93, "elapsed_time": "16:16:32", "remaining_time": "12:49:18"}
|
| 1285 |
+
{"current_steps": 597, "total_steps": 1230, "loss": 0.2448, "lr": 2.447413064573125e-05, "epoch": 2.42126582278481, "percentage": 48.54, "elapsed_time": "14:06:01", "remaining_time": "14:57:02"}
|
| 1286 |
+
{"current_steps": 689, "total_steps": 1230, "loss": 0.2784, "lr": 1.92906653591874e-05, "epoch": 2.7939240506329113, "percentage": 56.02, "elapsed_time": "16:18:05", "remaining_time": "12:47:59"}
|
| 1287 |
+
{"current_steps": 598, "total_steps": 1230, "loss": 0.2328, "lr": 2.4418792488837095e-05, "epoch": 2.4253164556962026, "percentage": 48.62, "elapsed_time": "14:07:02", "remaining_time": "14:55:11"}
|
| 1288 |
+
{"current_steps": 599, "total_steps": 1230, "loss": 0.2349, "lr": 2.4363418743595713e-05, "epoch": 2.429367088607595, "percentage": 48.7, "elapsed_time": "14:08:16", "remaining_time": "14:53:36"}
|
| 1289 |
+
{"current_steps": 690, "total_steps": 1230, "loss": 0.251, "lr": 1.9233945326199295e-05, "epoch": 2.797974683544304, "percentage": 56.1, "elapsed_time": "16:19:34", "remaining_time": "12:46:37"}
|
| 1290 |
+
{"current_steps": 600, "total_steps": 1230, "loss": 0.243, "lr": 2.430800985597963e-05, "epoch": 2.433417721518987, "percentage": 48.78, "elapsed_time": "14:09:42", "remaining_time": "14:52:11"}
|
| 1291 |
+
{"current_steps": 691, "total_steps": 1230, "loss": 0.2437, "lr": 1.917723146291022e-05, "epoch": 2.8020253164556963, "percentage": 56.18, "elapsed_time": "16:20:54", "remaining_time": "12:45:08"}
|
| 1292 |
+
{"current_steps": 692, "total_steps": 1230, "loss": 0.2474, "lr": 1.912052422608584e-05, "epoch": 2.806075949367089, "percentage": 56.26, "elapsed_time": "16:22:16", "remaining_time": "12:43:40"}
|
| 1293 |
+
{"current_steps": 601, "total_steps": 1230, "loss": 0.2731, "lr": 2.4252566272244415e-05, "epoch": 2.4374683544303797, "percentage": 48.86, "elapsed_time": "14:11:20", "remaining_time": "14:51:00"}
|
| 1294 |
+
{"current_steps": 693, "total_steps": 1230, "loss": 0.2452, "lr": 1.9063824072438428e-05, "epoch": 2.810126582278481, "percentage": 56.34, "elapsed_time": "16:23:46", "remaining_time": "12:42:19"}
|
| 1295 |
+
{"current_steps": 602, "total_steps": 1230, "loss": 0.2674, "lr": 2.4197088438925063e-05, "epoch": 2.441518987341772, "percentage": 48.94, "elapsed_time": "14:12:49", "remaining_time": "14:49:39"}
|
| 1296 |
+
{"current_steps": 694, "total_steps": 1230, "loss": 0.239, "lr": 1.9007131458623246e-05, "epoch": 2.8141772151898734, "percentage": 56.42, "elapsed_time": "16:25:06", "remaining_time": "12:40:49"}
|
| 1297 |
+
{"current_steps": 603, "total_steps": 1230, "loss": 0.2681, "lr": 2.4141576802832417e-05, "epoch": 2.4455696202531647, "percentage": 49.02, "elapsed_time": "14:14:22", "remaining_time": "14:48:22"}
|
| 1298 |
+
{"current_steps": 695, "total_steps": 1230, "loss": 0.2638, "lr": 1.895044684123479e-05, "epoch": 2.818227848101266, "percentage": 56.5, "elapsed_time": "16:26:35", "remaining_time": "12:39:28"}
|
| 1299 |
+
{"current_steps": 604, "total_steps": 1230, "loss": 0.2529, "lr": 2.408603181104957e-05, "epoch": 2.449620253164557, "percentage": 49.11, "elapsed_time": "14:15:55", "remaining_time": "14:47:05"}
|
| 1300 |
+
{"current_steps": 696, "total_steps": 1230, "loss": 0.2583, "lr": 1.8893770676803194e-05, "epoch": 2.822278481012658, "percentage": 56.59, "elapsed_time": "16:27:52", "remaining_time": "12:37:56"}
|
| 1301 |
+
{"current_steps": 605, "total_steps": 1230, "loss": 0.259, "lr": 2.4030453910928245e-05, "epoch": 2.4536708860759493, "percentage": 49.19, "elapsed_time": "14:17:09", "remaining_time": "14:45:29"}
|
| 1302 |
+
{"current_steps": 697, "total_steps": 1230, "loss": 0.252, "lr": 1.8837103421790486e-05, "epoch": 2.8263291139240505, "percentage": 56.67, "elapsed_time": "16:29:19", "remaining_time": "12:36:32"}
|
| 1303 |
+
{"current_steps": 606, "total_steps": 1230, "loss": 0.2288, "lr": 2.397484355008521e-05, "epoch": 2.457721518987342, "percentage": 49.27, "elapsed_time": "14:18:23", "remaining_time": "14:43:52"}
|
| 1304 |
+
{"current_steps": 607, "total_steps": 1230, "loss": 0.2517, "lr": 2.3919201176398662e-05, "epoch": 2.4617721518987343, "percentage": 49.35, "elapsed_time": "14:19:35", "remaining_time": "14:42:14"}
|
| 1305 |
+
{"current_steps": 698, "total_steps": 1230, "loss": 0.2646, "lr": 1.8780445532586952e-05, "epoch": 2.830379746835443, "percentage": 56.75, "elapsed_time": "16:30:57", "remaining_time": "12:35:17"}
|
| 1306 |
+
{"current_steps": 699, "total_steps": 1230, "loss": 0.2658, "lr": 1.872379746550743e-05, "epoch": 2.8344303797468355, "percentage": 56.83, "elapsed_time": "16:32:21", "remaining_time": "12:33:51"}
|
| 1307 |
+
{"current_steps": 608, "total_steps": 1230, "loss": 0.2812, "lr": 2.3863527238004633e-05, "epoch": 2.4658227848101264, "percentage": 49.43, "elapsed_time": "14:21:19", "remaining_time": "14:41:09"}
|
| 1308 |
+
{"current_steps": 700, "total_steps": 1230, "loss": 0.2289, "lr": 1.866715967678769e-05, "epoch": 2.838481012658228, "percentage": 56.91, "elapsed_time": "16:33:31", "remaining_time": "12:32:14"}
|
| 1309 |
+
{"current_steps": 609, "total_steps": 1230, "loss": 0.24, "lr": 2.380782218329337e-05, "epoch": 2.469873417721519, "percentage": 49.51, "elapsed_time": "14:22:43", "remaining_time": "14:39:43"}
|
| 1310 |
+
{"current_steps": 701, "total_steps": 1230, "loss": 0.2373, "lr": 1.861053262258067e-05, "epoch": 2.84253164556962, "percentage": 56.99, "elapsed_time": "16:34:45", "remaining_time": "12:30:40"}
|
| 1311 |
+
{"current_steps": 610, "total_steps": 1230, "loss": 0.2612, "lr": 2.3752086460905725e-05, "epoch": 2.4739240506329114, "percentage": 49.59, "elapsed_time": "14:24:21", "remaining_time": "14:38:31"}
|
| 1312 |
+
{"current_steps": 702, "total_steps": 1230, "loss": 0.2484, "lr": 1.8553916758952897e-05, "epoch": 2.8465822784810126, "percentage": 57.07, "elapsed_time": "16:36:19", "remaining_time": "12:29:22"}
|
| 1313 |
+
{"current_steps": 611, "total_steps": 1230, "loss": 0.2617, "lr": 2.3696320519729544e-05, "epoch": 2.477974683544304, "percentage": 49.67, "elapsed_time": "14:25:42", "remaining_time": "14:37:03"}
|
| 1314 |
+
{"current_steps": 703, "total_steps": 1230, "loss": 0.2638, "lr": 1.8497312541880735e-05, "epoch": 2.850632911392405, "percentage": 57.15, "elapsed_time": "16:37:43", "remaining_time": "12:27:56"}
|
| 1315 |
+
{"current_steps": 612, "total_steps": 1230, "loss": 0.2461, "lr": 2.3640524808896045e-05, "epoch": 2.482025316455696, "percentage": 49.76, "elapsed_time": "14:27:01", "remaining_time": "14:35:31"}
|
| 1316 |
+
{"current_steps": 704, "total_steps": 1230, "loss": 0.2268, "lr": 1.8440720427246786e-05, "epoch": 2.8546835443037972, "percentage": 57.24, "elapsed_time": "16:38:59", "remaining_time": "12:26:23"}
|
| 1317 |
+
{"current_steps": 613, "total_steps": 1230, "loss": 0.2398, "lr": 2.3584699777776222e-05, "epoch": 2.4860759493670885, "percentage": 49.84, "elapsed_time": "14:28:12", "remaining_time": "14:33:52"}
|
| 1318 |
+
{"current_steps": 705, "total_steps": 1230, "loss": 0.2287, "lr": 1.8384140870836157e-05, "epoch": 2.8587341772151897, "percentage": 57.32, "elapsed_time": "16:40:04", "remaining_time": "12:24:43"}
|
| 1319 |
+
{"current_steps": 614, "total_steps": 1230, "loss": 0.2474, "lr": 2.3528845875977195e-05, "epoch": 2.490126582278481, "percentage": 49.92, "elapsed_time": "14:29:33", "remaining_time": "14:32:23"}
|
| 1320 |
+
{"current_steps": 706, "total_steps": 1230, "loss": 0.2456, "lr": 1.8327574328332806e-05, "epoch": 2.8627848101265823, "percentage": 57.4, "elapsed_time": "16:41:18", "remaining_time": "12:23:10"}
|
| 1321 |
+
{"current_steps": 615, "total_steps": 1230, "loss": 0.256, "lr": 2.3472963553338614e-05, "epoch": 2.4941772151898736, "percentage": 50.0, "elapsed_time": "14:30:52", "remaining_time": "14:30:52"}
|
| 1322 |
+
{"current_steps": 707, "total_steps": 1230, "loss": 0.2514, "lr": 1.8271021255315906e-05, "epoch": 2.8668354430379748, "percentage": 57.48, "elapsed_time": "16:42:39", "remaining_time": "12:21:42"}
|
| 1323 |
+
{"current_steps": 616, "total_steps": 1230, "loss": 0.2488, "lr": 2.341705325992901e-05, "epoch": 2.4982278481012656, "percentage": 50.08, "elapsed_time": "14:32:09", "remaining_time": "14:29:19"}
|
| 1324 |
+
{"current_steps": 708, "total_steps": 1230, "loss": 0.2491, "lr": 1.8214482107256117e-05, "epoch": 2.8708860759493673, "percentage": 57.56, "elapsed_time": "16:44:18", "remaining_time": "12:20:28"}
|
| 1325 |
+
{"current_steps": 617, "total_steps": 1230, "loss": 0.2358, "lr": 2.336111544604222e-05, "epoch": 2.502278481012658, "percentage": 50.16, "elapsed_time": "14:33:21", "remaining_time": "14:27:42"}
|
| 1326 |
+
{"current_steps": 618, "total_steps": 1230, "loss": 0.2347, "lr": 2.33051505621937e-05, "epoch": 2.5063291139240507, "percentage": 50.24, "elapsed_time": "14:34:31", "remaining_time": "14:26:02"}
|
| 1327 |
+
{"current_steps": 709, "total_steps": 1230, "loss": 0.2435, "lr": 1.8157957339511968e-05, "epoch": 2.8749367088607594, "percentage": 57.64, "elapsed_time": "16:45:40", "remaining_time": "12:19:00"}
|
| 1328 |
+
{"current_steps": 619, "total_steps": 1230, "loss": 0.2344, "lr": 2.324915905911693e-05, "epoch": 2.510379746835443, "percentage": 50.33, "elapsed_time": "14:35:54", "remaining_time": "14:24:35"}
|
| 1329 |
+
{"current_steps": 710, "total_steps": 1230, "loss": 0.2663, "lr": 1.8101447407326182e-05, "epoch": 2.878987341772152, "percentage": 57.72, "elapsed_time": "16:47:17", "remaining_time": "12:17:44"}
|
| 1330 |
+
{"current_steps": 711, "total_steps": 1230, "loss": 0.2292, "lr": 1.8044952765821966e-05, "epoch": 2.8830379746835444, "percentage": 57.8, "elapsed_time": "16:48:38", "remaining_time": "12:16:15"}
|
| 1331 |
+
{"current_steps": 620, "total_steps": 1230, "loss": 0.2783, "lr": 2.319314138775977e-05, "epoch": 2.5144303797468357, "percentage": 50.41, "elapsed_time": "14:37:40", "remaining_time": "14:23:30"}
|
| 1332 |
+
{"current_steps": 712, "total_steps": 1230, "loss": 0.2359, "lr": 1.7988473869999407e-05, "epoch": 2.8870886075949365, "percentage": 57.89, "elapsed_time": "16:50:07", "remaining_time": "12:14:53"}
|
| 1333 |
+
{"current_steps": 621, "total_steps": 1230, "loss": 0.2538, "lr": 2.3137097999280856e-05, "epoch": 2.5184810126582278, "percentage": 50.49, "elapsed_time": "14:39:06", "remaining_time": "14:22:07"}
|
| 1334 |
+
{"current_steps": 713, "total_steps": 1230, "loss": 0.2646, "lr": 1.7932011174731764e-05, "epoch": 2.891139240506329, "percentage": 57.97, "elapsed_time": "16:51:44", "remaining_time": "12:13:37"}
|
| 1335 |
+
{"current_steps": 622, "total_steps": 1230, "loss": 0.236, "lr": 2.308102934504593e-05, "epoch": 2.5225316455696203, "percentage": 50.57, "elapsed_time": "14:40:35", "remaining_time": "14:20:46"}
|
| 1336 |
+
{"current_steps": 714, "total_steps": 1230, "loss": 0.252, "lr": 1.7875565134761817e-05, "epoch": 2.8951898734177215, "percentage": 58.05, "elapsed_time": "16:53:12", "remaining_time": "12:12:13"}
|
| 1337 |
+
{"current_steps": 623, "total_steps": 1230, "loss": 0.2596, "lr": 2.3024935876624222e-05, "epoch": 2.526582278481013, "percentage": 50.65, "elapsed_time": "14:42:06", "remaining_time": "14:19:27"}
|
| 1338 |
+
{"current_steps": 624, "total_steps": 1230, "loss": 0.2265, "lr": 2.2968818045784813e-05, "epoch": 2.530632911392405, "percentage": 50.73, "elapsed_time": "14:43:27", "remaining_time": "14:17:58"}
|
| 1339 |
+
{"current_steps": 715, "total_steps": 1230, "loss": 0.255, "lr": 1.7819136204698226e-05, "epoch": 2.899240506329114, "percentage": 58.13, "elapsed_time": "16:54:39", "remaining_time": "12:10:50"}
|
| 1340 |
+
{"current_steps": 625, "total_steps": 1230, "loss": 0.2586, "lr": 2.2912676304493006e-05, "epoch": 2.5346835443037974, "percentage": 50.81, "elapsed_time": "14:44:50", "remaining_time": "14:16:31"}
|
| 1341 |
+
{"current_steps": 716, "total_steps": 1230, "loss": 0.2505, "lr": 1.776272483901182e-05, "epoch": 2.9032911392405065, "percentage": 58.21, "elapsed_time": "16:56:00", "remaining_time": "12:09:22"}
|
| 1342 |
+
{"current_steps": 626, "total_steps": 1230, "loss": 0.2627, "lr": 2.2856511104906668e-05, "epoch": 2.53873417721519, "percentage": 50.89, "elapsed_time": "14:46:15", "remaining_time": "14:15:06"}
|
| 1343 |
+
{"current_steps": 717, "total_steps": 1230, "loss": 0.251, "lr": 1.7706331492031995e-05, "epoch": 2.9073417721518986, "percentage": 58.29, "elapsed_time": "16:57:36", "remaining_time": "12:08:04"}
|
| 1344 |
+
{"current_steps": 627, "total_steps": 1230, "loss": 0.2584, "lr": 2.2800322899372586e-05, "epoch": 2.5427848101265824, "percentage": 50.98, "elapsed_time": "14:47:30", "remaining_time": "14:13:31"}
|
| 1345 |
+
{"current_steps": 718, "total_steps": 1230, "loss": 0.2603, "lr": 1.764995661794301e-05, "epoch": 2.911392405063291, "percentage": 58.37, "elapsed_time": "16:58:54", "remaining_time": "12:06:34"}
|
| 1346 |
+
{"current_steps": 628, "total_steps": 1230, "loss": 0.2409, "lr": 2.2744112140422844e-05, "epoch": 2.546835443037975, "percentage": 51.06, "elapsed_time": "14:48:36", "remaining_time": "14:11:49"}
|
| 1347 |
+
{"current_steps": 719, "total_steps": 1230, "loss": 0.2409, "lr": 1.759360067078035e-05, "epoch": 2.9154430379746836, "percentage": 58.46, "elapsed_time": "17:00:18", "remaining_time": "12:05:08"}
|
| 1348 |
+
{"current_steps": 629, "total_steps": 1230, "loss": 0.2487, "lr": 2.2687879280771177e-05, "epoch": 2.550886075949367, "percentage": 51.14, "elapsed_time": "14:50:01", "remaining_time": "14:10:24"}
|
| 1349 |
+
{"current_steps": 720, "total_steps": 1230, "loss": 0.2763, "lr": 1.7537264104427064e-05, "epoch": 2.9194936708860757, "percentage": 58.54, "elapsed_time": "17:01:56", "remaining_time": "12:03:52"}
|
| 1350 |
+
{"current_steps": 630, "total_steps": 1230, "loss": 0.2356, "lr": 2.26316247733093e-05, "epoch": 2.5549367088607595, "percentage": 51.22, "elapsed_time": "14:51:11", "remaining_time": "14:08:45"}
|
| 1351 |
+
{"current_steps": 721, "total_steps": 1230, "loss": 0.2504, "lr": 1.748094737261012e-05, "epoch": 2.923544303797468, "percentage": 58.62, "elapsed_time": "17:03:22", "remaining_time": "12:02:28"}
|
| 1352 |
+
{"current_steps": 631, "total_steps": 1230, "loss": 0.2458, "lr": 2.257534907110328e-05, "epoch": 2.558987341772152, "percentage": 51.3, "elapsed_time": "14:52:44", "remaining_time": "14:07:28"}
|
| 1353 |
+
{"current_steps": 722, "total_steps": 1230, "loss": 0.247, "lr": 1.7424650928896726e-05, "epoch": 2.9275949367088607, "percentage": 58.7, "elapsed_time": "17:04:26", "remaining_time": "12:00:47"}
|
| 1354 |
+
{"current_steps": 632, "total_steps": 1230, "loss": 0.2489, "lr": 2.2519052627389882e-05, "epoch": 2.563037974683544, "percentage": 51.38, "elapsed_time": "14:54:20", "remaining_time": "14:06:13"}
|
| 1355 |
+
{"current_steps": 723, "total_steps": 1230, "loss": 0.2459, "lr": 1.7368375226690712e-05, "epoch": 2.9316455696202532, "percentage": 58.78, "elapsed_time": "17:05:52", "remaining_time": "11:59:23"}
|
| 1356 |
+
{"current_steps": 633, "total_steps": 1230, "loss": 0.2265, "lr": 2.246273589557294e-05, "epoch": 2.5670886075949366, "percentage": 51.46, "elapsed_time": "14:55:35", "remaining_time": "14:04:39"}
|
| 1357 |
+
{"current_steps": 724, "total_steps": 1230, "loss": 0.2234, "lr": 1.731212071922883e-05, "epoch": 2.9356962025316458, "percentage": 58.86, "elapsed_time": "17:07:05", "remaining_time": "11:57:49"}
|
| 1358 |
+
{"current_steps": 634, "total_steps": 1230, "loss": 0.2612, "lr": 2.240639932921966e-05, "epoch": 2.571139240506329, "percentage": 51.54, "elapsed_time": "14:56:55", "remaining_time": "14:03:09"}
|
| 1359 |
+
{"current_steps": 725, "total_steps": 1230, "loss": 0.2588, "lr": 1.7255887859577156e-05, "epoch": 2.939746835443038, "percentage": 58.94, "elapsed_time": "17:08:33", "remaining_time": "11:56:26"}
|
| 1360 |
+
{"current_steps": 635, "total_steps": 1230, "loss": 0.2598, "lr": 2.2350043382056995e-05, "epoch": 2.5751898734177217, "percentage": 51.63, "elapsed_time": "14:58:20", "remaining_time": "14:01:45"}
|
| 1361 |
+
{"current_steps": 726, "total_steps": 1230, "loss": 0.241, "lr": 1.7199677100627427e-05, "epoch": 2.9437974683544303, "percentage": 59.02, "elapsed_time": "17:09:50", "remaining_time": "11:54:56"}
|
| 1362 |
+
{"current_steps": 636, "total_steps": 1230, "loss": 0.2578, "lr": 2.2293668507968015e-05, "epoch": 2.579240506329114, "percentage": 51.71, "elapsed_time": "14:59:47", "remaining_time": "14:00:21"}
|
| 1363 |
+
{"current_steps": 727, "total_steps": 1230, "loss": 0.2511, "lr": 1.7143488895093343e-05, "epoch": 2.947848101265823, "percentage": 59.11, "elapsed_time": "17:11:17", "remaining_time": "11:53:32"}
|
| 1364 |
+
{"current_steps": 637, "total_steps": 1230, "loss": 0.2391, "lr": 2.2237275160988186e-05, "epoch": 2.5832911392405062, "percentage": 51.79, "elapsed_time": "15:00:54", "remaining_time": "13:58:41"}
|
| 1365 |
+
{"current_steps": 728, "total_steps": 1230, "loss": 0.2441, "lr": 1.7087323695506994e-05, "epoch": 2.951898734177215, "percentage": 59.19, "elapsed_time": "17:12:39", "remaining_time": "11:52:05"}
|
| 1366 |
+
{"current_steps": 638, "total_steps": 1230, "loss": 0.2687, "lr": 2.2180863795301787e-05, "epoch": 2.5873417721518988, "percentage": 51.87, "elapsed_time": "15:02:31", "remaining_time": "13:57:27"}
|
| 1367 |
+
{"current_steps": 729, "total_steps": 1230, "loss": 0.2429, "lr": 1.7031181954215194e-05, "epoch": 2.9559493670886074, "percentage": 59.27, "elapsed_time": "17:13:53", "remaining_time": "11:50:32"}
|
| 1368 |
+
{"current_steps": 639, "total_steps": 1230, "loss": 0.2297, "lr": 2.212443486523819e-05, "epoch": 2.5913924050632913, "percentage": 51.95, "elapsed_time": "15:03:51", "remaining_time": "13:55:57"}
|
| 1369 |
+
{"current_steps": 730, "total_steps": 1230, "loss": 0.2389, "lr": 1.6975064123375788e-05, "epoch": 2.96, "percentage": 59.35, "elapsed_time": "17:15:05", "remaining_time": "11:48:58"}
|
| 1370 |
+
{"current_steps": 640, "total_steps": 1230, "loss": 0.2458, "lr": 2.2067988825268243e-05, "epoch": 2.5954430379746833, "percentage": 52.03, "elapsed_time": "15:04:59", "remaining_time": "13:54:17"}
|
| 1371 |
+
{"current_steps": 731, "total_steps": 1230, "loss": 0.2476, "lr": 1.6918970654954084e-05, "epoch": 2.9640506329113925, "percentage": 59.43, "elapsed_time": "17:16:25", "remaining_time": "11:47:29"}
|
| 1372 |
+
{"current_steps": 641, "total_steps": 1230, "loss": 0.2336, "lr": 2.2011526130000596e-05, "epoch": 2.599493670886076, "percentage": 52.11, "elapsed_time": "15:06:17", "remaining_time": "13:52:46"}
|
| 1373 |
+
{"current_steps": 732, "total_steps": 1230, "loss": 0.2382, "lr": 1.686290200071915e-05, "epoch": 2.968101265822785, "percentage": 59.51, "elapsed_time": "17:17:34", "remaining_time": "11:45:53"}
|
| 1374 |
+
{"current_steps": 642, "total_steps": 1230, "loss": 0.2502, "lr": 2.1955047234178038e-05, "epoch": 2.6035443037974684, "percentage": 52.2, "elapsed_time": "15:07:36", "remaining_time": "13:51:15"}
|
| 1375 |
+
{"current_steps": 733, "total_steps": 1230, "loss": 0.2316, "lr": 1.6806858612240234e-05, "epoch": 2.972151898734177, "percentage": 59.59, "elapsed_time": "17:18:51", "remaining_time": "11:44:22"}
|
| 1376 |
+
{"current_steps": 734, "total_steps": 1230, "loss": 0.2146, "lr": 1.6750840940883078e-05, "epoch": 2.9762025316455696, "percentage": 59.67, "elapsed_time": "17:20:03", "remaining_time": "11:42:48"}
|
| 1377 |
+
{"current_steps": 643, "total_steps": 1230, "loss": 0.2572, "lr": 2.1898552592673825e-05, "epoch": 2.607594936708861, "percentage": 52.28, "elapsed_time": "15:09:14", "remaining_time": "13:50:03"}
|
| 1378 |
+
{"current_steps": 735, "total_steps": 1230, "loss": 0.2349, "lr": 1.6694849437806305e-05, "epoch": 2.980253164556962, "percentage": 59.76, "elapsed_time": "17:21:09", "remaining_time": "11:41:11"}
|
| 1379 |
+
{"current_steps": 644, "total_steps": 1230, "loss": 0.2398, "lr": 2.184204266048803e-05, "epoch": 2.6116455696202534, "percentage": 52.36, "elapsed_time": "15:10:37", "remaining_time": "13:48:36"}
|
| 1380 |
+
{"current_steps": 736, "total_steps": 1230, "loss": 0.2154, "lr": 1.663888455395778e-05, "epoch": 2.984303797468354, "percentage": 59.84, "elapsed_time": "17:22:30", "remaining_time": "11:39:43"}
|
| 1381 |
+
{"current_steps": 645, "total_steps": 1230, "loss": 0.2715, "lr": 2.1785517892743887e-05, "epoch": 2.6156962025316455, "percentage": 52.44, "elapsed_time": "15:12:00", "remaining_time": "13:47:10"}
|
| 1382 |
+
{"current_steps": 737, "total_steps": 1230, "loss": 0.2218, "lr": 1.6582946740070995e-05, "epoch": 2.9883544303797467, "percentage": 59.92, "elapsed_time": "17:23:35", "remaining_time": "11:38:05"}
|
| 1383 |
+
{"current_steps": 646, "total_steps": 1230, "loss": 0.2636, "lr": 2.17289787446841e-05, "epoch": 2.619746835443038, "percentage": 52.52, "elapsed_time": "15:13:17", "remaining_time": "13:45:37"}
|
| 1384 |
+
{"current_steps": 738, "total_steps": 1230, "loss": 0.2658, "lr": 1.6527036446661396e-05, "epoch": 2.992405063291139, "percentage": 60.0, "elapsed_time": "17:24:57", "remaining_time": "11:36:38"}
|
| 1385 |
+
{"current_steps": 647, "total_steps": 1230, "loss": 0.2521, "lr": 2.1672425671667198e-05, "epoch": 2.6237974683544305, "percentage": 52.6, "elapsed_time": "15:14:48", "remaining_time": "13:44:18"}
|
| 1386 |
+
{"current_steps": 739, "total_steps": 1230, "loss": 0.2414, "lr": 1.6471154124022818e-05, "epoch": 2.9964556962025317, "percentage": 60.08, "elapsed_time": "17:26:17", "remaining_time": "11:35:10"}
|
| 1387 |
+
{"current_steps": 648, "total_steps": 1230, "loss": 0.2156, "lr": 2.161585912916385e-05, "epoch": 2.6278481012658226, "percentage": 52.68, "elapsed_time": "15:15:51", "remaining_time": "13:42:34"}
|
| 1388 |
+
{"current_steps": 649, "total_steps": 1230, "loss": 0.2207, "lr": 2.1559279572753214e-05, "epoch": 2.631898734177215, "percentage": 52.76, "elapsed_time": "15:17:08", "remaining_time": "13:41:02"}
|
| 1389 |
+
{"current_steps": 740, "total_steps": 1230, "loss": 0.2256, "lr": 1.6415300222223788e-05, "epoch": 3.002025316455696, "percentage": 60.16, "elapsed_time": "17:28:47", "remaining_time": "11:34:27"}
|
| 1390 |
+
{"current_steps": 650, "total_steps": 1230, "loss": 0.2762, "lr": 2.1502687458119268e-05, "epoch": 2.6359493670886076, "percentage": 52.85, "elapsed_time": "15:18:42", "remaining_time": "13:39:46"}
|
| 1391 |
+
{"current_steps": 741, "total_steps": 1230, "loss": 0.1766, "lr": 1.6359475191103958e-05, "epoch": 3.0060759493670886, "percentage": 60.24, "elapsed_time": "17:30:07", "remaining_time": "11:32:59"}
|
| 1392 |
+
{"current_steps": 651, "total_steps": 1230, "loss": 0.2499, "lr": 2.1446083241047116e-05, "epoch": 2.64, "percentage": 52.93, "elapsed_time": "15:20:02", "remaining_time": "13:38:16"}
|
| 1393 |
+
{"current_steps": 742, "total_steps": 1230, "loss": 0.2079, "lr": 1.6303679480270466e-05, "epoch": 3.010126582278481, "percentage": 60.33, "elapsed_time": "17:31:29", "remaining_time": "11:31:33"}
|
| 1394 |
+
{"current_steps": 652, "total_steps": 1230, "loss": 0.256, "lr": 2.1389467377419333e-05, "epoch": 2.6440506329113926, "percentage": 53.01, "elapsed_time": "15:21:31", "remaining_time": "13:36:56"}
|
| 1395 |
+
{"current_steps": 743, "total_steps": 1230, "loss": 0.1763, "lr": 1.624791353909428e-05, "epoch": 3.0141772151898736, "percentage": 60.41, "elapsed_time": "17:32:46", "remaining_time": "11:30:02"}
|
| 1396 |
+
{"current_steps": 653, "total_steps": 1230, "loss": 0.2469, "lr": 2.133284032321232e-05, "epoch": 2.6481012658227847, "percentage": 53.09, "elapsed_time": "15:22:50", "remaining_time": "13:35:25"}
|
| 1397 |
+
{"current_steps": 744, "total_steps": 1230, "loss": 0.1671, "lr": 1.619217781670663e-05, "epoch": 3.0182278481012657, "percentage": 60.49, "elapsed_time": "17:34:06", "remaining_time": "11:28:34"}
|
| 1398 |
+
{"current_steps": 654, "total_steps": 1230, "loss": 0.249, "lr": 2.1276202534492566e-05, "epoch": 2.6521518987341772, "percentage": 53.17, "elapsed_time": "15:24:14", "remaining_time": "13:34:00"}
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7288
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b109346f835356baa84e067fdb9a82cdcae7d60dd3739e1d9b7b4e6b1eca559
|
| 3 |
size 7288
|