Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7f4d90902fb002d5865856495bfd277f4feff26a0acf34825176d0fd085116e
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:389ee66f7c341a250cbcd3b5382d9a5f39da47caa358773cad842c4003ea1d32
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:837d3dfca5d9d28486fc70679d6bf6afa882c649759a86e9332d0c2f63a95058
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:151bc2c60750051fd7687c757e8563f753894a463e070ab440ec312996539aa7
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -223,3 +223,115 @@
|
|
| 223 |
{"current_steps": 223, "total_steps": 336, "loss": 0.4574, "lr": 2.4596606858352036e-05, "epoch": 1.9910714285714286, "percentage": 66.37, "elapsed_time": "3:41:17", "remaining_time": "1:52:08"}
|
| 224 |
{"current_steps": 224, "total_steps": 336, "loss": 0.4567, "lr": 2.421343175066095e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:42:16", "remaining_time": "1:51:08"}
|
| 225 |
{"current_steps": 225, "total_steps": 336, "loss": 0.4285, "lr": 2.3831964964736737e-05, "epoch": 2.0089285714285716, "percentage": 66.96, "elapsed_time": "3:44:57", "remaining_time": "1:50:58"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 223 |
{"current_steps": 223, "total_steps": 336, "loss": 0.4574, "lr": 2.4596606858352036e-05, "epoch": 1.9910714285714286, "percentage": 66.37, "elapsed_time": "3:41:17", "remaining_time": "1:52:08"}
|
| 224 |
{"current_steps": 224, "total_steps": 336, "loss": 0.4567, "lr": 2.421343175066095e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:42:16", "remaining_time": "1:51:08"}
|
| 225 |
{"current_steps": 225, "total_steps": 336, "loss": 0.4285, "lr": 2.3831964964736737e-05, "epoch": 2.0089285714285716, "percentage": 66.96, "elapsed_time": "3:44:57", "remaining_time": "1:50:58"}
|
| 226 |
+
{"current_steps": 226, "total_steps": 336, "loss": 0.4245, "lr": 2.3452247780482877e-05, "epoch": 2.017857142857143, "percentage": 67.26, "elapsed_time": "3:45:56", "remaining_time": "1:49:58"}
|
| 227 |
+
{"current_steps": 227, "total_steps": 336, "loss": 0.4143, "lr": 2.3074321288472135e-05, "epoch": 2.0267857142857144, "percentage": 67.56, "elapsed_time": "3:46:55", "remaining_time": "1:48:57"}
|
| 228 |
+
{"current_steps": 228, "total_steps": 336, "loss": 0.4182, "lr": 2.269822638549997e-05, "epoch": 2.0357142857142856, "percentage": 67.86, "elapsed_time": "3:47:54", "remaining_time": "1:47:57"}
|
| 229 |
+
{"current_steps": 229, "total_steps": 336, "loss": 0.4266, "lr": 2.2324003770158917e-05, "epoch": 2.044642857142857, "percentage": 68.15, "elapsed_time": "3:48:53", "remaining_time": "1:46:57"}
|
| 230 |
+
{"current_steps": 230, "total_steps": 336, "loss": 0.4163, "lr": 2.1951693938434517e-05, "epoch": 2.0535714285714284, "percentage": 68.45, "elapsed_time": "3:49:52", "remaining_time": "1:45:56"}
|
| 231 |
+
{"current_steps": 231, "total_steps": 336, "loss": 0.4202, "lr": 2.1581337179323062e-05, "epoch": 2.0625, "percentage": 68.75, "elapsed_time": "3:50:52", "remaining_time": "1:44:56"}
|
| 232 |
+
{"current_steps": 232, "total_steps": 336, "loss": 0.4204, "lr": 2.1212973570471758e-05, "epoch": 2.0714285714285716, "percentage": 69.05, "elapsed_time": "3:51:52", "remaining_time": "1:43:56"}
|
| 233 |
+
{"current_steps": 233, "total_steps": 336, "loss": 0.4255, "lr": 2.0846642973841833e-05, "epoch": 2.080357142857143, "percentage": 69.35, "elapsed_time": "3:52:50", "remaining_time": "1:42:55"}
|
| 234 |
+
{"current_steps": 234, "total_steps": 336, "loss": 0.4173, "lr": 2.0482385031394864e-05, "epoch": 2.0892857142857144, "percentage": 69.64, "elapsed_time": "3:53:50", "remaining_time": "1:41:55"}
|
| 235 |
+
{"current_steps": 235, "total_steps": 336, "loss": 0.4253, "lr": 2.0120239160803026e-05, "epoch": 2.0982142857142856, "percentage": 69.94, "elapsed_time": "3:54:49", "remaining_time": "1:40:55"}
|
| 236 |
+
{"current_steps": 236, "total_steps": 336, "loss": 0.4234, "lr": 1.9760244551183503e-05, "epoch": 2.107142857142857, "percentage": 70.24, "elapsed_time": "3:55:48", "remaining_time": "1:39:55"}
|
| 237 |
+
{"current_steps": 237, "total_steps": 336, "loss": 0.4241, "lr": 1.9402440158857775e-05, "epoch": 2.1160714285714284, "percentage": 70.54, "elapsed_time": "3:56:48", "remaining_time": "1:38:55"}
|
| 238 |
+
{"current_steps": 238, "total_steps": 336, "loss": 0.4174, "lr": 1.9046864703135958e-05, "epoch": 2.125, "percentage": 70.83, "elapsed_time": "3:57:48", "remaining_time": "1:37:55"}
|
| 239 |
+
{"current_steps": 239, "total_steps": 336, "loss": 0.4211, "lr": 1.8693556662126857e-05, "epoch": 2.1339285714285716, "percentage": 71.13, "elapsed_time": "3:58:47", "remaining_time": "1:36:55"}
|
| 240 |
+
{"current_steps": 240, "total_steps": 336, "loss": 0.4158, "lr": 1.8342554268574114e-05, "epoch": 2.142857142857143, "percentage": 71.43, "elapsed_time": "3:59:47", "remaining_time": "1:35:54"}
|
| 241 |
+
{"current_steps": 241, "total_steps": 336, "loss": 0.4164, "lr": 1.7993895505718907e-05, "epoch": 2.1517857142857144, "percentage": 71.73, "elapsed_time": "4:00:46", "remaining_time": "1:34:54"}
|
| 242 |
+
{"current_steps": 242, "total_steps": 336, "loss": 0.4213, "lr": 1.7647618103189632e-05, "epoch": 2.1607142857142856, "percentage": 72.02, "elapsed_time": "4:01:45", "remaining_time": "1:33:54"}
|
| 243 |
+
{"current_steps": 243, "total_steps": 336, "loss": 0.4194, "lr": 1.7303759532919066e-05, "epoch": 2.169642857142857, "percentage": 72.32, "elapsed_time": "4:02:44", "remaining_time": "1:32:54"}
|
| 244 |
+
{"current_steps": 244, "total_steps": 336, "loss": 0.4171, "lr": 1.6962357005089368e-05, "epoch": 2.1785714285714284, "percentage": 72.62, "elapsed_time": "4:03:43", "remaining_time": "1:31:53"}
|
| 245 |
+
{"current_steps": 245, "total_steps": 336, "loss": 0.4218, "lr": 1.6623447464105455e-05, "epoch": 2.1875, "percentage": 72.92, "elapsed_time": "4:04:42", "remaining_time": "1:30:53"}
|
| 246 |
+
{"current_steps": 246, "total_steps": 336, "loss": 0.4184, "lr": 1.628706758459709e-05, "epoch": 2.1964285714285716, "percentage": 73.21, "elapsed_time": "4:05:41", "remaining_time": "1:29:53"}
|
| 247 |
+
{"current_steps": 247, "total_steps": 336, "loss": 0.4233, "lr": 1.5953253767450214e-05, "epoch": 2.205357142857143, "percentage": 73.51, "elapsed_time": "4:06:40", "remaining_time": "1:28:53"}
|
| 248 |
+
{"current_steps": 248, "total_steps": 336, "loss": 0.4189, "lr": 1.5622042135867838e-05, "epoch": 2.2142857142857144, "percentage": 73.81, "elapsed_time": "4:07:39", "remaining_time": "1:27:52"}
|
| 249 |
+
{"current_steps": 249, "total_steps": 336, "loss": 0.4232, "lr": 1.5293468531461063e-05, "epoch": 2.2232142857142856, "percentage": 74.11, "elapsed_time": "4:08:37", "remaining_time": "1:26:52"}
|
| 250 |
+
{"current_steps": 250, "total_steps": 336, "loss": 0.4259, "lr": 1.4967568510370498e-05, "epoch": 2.232142857142857, "percentage": 74.4, "elapsed_time": "4:09:37", "remaining_time": "1:25:52"}
|
| 251 |
+
{"current_steps": 251, "total_steps": 336, "loss": 0.4181, "lr": 1.464437733941861e-05, "epoch": 2.2410714285714284, "percentage": 74.7, "elapsed_time": "4:10:36", "remaining_time": "1:24:51"}
|
| 252 |
+
{"current_steps": 252, "total_steps": 336, "loss": 0.4196, "lr": 1.4323929992293378e-05, "epoch": 2.25, "percentage": 75.0, "elapsed_time": "4:11:34", "remaining_time": "1:23:51"}
|
| 253 |
+
{"current_steps": 253, "total_steps": 336, "loss": 0.4218, "lr": 1.4006261145763657e-05, "epoch": 2.2589285714285716, "percentage": 75.3, "elapsed_time": "4:12:33", "remaining_time": "1:22:51"}
|
| 254 |
+
{"current_steps": 254, "total_steps": 336, "loss": 0.4179, "lr": 1.3691405175926705e-05, "epoch": 2.267857142857143, "percentage": 75.6, "elapsed_time": "4:13:32", "remaining_time": "1:21:51"}
|
| 255 |
+
{"current_steps": 255, "total_steps": 336, "loss": 0.426, "lr": 1.3379396154488142e-05, "epoch": 2.2767857142857144, "percentage": 75.89, "elapsed_time": "4:14:31", "remaining_time": "1:20:50"}
|
| 256 |
+
{"current_steps": 256, "total_steps": 336, "loss": 0.4154, "lr": 1.3070267845075026e-05, "epoch": 2.2857142857142856, "percentage": 76.19, "elapsed_time": "4:15:30", "remaining_time": "1:19:50"}
|
| 257 |
+
{"current_steps": 257, "total_steps": 336, "loss": 0.4154, "lr": 1.2764053699582145e-05, "epoch": 2.294642857142857, "percentage": 76.49, "elapsed_time": "4:16:28", "remaining_time": "1:18:50"}
|
| 258 |
+
{"current_steps": 258, "total_steps": 336, "loss": 0.4249, "lr": 1.2460786854552e-05, "epoch": 2.3035714285714284, "percentage": 76.79, "elapsed_time": "4:17:27", "remaining_time": "1:17:50"}
|
| 259 |
+
{"current_steps": 259, "total_steps": 336, "loss": 0.4215, "lr": 1.2160500127589057e-05, "epoch": 2.3125, "percentage": 77.08, "elapsed_time": "4:18:26", "remaining_time": "1:16:49"}
|
| 260 |
+
{"current_steps": 260, "total_steps": 336, "loss": 0.4221, "lr": 1.1863226013808392e-05, "epoch": 2.3214285714285716, "percentage": 77.38, "elapsed_time": "4:19:24", "remaining_time": "1:15:49"}
|
| 261 |
+
{"current_steps": 261, "total_steps": 336, "loss": 0.4197, "lr": 1.1568996682319304e-05, "epoch": 2.330357142857143, "percentage": 77.68, "elapsed_time": "4:20:23", "remaining_time": "1:14:49"}
|
| 262 |
+
{"current_steps": 262, "total_steps": 336, "loss": 0.4135, "lr": 1.1277843972744127e-05, "epoch": 2.3392857142857144, "percentage": 77.98, "elapsed_time": "4:21:22", "remaining_time": "1:13:49"}
|
| 263 |
+
{"current_steps": 263, "total_steps": 336, "loss": 0.413, "lr": 1.0989799391772835e-05, "epoch": 2.3482142857142856, "percentage": 78.27, "elapsed_time": "4:22:20", "remaining_time": "1:12:49"}
|
| 264 |
+
{"current_steps": 264, "total_steps": 336, "loss": 0.4211, "lr": 1.070489410975351e-05, "epoch": 2.357142857142857, "percentage": 78.57, "elapsed_time": "4:23:19", "remaining_time": "1:11:48"}
|
| 265 |
+
{"current_steps": 265, "total_steps": 336, "loss": 0.4199, "lr": 1.0423158957319331e-05, "epoch": 2.3660714285714284, "percentage": 78.87, "elapsed_time": "4:24:18", "remaining_time": "1:10:48"}
|
| 266 |
+
{"current_steps": 266, "total_steps": 336, "loss": 0.4212, "lr": 1.014462442205225e-05, "epoch": 2.375, "percentage": 79.17, "elapsed_time": "4:25:16", "remaining_time": "1:09:48"}
|
| 267 |
+
{"current_steps": 267, "total_steps": 336, "loss": 0.416, "lr": 9.869320645183861e-06, "epoch": 2.3839285714285716, "percentage": 79.46, "elapsed_time": "4:26:15", "remaining_time": "1:08:48"}
|
| 268 |
+
{"current_steps": 268, "total_steps": 336, "loss": 0.4174, "lr": 9.597277418333673e-06, "epoch": 2.392857142857143, "percentage": 79.76, "elapsed_time": "4:27:14", "remaining_time": "1:07:48"}
|
| 269 |
+
{"current_steps": 269, "total_steps": 336, "loss": 0.423, "lr": 9.328524180285226e-06, "epoch": 2.4017857142857144, "percentage": 80.06, "elapsed_time": "4:28:12", "remaining_time": "1:06:48"}
|
| 270 |
+
{"current_steps": 270, "total_steps": 336, "loss": 0.4247, "lr": 9.063090013800488e-06, "epoch": 2.4107142857142856, "percentage": 80.36, "elapsed_time": "4:29:11", "remaining_time": "1:05:48"}
|
| 271 |
+
{"current_steps": 271, "total_steps": 336, "loss": 0.4201, "lr": 8.80100364247265e-06, "epoch": 2.419642857142857, "percentage": 80.65, "elapsed_time": "4:30:10", "remaining_time": "1:04:48"}
|
| 272 |
+
{"current_steps": 272, "total_steps": 336, "loss": 0.4174, "lr": 8.542293427617853e-06, "epoch": 2.4285714285714284, "percentage": 80.95, "elapsed_time": "4:31:08", "remaining_time": "1:03:47"}
|
| 273 |
+
{"current_steps": 273, "total_steps": 336, "loss": 0.4177, "lr": 8.286987365206114e-06, "epoch": 2.4375, "percentage": 81.25, "elapsed_time": "4:32:07", "remaining_time": "1:02:47"}
|
| 274 |
+
{"current_steps": 274, "total_steps": 336, "loss": 0.4182, "lr": 8.035113082831776e-06, "epoch": 2.4464285714285716, "percentage": 81.55, "elapsed_time": "4:33:06", "remaining_time": "1:01:47"}
|
| 275 |
+
{"current_steps": 275, "total_steps": 336, "loss": 0.4217, "lr": 7.78669783672382e-06, "epoch": 2.455357142857143, "percentage": 81.85, "elapsed_time": "4:34:05", "remaining_time": "1:00:47"}
|
| 276 |
+
{"current_steps": 276, "total_steps": 336, "loss": 0.4224, "lr": 7.5417685087963855e-06, "epoch": 2.4642857142857144, "percentage": 82.14, "elapsed_time": "4:35:03", "remaining_time": "0:59:47"}
|
| 277 |
+
{"current_steps": 277, "total_steps": 336, "loss": 0.422, "lr": 7.300351603739759e-06, "epoch": 2.4732142857142856, "percentage": 82.44, "elapsed_time": "4:36:02", "remaining_time": "0:58:47"}
|
| 278 |
+
{"current_steps": 278, "total_steps": 336, "loss": 0.4182, "lr": 7.062473246152231e-06, "epoch": 2.482142857142857, "percentage": 82.74, "elapsed_time": "4:37:01", "remaining_time": "0:57:47"}
|
| 279 |
+
{"current_steps": 279, "total_steps": 336, "loss": 0.4185, "lr": 6.828159177713036e-06, "epoch": 2.4910714285714284, "percentage": 83.04, "elapsed_time": "4:37:59", "remaining_time": "0:56:47"}
|
| 280 |
+
{"current_steps": 280, "total_steps": 336, "loss": 0.4233, "lr": 6.597434754396763e-06, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "4:38:58", "remaining_time": "0:55:47"}
|
| 281 |
+
{"current_steps": 281, "total_steps": 336, "loss": 0.4205, "lr": 6.370324943729498e-06, "epoch": 2.508928571428571, "percentage": 83.63, "elapsed_time": "4:39:57", "remaining_time": "0:54:47"}
|
| 282 |
+
{"current_steps": 282, "total_steps": 336, "loss": 0.4224, "lr": 6.146854322086984e-06, "epoch": 2.517857142857143, "percentage": 83.93, "elapsed_time": "4:40:55", "remaining_time": "0:53:47"}
|
| 283 |
+
{"current_steps": 283, "total_steps": 336, "loss": 0.4133, "lr": 5.9270470720351305e-06, "epoch": 2.5267857142857144, "percentage": 84.23, "elapsed_time": "4:41:54", "remaining_time": "0:52:47"}
|
| 284 |
+
{"current_steps": 284, "total_steps": 336, "loss": 0.4192, "lr": 5.7109269797131335e-06, "epoch": 2.5357142857142856, "percentage": 84.52, "elapsed_time": "4:42:53", "remaining_time": "0:51:47"}
|
| 285 |
+
{"current_steps": 285, "total_steps": 336, "loss": 0.4196, "lr": 5.498517432259487e-06, "epoch": 2.544642857142857, "percentage": 84.82, "elapsed_time": "4:43:51", "remaining_time": "0:50:47"}
|
| 286 |
+
{"current_steps": 286, "total_steps": 336, "loss": 0.4223, "lr": 5.2898414152811715e-06, "epoch": 2.553571428571429, "percentage": 85.12, "elapsed_time": "4:44:50", "remaining_time": "0:49:47"}
|
| 287 |
+
{"current_steps": 287, "total_steps": 336, "loss": 0.4207, "lr": 5.084921510366321e-06, "epoch": 2.5625, "percentage": 85.42, "elapsed_time": "4:45:49", "remaining_time": "0:48:47"}
|
| 288 |
+
{"current_steps": 288, "total_steps": 336, "loss": 0.4235, "lr": 4.883779892640532e-06, "epoch": 2.571428571428571, "percentage": 85.71, "elapsed_time": "4:46:47", "remaining_time": "0:47:47"}
|
| 289 |
+
{"current_steps": 289, "total_steps": 336, "loss": 0.4169, "lr": 4.686438328367287e-06, "epoch": 2.580357142857143, "percentage": 86.01, "elapsed_time": "4:47:46", "remaining_time": "0:46:48"}
|
| 290 |
+
{"current_steps": 290, "total_steps": 336, "loss": 0.4234, "lr": 4.492918172592489e-06, "epoch": 2.5892857142857144, "percentage": 86.31, "elapsed_time": "4:48:45", "remaining_time": "0:45:48"}
|
| 291 |
+
{"current_steps": 291, "total_steps": 336, "loss": 0.4139, "lr": 4.303240366833596e-06, "epoch": 2.5982142857142856, "percentage": 86.61, "elapsed_time": "4:49:43", "remaining_time": "0:44:48"}
|
| 292 |
+
{"current_steps": 292, "total_steps": 336, "loss": 0.4202, "lr": 4.117425436813438e-06, "epoch": 2.607142857142857, "percentage": 86.9, "elapsed_time": "4:50:42", "remaining_time": "0:43:48"}
|
| 293 |
+
{"current_steps": 293, "total_steps": 336, "loss": 0.4208, "lr": 3.935493490239046e-06, "epoch": 2.616071428571429, "percentage": 87.2, "elapsed_time": "4:51:40", "remaining_time": "0:42:48"}
|
| 294 |
+
{"current_steps": 294, "total_steps": 336, "loss": 0.4186, "lr": 3.7574642146257634e-06, "epoch": 2.625, "percentage": 87.5, "elapsed_time": "4:52:39", "remaining_time": "0:41:48"}
|
| 295 |
+
{"current_steps": 295, "total_steps": 336, "loss": 0.4237, "lr": 3.583356875166737e-06, "epoch": 2.633928571428571, "percentage": 87.8, "elapsed_time": "4:53:38", "remaining_time": "0:40:48"}
|
| 296 |
+
{"current_steps": 296, "total_steps": 336, "loss": 0.4154, "lr": 3.4131903126482045e-06, "epoch": 2.642857142857143, "percentage": 88.1, "elapsed_time": "4:54:37", "remaining_time": "0:39:48"}
|
| 297 |
+
{"current_steps": 297, "total_steps": 336, "loss": 0.4201, "lr": 3.2469829414106503e-06, "epoch": 2.6517857142857144, "percentage": 88.39, "elapsed_time": "4:55:35", "remaining_time": "0:38:48"}
|
| 298 |
+
{"current_steps": 298, "total_steps": 336, "loss": 0.4248, "lr": 3.0847527473561167e-06, "epoch": 2.6607142857142856, "percentage": 88.69, "elapsed_time": "4:56:34", "remaining_time": "0:37:49"}
|
| 299 |
+
{"current_steps": 299, "total_steps": 336, "loss": 0.415, "lr": 2.9265172860018754e-06, "epoch": 2.669642857142857, "percentage": 88.99, "elapsed_time": "4:57:33", "remaining_time": "0:36:49"}
|
| 300 |
+
{"current_steps": 300, "total_steps": 336, "loss": 0.4171, "lr": 2.7722936805807267e-06, "epoch": 2.678571428571429, "percentage": 89.29, "elapsed_time": "4:58:31", "remaining_time": "0:35:49"}
|
| 301 |
+
{"current_steps": 301, "total_steps": 336, "loss": 0.427, "lr": 2.622098620187963e-06, "epoch": 2.6875, "percentage": 89.58, "elapsed_time": "4:59:30", "remaining_time": "0:34:49"}
|
| 302 |
+
{"current_steps": 302, "total_steps": 336, "loss": 0.4198, "lr": 2.475948357975435e-06, "epoch": 2.696428571428571, "percentage": 89.88, "elapsed_time": "5:00:29", "remaining_time": "0:33:49"}
|
| 303 |
+
{"current_steps": 303, "total_steps": 336, "loss": 0.4219, "lr": 2.3338587093927245e-06, "epoch": 2.705357142857143, "percentage": 90.18, "elapsed_time": "5:01:27", "remaining_time": "0:32:49"}
|
| 304 |
+
{"current_steps": 304, "total_steps": 336, "loss": 0.4223, "lr": 2.195845050475698e-06, "epoch": 2.7142857142857144, "percentage": 90.48, "elapsed_time": "5:02:26", "remaining_time": "0:31:50"}
|
| 305 |
+
{"current_steps": 305, "total_steps": 336, "loss": 0.4184, "lr": 2.0619223161825942e-06, "epoch": 2.7232142857142856, "percentage": 90.77, "elapsed_time": "5:03:25", "remaining_time": "0:30:50"}
|
| 306 |
+
{"current_steps": 306, "total_steps": 336, "loss": 0.4179, "lr": 1.932104998777877e-06, "epoch": 2.732142857142857, "percentage": 91.07, "elapsed_time": "5:04:23", "remaining_time": "0:29:50"}
|
| 307 |
+
{"current_steps": 307, "total_steps": 336, "loss": 0.4184, "lr": 1.8064071462639798e-06, "epoch": 2.741071428571429, "percentage": 91.37, "elapsed_time": "5:05:22", "remaining_time": "0:28:50"}
|
| 308 |
+
{"current_steps": 308, "total_steps": 336, "loss": 0.4261, "lr": 1.684842360861092e-06, "epoch": 2.75, "percentage": 91.67, "elapsed_time": "5:06:20", "remaining_time": "0:27:50"}
|
| 309 |
+
{"current_steps": 309, "total_steps": 336, "loss": 0.4171, "lr": 1.5674237975352457e-06, "epoch": 2.758928571428571, "percentage": 91.96, "elapsed_time": "5:07:19", "remaining_time": "0:26:51"}
|
| 310 |
+
{"current_steps": 310, "total_steps": 336, "loss": 0.4192, "lr": 1.4541641625747428e-06, "epoch": 2.767857142857143, "percentage": 92.26, "elapsed_time": "5:08:18", "remaining_time": "0:25:51"}
|
| 311 |
+
{"current_steps": 311, "total_steps": 336, "loss": 0.4129, "lr": 1.3450757122151826e-06, "epoch": 2.7767857142857144, "percentage": 92.56, "elapsed_time": "5:09:16", "remaining_time": "0:24:51"}
|
| 312 |
+
{"current_steps": 312, "total_steps": 336, "loss": 0.4182, "lr": 1.2401702513131597e-06, "epoch": 2.7857142857142856, "percentage": 92.86, "elapsed_time": "5:10:15", "remaining_time": "0:23:51"}
|
| 313 |
+
{"current_steps": 313, "total_steps": 336, "loss": 0.4186, "lr": 1.1394591320688098e-06, "epoch": 2.794642857142857, "percentage": 93.15, "elapsed_time": "5:11:14", "remaining_time": "0:22:52"}
|
| 314 |
+
{"current_steps": 314, "total_steps": 336, "loss": 0.4263, "lr": 1.0429532527973695e-06, "epoch": 2.803571428571429, "percentage": 93.45, "elapsed_time": "5:12:13", "remaining_time": "0:21:52"}
|
| 315 |
+
{"current_steps": 315, "total_steps": 336, "loss": 0.4141, "lr": 9.50663056749801e-07, "epoch": 2.8125, "percentage": 93.75, "elapsed_time": "5:13:11", "remaining_time": "0:20:52"}
|
| 316 |
+
{"current_steps": 316, "total_steps": 336, "loss": 0.4192, "lr": 8.625985309827211e-07, "epoch": 2.821428571428571, "percentage": 94.05, "elapsed_time": "5:14:10", "remaining_time": "0:19:53"}
|
| 317 |
+
{"current_steps": 317, "total_steps": 336, "loss": 0.409, "lr": 7.787692052776363e-07, "epoch": 2.830357142857143, "percentage": 94.35, "elapsed_time": "5:15:08", "remaining_time": "0:18:53"}
|
| 318 |
+
{"current_steps": 318, "total_steps": 336, "loss": 0.4167, "lr": 6.991841511097175e-07, "epoch": 2.8392857142857144, "percentage": 94.64, "elapsed_time": "5:16:07", "remaining_time": "0:17:53"}
|
| 319 |
+
{"current_steps": 319, "total_steps": 336, "loss": 0.4191, "lr": 6.238519806661192e-07, "epoch": 2.8482142857142856, "percentage": 94.94, "elapsed_time": "5:17:06", "remaining_time": "0:16:53"}
|
| 320 |
+
{"current_steps": 320, "total_steps": 336, "loss": 0.4196, "lr": 5.527808459140449e-07, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "5:18:05", "remaining_time": "0:15:54"}
|
| 321 |
+
{"current_steps": 321, "total_steps": 336, "loss": 0.4188, "lr": 4.859784377185639e-07, "epoch": 2.866071428571429, "percentage": 95.54, "elapsed_time": "5:19:04", "remaining_time": "0:14:54"}
|
| 322 |
+
{"current_steps": 322, "total_steps": 336, "loss": 0.4138, "lr": 4.2345198501038796e-07, "epoch": 2.875, "percentage": 95.83, "elapsed_time": "5:20:02", "remaining_time": "0:13:54"}
|
| 323 |
+
{"current_steps": 323, "total_steps": 336, "loss": 0.4231, "lr": 3.652082540035906e-07, "epoch": 2.883928571428571, "percentage": 96.13, "elapsed_time": "5:21:01", "remaining_time": "0:12:55"}
|
| 324 |
+
{"current_steps": 324, "total_steps": 336, "loss": 0.4214, "lr": 3.112535474633971e-07, "epoch": 2.892857142857143, "percentage": 96.43, "elapsed_time": "5:22:00", "remaining_time": "0:11:55"}
|
| 325 |
+
{"current_steps": 325, "total_steps": 336, "loss": 0.4186, "lr": 2.6159370402415674e-07, "epoch": 2.9017857142857144, "percentage": 96.73, "elapsed_time": "5:22:58", "remaining_time": "0:10:55"}
|
| 326 |
+
{"current_steps": 326, "total_steps": 336, "loss": 0.4248, "lr": 2.1623409755751056e-07, "epoch": 2.9107142857142856, "percentage": 97.02, "elapsed_time": "5:23:57", "remaining_time": "0:09:56"}
|
| 327 |
+
{"current_steps": 327, "total_steps": 336, "loss": 0.4233, "lr": 1.751796365908831e-07, "epoch": 2.919642857142857, "percentage": 97.32, "elapsed_time": "5:24:56", "remaining_time": "0:08:56"}
|
| 328 |
+
{"current_steps": 328, "total_steps": 336, "loss": 0.4177, "lr": 1.3843476377628507e-07, "epoch": 2.928571428571429, "percentage": 97.62, "elapsed_time": "5:25:54", "remaining_time": "0:07:56"}
|
| 329 |
+
{"current_steps": 329, "total_steps": 336, "loss": 0.4185, "lr": 1.0600345540958234e-07, "epoch": 2.9375, "percentage": 97.92, "elapsed_time": "5:26:53", "remaining_time": "0:06:57"}
|
| 330 |
+
{"current_steps": 330, "total_steps": 336, "loss": 0.4227, "lr": 7.788922100020024e-08, "epoch": 2.946428571428571, "percentage": 98.21, "elapsed_time": "5:27:51", "remaining_time": "0:05:57"}
|
| 331 |
+
{"current_steps": 331, "total_steps": 336, "loss": 0.4296, "lr": 5.4095102891338344e-08, "epoch": 2.955357142857143, "percentage": 98.51, "elapsed_time": "5:28:50", "remaining_time": "0:04:58"}
|
| 332 |
+
{"current_steps": 332, "total_steps": 336, "loss": 0.4137, "lr": 3.462367593075833e-08, "epoch": 2.9642857142857144, "percentage": 98.81, "elapsed_time": "5:29:49", "remaining_time": "0:03:58"}
|
| 333 |
+
{"current_steps": 333, "total_steps": 336, "loss": 0.4274, "lr": 1.9477047192140164e-08, "epoch": 2.9732142857142856, "percentage": 99.11, "elapsed_time": "5:30:47", "remaining_time": "0:02:58"}
|
| 334 |
+
{"current_steps": 334, "total_steps": 336, "loss": 0.4179, "lr": 8.656855747082305e-09, "epoch": 2.982142857142857, "percentage": 99.4, "elapsed_time": "5:31:46", "remaining_time": "0:01:59"}
|
| 335 |
+
{"current_steps": 335, "total_steps": 336, "loss": 0.411, "lr": 2.1642724877146693e-09, "epoch": 2.991071428571429, "percentage": 99.7, "elapsed_time": "5:32:45", "remaining_time": "0:00:59"}
|
| 336 |
+
{"current_steps": 336, "total_steps": 336, "loss": 0.4162, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "5:33:44", "remaining_time": "0:00:00"}
|
| 337 |
+
{"current_steps": 336, "total_steps": 336, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "5:35:10", "remaining_time": "0:00:00"}
|