Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a263fd15137c5e62335534365849906eb0275e81256642b927e25e4b6f66be44
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e106487fba65be38ec88d560b05e1117d762e0e5b4c23c9a8ec767a0172b6d1f
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:07d33cafaea06ad2410be9faea33dc896beca39a7e861a69dc60c3630e9835d3
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c4aa02f3cc88c70046c395d7018dcf71b8cdf2e30a9a6b6f40143dacd5cdf5b
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -995,3 +995,486 @@
|
|
| 995 |
{"current_steps": 995, "total_steps": 1479, "loss": 0.4129, "lr": 2.9229249349905686e-06, "epoch": 2.0182555780933065, "percentage": 67.28, "elapsed_time": "3:36:10", "remaining_time": "1:45:09"}
|
| 996 |
{"current_steps": 996, "total_steps": 1479, "loss": 0.4245, "lr": 2.9121955948221257e-06, "epoch": 2.020283975659229, "percentage": 67.34, "elapsed_time": "3:36:23", "remaining_time": "1:44:56"}
|
| 997 |
{"current_steps": 997, "total_steps": 1479, "loss": 0.4055, "lr": 2.9014778860871916e-06, "epoch": 2.022312373225152, "percentage": 67.41, "elapsed_time": "3:36:36", "remaining_time": "1:44:43"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 995 |
{"current_steps": 995, "total_steps": 1479, "loss": 0.4129, "lr": 2.9229249349905686e-06, "epoch": 2.0182555780933065, "percentage": 67.28, "elapsed_time": "3:36:10", "remaining_time": "1:45:09"}
|
| 996 |
{"current_steps": 996, "total_steps": 1479, "loss": 0.4245, "lr": 2.9121955948221257e-06, "epoch": 2.020283975659229, "percentage": 67.34, "elapsed_time": "3:36:23", "remaining_time": "1:44:56"}
|
| 997 |
{"current_steps": 997, "total_steps": 1479, "loss": 0.4055, "lr": 2.9014778860871916e-06, "epoch": 2.022312373225152, "percentage": 67.41, "elapsed_time": "3:36:36", "remaining_time": "1:44:43"}
|
| 998 |
+
{"current_steps": 998, "total_steps": 1479, "loss": 0.4177, "lr": 2.8907718684955354e-06, "epoch": 2.024340770791075, "percentage": 67.48, "elapsed_time": "3:36:48", "remaining_time": "1:44:29"}
|
| 999 |
+
{"current_steps": 999, "total_steps": 1479, "loss": 0.4178, "lr": 2.880077601691793e-06, "epoch": 2.026369168356998, "percentage": 67.55, "elapsed_time": "3:37:01", "remaining_time": "1:44:16"}
|
| 1000 |
+
{"current_steps": 1000, "total_steps": 1479, "loss": 0.4245, "lr": 2.869395145255131e-06, "epoch": 2.028397565922921, "percentage": 67.61, "elapsed_time": "3:37:14", "remaining_time": "1:44:03"}
|
| 1001 |
+
{"current_steps": 1001, "total_steps": 1479, "loss": 0.4187, "lr": 2.8587245586989265e-06, "epoch": 2.030425963488844, "percentage": 67.68, "elapsed_time": "3:37:27", "remaining_time": "1:43:50"}
|
| 1002 |
+
{"current_steps": 1002, "total_steps": 1479, "loss": 0.4265, "lr": 2.848065901470418e-06, "epoch": 2.032454361054767, "percentage": 67.75, "elapsed_time": "3:37:39", "remaining_time": "1:43:37"}
|
| 1003 |
+
{"current_steps": 1003, "total_steps": 1479, "loss": 0.4285, "lr": 2.8374192329503934e-06, "epoch": 2.0344827586206895, "percentage": 67.82, "elapsed_time": "3:37:52", "remaining_time": "1:43:24"}
|
| 1004 |
+
{"current_steps": 1004, "total_steps": 1479, "loss": 0.4128, "lr": 2.8267846124528487e-06, "epoch": 2.0365111561866125, "percentage": 67.88, "elapsed_time": "3:38:05", "remaining_time": "1:43:10"}
|
| 1005 |
+
{"current_steps": 1005, "total_steps": 1479, "loss": 0.419, "lr": 2.8161620992246497e-06, "epoch": 2.0385395537525355, "percentage": 67.95, "elapsed_time": "3:38:18", "remaining_time": "1:42:57"}
|
| 1006 |
+
{"current_steps": 1006, "total_steps": 1479, "loss": 0.4142, "lr": 2.805551752445222e-06, "epoch": 2.0405679513184585, "percentage": 68.02, "elapsed_time": "3:38:30", "remaining_time": "1:42:44"}
|
| 1007 |
+
{"current_steps": 1007, "total_steps": 1479, "loss": 0.4149, "lr": 2.7949536312262048e-06, "epoch": 2.0425963488843815, "percentage": 68.09, "elapsed_time": "3:38:43", "remaining_time": "1:42:31"}
|
| 1008 |
+
{"current_steps": 1008, "total_steps": 1479, "loss": 0.4392, "lr": 2.7843677946111303e-06, "epoch": 2.0446247464503045, "percentage": 68.15, "elapsed_time": "3:38:56", "remaining_time": "1:42:18"}
|
| 1009 |
+
{"current_steps": 1009, "total_steps": 1479, "loss": 0.4118, "lr": 2.7737943015750862e-06, "epoch": 2.046653144016227, "percentage": 68.22, "elapsed_time": "3:39:09", "remaining_time": "1:42:05"}
|
| 1010 |
+
{"current_steps": 1010, "total_steps": 1479, "loss": 0.4299, "lr": 2.763233211024397e-06, "epoch": 2.04868154158215, "percentage": 68.29, "elapsed_time": "3:39:22", "remaining_time": "1:41:51"}
|
| 1011 |
+
{"current_steps": 1011, "total_steps": 1479, "loss": 0.4238, "lr": 2.752684581796292e-06, "epoch": 2.050709939148073, "percentage": 68.36, "elapsed_time": "3:39:34", "remaining_time": "1:41:38"}
|
| 1012 |
+
{"current_steps": 1012, "total_steps": 1479, "loss": 0.418, "lr": 2.7421484726585715e-06, "epoch": 2.052738336713996, "percentage": 68.42, "elapsed_time": "3:39:47", "remaining_time": "1:41:25"}
|
| 1013 |
+
{"current_steps": 1013, "total_steps": 1479, "loss": 0.4216, "lr": 2.7316249423092923e-06, "epoch": 2.054766734279919, "percentage": 68.49, "elapsed_time": "3:40:00", "remaining_time": "1:41:12"}
|
| 1014 |
+
{"current_steps": 1014, "total_steps": 1479, "loss": 0.4155, "lr": 2.721114049376424e-06, "epoch": 2.056795131845842, "percentage": 68.56, "elapsed_time": "3:40:12", "remaining_time": "1:40:59"}
|
| 1015 |
+
{"current_steps": 1015, "total_steps": 1479, "loss": 0.4305, "lr": 2.7106158524175396e-06, "epoch": 2.0588235294117645, "percentage": 68.63, "elapsed_time": "3:40:25", "remaining_time": "1:40:46"}
|
| 1016 |
+
{"current_steps": 1016, "total_steps": 1479, "loss": 0.4325, "lr": 2.700130409919477e-06, "epoch": 2.0608519269776875, "percentage": 68.7, "elapsed_time": "3:40:38", "remaining_time": "1:40:32"}
|
| 1017 |
+
{"current_steps": 1017, "total_steps": 1479, "loss": 0.4255, "lr": 2.689657780298019e-06, "epoch": 2.0628803245436105, "percentage": 68.76, "elapsed_time": "3:40:51", "remaining_time": "1:40:19"}
|
| 1018 |
+
{"current_steps": 1018, "total_steps": 1479, "loss": 0.436, "lr": 2.6791980218975665e-06, "epoch": 2.0649087221095335, "percentage": 68.83, "elapsed_time": "3:41:04", "remaining_time": "1:40:06"}
|
| 1019 |
+
{"current_steps": 1019, "total_steps": 1479, "loss": 0.4197, "lr": 2.6687511929908093e-06, "epoch": 2.0669371196754565, "percentage": 68.9, "elapsed_time": "3:41:16", "remaining_time": "1:39:53"}
|
| 1020 |
+
{"current_steps": 1020, "total_steps": 1479, "loss": 0.4249, "lr": 2.6583173517784122e-06, "epoch": 2.0689655172413794, "percentage": 68.97, "elapsed_time": "3:41:29", "remaining_time": "1:39:40"}
|
| 1021 |
+
{"current_steps": 1021, "total_steps": 1479, "loss": 0.42, "lr": 2.6478965563886745e-06, "epoch": 2.0709939148073024, "percentage": 69.03, "elapsed_time": "3:41:42", "remaining_time": "1:39:27"}
|
| 1022 |
+
{"current_steps": 1022, "total_steps": 1479, "loss": 0.4314, "lr": 2.637488864877226e-06, "epoch": 2.073022312373225, "percentage": 69.1, "elapsed_time": "3:41:55", "remaining_time": "1:39:14"}
|
| 1023 |
+
{"current_steps": 1023, "total_steps": 1479, "loss": 0.431, "lr": 2.627094335226682e-06, "epoch": 2.075050709939148, "percentage": 69.17, "elapsed_time": "3:42:07", "remaining_time": "1:39:00"}
|
| 1024 |
+
{"current_steps": 1024, "total_steps": 1479, "loss": 0.4294, "lr": 2.616713025346341e-06, "epoch": 2.077079107505071, "percentage": 69.24, "elapsed_time": "3:42:20", "remaining_time": "1:38:47"}
|
| 1025 |
+
{"current_steps": 1025, "total_steps": 1479, "loss": 0.44, "lr": 2.6063449930718487e-06, "epoch": 2.079107505070994, "percentage": 69.3, "elapsed_time": "3:42:33", "remaining_time": "1:38:34"}
|
| 1026 |
+
{"current_steps": 1026, "total_steps": 1479, "loss": 0.4206, "lr": 2.5959902961648785e-06, "epoch": 2.081135902636917, "percentage": 69.37, "elapsed_time": "3:42:46", "remaining_time": "1:38:21"}
|
| 1027 |
+
{"current_steps": 1027, "total_steps": 1479, "loss": 0.4143, "lr": 2.5856489923128136e-06, "epoch": 2.08316430020284, "percentage": 69.44, "elapsed_time": "3:42:58", "remaining_time": "1:38:08"}
|
| 1028 |
+
{"current_steps": 1028, "total_steps": 1479, "loss": 0.4356, "lr": 2.5753211391284172e-06, "epoch": 2.0851926977687625, "percentage": 69.51, "elapsed_time": "3:43:12", "remaining_time": "1:37:55"}
|
| 1029 |
+
{"current_steps": 1029, "total_steps": 1479, "loss": 0.424, "lr": 2.5650067941495236e-06, "epoch": 2.0872210953346855, "percentage": 69.57, "elapsed_time": "3:43:24", "remaining_time": "1:37:42"}
|
| 1030 |
+
{"current_steps": 1030, "total_steps": 1479, "loss": 0.4266, "lr": 2.5547060148387052e-06, "epoch": 2.0892494929006085, "percentage": 69.64, "elapsed_time": "3:43:37", "remaining_time": "1:37:29"}
|
| 1031 |
+
{"current_steps": 1031, "total_steps": 1479, "loss": 0.4158, "lr": 2.5444188585829634e-06, "epoch": 2.0912778904665315, "percentage": 69.71, "elapsed_time": "3:43:50", "remaining_time": "1:37:15"}
|
| 1032 |
+
{"current_steps": 1032, "total_steps": 1479, "loss": 0.4262, "lr": 2.5341453826934016e-06, "epoch": 2.0933062880324544, "percentage": 69.78, "elapsed_time": "3:44:03", "remaining_time": "1:37:02"}
|
| 1033 |
+
{"current_steps": 1033, "total_steps": 1479, "loss": 0.4227, "lr": 2.523885644404906e-06, "epoch": 2.0953346855983774, "percentage": 69.84, "elapsed_time": "3:44:15", "remaining_time": "1:36:49"}
|
| 1034 |
+
{"current_steps": 1034, "total_steps": 1479, "loss": 0.3973, "lr": 2.5136397008758316e-06, "epoch": 2.0973630831643, "percentage": 69.91, "elapsed_time": "3:44:28", "remaining_time": "1:36:36"}
|
| 1035 |
+
{"current_steps": 1035, "total_steps": 1479, "loss": 0.4097, "lr": 2.5034076091876813e-06, "epoch": 2.099391480730223, "percentage": 69.98, "elapsed_time": "3:44:41", "remaining_time": "1:36:23"}
|
| 1036 |
+
{"current_steps": 1036, "total_steps": 1479, "loss": 0.43, "lr": 2.4931894263447874e-06, "epoch": 2.101419878296146, "percentage": 70.05, "elapsed_time": "3:44:54", "remaining_time": "1:36:10"}
|
| 1037 |
+
{"current_steps": 1037, "total_steps": 1479, "loss": 0.4418, "lr": 2.48298520927399e-06, "epoch": 2.103448275862069, "percentage": 70.11, "elapsed_time": "3:45:06", "remaining_time": "1:35:57"}
|
| 1038 |
+
{"current_steps": 1038, "total_steps": 1479, "loss": 0.4137, "lr": 2.472795014824329e-06, "epoch": 2.105476673427992, "percentage": 70.18, "elapsed_time": "3:45:19", "remaining_time": "1:35:43"}
|
| 1039 |
+
{"current_steps": 1039, "total_steps": 1479, "loss": 0.4301, "lr": 2.4626188997667224e-06, "epoch": 2.107505070993915, "percentage": 70.25, "elapsed_time": "3:45:32", "remaining_time": "1:35:30"}
|
| 1040 |
+
{"current_steps": 1040, "total_steps": 1479, "loss": 0.4203, "lr": 2.452456920793645e-06, "epoch": 2.109533468559838, "percentage": 70.32, "elapsed_time": "3:45:45", "remaining_time": "1:35:17"}
|
| 1041 |
+
{"current_steps": 1041, "total_steps": 1479, "loss": 0.413, "lr": 2.4423091345188244e-06, "epoch": 2.1115618661257605, "percentage": 70.39, "elapsed_time": "3:45:57", "remaining_time": "1:35:04"}
|
| 1042 |
+
{"current_steps": 1042, "total_steps": 1479, "loss": 0.4101, "lr": 2.432175597476912e-06, "epoch": 2.1135902636916835, "percentage": 70.45, "elapsed_time": "3:46:10", "remaining_time": "1:34:51"}
|
| 1043 |
+
{"current_steps": 1043, "total_steps": 1479, "loss": 0.4148, "lr": 2.4220563661231793e-06, "epoch": 2.1156186612576064, "percentage": 70.52, "elapsed_time": "3:46:23", "remaining_time": "1:34:38"}
|
| 1044 |
+
{"current_steps": 1044, "total_steps": 1479, "loss": 0.4318, "lr": 2.4119514968331994e-06, "epoch": 2.1176470588235294, "percentage": 70.59, "elapsed_time": "3:46:36", "remaining_time": "1:34:25"}
|
| 1045 |
+
{"current_steps": 1045, "total_steps": 1479, "loss": 0.4405, "lr": 2.4018610459025317e-06, "epoch": 2.1196754563894524, "percentage": 70.66, "elapsed_time": "3:46:49", "remaining_time": "1:34:11"}
|
| 1046 |
+
{"current_steps": 1046, "total_steps": 1479, "loss": 0.4326, "lr": 2.391785069546404e-06, "epoch": 2.1217038539553754, "percentage": 70.72, "elapsed_time": "3:47:01", "remaining_time": "1:33:58"}
|
| 1047 |
+
{"current_steps": 1047, "total_steps": 1479, "loss": 0.4103, "lr": 2.381723623899412e-06, "epoch": 2.123732251521298, "percentage": 70.79, "elapsed_time": "3:47:14", "remaining_time": "1:33:45"}
|
| 1048 |
+
{"current_steps": 1048, "total_steps": 1479, "loss": 0.4241, "lr": 2.3716767650151958e-06, "epoch": 2.125760649087221, "percentage": 70.86, "elapsed_time": "3:47:27", "remaining_time": "1:33:32"}
|
| 1049 |
+
{"current_steps": 1049, "total_steps": 1479, "loss": 0.4281, "lr": 2.361644548866127e-06, "epoch": 2.127789046653144, "percentage": 70.93, "elapsed_time": "3:47:40", "remaining_time": "1:33:19"}
|
| 1050 |
+
{"current_steps": 1050, "total_steps": 1479, "loss": 0.4096, "lr": 2.3516270313430085e-06, "epoch": 2.129817444219067, "percentage": 70.99, "elapsed_time": "3:47:52", "remaining_time": "1:33:06"}
|
| 1051 |
+
{"current_steps": 1051, "total_steps": 1479, "loss": 0.4191, "lr": 2.341624268254747e-06, "epoch": 2.13184584178499, "percentage": 71.06, "elapsed_time": "3:48:05", "remaining_time": "1:32:53"}
|
| 1052 |
+
{"current_steps": 1052, "total_steps": 1479, "loss": 0.4211, "lr": 2.3316363153280545e-06, "epoch": 2.133874239350913, "percentage": 71.13, "elapsed_time": "3:48:18", "remaining_time": "1:32:40"}
|
| 1053 |
+
{"current_steps": 1053, "total_steps": 1479, "loss": 0.4168, "lr": 2.3216632282071345e-06, "epoch": 2.135902636916836, "percentage": 71.2, "elapsed_time": "3:48:31", "remaining_time": "1:32:26"}
|
| 1054 |
+
{"current_steps": 1054, "total_steps": 1479, "loss": 0.4216, "lr": 2.3117050624533695e-06, "epoch": 2.1379310344827585, "percentage": 71.26, "elapsed_time": "3:48:43", "remaining_time": "1:32:13"}
|
| 1055 |
+
{"current_steps": 1055, "total_steps": 1479, "loss": 0.4189, "lr": 2.3017618735450142e-06, "epoch": 2.1399594320486814, "percentage": 71.33, "elapsed_time": "3:48:56", "remaining_time": "1:32:00"}
|
| 1056 |
+
{"current_steps": 1056, "total_steps": 1479, "loss": 0.4235, "lr": 2.291833716876882e-06, "epoch": 2.1419878296146044, "percentage": 71.4, "elapsed_time": "3:49:09", "remaining_time": "1:31:47"}
|
| 1057 |
+
{"current_steps": 1057, "total_steps": 1479, "loss": 0.4189, "lr": 2.2819206477600462e-06, "epoch": 2.1440162271805274, "percentage": 71.47, "elapsed_time": "3:49:22", "remaining_time": "1:31:34"}
|
| 1058 |
+
{"current_steps": 1058, "total_steps": 1479, "loss": 0.4135, "lr": 2.272022721421517e-06, "epoch": 2.1460446247464504, "percentage": 71.53, "elapsed_time": "3:49:34", "remaining_time": "1:31:21"}
|
| 1059 |
+
{"current_steps": 1059, "total_steps": 1479, "loss": 0.4341, "lr": 2.2621399930039493e-06, "epoch": 2.1480730223123734, "percentage": 71.6, "elapsed_time": "3:49:47", "remaining_time": "1:31:08"}
|
| 1060 |
+
{"current_steps": 1060, "total_steps": 1479, "loss": 0.4181, "lr": 2.252272517565324e-06, "epoch": 2.150101419878296, "percentage": 71.67, "elapsed_time": "3:50:00", "remaining_time": "1:30:55"}
|
| 1061 |
+
{"current_steps": 1061, "total_steps": 1479, "loss": 0.4337, "lr": 2.2424203500786473e-06, "epoch": 2.152129817444219, "percentage": 71.74, "elapsed_time": "3:50:13", "remaining_time": "1:30:41"}
|
| 1062 |
+
{"current_steps": 1062, "total_steps": 1479, "loss": 0.4218, "lr": 2.232583545431646e-06, "epoch": 2.154158215010142, "percentage": 71.81, "elapsed_time": "3:50:25", "remaining_time": "1:30:28"}
|
| 1063 |
+
{"current_steps": 1063, "total_steps": 1479, "loss": 0.419, "lr": 2.2227621584264505e-06, "epoch": 2.156186612576065, "percentage": 71.87, "elapsed_time": "3:50:38", "remaining_time": "1:30:15"}
|
| 1064 |
+
{"current_steps": 1064, "total_steps": 1479, "loss": 0.4247, "lr": 2.2129562437793038e-06, "epoch": 2.158215010141988, "percentage": 71.94, "elapsed_time": "3:50:51", "remaining_time": "1:30:02"}
|
| 1065 |
+
{"current_steps": 1065, "total_steps": 1479, "loss": 0.4224, "lr": 2.203165856120251e-06, "epoch": 2.160243407707911, "percentage": 72.01, "elapsed_time": "3:51:04", "remaining_time": "1:29:49"}
|
| 1066 |
+
{"current_steps": 1066, "total_steps": 1479, "loss": 0.4341, "lr": 2.193391049992831e-06, "epoch": 2.162271805273834, "percentage": 72.08, "elapsed_time": "3:51:17", "remaining_time": "1:29:36"}
|
| 1067 |
+
{"current_steps": 1067, "total_steps": 1479, "loss": 0.4425, "lr": 2.183631879853776e-06, "epoch": 2.1643002028397564, "percentage": 72.14, "elapsed_time": "3:51:29", "remaining_time": "1:29:23"}
|
| 1068 |
+
{"current_steps": 1068, "total_steps": 1479, "loss": 0.4147, "lr": 2.173888400072709e-06, "epoch": 2.1663286004056794, "percentage": 72.21, "elapsed_time": "3:51:42", "remaining_time": "1:29:10"}
|
| 1069 |
+
{"current_steps": 1069, "total_steps": 1479, "loss": 0.4245, "lr": 2.164160664931843e-06, "epoch": 2.1683569979716024, "percentage": 72.28, "elapsed_time": "3:51:55", "remaining_time": "1:28:57"}
|
| 1070 |
+
{"current_steps": 1070, "total_steps": 1479, "loss": 0.4378, "lr": 2.1544487286256683e-06, "epoch": 2.1703853955375254, "percentage": 72.35, "elapsed_time": "3:52:08", "remaining_time": "1:28:43"}
|
| 1071 |
+
{"current_steps": 1071, "total_steps": 1479, "loss": 0.4118, "lr": 2.1447526452606658e-06, "epoch": 2.1724137931034484, "percentage": 72.41, "elapsed_time": "3:52:20", "remaining_time": "1:28:30"}
|
| 1072 |
+
{"current_steps": 1072, "total_steps": 1479, "loss": 0.4163, "lr": 2.1350724688549906e-06, "epoch": 2.1744421906693714, "percentage": 72.48, "elapsed_time": "3:52:33", "remaining_time": "1:28:17"}
|
| 1073 |
+
{"current_steps": 1073, "total_steps": 1479, "loss": 0.4409, "lr": 2.125408253338183e-06, "epoch": 2.176470588235294, "percentage": 72.55, "elapsed_time": "3:52:46", "remaining_time": "1:28:04"}
|
| 1074 |
+
{"current_steps": 1074, "total_steps": 1479, "loss": 0.4189, "lr": 2.1157600525508607e-06, "epoch": 2.178498985801217, "percentage": 72.62, "elapsed_time": "3:52:59", "remaining_time": "1:27:51"}
|
| 1075 |
+
{"current_steps": 1075, "total_steps": 1479, "loss": 0.4164, "lr": 2.106127920244423e-06, "epoch": 2.18052738336714, "percentage": 72.68, "elapsed_time": "3:53:11", "remaining_time": "1:27:38"}
|
| 1076 |
+
{"current_steps": 1076, "total_steps": 1479, "loss": 0.426, "lr": 2.096511910080749e-06, "epoch": 2.182555780933063, "percentage": 72.75, "elapsed_time": "3:53:24", "remaining_time": "1:27:25"}
|
| 1077 |
+
{"current_steps": 1077, "total_steps": 1479, "loss": 0.4194, "lr": 2.086912075631896e-06, "epoch": 2.184584178498986, "percentage": 72.82, "elapsed_time": "3:53:37", "remaining_time": "1:27:12"}
|
| 1078 |
+
{"current_steps": 1078, "total_steps": 1479, "loss": 0.4146, "lr": 2.0773284703798106e-06, "epoch": 2.186612576064909, "percentage": 72.89, "elapsed_time": "3:53:50", "remaining_time": "1:26:58"}
|
| 1079 |
+
{"current_steps": 1079, "total_steps": 1479, "loss": 0.426, "lr": 2.067761147716017e-06, "epoch": 2.1886409736308314, "percentage": 72.95, "elapsed_time": "3:54:02", "remaining_time": "1:26:45"}
|
| 1080 |
+
{"current_steps": 1080, "total_steps": 1479, "loss": 0.4253, "lr": 2.0582101609413336e-06, "epoch": 2.1906693711967544, "percentage": 73.02, "elapsed_time": "3:54:15", "remaining_time": "1:26:32"}
|
| 1081 |
+
{"current_steps": 1081, "total_steps": 1479, "loss": 0.4181, "lr": 2.0486755632655643e-06, "epoch": 2.1926977687626774, "percentage": 73.09, "elapsed_time": "3:54:28", "remaining_time": "1:26:19"}
|
| 1082 |
+
{"current_steps": 1082, "total_steps": 1479, "loss": 0.4338, "lr": 2.0391574078072098e-06, "epoch": 2.1947261663286004, "percentage": 73.16, "elapsed_time": "3:54:41", "remaining_time": "1:26:06"}
|
| 1083 |
+
{"current_steps": 1083, "total_steps": 1479, "loss": 0.4325, "lr": 2.029655747593169e-06, "epoch": 2.1967545638945234, "percentage": 73.23, "elapsed_time": "3:54:53", "remaining_time": "1:25:53"}
|
| 1084 |
+
{"current_steps": 1084, "total_steps": 1479, "loss": 0.4427, "lr": 2.0201706355584438e-06, "epoch": 2.1987829614604464, "percentage": 73.29, "elapsed_time": "3:55:06", "remaining_time": "1:25:40"}
|
| 1085 |
+
{"current_steps": 1085, "total_steps": 1479, "loss": 0.4379, "lr": 2.010702124545845e-06, "epoch": 2.2008113590263694, "percentage": 73.36, "elapsed_time": "3:55:19", "remaining_time": "1:25:27"}
|
| 1086 |
+
{"current_steps": 1086, "total_steps": 1479, "loss": 0.4312, "lr": 2.0012502673056916e-06, "epoch": 2.202839756592292, "percentage": 73.43, "elapsed_time": "3:55:32", "remaining_time": "1:25:14"}
|
| 1087 |
+
{"current_steps": 1087, "total_steps": 1479, "loss": 0.4054, "lr": 1.9918151164955303e-06, "epoch": 2.204868154158215, "percentage": 73.5, "elapsed_time": "3:55:44", "remaining_time": "1:25:01"}
|
| 1088 |
+
{"current_steps": 1088, "total_steps": 1479, "loss": 0.4208, "lr": 1.9823967246798247e-06, "epoch": 2.206896551724138, "percentage": 73.56, "elapsed_time": "3:55:57", "remaining_time": "1:24:47"}
|
| 1089 |
+
{"current_steps": 1089, "total_steps": 1479, "loss": 0.4193, "lr": 1.9729951443296823e-06, "epoch": 2.208924949290061, "percentage": 73.63, "elapsed_time": "3:56:10", "remaining_time": "1:24:34"}
|
| 1090 |
+
{"current_steps": 1090, "total_steps": 1479, "loss": 0.4146, "lr": 1.9636104278225414e-06, "epoch": 2.210953346855984, "percentage": 73.7, "elapsed_time": "3:56:23", "remaining_time": "1:24:21"}
|
| 1091 |
+
{"current_steps": 1091, "total_steps": 1479, "loss": 0.4472, "lr": 1.9542426274418975e-06, "epoch": 2.212981744421907, "percentage": 73.77, "elapsed_time": "3:56:36", "remaining_time": "1:24:08"}
|
| 1092 |
+
{"current_steps": 1092, "total_steps": 1479, "loss": 0.4297, "lr": 1.9448917953769997e-06, "epoch": 2.2150101419878294, "percentage": 73.83, "elapsed_time": "3:56:48", "remaining_time": "1:23:55"}
|
| 1093 |
+
{"current_steps": 1093, "total_steps": 1479, "loss": 0.4216, "lr": 1.9355579837225673e-06, "epoch": 2.2170385395537524, "percentage": 73.9, "elapsed_time": "3:57:01", "remaining_time": "1:23:42"}
|
| 1094 |
+
{"current_steps": 1094, "total_steps": 1479, "loss": 0.4016, "lr": 1.926241244478496e-06, "epoch": 2.2190669371196754, "percentage": 73.97, "elapsed_time": "3:57:14", "remaining_time": "1:23:29"}
|
| 1095 |
+
{"current_steps": 1095, "total_steps": 1479, "loss": 0.4339, "lr": 1.916941629549565e-06, "epoch": 2.2210953346855984, "percentage": 74.04, "elapsed_time": "3:57:27", "remaining_time": "1:23:16"}
|
| 1096 |
+
{"current_steps": 1096, "total_steps": 1479, "loss": 0.4187, "lr": 1.9076591907451585e-06, "epoch": 2.2231237322515214, "percentage": 74.1, "elapsed_time": "3:57:39", "remaining_time": "1:23:03"}
|
| 1097 |
+
{"current_steps": 1097, "total_steps": 1479, "loss": 0.4272, "lr": 1.8983939797789624e-06, "epoch": 2.2251521298174444, "percentage": 74.17, "elapsed_time": "3:57:52", "remaining_time": "1:22:50"}
|
| 1098 |
+
{"current_steps": 1098, "total_steps": 1479, "loss": 0.4135, "lr": 1.8891460482686903e-06, "epoch": 2.227180527383367, "percentage": 74.24, "elapsed_time": "3:58:05", "remaining_time": "1:22:37"}
|
| 1099 |
+
{"current_steps": 1099, "total_steps": 1479, "loss": 0.4317, "lr": 1.8799154477357883e-06, "epoch": 2.22920892494929, "percentage": 74.31, "elapsed_time": "3:58:18", "remaining_time": "1:22:23"}
|
| 1100 |
+
{"current_steps": 1100, "total_steps": 1479, "loss": 0.4149, "lr": 1.8707022296051463e-06, "epoch": 2.231237322515213, "percentage": 74.37, "elapsed_time": "3:58:31", "remaining_time": "1:22:10"}
|
| 1101 |
+
{"current_steps": 1101, "total_steps": 1479, "loss": 0.4148, "lr": 1.8615064452048181e-06, "epoch": 2.233265720081136, "percentage": 74.44, "elapsed_time": "3:58:44", "remaining_time": "1:21:57"}
|
| 1102 |
+
{"current_steps": 1102, "total_steps": 1479, "loss": 0.4309, "lr": 1.8523281457657304e-06, "epoch": 2.235294117647059, "percentage": 74.51, "elapsed_time": "3:58:56", "remaining_time": "1:21:44"}
|
| 1103 |
+
{"current_steps": 1103, "total_steps": 1479, "loss": 0.4286, "lr": 1.8431673824214013e-06, "epoch": 2.237322515212982, "percentage": 74.58, "elapsed_time": "3:59:09", "remaining_time": "1:21:31"}
|
| 1104 |
+
{"current_steps": 1104, "total_steps": 1479, "loss": 0.4436, "lr": 1.8340242062076464e-06, "epoch": 2.239350912778905, "percentage": 74.65, "elapsed_time": "3:59:23", "remaining_time": "1:21:18"}
|
| 1105 |
+
{"current_steps": 1105, "total_steps": 1479, "loss": 0.4265, "lr": 1.8248986680623077e-06, "epoch": 2.2413793103448274, "percentage": 74.71, "elapsed_time": "3:59:36", "remaining_time": "1:21:05"}
|
| 1106 |
+
{"current_steps": 1106, "total_steps": 1479, "loss": 0.4205, "lr": 1.8157908188249629e-06, "epoch": 2.2434077079107504, "percentage": 74.78, "elapsed_time": "3:59:49", "remaining_time": "1:20:52"}
|
| 1107 |
+
{"current_steps": 1107, "total_steps": 1479, "loss": 0.4177, "lr": 1.8067007092366368e-06, "epoch": 2.2454361054766734, "percentage": 74.85, "elapsed_time": "4:00:03", "remaining_time": "1:20:40"}
|
| 1108 |
+
{"current_steps": 1108, "total_steps": 1479, "loss": 0.4272, "lr": 1.7976283899395314e-06, "epoch": 2.2474645030425964, "percentage": 74.92, "elapsed_time": "4:00:16", "remaining_time": "1:20:27"}
|
| 1109 |
+
{"current_steps": 1109, "total_steps": 1479, "loss": 0.4159, "lr": 1.7885739114767292e-06, "epoch": 2.2494929006085194, "percentage": 74.98, "elapsed_time": "4:00:30", "remaining_time": "1:20:14"}
|
| 1110 |
+
{"current_steps": 1110, "total_steps": 1479, "loss": 0.4165, "lr": 1.7795373242919262e-06, "epoch": 2.2515212981744424, "percentage": 75.05, "elapsed_time": "4:00:43", "remaining_time": "1:20:01"}
|
| 1111 |
+
{"current_steps": 1111, "total_steps": 1479, "loss": 0.4105, "lr": 1.770518678729139e-06, "epoch": 2.2535496957403653, "percentage": 75.12, "elapsed_time": "4:00:56", "remaining_time": "1:19:48"}
|
| 1112 |
+
{"current_steps": 1112, "total_steps": 1479, "loss": 0.4032, "lr": 1.761518025032432e-06, "epoch": 2.255578093306288, "percentage": 75.19, "elapsed_time": "4:01:09", "remaining_time": "1:19:35"}
|
| 1113 |
+
{"current_steps": 1113, "total_steps": 1479, "loss": 0.4296, "lr": 1.752535413345634e-06, "epoch": 2.257606490872211, "percentage": 75.25, "elapsed_time": "4:01:22", "remaining_time": "1:19:22"}
|
| 1114 |
+
{"current_steps": 1114, "total_steps": 1479, "loss": 0.4357, "lr": 1.743570893712056e-06, "epoch": 2.259634888438134, "percentage": 75.32, "elapsed_time": "4:01:35", "remaining_time": "1:19:09"}
|
| 1115 |
+
{"current_steps": 1115, "total_steps": 1479, "loss": 0.435, "lr": 1.734624516074221e-06, "epoch": 2.261663286004057, "percentage": 75.39, "elapsed_time": "4:01:48", "remaining_time": "1:18:56"}
|
| 1116 |
+
{"current_steps": 1116, "total_steps": 1479, "loss": 0.4317, "lr": 1.7256963302735752e-06, "epoch": 2.26369168356998, "percentage": 75.46, "elapsed_time": "4:02:00", "remaining_time": "1:18:43"}
|
| 1117 |
+
{"current_steps": 1117, "total_steps": 1479, "loss": 0.424, "lr": 1.716786386050221e-06, "epoch": 2.2657200811359024, "percentage": 75.52, "elapsed_time": "4:02:13", "remaining_time": "1:18:30"}
|
| 1118 |
+
{"current_steps": 1118, "total_steps": 1479, "loss": 0.412, "lr": 1.7078947330426293e-06, "epoch": 2.2677484787018254, "percentage": 75.59, "elapsed_time": "4:02:26", "remaining_time": "1:18:16"}
|
| 1119 |
+
{"current_steps": 1119, "total_steps": 1479, "loss": 0.4152, "lr": 1.6990214207873723e-06, "epoch": 2.2697768762677484, "percentage": 75.66, "elapsed_time": "4:02:39", "remaining_time": "1:18:03"}
|
| 1120 |
+
{"current_steps": 1120, "total_steps": 1479, "loss": 0.4251, "lr": 1.6901664987188427e-06, "epoch": 2.2718052738336714, "percentage": 75.73, "elapsed_time": "4:02:51", "remaining_time": "1:17:50"}
|
| 1121 |
+
{"current_steps": 1121, "total_steps": 1479, "loss": 0.4217, "lr": 1.681330016168977e-06, "epoch": 2.2738336713995944, "percentage": 75.79, "elapsed_time": "4:03:04", "remaining_time": "1:17:37"}
|
| 1122 |
+
{"current_steps": 1122, "total_steps": 1479, "loss": 0.4201, "lr": 1.6725120223669873e-06, "epoch": 2.2758620689655173, "percentage": 75.86, "elapsed_time": "4:03:17", "remaining_time": "1:17:24"}
|
| 1123 |
+
{"current_steps": 1123, "total_steps": 1479, "loss": 0.4334, "lr": 1.6637125664390747e-06, "epoch": 2.2778904665314403, "percentage": 75.93, "elapsed_time": "4:03:30", "remaining_time": "1:17:11"}
|
| 1124 |
+
{"current_steps": 1124, "total_steps": 1479, "loss": 0.4025, "lr": 1.654931697408172e-06, "epoch": 2.279918864097363, "percentage": 76.0, "elapsed_time": "4:03:43", "remaining_time": "1:16:58"}
|
| 1125 |
+
{"current_steps": 1125, "total_steps": 1479, "loss": 0.4247, "lr": 1.6461694641936544e-06, "epoch": 2.281947261663286, "percentage": 76.06, "elapsed_time": "4:03:55", "remaining_time": "1:16:45"}
|
| 1126 |
+
{"current_steps": 1126, "total_steps": 1479, "loss": 0.4176, "lr": 1.6374259156110812e-06, "epoch": 2.283975659229209, "percentage": 76.13, "elapsed_time": "4:04:08", "remaining_time": "1:16:32"}
|
| 1127 |
+
{"current_steps": 1127, "total_steps": 1479, "loss": 0.4218, "lr": 1.6287011003719105e-06, "epoch": 2.286004056795132, "percentage": 76.2, "elapsed_time": "4:04:21", "remaining_time": "1:16:19"}
|
| 1128 |
+
{"current_steps": 1128, "total_steps": 1479, "loss": 0.433, "lr": 1.6199950670832404e-06, "epoch": 2.288032454361055, "percentage": 76.27, "elapsed_time": "4:04:34", "remaining_time": "1:16:06"}
|
| 1129 |
+
{"current_steps": 1129, "total_steps": 1479, "loss": 0.4141, "lr": 1.61130786424753e-06, "epoch": 2.290060851926978, "percentage": 76.34, "elapsed_time": "4:04:46", "remaining_time": "1:15:53"}
|
| 1130 |
+
{"current_steps": 1130, "total_steps": 1479, "loss": 0.4049, "lr": 1.6026395402623274e-06, "epoch": 2.292089249492901, "percentage": 76.4, "elapsed_time": "4:04:59", "remaining_time": "1:15:39"}
|
| 1131 |
+
{"current_steps": 1131, "total_steps": 1479, "loss": 0.4346, "lr": 1.5939901434200145e-06, "epoch": 2.2941176470588234, "percentage": 76.47, "elapsed_time": "4:05:12", "remaining_time": "1:15:26"}
|
| 1132 |
+
{"current_steps": 1132, "total_steps": 1479, "loss": 0.4295, "lr": 1.5853597219075155e-06, "epoch": 2.2961460446247464, "percentage": 76.54, "elapsed_time": "4:05:25", "remaining_time": "1:15:13"}
|
| 1133 |
+
{"current_steps": 1133, "total_steps": 1479, "loss": 0.4261, "lr": 1.5767483238060498e-06, "epoch": 2.2981744421906694, "percentage": 76.61, "elapsed_time": "4:05:38", "remaining_time": "1:15:00"}
|
| 1134 |
+
{"current_steps": 1134, "total_steps": 1479, "loss": 0.4279, "lr": 1.5681559970908483e-06, "epoch": 2.3002028397565923, "percentage": 76.67, "elapsed_time": "4:05:50", "remaining_time": "1:14:47"}
|
| 1135 |
+
{"current_steps": 1135, "total_steps": 1479, "loss": 0.4284, "lr": 1.5595827896308968e-06, "epoch": 2.3022312373225153, "percentage": 76.74, "elapsed_time": "4:06:03", "remaining_time": "1:14:34"}
|
| 1136 |
+
{"current_steps": 1136, "total_steps": 1479, "loss": 0.4346, "lr": 1.5510287491886656e-06, "epoch": 2.3042596348884383, "percentage": 76.81, "elapsed_time": "4:06:16", "remaining_time": "1:14:21"}
|
| 1137 |
+
{"current_steps": 1137, "total_steps": 1479, "loss": 0.4138, "lr": 1.5424939234198377e-06, "epoch": 2.306288032454361, "percentage": 76.88, "elapsed_time": "4:06:29", "remaining_time": "1:14:08"}
|
| 1138 |
+
{"current_steps": 1138, "total_steps": 1479, "loss": 0.4017, "lr": 1.5339783598730568e-06, "epoch": 2.308316430020284, "percentage": 76.94, "elapsed_time": "4:06:41", "remaining_time": "1:13:55"}
|
| 1139 |
+
{"current_steps": 1139, "total_steps": 1479, "loss": 0.4303, "lr": 1.5254821059896452e-06, "epoch": 2.310344827586207, "percentage": 77.01, "elapsed_time": "4:06:54", "remaining_time": "1:13:42"}
|
| 1140 |
+
{"current_steps": 1140, "total_steps": 1479, "loss": 0.4342, "lr": 1.5170052091033554e-06, "epoch": 2.31237322515213, "percentage": 77.08, "elapsed_time": "4:07:07", "remaining_time": "1:13:29"}
|
| 1141 |
+
{"current_steps": 1141, "total_steps": 1479, "loss": 0.4289, "lr": 1.5085477164400975e-06, "epoch": 2.314401622718053, "percentage": 77.15, "elapsed_time": "4:07:20", "remaining_time": "1:13:16"}
|
| 1142 |
+
{"current_steps": 1142, "total_steps": 1479, "loss": 0.4298, "lr": 1.500109675117677e-06, "epoch": 2.316430020283976, "percentage": 77.21, "elapsed_time": "4:07:32", "remaining_time": "1:13:03"}
|
| 1143 |
+
{"current_steps": 1143, "total_steps": 1479, "loss": 0.4194, "lr": 1.4916911321455362e-06, "epoch": 2.3184584178498984, "percentage": 77.28, "elapsed_time": "4:07:45", "remaining_time": "1:12:49"}
|
| 1144 |
+
{"current_steps": 1144, "total_steps": 1479, "loss": 0.4272, "lr": 1.4832921344244843e-06, "epoch": 2.3204868154158214, "percentage": 77.35, "elapsed_time": "4:07:58", "remaining_time": "1:12:36"}
|
| 1145 |
+
{"current_steps": 1145, "total_steps": 1479, "loss": 0.4235, "lr": 1.4749127287464483e-06, "epoch": 2.3225152129817443, "percentage": 77.42, "elapsed_time": "4:08:11", "remaining_time": "1:12:23"}
|
| 1146 |
+
{"current_steps": 1146, "total_steps": 1479, "loss": 0.4298, "lr": 1.4665529617941976e-06, "epoch": 2.3245436105476673, "percentage": 77.48, "elapsed_time": "4:08:23", "remaining_time": "1:12:10"}
|
| 1147 |
+
{"current_steps": 1147, "total_steps": 1479, "loss": 0.411, "lr": 1.458212880141099e-06, "epoch": 2.3265720081135903, "percentage": 77.55, "elapsed_time": "4:08:36", "remaining_time": "1:11:57"}
|
| 1148 |
+
{"current_steps": 1148, "total_steps": 1479, "loss": 0.4424, "lr": 1.4498925302508438e-06, "epoch": 2.3286004056795133, "percentage": 77.62, "elapsed_time": "4:08:49", "remaining_time": "1:11:44"}
|
| 1149 |
+
{"current_steps": 1149, "total_steps": 1479, "loss": 0.4248, "lr": 1.4415919584771999e-06, "epoch": 2.3306288032454363, "percentage": 77.69, "elapsed_time": "4:09:02", "remaining_time": "1:11:31"}
|
| 1150 |
+
{"current_steps": 1150, "total_steps": 1479, "loss": 0.4082, "lr": 1.4333112110637454e-06, "epoch": 2.332657200811359, "percentage": 77.76, "elapsed_time": "4:09:14", "remaining_time": "1:11:18"}
|
| 1151 |
+
{"current_steps": 1151, "total_steps": 1479, "loss": 0.459, "lr": 1.425050334143616e-06, "epoch": 2.334685598377282, "percentage": 77.82, "elapsed_time": "4:09:27", "remaining_time": "1:11:05"}
|
| 1152 |
+
{"current_steps": 1152, "total_steps": 1479, "loss": 0.4367, "lr": 1.416809373739248e-06, "epoch": 2.336713995943205, "percentage": 77.89, "elapsed_time": "4:09:40", "remaining_time": "1:10:52"}
|
| 1153 |
+
{"current_steps": 1153, "total_steps": 1479, "loss": 0.4347, "lr": 1.408588375762114e-06, "epoch": 2.338742393509128, "percentage": 77.96, "elapsed_time": "4:09:53", "remaining_time": "1:10:39"}
|
| 1154 |
+
{"current_steps": 1154, "total_steps": 1479, "loss": 0.4244, "lr": 1.4003873860124806e-06, "epoch": 2.340770791075051, "percentage": 78.03, "elapsed_time": "4:10:05", "remaining_time": "1:10:26"}
|
| 1155 |
+
{"current_steps": 1155, "total_steps": 1479, "loss": 0.4154, "lr": 1.39220645017914e-06, "epoch": 2.342799188640974, "percentage": 78.09, "elapsed_time": "4:10:18", "remaining_time": "1:10:13"}
|
| 1156 |
+
{"current_steps": 1156, "total_steps": 1479, "loss": 0.4124, "lr": 1.3840456138391644e-06, "epoch": 2.344827586206897, "percentage": 78.16, "elapsed_time": "4:10:31", "remaining_time": "1:09:59"}
|
| 1157 |
+
{"current_steps": 1157, "total_steps": 1479, "loss": 0.4166, "lr": 1.3759049224576516e-06, "epoch": 2.3468559837728193, "percentage": 78.23, "elapsed_time": "4:10:44", "remaining_time": "1:09:46"}
|
| 1158 |
+
{"current_steps": 1158, "total_steps": 1479, "loss": 0.4345, "lr": 1.3677844213874619e-06, "epoch": 2.3488843813387423, "percentage": 78.3, "elapsed_time": "4:10:57", "remaining_time": "1:09:33"}
|
| 1159 |
+
{"current_steps": 1159, "total_steps": 1479, "loss": 0.4385, "lr": 1.3596841558689788e-06, "epoch": 2.3509127789046653, "percentage": 78.36, "elapsed_time": "4:11:09", "remaining_time": "1:09:20"}
|
| 1160 |
+
{"current_steps": 1160, "total_steps": 1479, "loss": 0.4376, "lr": 1.35160417102985e-06, "epoch": 2.3529411764705883, "percentage": 78.43, "elapsed_time": "4:11:22", "remaining_time": "1:09:07"}
|
| 1161 |
+
{"current_steps": 1161, "total_steps": 1479, "loss": 0.4285, "lr": 1.3435445118847362e-06, "epoch": 2.3549695740365113, "percentage": 78.5, "elapsed_time": "4:11:35", "remaining_time": "1:08:54"}
|
| 1162 |
+
{"current_steps": 1162, "total_steps": 1479, "loss": 0.4329, "lr": 1.3355052233350584e-06, "epoch": 2.356997971602434, "percentage": 78.57, "elapsed_time": "4:11:48", "remaining_time": "1:08:41"}
|
| 1163 |
+
{"current_steps": 1163, "total_steps": 1479, "loss": 0.424, "lr": 1.3274863501687546e-06, "epoch": 2.359026369168357, "percentage": 78.63, "elapsed_time": "4:12:00", "remaining_time": "1:08:28"}
|
| 1164 |
+
{"current_steps": 1164, "total_steps": 1479, "loss": 0.4178, "lr": 1.3194879370600244e-06, "epoch": 2.36105476673428, "percentage": 78.7, "elapsed_time": "4:12:13", "remaining_time": "1:08:15"}
|
| 1165 |
+
{"current_steps": 1165, "total_steps": 1479, "loss": 0.434, "lr": 1.3115100285690795e-06, "epoch": 2.363083164300203, "percentage": 78.77, "elapsed_time": "4:12:26", "remaining_time": "1:08:02"}
|
| 1166 |
+
{"current_steps": 1166, "total_steps": 1479, "loss": 0.4261, "lr": 1.3035526691419026e-06, "epoch": 2.365111561866126, "percentage": 78.84, "elapsed_time": "4:12:39", "remaining_time": "1:07:49"}
|
| 1167 |
+
{"current_steps": 1167, "total_steps": 1479, "loss": 0.4423, "lr": 1.2956159031099874e-06, "epoch": 2.367139959432049, "percentage": 78.9, "elapsed_time": "4:12:52", "remaining_time": "1:07:36"}
|
| 1168 |
+
{"current_steps": 1168, "total_steps": 1479, "loss": 0.4231, "lr": 1.2876997746901072e-06, "epoch": 2.369168356997972, "percentage": 78.97, "elapsed_time": "4:13:04", "remaining_time": "1:07:23"}
|
| 1169 |
+
{"current_steps": 1169, "total_steps": 1479, "loss": 0.4205, "lr": 1.2798043279840544e-06, "epoch": 2.3711967545638943, "percentage": 79.04, "elapsed_time": "4:13:17", "remaining_time": "1:07:10"}
|
| 1170 |
+
{"current_steps": 1170, "total_steps": 1479, "loss": 0.4194, "lr": 1.2719296069784066e-06, "epoch": 2.3732251521298173, "percentage": 79.11, "elapsed_time": "4:13:30", "remaining_time": "1:06:57"}
|
| 1171 |
+
{"current_steps": 1171, "total_steps": 1479, "loss": 0.4175, "lr": 1.2640756555442684e-06, "epoch": 2.3752535496957403, "percentage": 79.18, "elapsed_time": "4:13:43", "remaining_time": "1:06:44"}
|
| 1172 |
+
{"current_steps": 1172, "total_steps": 1479, "loss": 0.4075, "lr": 1.25624251743704e-06, "epoch": 2.3772819472616633, "percentage": 79.24, "elapsed_time": "4:13:55", "remaining_time": "1:06:30"}
|
| 1173 |
+
{"current_steps": 1173, "total_steps": 1479, "loss": 0.4108, "lr": 1.248430236296168e-06, "epoch": 2.3793103448275863, "percentage": 79.31, "elapsed_time": "4:14:08", "remaining_time": "1:06:17"}
|
| 1174 |
+
{"current_steps": 1174, "total_steps": 1479, "loss": 0.4231, "lr": 1.2406388556448973e-06, "epoch": 2.3813387423935093, "percentage": 79.38, "elapsed_time": "4:14:21", "remaining_time": "1:06:04"}
|
| 1175 |
+
{"current_steps": 1175, "total_steps": 1479, "loss": 0.4196, "lr": 1.2328684188900392e-06, "epoch": 2.3833671399594323, "percentage": 79.45, "elapsed_time": "4:14:34", "remaining_time": "1:05:51"}
|
| 1176 |
+
{"current_steps": 1176, "total_steps": 1479, "loss": 0.4279, "lr": 1.2251189693217175e-06, "epoch": 2.385395537525355, "percentage": 79.51, "elapsed_time": "4:14:46", "remaining_time": "1:05:38"}
|
| 1177 |
+
{"current_steps": 1177, "total_steps": 1479, "loss": 0.4184, "lr": 1.2173905501131395e-06, "epoch": 2.387423935091278, "percentage": 79.58, "elapsed_time": "4:14:59", "remaining_time": "1:05:25"}
|
| 1178 |
+
{"current_steps": 1178, "total_steps": 1479, "loss": 0.4208, "lr": 1.2096832043203467e-06, "epoch": 2.389452332657201, "percentage": 79.65, "elapsed_time": "4:15:12", "remaining_time": "1:05:12"}
|
| 1179 |
+
{"current_steps": 1179, "total_steps": 1479, "loss": 0.4329, "lr": 1.2019969748819783e-06, "epoch": 2.391480730223124, "percentage": 79.72, "elapsed_time": "4:15:25", "remaining_time": "1:04:59"}
|
| 1180 |
+
{"current_steps": 1180, "total_steps": 1479, "loss": 0.4094, "lr": 1.1943319046190333e-06, "epoch": 2.393509127789047, "percentage": 79.78, "elapsed_time": "4:15:37", "remaining_time": "1:04:46"}
|
| 1181 |
+
{"current_steps": 1181, "total_steps": 1479, "loss": 0.4286, "lr": 1.186688036234625e-06, "epoch": 2.3955375253549693, "percentage": 79.85, "elapsed_time": "4:15:50", "remaining_time": "1:04:33"}
|
| 1182 |
+
{"current_steps": 1182, "total_steps": 1479, "loss": 0.439, "lr": 1.1790654123137552e-06, "epoch": 2.3975659229208923, "percentage": 79.92, "elapsed_time": "4:16:03", "remaining_time": "1:04:20"}
|
| 1183 |
+
{"current_steps": 1183, "total_steps": 1479, "loss": 0.4293, "lr": 1.1714640753230628e-06, "epoch": 2.3995943204868153, "percentage": 79.99, "elapsed_time": "4:16:16", "remaining_time": "1:04:07"}
|
| 1184 |
+
{"current_steps": 1184, "total_steps": 1479, "loss": 0.4402, "lr": 1.1638840676106012e-06, "epoch": 2.4016227180527383, "percentage": 80.05, "elapsed_time": "4:16:28", "remaining_time": "1:03:54"}
|
| 1185 |
+
{"current_steps": 1185, "total_steps": 1479, "loss": 0.4298, "lr": 1.1563254314055893e-06, "epoch": 2.4036511156186613, "percentage": 80.12, "elapsed_time": "4:16:41", "remaining_time": "1:03:41"}
|
| 1186 |
+
{"current_steps": 1186, "total_steps": 1479, "loss": 0.4375, "lr": 1.1487882088181878e-06, "epoch": 2.4056795131845843, "percentage": 80.19, "elapsed_time": "4:16:54", "remaining_time": "1:03:28"}
|
| 1187 |
+
{"current_steps": 1187, "total_steps": 1479, "loss": 0.4128, "lr": 1.1412724418392562e-06, "epoch": 2.4077079107505073, "percentage": 80.26, "elapsed_time": "4:17:07", "remaining_time": "1:03:15"}
|
| 1188 |
+
{"current_steps": 1188, "total_steps": 1479, "loss": 0.4259, "lr": 1.1337781723401236e-06, "epoch": 2.40973630831643, "percentage": 80.32, "elapsed_time": "4:17:19", "remaining_time": "1:03:01"}
|
| 1189 |
+
{"current_steps": 1189, "total_steps": 1479, "loss": 0.4291, "lr": 1.126305442072354e-06, "epoch": 2.411764705882353, "percentage": 80.39, "elapsed_time": "4:17:32", "remaining_time": "1:02:48"}
|
| 1190 |
+
{"current_steps": 1190, "total_steps": 1479, "loss": 0.4434, "lr": 1.1188542926675105e-06, "epoch": 2.413793103448276, "percentage": 80.46, "elapsed_time": "4:17:45", "remaining_time": "1:02:35"}
|
| 1191 |
+
{"current_steps": 1191, "total_steps": 1479, "loss": 0.4196, "lr": 1.1114247656369305e-06, "epoch": 2.415821501014199, "percentage": 80.53, "elapsed_time": "4:17:58", "remaining_time": "1:02:22"}
|
| 1192 |
+
{"current_steps": 1192, "total_steps": 1479, "loss": 0.4233, "lr": 1.1040169023714852e-06, "epoch": 2.417849898580122, "percentage": 80.59, "elapsed_time": "4:18:10", "remaining_time": "1:02:09"}
|
| 1193 |
+
{"current_steps": 1193, "total_steps": 1479, "loss": 0.4175, "lr": 1.0966307441413598e-06, "epoch": 2.4198782961460448, "percentage": 80.66, "elapsed_time": "4:18:23", "remaining_time": "1:01:56"}
|
| 1194 |
+
{"current_steps": 1194, "total_steps": 1479, "loss": 0.434, "lr": 1.0892663320958159e-06, "epoch": 2.4219066937119678, "percentage": 80.73, "elapsed_time": "4:18:36", "remaining_time": "1:01:43"}
|
| 1195 |
+
{"current_steps": 1195, "total_steps": 1479, "loss": 0.4333, "lr": 1.0819237072629606e-06, "epoch": 2.4239350912778903, "percentage": 80.8, "elapsed_time": "4:18:49", "remaining_time": "1:01:30"}
|
| 1196 |
+
{"current_steps": 1196, "total_steps": 1479, "loss": 0.4293, "lr": 1.074602910549527e-06, "epoch": 2.4259634888438133, "percentage": 80.87, "elapsed_time": "4:19:01", "remaining_time": "1:01:17"}
|
| 1197 |
+
{"current_steps": 1197, "total_steps": 1479, "loss": 0.4196, "lr": 1.0673039827406373e-06, "epoch": 2.4279918864097363, "percentage": 80.93, "elapsed_time": "4:19:14", "remaining_time": "1:01:04"}
|
| 1198 |
+
{"current_steps": 1198, "total_steps": 1479, "loss": 0.4257, "lr": 1.0600269644995826e-06, "epoch": 2.4300202839756593, "percentage": 81.0, "elapsed_time": "4:19:27", "remaining_time": "1:00:51"}
|
| 1199 |
+
{"current_steps": 1199, "total_steps": 1479, "loss": 0.4191, "lr": 1.0527718963675871e-06, "epoch": 2.4320486815415823, "percentage": 81.07, "elapsed_time": "4:19:40", "remaining_time": "1:00:38"}
|
| 1200 |
+
{"current_steps": 1200, "total_steps": 1479, "loss": 0.4343, "lr": 1.0455388187635934e-06, "epoch": 2.4340770791075053, "percentage": 81.14, "elapsed_time": "4:19:52", "remaining_time": "1:00:25"}
|
| 1201 |
+
{"current_steps": 1201, "total_steps": 1479, "loss": 0.4157, "lr": 1.0383277719840318e-06, "epoch": 2.436105476673428, "percentage": 81.2, "elapsed_time": "4:20:05", "remaining_time": "1:00:12"}
|
| 1202 |
+
{"current_steps": 1202, "total_steps": 1479, "loss": 0.4215, "lr": 1.0311387962025909e-06, "epoch": 2.438133874239351, "percentage": 81.27, "elapsed_time": "4:20:18", "remaining_time": "0:59:59"}
|
| 1203 |
+
{"current_steps": 1203, "total_steps": 1479, "loss": 0.4195, "lr": 1.0239719314700052e-06, "epoch": 2.440162271805274, "percentage": 81.34, "elapsed_time": "4:20:31", "remaining_time": "0:59:46"}
|
| 1204 |
+
{"current_steps": 1204, "total_steps": 1479, "loss": 0.4515, "lr": 1.01682721771382e-06, "epoch": 2.4421906693711968, "percentage": 81.41, "elapsed_time": "4:20:43", "remaining_time": "0:59:33"}
|
| 1205 |
+
{"current_steps": 1205, "total_steps": 1479, "loss": 0.4251, "lr": 1.0097046947381805e-06, "epoch": 2.4442190669371198, "percentage": 81.47, "elapsed_time": "4:20:56", "remaining_time": "0:59:20"}
|
| 1206 |
+
{"current_steps": 1206, "total_steps": 1479, "loss": 0.4215, "lr": 1.002604402223597e-06, "epoch": 2.4462474645030428, "percentage": 81.54, "elapsed_time": "4:21:09", "remaining_time": "0:59:07"}
|
| 1207 |
+
{"current_steps": 1207, "total_steps": 1479, "loss": 0.4265, "lr": 9.955263797267379e-07, "epoch": 2.4482758620689653, "percentage": 81.61, "elapsed_time": "4:21:22", "remaining_time": "0:58:54"}
|
| 1208 |
+
{"current_steps": 1208, "total_steps": 1479, "loss": 0.4131, "lr": 9.88470666680198e-07, "epoch": 2.4503042596348883, "percentage": 81.68, "elapsed_time": "4:21:34", "remaining_time": "0:58:40"}
|
| 1209 |
+
{"current_steps": 1209, "total_steps": 1479, "loss": 0.4236, "lr": 9.814373023922851e-07, "epoch": 2.4523326572008113, "percentage": 81.74, "elapsed_time": "4:21:47", "remaining_time": "0:58:27"}
|
| 1210 |
+
{"current_steps": 1210, "total_steps": 1479, "loss": 0.435, "lr": 9.744263260468006e-07, "epoch": 2.4543610547667343, "percentage": 81.81, "elapsed_time": "4:22:00", "remaining_time": "0:58:14"}
|
| 1211 |
+
{"current_steps": 1211, "total_steps": 1479, "loss": 0.4172, "lr": 9.674377767028142e-07, "epoch": 2.4563894523326573, "percentage": 81.88, "elapsed_time": "4:22:13", "remaining_time": "0:58:01"}
|
| 1212 |
+
{"current_steps": 1212, "total_steps": 1479, "loss": 0.4134, "lr": 9.604716932944586e-07, "epoch": 2.4584178498985803, "percentage": 81.95, "elapsed_time": "4:22:25", "remaining_time": "0:57:48"}
|
| 1213 |
+
{"current_steps": 1213, "total_steps": 1479, "loss": 0.4234, "lr": 9.53528114630699e-07, "epoch": 2.4604462474645032, "percentage": 82.01, "elapsed_time": "4:22:38", "remaining_time": "0:57:35"}
|
| 1214 |
+
{"current_steps": 1214, "total_steps": 1479, "loss": 0.412, "lr": 9.466070793951309e-07, "epoch": 2.462474645030426, "percentage": 82.08, "elapsed_time": "4:22:51", "remaining_time": "0:57:22"}
|
| 1215 |
+
{"current_steps": 1215, "total_steps": 1479, "loss": 0.4068, "lr": 9.397086261457511e-07, "epoch": 2.464503042596349, "percentage": 82.15, "elapsed_time": "4:23:04", "remaining_time": "0:57:09"}
|
| 1216 |
+
{"current_steps": 1216, "total_steps": 1479, "loss": 0.4288, "lr": 9.328327933147529e-07, "epoch": 2.4665314401622718, "percentage": 82.22, "elapsed_time": "4:23:17", "remaining_time": "0:56:56"}
|
| 1217 |
+
{"current_steps": 1217, "total_steps": 1479, "loss": 0.4365, "lr": 9.259796192083071e-07, "epoch": 2.4685598377281948, "percentage": 82.29, "elapsed_time": "4:23:29", "remaining_time": "0:56:43"}
|
| 1218 |
+
{"current_steps": 1218, "total_steps": 1479, "loss": 0.4201, "lr": 9.191491420063498e-07, "epoch": 2.4705882352941178, "percentage": 82.35, "elapsed_time": "4:23:42", "remaining_time": "0:56:30"}
|
| 1219 |
+
{"current_steps": 1219, "total_steps": 1479, "loss": 0.433, "lr": 9.123413997623714e-07, "epoch": 2.4726166328600407, "percentage": 82.42, "elapsed_time": "4:23:55", "remaining_time": "0:56:17"}
|
| 1220 |
+
{"current_steps": 1220, "total_steps": 1479, "loss": 0.4177, "lr": 9.055564304031983e-07, "epoch": 2.4746450304259637, "percentage": 82.49, "elapsed_time": "4:24:08", "remaining_time": "0:56:04"}
|
| 1221 |
+
{"current_steps": 1221, "total_steps": 1479, "loss": 0.4073, "lr": 8.987942717287923e-07, "epoch": 2.4766734279918863, "percentage": 82.56, "elapsed_time": "4:24:20", "remaining_time": "0:55:51"}
|
| 1222 |
+
{"current_steps": 1222, "total_steps": 1479, "loss": 0.4113, "lr": 8.920549614120272e-07, "epoch": 2.4787018255578093, "percentage": 82.62, "elapsed_time": "4:24:33", "remaining_time": "0:55:38"}
|
| 1223 |
+
{"current_steps": 1223, "total_steps": 1479, "loss": 0.4285, "lr": 8.853385369984901e-07, "epoch": 2.4807302231237323, "percentage": 82.69, "elapsed_time": "4:24:46", "remaining_time": "0:55:25"}
|
| 1224 |
+
{"current_steps": 1224, "total_steps": 1479, "loss": 0.4098, "lr": 8.786450359062693e-07, "epoch": 2.4827586206896552, "percentage": 82.76, "elapsed_time": "4:24:59", "remaining_time": "0:55:12"}
|
| 1225 |
+
{"current_steps": 1225, "total_steps": 1479, "loss": 0.4235, "lr": 8.719744954257375e-07, "epoch": 2.4847870182555782, "percentage": 82.83, "elapsed_time": "4:25:12", "remaining_time": "0:54:59"}
|
| 1226 |
+
{"current_steps": 1226, "total_steps": 1479, "loss": 0.4112, "lr": 8.65326952719357e-07, "epoch": 2.486815415821501, "percentage": 82.89, "elapsed_time": "4:25:24", "remaining_time": "0:54:46"}
|
| 1227 |
+
{"current_steps": 1227, "total_steps": 1479, "loss": 0.4235, "lr": 8.587024448214637e-07, "epoch": 2.4888438133874238, "percentage": 82.96, "elapsed_time": "4:25:37", "remaining_time": "0:54:33"}
|
| 1228 |
+
{"current_steps": 1228, "total_steps": 1479, "loss": 0.4349, "lr": 8.521010086380665e-07, "epoch": 2.4908722109533468, "percentage": 83.03, "elapsed_time": "4:25:50", "remaining_time": "0:54:20"}
|
| 1229 |
+
{"current_steps": 1229, "total_steps": 1479, "loss": 0.4397, "lr": 8.455226809466327e-07, "epoch": 2.4929006085192698, "percentage": 83.1, "elapsed_time": "4:26:03", "remaining_time": "0:54:07"}
|
| 1230 |
+
{"current_steps": 1230, "total_steps": 1479, "loss": 0.4215, "lr": 8.389674983958951e-07, "epoch": 2.4949290060851927, "percentage": 83.16, "elapsed_time": "4:26:15", "remaining_time": "0:53:54"}
|
| 1231 |
+
{"current_steps": 1231, "total_steps": 1479, "loss": 0.4432, "lr": 8.324354975056403e-07, "epoch": 2.4969574036511157, "percentage": 83.23, "elapsed_time": "4:26:28", "remaining_time": "0:53:41"}
|
| 1232 |
+
{"current_steps": 1232, "total_steps": 1479, "loss": 0.4171, "lr": 8.25926714666504e-07, "epoch": 2.4989858012170387, "percentage": 83.3, "elapsed_time": "4:26:41", "remaining_time": "0:53:28"}
|
| 1233 |
+
{"current_steps": 1233, "total_steps": 1479, "loss": 0.4151, "lr": 8.19441186139776e-07, "epoch": 2.5010141987829613, "percentage": 83.37, "elapsed_time": "4:26:54", "remaining_time": "0:53:15"}
|
| 1234 |
+
{"current_steps": 1234, "total_steps": 1479, "loss": 0.4375, "lr": 8.129789480571871e-07, "epoch": 2.5030425963488843, "percentage": 83.43, "elapsed_time": "4:27:06", "remaining_time": "0:53:02"}
|
| 1235 |
+
{"current_steps": 1235, "total_steps": 1479, "loss": 0.4204, "lr": 8.065400364207194e-07, "epoch": 2.5050709939148073, "percentage": 83.5, "elapsed_time": "4:27:19", "remaining_time": "0:52:48"}
|
| 1236 |
+
{"current_steps": 1236, "total_steps": 1479, "loss": 0.4215, "lr": 8.001244871023978e-07, "epoch": 2.5070993914807302, "percentage": 83.57, "elapsed_time": "4:27:32", "remaining_time": "0:52:35"}
|
| 1237 |
+
{"current_steps": 1237, "total_steps": 1479, "loss": 0.436, "lr": 7.937323358440935e-07, "epoch": 2.5091277890466532, "percentage": 83.64, "elapsed_time": "4:27:45", "remaining_time": "0:52:22"}
|
| 1238 |
+
{"current_steps": 1238, "total_steps": 1479, "loss": 0.4269, "lr": 7.873636182573246e-07, "epoch": 2.5111561866125762, "percentage": 83.71, "elapsed_time": "4:27:58", "remaining_time": "0:52:09"}
|
| 1239 |
+
{"current_steps": 1239, "total_steps": 1479, "loss": 0.4162, "lr": 7.810183698230539e-07, "epoch": 2.513184584178499, "percentage": 83.77, "elapsed_time": "4:28:10", "remaining_time": "0:51:56"}
|
| 1240 |
+
{"current_steps": 1240, "total_steps": 1479, "loss": 0.4455, "lr": 7.74696625891499e-07, "epoch": 2.5152129817444218, "percentage": 83.84, "elapsed_time": "4:28:23", "remaining_time": "0:51:43"}
|
| 1241 |
+
{"current_steps": 1241, "total_steps": 1479, "loss": 0.4199, "lr": 7.683984216819262e-07, "epoch": 2.5172413793103448, "percentage": 83.91, "elapsed_time": "4:28:36", "remaining_time": "0:51:30"}
|
| 1242 |
+
{"current_steps": 1242, "total_steps": 1479, "loss": 0.4043, "lr": 7.621237922824637e-07, "epoch": 2.5192697768762677, "percentage": 83.98, "elapsed_time": "4:28:49", "remaining_time": "0:51:17"}
|
| 1243 |
+
{"current_steps": 1243, "total_steps": 1479, "loss": 0.4218, "lr": 7.55872772649896e-07, "epoch": 2.5212981744421907, "percentage": 84.04, "elapsed_time": "4:29:01", "remaining_time": "0:51:04"}
|
| 1244 |
+
{"current_steps": 1244, "total_steps": 1479, "loss": 0.4217, "lr": 7.496453976094792e-07, "epoch": 2.5233265720081137, "percentage": 84.11, "elapsed_time": "4:29:14", "remaining_time": "0:50:51"}
|
| 1245 |
+
{"current_steps": 1245, "total_steps": 1479, "loss": 0.4104, "lr": 7.434417018547396e-07, "epoch": 2.5253549695740363, "percentage": 84.18, "elapsed_time": "4:29:27", "remaining_time": "0:50:38"}
|
| 1246 |
+
{"current_steps": 1246, "total_steps": 1479, "loss": 0.4201, "lr": 7.372617199472854e-07, "epoch": 2.5273833671399597, "percentage": 84.25, "elapsed_time": "4:29:40", "remaining_time": "0:50:25"}
|
| 1247 |
+
{"current_steps": 1247, "total_steps": 1479, "loss": 0.4343, "lr": 7.311054863166095e-07, "epoch": 2.5294117647058822, "percentage": 84.31, "elapsed_time": "4:29:52", "remaining_time": "0:50:12"}
|
| 1248 |
+
{"current_steps": 1248, "total_steps": 1479, "loss": 0.4455, "lr": 7.249730352599e-07, "epoch": 2.5314401622718052, "percentage": 84.38, "elapsed_time": "4:30:05", "remaining_time": "0:49:59"}
|
| 1249 |
+
{"current_steps": 1249, "total_steps": 1479, "loss": 0.4181, "lr": 7.188644009418517e-07, "epoch": 2.5334685598377282, "percentage": 84.45, "elapsed_time": "4:30:18", "remaining_time": "0:49:46"}
|
| 1250 |
+
{"current_steps": 1250, "total_steps": 1479, "loss": 0.415, "lr": 7.127796173944695e-07, "epoch": 2.535496957403651, "percentage": 84.52, "elapsed_time": "4:30:31", "remaining_time": "0:49:33"}
|
| 1251 |
+
{"current_steps": 1251, "total_steps": 1479, "loss": 0.4112, "lr": 7.067187185168862e-07, "epoch": 2.537525354969574, "percentage": 84.58, "elapsed_time": "4:30:44", "remaining_time": "0:49:20"}
|
| 1252 |
+
{"current_steps": 1252, "total_steps": 1479, "loss": 0.415, "lr": 7.006817380751663e-07, "epoch": 2.5395537525354968, "percentage": 84.65, "elapsed_time": "4:30:56", "remaining_time": "0:49:07"}
|
| 1253 |
+
{"current_steps": 1253, "total_steps": 1479, "loss": 0.4249, "lr": 6.946687097021249e-07, "epoch": 2.5415821501014197, "percentage": 84.72, "elapsed_time": "4:31:09", "remaining_time": "0:48:54"}
|
| 1254 |
+
{"current_steps": 1254, "total_steps": 1479, "loss": 0.4141, "lr": 6.886796668971357e-07, "epoch": 2.5436105476673427, "percentage": 84.79, "elapsed_time": "4:31:22", "remaining_time": "0:48:41"}
|
| 1255 |
+
{"current_steps": 1255, "total_steps": 1479, "loss": 0.4127, "lr": 6.827146430259446e-07, "epoch": 2.5456389452332657, "percentage": 84.85, "elapsed_time": "4:31:35", "remaining_time": "0:48:28"}
|
| 1256 |
+
{"current_steps": 1256, "total_steps": 1479, "loss": 0.4175, "lr": 6.767736713204875e-07, "epoch": 2.5476673427991887, "percentage": 84.92, "elapsed_time": "4:31:47", "remaining_time": "0:48:15"}
|
| 1257 |
+
{"current_steps": 1257, "total_steps": 1479, "loss": 0.4128, "lr": 6.70856784878699e-07, "epoch": 2.5496957403651117, "percentage": 84.99, "elapsed_time": "4:32:00", "remaining_time": "0:48:02"}
|
| 1258 |
+
{"current_steps": 1258, "total_steps": 1479, "loss": 0.4182, "lr": 6.649640166643345e-07, "epoch": 2.5517241379310347, "percentage": 85.06, "elapsed_time": "4:32:13", "remaining_time": "0:47:49"}
|
| 1259 |
+
{"current_steps": 1259, "total_steps": 1479, "loss": 0.4204, "lr": 6.590953995067812e-07, "epoch": 2.5537525354969572, "percentage": 85.13, "elapsed_time": "4:32:25", "remaining_time": "0:47:36"}
|
| 1260 |
+
{"current_steps": 1260, "total_steps": 1479, "loss": 0.4322, "lr": 6.53250966100879e-07, "epoch": 2.5557809330628802, "percentage": 85.19, "elapsed_time": "4:32:38", "remaining_time": "0:47:23"}
|
| 1261 |
+
{"current_steps": 1261, "total_steps": 1479, "loss": 0.4141, "lr": 6.474307490067383e-07, "epoch": 2.5578093306288032, "percentage": 85.26, "elapsed_time": "4:32:51", "remaining_time": "0:47:10"}
|
| 1262 |
+
{"current_steps": 1262, "total_steps": 1479, "loss": 0.4304, "lr": 6.416347806495532e-07, "epoch": 2.559837728194726, "percentage": 85.33, "elapsed_time": "4:33:04", "remaining_time": "0:46:57"}
|
| 1263 |
+
{"current_steps": 1263, "total_steps": 1479, "loss": 0.4189, "lr": 6.358630933194282e-07, "epoch": 2.561866125760649, "percentage": 85.4, "elapsed_time": "4:33:17", "remaining_time": "0:46:44"}
|
| 1264 |
+
{"current_steps": 1264, "total_steps": 1479, "loss": 0.4174, "lr": 6.301157191711949e-07, "epoch": 2.5638945233265718, "percentage": 85.46, "elapsed_time": "4:33:29", "remaining_time": "0:46:31"}
|
| 1265 |
+
{"current_steps": 1265, "total_steps": 1479, "loss": 0.4393, "lr": 6.24392690224232e-07, "epoch": 2.565922920892495, "percentage": 85.53, "elapsed_time": "4:33:42", "remaining_time": "0:46:18"}
|
| 1266 |
+
{"current_steps": 1266, "total_steps": 1479, "loss": 0.4271, "lr": 6.186940383622875e-07, "epoch": 2.5679513184584177, "percentage": 85.6, "elapsed_time": "4:33:55", "remaining_time": "0:46:05"}
|
| 1267 |
+
{"current_steps": 1267, "total_steps": 1479, "loss": 0.4199, "lr": 6.130197953333017e-07, "epoch": 2.5699797160243407, "percentage": 85.67, "elapsed_time": "4:34:08", "remaining_time": "0:45:52"}
|
| 1268 |
+
{"current_steps": 1268, "total_steps": 1479, "loss": 0.4221, "lr": 6.073699927492322e-07, "epoch": 2.5720081135902637, "percentage": 85.73, "elapsed_time": "4:34:20", "remaining_time": "0:45:39"}
|
| 1269 |
+
{"current_steps": 1269, "total_steps": 1479, "loss": 0.4302, "lr": 6.017446620858708e-07, "epoch": 2.5740365111561867, "percentage": 85.8, "elapsed_time": "4:34:33", "remaining_time": "0:45:26"}
|
| 1270 |
+
{"current_steps": 1270, "total_steps": 1479, "loss": 0.4064, "lr": 5.961438346826792e-07, "epoch": 2.5760649087221097, "percentage": 85.87, "elapsed_time": "4:34:46", "remaining_time": "0:45:13"}
|
| 1271 |
+
{"current_steps": 1271, "total_steps": 1479, "loss": 0.4096, "lr": 5.905675417426027e-07, "epoch": 2.5780933062880322, "percentage": 85.94, "elapsed_time": "4:34:59", "remaining_time": "0:45:00"}
|
| 1272 |
+
{"current_steps": 1272, "total_steps": 1479, "loss": 0.42, "lr": 5.850158143319062e-07, "epoch": 2.5801217038539552, "percentage": 86.0, "elapsed_time": "4:35:11", "remaining_time": "0:44:47"}
|
| 1273 |
+
{"current_steps": 1273, "total_steps": 1479, "loss": 0.4165, "lr": 5.794886833799923e-07, "epoch": 2.582150101419878, "percentage": 86.07, "elapsed_time": "4:35:24", "remaining_time": "0:44:34"}
|
| 1274 |
+
{"current_steps": 1274, "total_steps": 1479, "loss": 0.4251, "lr": 5.739861796792373e-07, "epoch": 2.584178498985801, "percentage": 86.14, "elapsed_time": "4:35:37", "remaining_time": "0:44:21"}
|
| 1275 |
+
{"current_steps": 1275, "total_steps": 1479, "loss": 0.4219, "lr": 5.685083338848152e-07, "epoch": 2.586206896551724, "percentage": 86.21, "elapsed_time": "4:35:50", "remaining_time": "0:44:08"}
|
| 1276 |
+
{"current_steps": 1276, "total_steps": 1479, "loss": 0.4226, "lr": 5.630551765145259e-07, "epoch": 2.588235294117647, "percentage": 86.27, "elapsed_time": "4:36:02", "remaining_time": "0:43:54"}
|
| 1277 |
+
{"current_steps": 1277, "total_steps": 1479, "loss": 0.4204, "lr": 5.576267379486294e-07, "epoch": 2.59026369168357, "percentage": 86.34, "elapsed_time": "4:36:15", "remaining_time": "0:43:41"}
|
| 1278 |
+
{"current_steps": 1278, "total_steps": 1479, "loss": 0.4407, "lr": 5.522230484296698e-07, "epoch": 2.5922920892494927, "percentage": 86.41, "elapsed_time": "4:36:28", "remaining_time": "0:43:28"}
|
| 1279 |
+
{"current_steps": 1279, "total_steps": 1479, "loss": 0.4238, "lr": 5.468441380623169e-07, "epoch": 2.5943204868154157, "percentage": 86.48, "elapsed_time": "4:36:41", "remaining_time": "0:43:15"}
|
| 1280 |
+
{"current_steps": 1280, "total_steps": 1479, "loss": 0.42, "lr": 5.414900368131854e-07, "epoch": 2.5963488843813387, "percentage": 86.54, "elapsed_time": "4:36:53", "remaining_time": "0:43:02"}
|
| 1281 |
+
{"current_steps": 1281, "total_steps": 1479, "loss": 0.4488, "lr": 5.361607745106817e-07, "epoch": 2.5983772819472617, "percentage": 86.61, "elapsed_time": "4:37:06", "remaining_time": "0:42:49"}
|
| 1282 |
+
{"current_steps": 1282, "total_steps": 1479, "loss": 0.4329, "lr": 5.308563808448286e-07, "epoch": 2.6004056795131847, "percentage": 86.68, "elapsed_time": "4:37:19", "remaining_time": "0:42:36"}
|
| 1283 |
+
{"current_steps": 1283, "total_steps": 1479, "loss": 0.4166, "lr": 5.255768853671011e-07, "epoch": 2.6024340770791072, "percentage": 86.75, "elapsed_time": "4:37:32", "remaining_time": "0:42:23"}
|
| 1284 |
+
{"current_steps": 1284, "total_steps": 1479, "loss": 0.4344, "lr": 5.203223174902644e-07, "epoch": 2.6044624746450307, "percentage": 86.82, "elapsed_time": "4:37:44", "remaining_time": "0:42:10"}
|
| 1285 |
+
{"current_steps": 1285, "total_steps": 1479, "loss": 0.4229, "lr": 5.150927064882089e-07, "epoch": 2.606490872210953, "percentage": 86.88, "elapsed_time": "4:37:57", "remaining_time": "0:41:57"}
|
| 1286 |
+
{"current_steps": 1286, "total_steps": 1479, "loss": 0.439, "lr": 5.098880814957879e-07, "epoch": 2.608519269776876, "percentage": 86.95, "elapsed_time": "4:38:10", "remaining_time": "0:41:44"}
|
| 1287 |
+
{"current_steps": 1287, "total_steps": 1479, "loss": 0.4245, "lr": 5.047084715086515e-07, "epoch": 2.610547667342799, "percentage": 87.02, "elapsed_time": "4:38:23", "remaining_time": "0:41:31"}
|
| 1288 |
+
{"current_steps": 1288, "total_steps": 1479, "loss": 0.4376, "lr": 4.995539053830901e-07, "epoch": 2.612576064908722, "percentage": 87.09, "elapsed_time": "4:38:35", "remaining_time": "0:41:18"}
|
| 1289 |
+
{"current_steps": 1289, "total_steps": 1479, "loss": 0.436, "lr": 4.944244118358721e-07, "epoch": 2.614604462474645, "percentage": 87.15, "elapsed_time": "4:38:48", "remaining_time": "0:41:05"}
|
| 1290 |
+
{"current_steps": 1290, "total_steps": 1479, "loss": 0.4097, "lr": 4.8932001944408e-07, "epoch": 2.6166328600405677, "percentage": 87.22, "elapsed_time": "4:39:01", "remaining_time": "0:40:52"}
|
| 1291 |
+
{"current_steps": 1291, "total_steps": 1479, "loss": 0.4344, "lr": 4.842407566449591e-07, "epoch": 2.6186612576064907, "percentage": 87.29, "elapsed_time": "4:39:14", "remaining_time": "0:40:39"}
|
| 1292 |
+
{"current_steps": 1292, "total_steps": 1479, "loss": 0.4311, "lr": 4.791866517357491e-07, "epoch": 2.6206896551724137, "percentage": 87.36, "elapsed_time": "4:39:26", "remaining_time": "0:40:26"}
|
| 1293 |
+
{"current_steps": 1293, "total_steps": 1479, "loss": 0.4124, "lr": 4.741577328735364e-07, "epoch": 2.6227180527383367, "percentage": 87.42, "elapsed_time": "4:39:39", "remaining_time": "0:40:13"}
|
| 1294 |
+
{"current_steps": 1294, "total_steps": 1479, "loss": 0.4193, "lr": 4.6915402807509004e-07, "epoch": 2.6247464503042597, "percentage": 87.49, "elapsed_time": "4:39:52", "remaining_time": "0:40:00"}
|
| 1295 |
+
{"current_steps": 1295, "total_steps": 1479, "loss": 0.422, "lr": 4.641755652167107e-07, "epoch": 2.6267748478701827, "percentage": 87.56, "elapsed_time": "4:40:05", "remaining_time": "0:39:47"}
|
| 1296 |
+
{"current_steps": 1296, "total_steps": 1479, "loss": 0.4204, "lr": 4.592223720340683e-07, "epoch": 2.6288032454361057, "percentage": 87.63, "elapsed_time": "4:40:17", "remaining_time": "0:39:34"}
|
| 1297 |
+
{"current_steps": 1297, "total_steps": 1479, "loss": 0.4262, "lr": 4.5429447612205635e-07, "epoch": 2.630831643002028, "percentage": 87.69, "elapsed_time": "4:40:30", "remaining_time": "0:39:21"}
|
| 1298 |
+
{"current_steps": 1298, "total_steps": 1479, "loss": 0.4297, "lr": 4.4939190493463347e-07, "epoch": 2.632860040567951, "percentage": 87.76, "elapsed_time": "4:40:43", "remaining_time": "0:39:08"}
|
| 1299 |
+
{"current_steps": 1299, "total_steps": 1479, "loss": 0.4123, "lr": 4.445146857846672e-07, "epoch": 2.634888438133874, "percentage": 87.83, "elapsed_time": "4:40:56", "remaining_time": "0:38:55"}
|
| 1300 |
+
{"current_steps": 1300, "total_steps": 1479, "loss": 0.4207, "lr": 4.3966284584379125e-07, "epoch": 2.636916835699797, "percentage": 87.9, "elapsed_time": "4:41:09", "remaining_time": "0:38:42"}
|
| 1301 |
+
{"current_steps": 1301, "total_steps": 1479, "loss": 0.4214, "lr": 4.3483641214224325e-07, "epoch": 2.63894523326572, "percentage": 87.96, "elapsed_time": "4:41:21", "remaining_time": "0:38:29"}
|
| 1302 |
+
{"current_steps": 1302, "total_steps": 1479, "loss": 0.4066, "lr": 4.300354115687216e-07, "epoch": 2.640973630831643, "percentage": 88.03, "elapsed_time": "4:41:34", "remaining_time": "0:38:16"}
|
| 1303 |
+
{"current_steps": 1303, "total_steps": 1479, "loss": 0.4278, "lr": 4.2525987087023433e-07, "epoch": 2.643002028397566, "percentage": 88.1, "elapsed_time": "4:41:47", "remaining_time": "0:38:03"}
|
| 1304 |
+
{"current_steps": 1304, "total_steps": 1479, "loss": 0.4106, "lr": 4.2050981665194725e-07, "epoch": 2.6450304259634887, "percentage": 88.17, "elapsed_time": "4:42:00", "remaining_time": "0:37:50"}
|
| 1305 |
+
{"current_steps": 1305, "total_steps": 1479, "loss": 0.4162, "lr": 4.1578527537703973e-07, "epoch": 2.6470588235294117, "percentage": 88.24, "elapsed_time": "4:42:13", "remaining_time": "0:37:37"}
|
| 1306 |
+
{"current_steps": 1306, "total_steps": 1479, "loss": 0.4274, "lr": 4.110862733665522e-07, "epoch": 2.6490872210953347, "percentage": 88.3, "elapsed_time": "4:42:25", "remaining_time": "0:37:24"}
|
| 1307 |
+
{"current_steps": 1307, "total_steps": 1479, "loss": 0.401, "lr": 4.064128367992459e-07, "epoch": 2.6511156186612577, "percentage": 88.37, "elapsed_time": "4:42:38", "remaining_time": "0:37:11"}
|
| 1308 |
+
{"current_steps": 1308, "total_steps": 1479, "loss": 0.4322, "lr": 4.0176499171144967e-07, "epoch": 2.6531440162271807, "percentage": 88.44, "elapsed_time": "4:42:51", "remaining_time": "0:36:58"}
|
| 1309 |
+
{"current_steps": 1309, "total_steps": 1479, "loss": 0.4116, "lr": 3.971427639969233e-07, "epoch": 2.655172413793103, "percentage": 88.51, "elapsed_time": "4:43:03", "remaining_time": "0:36:45"}
|
| 1310 |
+
{"current_steps": 1310, "total_steps": 1479, "loss": 0.4282, "lr": 3.925461794067048e-07, "epoch": 2.6572008113590266, "percentage": 88.57, "elapsed_time": "4:43:16", "remaining_time": "0:36:32"}
|
| 1311 |
+
{"current_steps": 1311, "total_steps": 1479, "loss": 0.4242, "lr": 3.879752635489736e-07, "epoch": 2.659229208924949, "percentage": 88.64, "elapsed_time": "4:43:29", "remaining_time": "0:36:19"}
|
| 1312 |
+
{"current_steps": 1312, "total_steps": 1479, "loss": 0.4086, "lr": 3.834300418889042e-07, "epoch": 2.661257606490872, "percentage": 88.71, "elapsed_time": "4:43:42", "remaining_time": "0:36:06"}
|
| 1313 |
+
{"current_steps": 1313, "total_steps": 1479, "loss": 0.4355, "lr": 3.7891053974852597e-07, "epoch": 2.663286004056795, "percentage": 88.78, "elapsed_time": "4:43:55", "remaining_time": "0:35:53"}
|
| 1314 |
+
{"current_steps": 1314, "total_steps": 1479, "loss": 0.4132, "lr": 3.744167823065814e-07, "epoch": 2.665314401622718, "percentage": 88.84, "elapsed_time": "4:44:07", "remaining_time": "0:35:40"}
|
| 1315 |
+
{"current_steps": 1315, "total_steps": 1479, "loss": 0.4246, "lr": 3.6994879459838375e-07, "epoch": 2.667342799188641, "percentage": 88.91, "elapsed_time": "4:44:20", "remaining_time": "0:35:27"}
|
| 1316 |
+
{"current_steps": 1316, "total_steps": 1479, "loss": 0.433, "lr": 3.655066015156833e-07, "epoch": 2.6693711967545637, "percentage": 88.98, "elapsed_time": "4:44:33", "remaining_time": "0:35:14"}
|
| 1317 |
+
{"current_steps": 1317, "total_steps": 1479, "loss": 0.4117, "lr": 3.6109022780652147e-07, "epoch": 2.6713995943204867, "percentage": 89.05, "elapsed_time": "4:44:46", "remaining_time": "0:35:01"}
|
| 1318 |
+
{"current_steps": 1318, "total_steps": 1479, "loss": 0.4377, "lr": 3.566996980750992e-07, "epoch": 2.6734279918864097, "percentage": 89.11, "elapsed_time": "4:44:58", "remaining_time": "0:34:48"}
|
| 1319 |
+
{"current_steps": 1319, "total_steps": 1479, "loss": 0.408, "lr": 3.5233503678163696e-07, "epoch": 2.6754563894523327, "percentage": 89.18, "elapsed_time": "4:45:11", "remaining_time": "0:34:35"}
|
| 1320 |
+
{"current_steps": 1320, "total_steps": 1479, "loss": 0.4324, "lr": 3.4799626824223666e-07, "epoch": 2.6774847870182557, "percentage": 89.25, "elapsed_time": "4:45:24", "remaining_time": "0:34:22"}
|
| 1321 |
+
{"current_steps": 1321, "total_steps": 1479, "loss": 0.4222, "lr": 3.4368341662875004e-07, "epoch": 2.6795131845841786, "percentage": 89.32, "elapsed_time": "4:45:37", "remaining_time": "0:34:09"}
|
| 1322 |
+
{"current_steps": 1322, "total_steps": 1479, "loss": 0.4083, "lr": 3.3939650596864216e-07, "epoch": 2.6815415821501016, "percentage": 89.38, "elapsed_time": "4:45:49", "remaining_time": "0:33:56"}
|
| 1323 |
+
{"current_steps": 1323, "total_steps": 1479, "loss": 0.4316, "lr": 3.3513556014485805e-07, "epoch": 2.683569979716024, "percentage": 89.45, "elapsed_time": "4:46:02", "remaining_time": "0:33:43"}
|
| 1324 |
+
{"current_steps": 1324, "total_steps": 1479, "loss": 0.4078, "lr": 3.3090060289568683e-07, "epoch": 2.685598377281947, "percentage": 89.52, "elapsed_time": "4:46:15", "remaining_time": "0:33:30"}
|
| 1325 |
+
{"current_steps": 1325, "total_steps": 1479, "loss": 0.4204, "lr": 3.26691657814634e-07, "epoch": 2.68762677484787, "percentage": 89.59, "elapsed_time": "4:46:28", "remaining_time": "0:33:17"}
|
| 1326 |
+
{"current_steps": 1326, "total_steps": 1479, "loss": 0.4223, "lr": 3.225087483502892e-07, "epoch": 2.689655172413793, "percentage": 89.66, "elapsed_time": "4:46:40", "remaining_time": "0:33:04"}
|
| 1327 |
+
{"current_steps": 1327, "total_steps": 1479, "loss": 0.399, "lr": 3.183518978061895e-07, "epoch": 2.691683569979716, "percentage": 89.72, "elapsed_time": "4:46:53", "remaining_time": "0:32:51"}
|
| 1328 |
+
{"current_steps": 1328, "total_steps": 1479, "loss": 0.4154, "lr": 3.1422112934069993e-07, "epoch": 2.6937119675456387, "percentage": 89.79, "elapsed_time": "4:47:06", "remaining_time": "0:32:38"}
|
| 1329 |
+
{"current_steps": 1329, "total_steps": 1479, "loss": 0.4494, "lr": 3.101164659668732e-07, "epoch": 2.695740365111562, "percentage": 89.86, "elapsed_time": "4:47:19", "remaining_time": "0:32:25"}
|
| 1330 |
+
{"current_steps": 1330, "total_steps": 1479, "loss": 0.4236, "lr": 3.06037930552332e-07, "epoch": 2.6977687626774847, "percentage": 89.93, "elapsed_time": "4:47:31", "remaining_time": "0:32:12"}
|
| 1331 |
+
{"current_steps": 1331, "total_steps": 1479, "loss": 0.4168, "lr": 3.0198554581913343e-07, "epoch": 2.6997971602434077, "percentage": 89.99, "elapsed_time": "4:47:44", "remaining_time": "0:31:59"}
|
| 1332 |
+
{"current_steps": 1332, "total_steps": 1479, "loss": 0.4357, "lr": 2.9795933434364764e-07, "epoch": 2.7018255578093306, "percentage": 90.06, "elapsed_time": "4:47:57", "remaining_time": "0:31:46"}
|
| 1333 |
+
{"current_steps": 1333, "total_steps": 1479, "loss": 0.4065, "lr": 2.9395931855643043e-07, "epoch": 2.7038539553752536, "percentage": 90.13, "elapsed_time": "4:48:10", "remaining_time": "0:31:33"}
|
| 1334 |
+
{"current_steps": 1334, "total_steps": 1479, "loss": 0.4541, "lr": 2.8998552074209485e-07, "epoch": 2.7058823529411766, "percentage": 90.2, "elapsed_time": "4:48:24", "remaining_time": "0:31:20"}
|
| 1335 |
+
{"current_steps": 1335, "total_steps": 1479, "loss": 0.4265, "lr": 2.860379630391935e-07, "epoch": 2.707910750507099, "percentage": 90.26, "elapsed_time": "4:48:37", "remaining_time": "0:31:07"}
|
| 1336 |
+
{"current_steps": 1336, "total_steps": 1479, "loss": 0.4289, "lr": 2.821166674400905e-07, "epoch": 2.709939148073022, "percentage": 90.33, "elapsed_time": "4:48:50", "remaining_time": "0:30:55"}
|
| 1337 |
+
{"current_steps": 1337, "total_steps": 1479, "loss": 0.4289, "lr": 2.7822165579084013e-07, "epoch": 2.711967545638945, "percentage": 90.4, "elapsed_time": "4:49:04", "remaining_time": "0:30:42"}
|
| 1338 |
+
{"current_steps": 1338, "total_steps": 1479, "loss": 0.4149, "lr": 2.7435294979106574e-07, "epoch": 2.713995943204868, "percentage": 90.47, "elapsed_time": "4:49:17", "remaining_time": "0:30:29"}
|
| 1339 |
+
{"current_steps": 1339, "total_steps": 1479, "loss": 0.4269, "lr": 2.705105709938388e-07, "epoch": 2.716024340770791, "percentage": 90.53, "elapsed_time": "4:49:30", "remaining_time": "0:30:16"}
|
| 1340 |
+
{"current_steps": 1340, "total_steps": 1479, "loss": 0.4154, "lr": 2.666945408055571e-07, "epoch": 2.718052738336714, "percentage": 90.6, "elapsed_time": "4:49:43", "remaining_time": "0:30:03"}
|
| 1341 |
+
{"current_steps": 1341, "total_steps": 1479, "loss": 0.4427, "lr": 2.629048804858275e-07, "epoch": 2.720081135902637, "percentage": 90.67, "elapsed_time": "4:49:57", "remaining_time": "0:29:50"}
|
| 1342 |
+
{"current_steps": 1342, "total_steps": 1479, "loss": 0.4293, "lr": 2.5914161114734937e-07, "epoch": 2.7221095334685597, "percentage": 90.74, "elapsed_time": "4:50:10", "remaining_time": "0:29:37"}
|
| 1343 |
+
{"current_steps": 1343, "total_steps": 1479, "loss": 0.4252, "lr": 2.5540475375578967e-07, "epoch": 2.7241379310344827, "percentage": 90.8, "elapsed_time": "4:50:22", "remaining_time": "0:29:24"}
|
| 1344 |
+
{"current_steps": 1344, "total_steps": 1479, "loss": 0.428, "lr": 2.5169432912967527e-07, "epoch": 2.7261663286004056, "percentage": 90.87, "elapsed_time": "4:50:35", "remaining_time": "0:29:11"}
|
| 1345 |
+
{"current_steps": 1345, "total_steps": 1479, "loss": 0.4218, "lr": 2.4801035794026987e-07, "epoch": 2.7281947261663286, "percentage": 90.94, "elapsed_time": "4:50:48", "remaining_time": "0:28:58"}
|
| 1346 |
+
{"current_steps": 1346, "total_steps": 1479, "loss": 0.4449, "lr": 2.4435286071146256e-07, "epoch": 2.7302231237322516, "percentage": 91.01, "elapsed_time": "4:51:01", "remaining_time": "0:28:45"}
|
| 1347 |
+
{"current_steps": 1347, "total_steps": 1479, "loss": 0.4162, "lr": 2.407218578196524e-07, "epoch": 2.732251521298174, "percentage": 91.08, "elapsed_time": "4:51:14", "remaining_time": "0:28:32"}
|
| 1348 |
+
{"current_steps": 1348, "total_steps": 1479, "loss": 0.4381, "lr": 2.3711736949363516e-07, "epoch": 2.7342799188640976, "percentage": 91.14, "elapsed_time": "4:51:27", "remaining_time": "0:28:19"}
|
| 1349 |
+
{"current_steps": 1349, "total_steps": 1479, "loss": 0.4057, "lr": 2.3353941581449048e-07, "epoch": 2.73630831643002, "percentage": 91.21, "elapsed_time": "4:51:40", "remaining_time": "0:28:06"}
|
| 1350 |
+
{"current_steps": 1350, "total_steps": 1479, "loss": 0.4347, "lr": 2.2998801671546945e-07, "epoch": 2.738336713995943, "percentage": 91.28, "elapsed_time": "4:51:52", "remaining_time": "0:27:53"}
|
| 1351 |
+
{"current_steps": 1351, "total_steps": 1479, "loss": 0.4141, "lr": 2.2646319198188495e-07, "epoch": 2.740365111561866, "percentage": 91.35, "elapsed_time": "4:52:05", "remaining_time": "0:27:40"}
|
| 1352 |
+
{"current_steps": 1352, "total_steps": 1479, "loss": 0.4343, "lr": 2.2296496125099987e-07, "epoch": 2.742393509127789, "percentage": 91.41, "elapsed_time": "4:52:18", "remaining_time": "0:27:27"}
|
| 1353 |
+
{"current_steps": 1353, "total_steps": 1479, "loss": 0.427, "lr": 2.1949334401192013e-07, "epoch": 2.744421906693712, "percentage": 91.48, "elapsed_time": "4:52:31", "remaining_time": "0:27:14"}
|
| 1354 |
+
{"current_steps": 1354, "total_steps": 1479, "loss": 0.4103, "lr": 2.160483596054802e-07, "epoch": 2.7464503042596347, "percentage": 91.55, "elapsed_time": "4:52:44", "remaining_time": "0:27:01"}
|
| 1355 |
+
{"current_steps": 1355, "total_steps": 1479, "loss": 0.414, "lr": 2.1263002722414383e-07, "epoch": 2.7484787018255576, "percentage": 91.62, "elapsed_time": "4:52:56", "remaining_time": "0:26:48"}
|
| 1356 |
+
{"current_steps": 1356, "total_steps": 1479, "loss": 0.4107, "lr": 2.0923836591189183e-07, "epoch": 2.7505070993914806, "percentage": 91.68, "elapsed_time": "4:53:09", "remaining_time": "0:26:35"}
|
| 1357 |
+
{"current_steps": 1357, "total_steps": 1479, "loss": 0.4262, "lr": 2.0587339456411503e-07, "epoch": 2.7525354969574036, "percentage": 91.75, "elapsed_time": "4:53:22", "remaining_time": "0:26:22"}
|
| 1358 |
+
{"current_steps": 1358, "total_steps": 1479, "loss": 0.4188, "lr": 2.0253513192751374e-07, "epoch": 2.7545638945233266, "percentage": 91.82, "elapsed_time": "4:53:35", "remaining_time": "0:26:09"}
|
| 1359 |
+
{"current_steps": 1359, "total_steps": 1479, "loss": 0.4207, "lr": 1.9922359659998724e-07, "epoch": 2.7565922920892496, "percentage": 91.89, "elapsed_time": "4:53:47", "remaining_time": "0:25:56"}
|
| 1360 |
+
{"current_steps": 1360, "total_steps": 1479, "loss": 0.4101, "lr": 1.9593880703053681e-07, "epoch": 2.7586206896551726, "percentage": 91.95, "elapsed_time": "4:54:00", "remaining_time": "0:25:43"}
|
| 1361 |
+
{"current_steps": 1361, "total_steps": 1479, "loss": 0.4118, "lr": 1.9268078151915724e-07, "epoch": 2.760649087221095, "percentage": 92.02, "elapsed_time": "4:54:13", "remaining_time": "0:25:30"}
|
| 1362 |
+
{"current_steps": 1362, "total_steps": 1479, "loss": 0.4209, "lr": 1.8944953821673827e-07, "epoch": 2.762677484787018, "percentage": 92.09, "elapsed_time": "4:54:26", "remaining_time": "0:25:17"}
|
| 1363 |
+
{"current_steps": 1363, "total_steps": 1479, "loss": 0.4021, "lr": 1.8624509512496336e-07, "epoch": 2.764705882352941, "percentage": 92.16, "elapsed_time": "4:54:38", "remaining_time": "0:25:04"}
|
| 1364 |
+
{"current_steps": 1364, "total_steps": 1479, "loss": 0.4262, "lr": 1.830674700962054e-07, "epoch": 2.766734279918864, "percentage": 92.22, "elapsed_time": "4:54:51", "remaining_time": "0:24:51"}
|
| 1365 |
+
{"current_steps": 1365, "total_steps": 1479, "loss": 0.417, "lr": 1.799166808334335e-07, "epoch": 2.768762677484787, "percentage": 92.29, "elapsed_time": "4:55:04", "remaining_time": "0:24:38"}
|
| 1366 |
+
{"current_steps": 1366, "total_steps": 1479, "loss": 0.4175, "lr": 1.767927448901091e-07, "epoch": 2.77079107505071, "percentage": 92.36, "elapsed_time": "4:55:17", "remaining_time": "0:24:25"}
|
| 1367 |
+
{"current_steps": 1367, "total_steps": 1479, "loss": 0.4189, "lr": 1.7369567967009226e-07, "epoch": 2.772819472616633, "percentage": 92.43, "elapsed_time": "4:55:30", "remaining_time": "0:24:12"}
|
| 1368 |
+
{"current_steps": 1368, "total_steps": 1479, "loss": 0.446, "lr": 1.7062550242753994e-07, "epoch": 2.7748478701825556, "percentage": 92.49, "elapsed_time": "4:55:42", "remaining_time": "0:23:59"}
|
| 1369 |
+
{"current_steps": 1369, "total_steps": 1479, "loss": 0.4288, "lr": 1.6758223026681507e-07, "epoch": 2.7768762677484786, "percentage": 92.56, "elapsed_time": "4:55:55", "remaining_time": "0:23:46"}
|
| 1370 |
+
{"current_steps": 1370, "total_steps": 1479, "loss": 0.4386, "lr": 1.6456588014238828e-07, "epoch": 2.7789046653144016, "percentage": 92.63, "elapsed_time": "4:56:08", "remaining_time": "0:23:33"}
|
| 1371 |
+
{"current_steps": 1371, "total_steps": 1479, "loss": 0.4215, "lr": 1.615764688587429e-07, "epoch": 2.7809330628803246, "percentage": 92.7, "elapsed_time": "4:56:21", "remaining_time": "0:23:20"}
|
| 1372 |
+
{"current_steps": 1372, "total_steps": 1479, "loss": 0.425, "lr": 1.58614013070284e-07, "epoch": 2.7829614604462476, "percentage": 92.77, "elapsed_time": "4:56:33", "remaining_time": "0:23:07"}
|
| 1373 |
+
{"current_steps": 1373, "total_steps": 1479, "loss": 0.4179, "lr": 1.5567852928124237e-07, "epoch": 2.78498985801217, "percentage": 92.83, "elapsed_time": "4:56:46", "remaining_time": "0:22:54"}
|
| 1374 |
+
{"current_steps": 1374, "total_steps": 1479, "loss": 0.4171, "lr": 1.5277003384558619e-07, "epoch": 2.7870182555780936, "percentage": 92.9, "elapsed_time": "4:56:59", "remaining_time": "0:22:41"}
|
| 1375 |
+
{"current_steps": 1375, "total_steps": 1479, "loss": 0.4294, "lr": 1.4988854296692557e-07, "epoch": 2.789046653144016, "percentage": 92.97, "elapsed_time": "4:57:12", "remaining_time": "0:22:28"}
|
| 1376 |
+
{"current_steps": 1376, "total_steps": 1479, "loss": 0.4351, "lr": 1.4703407269842707e-07, "epoch": 2.791075050709939, "percentage": 93.04, "elapsed_time": "4:57:24", "remaining_time": "0:22:15"}
|
| 1377 |
+
{"current_steps": 1377, "total_steps": 1479, "loss": 0.41, "lr": 1.442066389427199e-07, "epoch": 2.793103448275862, "percentage": 93.1, "elapsed_time": "4:57:37", "remaining_time": "0:22:02"}
|
| 1378 |
+
{"current_steps": 1378, "total_steps": 1479, "loss": 0.4091, "lr": 1.414062574518099e-07, "epoch": 2.795131845841785, "percentage": 93.17, "elapsed_time": "4:57:50", "remaining_time": "0:21:49"}
|
| 1379 |
+
{"current_steps": 1379, "total_steps": 1479, "loss": 0.4213, "lr": 1.386329438269929e-07, "epoch": 2.797160243407708, "percentage": 93.24, "elapsed_time": "4:58:03", "remaining_time": "0:21:36"}
|
| 1380 |
+
{"current_steps": 1380, "total_steps": 1479, "loss": 0.4376, "lr": 1.358867135187636e-07, "epoch": 2.7991886409736306, "percentage": 93.31, "elapsed_time": "4:58:16", "remaining_time": "0:21:23"}
|
| 1381 |
+
{"current_steps": 1381, "total_steps": 1479, "loss": 0.4252, "lr": 1.3316758182673307e-07, "epoch": 2.8012170385395536, "percentage": 93.37, "elapsed_time": "4:58:28", "remaining_time": "0:21:10"}
|
| 1382 |
+
{"current_steps": 1382, "total_steps": 1479, "loss": 0.412, "lr": 1.3047556389954252e-07, "epoch": 2.8032454361054766, "percentage": 93.44, "elapsed_time": "4:58:41", "remaining_time": "0:20:57"}
|
| 1383 |
+
{"current_steps": 1383, "total_steps": 1479, "loss": 0.4287, "lr": 1.2781067473477905e-07, "epoch": 2.8052738336713996, "percentage": 93.51, "elapsed_time": "4:58:54", "remaining_time": "0:20:44"}
|
| 1384 |
+
{"current_steps": 1384, "total_steps": 1479, "loss": 0.4321, "lr": 1.2517292917889057e-07, "epoch": 2.8073022312373226, "percentage": 93.58, "elapsed_time": "4:59:07", "remaining_time": "0:20:31"}
|
| 1385 |
+
{"current_steps": 1385, "total_steps": 1479, "loss": 0.4329, "lr": 1.225623419271055e-07, "epoch": 2.8093306288032456, "percentage": 93.64, "elapsed_time": "4:59:19", "remaining_time": "0:20:18"}
|
| 1386 |
+
{"current_steps": 1386, "total_steps": 1479, "loss": 0.4272, "lr": 1.1997892752334983e-07, "epoch": 2.8113590263691686, "percentage": 93.71, "elapsed_time": "4:59:32", "remaining_time": "0:20:05"}
|
| 1387 |
+
{"current_steps": 1387, "total_steps": 1479, "loss": 0.4253, "lr": 1.1742270036016523e-07, "epoch": 2.813387423935091, "percentage": 93.78, "elapsed_time": "4:59:45", "remaining_time": "0:19:52"}
|
| 1388 |
+
{"current_steps": 1388, "total_steps": 1479, "loss": 0.4155, "lr": 1.1489367467862999e-07, "epoch": 2.815415821501014, "percentage": 93.85, "elapsed_time": "4:59:58", "remaining_time": "0:19:39"}
|
| 1389 |
+
{"current_steps": 1389, "total_steps": 1479, "loss": 0.4127, "lr": 1.1239186456828033e-07, "epoch": 2.817444219066937, "percentage": 93.91, "elapsed_time": "5:00:10", "remaining_time": "0:19:27"}
|
| 1390 |
+
{"current_steps": 1390, "total_steps": 1479, "loss": 0.4161, "lr": 1.0991728396702983e-07, "epoch": 2.81947261663286, "percentage": 93.98, "elapsed_time": "5:00:23", "remaining_time": "0:19:14"}
|
| 1391 |
+
{"current_steps": 1391, "total_steps": 1479, "loss": 0.4036, "lr": 1.0746994666109234e-07, "epoch": 2.821501014198783, "percentage": 94.05, "elapsed_time": "5:00:36", "remaining_time": "0:19:01"}
|
| 1392 |
+
{"current_steps": 1392, "total_steps": 1479, "loss": 0.4094, "lr": 1.0504986628490755e-07, "epoch": 2.8235294117647056, "percentage": 94.12, "elapsed_time": "5:00:49", "remaining_time": "0:18:48"}
|
| 1393 |
+
{"current_steps": 1393, "total_steps": 1479, "loss": 0.4266, "lr": 1.0265705632106216e-07, "epoch": 2.825557809330629, "percentage": 94.19, "elapsed_time": "5:01:01", "remaining_time": "0:18:35"}
|
| 1394 |
+
{"current_steps": 1394, "total_steps": 1479, "loss": 0.4327, "lr": 1.0029153010021497e-07, "epoch": 2.8275862068965516, "percentage": 94.25, "elapsed_time": "5:01:14", "remaining_time": "0:18:22"}
|
| 1395 |
+
{"current_steps": 1395, "total_steps": 1479, "loss": 0.4235, "lr": 9.795330080102527e-08, "epoch": 2.8296146044624746, "percentage": 94.32, "elapsed_time": "5:01:27", "remaining_time": "0:18:09"}
|
| 1396 |
+
{"current_steps": 1396, "total_steps": 1479, "loss": 0.4076, "lr": 9.564238145007621e-08, "epoch": 2.8316430020283976, "percentage": 94.39, "elapsed_time": "5:01:40", "remaining_time": "0:17:56"}
|
| 1397 |
+
{"current_steps": 1397, "total_steps": 1479, "loss": 0.4197, "lr": 9.335878492180373e-08, "epoch": 2.8336713995943206, "percentage": 94.46, "elapsed_time": "5:01:52", "remaining_time": "0:17:43"}
|
| 1398 |
+
{"current_steps": 1398, "total_steps": 1479, "loss": 0.4209, "lr": 9.110252393842556e-08, "epoch": 2.8356997971602436, "percentage": 94.52, "elapsed_time": "5:02:05", "remaining_time": "0:17:30"}
|
| 1399 |
+
{"current_steps": 1399, "total_steps": 1479, "loss": 0.4159, "lr": 8.887361106986848e-08, "epoch": 2.837728194726166, "percentage": 94.59, "elapsed_time": "5:02:18", "remaining_time": "0:17:17"}
|
| 1400 |
+
{"current_steps": 1400, "total_steps": 1479, "loss": 0.4276, "lr": 8.66720587337011e-08, "epoch": 2.839756592292089, "percentage": 94.66, "elapsed_time": "5:02:31", "remaining_time": "0:17:04"}
|
| 1401 |
+
{"current_steps": 1401, "total_steps": 1479, "loss": 0.4296, "lr": 8.44978791950607e-08, "epoch": 2.841784989858012, "percentage": 94.73, "elapsed_time": "5:02:44", "remaining_time": "0:16:51"}
|
| 1402 |
+
{"current_steps": 1402, "total_steps": 1479, "loss": 0.4428, "lr": 8.235108456658814e-08, "epoch": 2.843813387423935, "percentage": 94.79, "elapsed_time": "5:02:56", "remaining_time": "0:16:38"}
|
| 1403 |
+
{"current_steps": 1403, "total_steps": 1479, "loss": 0.423, "lr": 8.023168680835913e-08, "epoch": 2.845841784989858, "percentage": 94.86, "elapsed_time": "5:03:09", "remaining_time": "0:16:25"}
|
| 1404 |
+
{"current_steps": 1404, "total_steps": 1479, "loss": 0.4337, "lr": 7.813969772781815e-08, "epoch": 2.847870182555781, "percentage": 94.93, "elapsed_time": "5:03:22", "remaining_time": "0:16:12"}
|
| 1405 |
+
{"current_steps": 1405, "total_steps": 1479, "loss": 0.4188, "lr": 7.60751289797118e-08, "epoch": 2.849898580121704, "percentage": 95.0, "elapsed_time": "5:03:35", "remaining_time": "0:15:59"}
|
| 1406 |
+
{"current_steps": 1406, "total_steps": 1479, "loss": 0.4268, "lr": 7.403799206602447e-08, "epoch": 2.8519269776876266, "percentage": 95.06, "elapsed_time": "5:03:47", "remaining_time": "0:15:46"}
|
| 1407 |
+
{"current_steps": 1407, "total_steps": 1479, "loss": 0.412, "lr": 7.202829833591496e-08, "epoch": 2.8539553752535496, "percentage": 95.13, "elapsed_time": "5:04:00", "remaining_time": "0:15:33"}
|
| 1408 |
+
{"current_steps": 1408, "total_steps": 1479, "loss": 0.4119, "lr": 7.004605898565164e-08, "epoch": 2.8559837728194726, "percentage": 95.2, "elapsed_time": "5:04:13", "remaining_time": "0:15:20"}
|
| 1409 |
+
{"current_steps": 1409, "total_steps": 1479, "loss": 0.4186, "lr": 6.809128505855189e-08, "epoch": 2.8580121703853956, "percentage": 95.27, "elapsed_time": "5:04:26", "remaining_time": "0:15:07"}
|
| 1410 |
+
{"current_steps": 1410, "total_steps": 1479, "loss": 0.4301, "lr": 6.616398744491826e-08, "epoch": 2.8600405679513186, "percentage": 95.33, "elapsed_time": "5:04:38", "remaining_time": "0:14:54"}
|
| 1411 |
+
{"current_steps": 1411, "total_steps": 1479, "loss": 0.4306, "lr": 6.426417688197961e-08, "epoch": 2.862068965517241, "percentage": 95.4, "elapsed_time": "5:04:51", "remaining_time": "0:14:41"}
|
| 1412 |
+
{"current_steps": 1412, "total_steps": 1479, "loss": 0.4129, "lr": 6.239186395383067e-08, "epoch": 2.8640973630831645, "percentage": 95.47, "elapsed_time": "5:05:04", "remaining_time": "0:14:28"}
|
| 1413 |
+
{"current_steps": 1413, "total_steps": 1479, "loss": 0.4126, "lr": 6.054705909137426e-08, "epoch": 2.866125760649087, "percentage": 95.54, "elapsed_time": "5:05:17", "remaining_time": "0:14:15"}
|
| 1414 |
+
{"current_steps": 1414, "total_steps": 1479, "loss": 0.4377, "lr": 5.872977257226187e-08, "epoch": 2.86815415821501, "percentage": 95.61, "elapsed_time": "5:05:29", "remaining_time": "0:14:02"}
|
| 1415 |
+
{"current_steps": 1415, "total_steps": 1479, "loss": 0.4256, "lr": 5.6940014520834865e-08, "epoch": 2.870182555780933, "percentage": 95.67, "elapsed_time": "5:05:42", "remaining_time": "0:13:49"}
|
| 1416 |
+
{"current_steps": 1416, "total_steps": 1479, "loss": 0.4165, "lr": 5.5177794908071736e-08, "epoch": 2.872210953346856, "percentage": 95.74, "elapsed_time": "5:05:55", "remaining_time": "0:13:36"}
|
| 1417 |
+
{"current_steps": 1417, "total_steps": 1479, "loss": 0.417, "lr": 5.344312355153036e-08, "epoch": 2.874239350912779, "percentage": 95.81, "elapsed_time": "5:06:08", "remaining_time": "0:13:23"}
|
| 1418 |
+
{"current_steps": 1418, "total_steps": 1479, "loss": 0.4265, "lr": 5.173601011529361e-08, "epoch": 2.8762677484787016, "percentage": 95.88, "elapsed_time": "5:06:21", "remaining_time": "0:13:10"}
|
| 1419 |
+
{"current_steps": 1419, "total_steps": 1479, "loss": 0.4266, "lr": 5.005646410991549e-08, "epoch": 2.8782961460446246, "percentage": 95.94, "elapsed_time": "5:06:33", "remaining_time": "0:12:57"}
|
| 1420 |
+
{"current_steps": 1420, "total_steps": 1479, "loss": 0.4217, "lr": 4.840449489236787e-08, "epoch": 2.8803245436105476, "percentage": 96.01, "elapsed_time": "5:06:46", "remaining_time": "0:12:44"}
|
| 1421 |
+
{"current_steps": 1421, "total_steps": 1479, "loss": 0.426, "lr": 4.678011166598884e-08, "epoch": 2.8823529411764706, "percentage": 96.08, "elapsed_time": "5:06:59", "remaining_time": "0:12:31"}
|
| 1422 |
+
{"current_steps": 1422, "total_steps": 1479, "loss": 0.4245, "lr": 4.518332348043219e-08, "epoch": 2.8843813387423936, "percentage": 96.15, "elapsed_time": "5:07:12", "remaining_time": "0:12:18"}
|
| 1423 |
+
{"current_steps": 1423, "total_steps": 1479, "loss": 0.4026, "lr": 4.3614139231614725e-08, "epoch": 2.8864097363083165, "percentage": 96.21, "elapsed_time": "5:07:24", "remaining_time": "0:12:05"}
|
| 1424 |
+
{"current_steps": 1424, "total_steps": 1479, "loss": 0.4195, "lr": 4.207256766166845e-08, "epoch": 2.8884381338742395, "percentage": 96.28, "elapsed_time": "5:07:37", "remaining_time": "0:11:52"}
|
| 1425 |
+
{"current_steps": 1425, "total_steps": 1479, "loss": 0.4182, "lr": 4.0558617358892326e-08, "epoch": 2.890466531440162, "percentage": 96.35, "elapsed_time": "5:07:50", "remaining_time": "0:11:39"}
|
| 1426 |
+
{"current_steps": 1426, "total_steps": 1479, "loss": 0.4327, "lr": 3.9072296757702857e-08, "epoch": 2.892494929006085, "percentage": 96.42, "elapsed_time": "5:08:03", "remaining_time": "0:11:26"}
|
| 1427 |
+
{"current_steps": 1427, "total_steps": 1479, "loss": 0.4171, "lr": 3.7613614138587995e-08, "epoch": 2.894523326572008, "percentage": 96.48, "elapsed_time": "5:08:15", "remaining_time": "0:11:13"}
|
| 1428 |
+
{"current_steps": 1428, "total_steps": 1479, "loss": 0.4238, "lr": 3.61825776280611e-08, "epoch": 2.896551724137931, "percentage": 96.55, "elapsed_time": "5:08:28", "remaining_time": "0:11:01"}
|
| 1429 |
+
{"current_steps": 1429, "total_steps": 1479, "loss": 0.4217, "lr": 3.477919519861428e-08, "epoch": 2.898580121703854, "percentage": 96.62, "elapsed_time": "5:08:41", "remaining_time": "0:10:48"}
|
| 1430 |
+
{"current_steps": 1430, "total_steps": 1479, "loss": 0.4157, "lr": 3.3403474668677326e-08, "epoch": 2.900608519269777, "percentage": 96.69, "elapsed_time": "5:08:54", "remaining_time": "0:10:35"}
|
| 1431 |
+
{"current_steps": 1431, "total_steps": 1479, "loss": 0.4104, "lr": 3.205542370256997e-08, "epoch": 2.9026369168357, "percentage": 96.75, "elapsed_time": "5:09:06", "remaining_time": "0:10:22"}
|
| 1432 |
+
{"current_steps": 1432, "total_steps": 1479, "loss": 0.428, "lr": 3.073504981046138e-08, "epoch": 2.9046653144016226, "percentage": 96.82, "elapsed_time": "5:09:19", "remaining_time": "0:10:09"}
|
| 1433 |
+
{"current_steps": 1433, "total_steps": 1479, "loss": 0.4163, "lr": 2.944236034832959e-08, "epoch": 2.9066937119675456, "percentage": 96.89, "elapsed_time": "5:09:32", "remaining_time": "0:09:56"}
|
| 1434 |
+
{"current_steps": 1434, "total_steps": 1479, "loss": 0.4266, "lr": 2.817736251791714e-08, "epoch": 2.9087221095334685, "percentage": 96.96, "elapsed_time": "5:09:45", "remaining_time": "0:09:43"}
|
| 1435 |
+
{"current_steps": 1435, "total_steps": 1479, "loss": 0.428, "lr": 2.6940063366693303e-08, "epoch": 2.9107505070993915, "percentage": 97.03, "elapsed_time": "5:09:58", "remaining_time": "0:09:30"}
|
| 1436 |
+
{"current_steps": 1436, "total_steps": 1479, "loss": 0.4334, "lr": 2.5730469787815792e-08, "epoch": 2.9127789046653145, "percentage": 97.09, "elapsed_time": "5:10:10", "remaining_time": "0:09:17"}
|
| 1437 |
+
{"current_steps": 1437, "total_steps": 1479, "loss": 0.4259, "lr": 2.4548588520089123e-08, "epoch": 2.914807302231237, "percentage": 97.16, "elapsed_time": "5:10:23", "remaining_time": "0:09:04"}
|
| 1438 |
+
{"current_steps": 1438, "total_steps": 1479, "loss": 0.4196, "lr": 2.339442614792964e-08, "epoch": 2.9168356997971605, "percentage": 97.23, "elapsed_time": "5:10:36", "remaining_time": "0:08:51"}
|
| 1439 |
+
{"current_steps": 1439, "total_steps": 1479, "loss": 0.4268, "lr": 2.2267989101328878e-08, "epoch": 2.918864097363083, "percentage": 97.3, "elapsed_time": "5:10:49", "remaining_time": "0:08:38"}
|
| 1440 |
+
{"current_steps": 1440, "total_steps": 1479, "loss": 0.4173, "lr": 2.1169283655815276e-08, "epoch": 2.920892494929006, "percentage": 97.36, "elapsed_time": "5:11:01", "remaining_time": "0:08:25"}
|
| 1441 |
+
{"current_steps": 1441, "total_steps": 1479, "loss": 0.4306, "lr": 2.0098315932421952e-08, "epoch": 2.922920892494929, "percentage": 97.43, "elapsed_time": "5:11:14", "remaining_time": "0:08:12"}
|
| 1442 |
+
{"current_steps": 1442, "total_steps": 1479, "loss": 0.4109, "lr": 1.9055091897650647e-08, "epoch": 2.924949290060852, "percentage": 97.5, "elapsed_time": "5:11:27", "remaining_time": "0:07:59"}
|
| 1443 |
+
{"current_steps": 1443, "total_steps": 1479, "loss": 0.4313, "lr": 1.803961736344062e-08, "epoch": 2.926977687626775, "percentage": 97.57, "elapsed_time": "5:11:40", "remaining_time": "0:07:46"}
|
| 1444 |
+
{"current_steps": 1444, "total_steps": 1479, "loss": 0.4219, "lr": 1.7051897987134248e-08, "epoch": 2.9290060851926976, "percentage": 97.63, "elapsed_time": "5:11:52", "remaining_time": "0:07:33"}
|
| 1445 |
+
{"current_steps": 1445, "total_steps": 1479, "loss": 0.4216, "lr": 1.6091939271446478e-08, "epoch": 2.9310344827586206, "percentage": 97.7, "elapsed_time": "5:12:05", "remaining_time": "0:07:20"}
|
| 1446 |
+
{"current_steps": 1446, "total_steps": 1479, "loss": 0.418, "lr": 1.51597465644332e-08, "epoch": 2.9330628803245435, "percentage": 97.77, "elapsed_time": "5:12:18", "remaining_time": "0:07:07"}
|
| 1447 |
+
{"current_steps": 1447, "total_steps": 1479, "loss": 0.4159, "lr": 1.4255325059463477e-08, "epoch": 2.9350912778904665, "percentage": 97.84, "elapsed_time": "5:12:31", "remaining_time": "0:06:54"}
|
| 1448 |
+
{"current_steps": 1448, "total_steps": 1479, "loss": 0.4313, "lr": 1.337867979518903e-08, "epoch": 2.9371196754563895, "percentage": 97.9, "elapsed_time": "5:12:43", "remaining_time": "0:06:41"}
|
| 1449 |
+
{"current_steps": 1449, "total_steps": 1479, "loss": 0.4374, "lr": 1.252981565551481e-08, "epoch": 2.9391480730223125, "percentage": 97.97, "elapsed_time": "5:12:56", "remaining_time": "0:06:28"}
|
| 1450 |
+
{"current_steps": 1450, "total_steps": 1479, "loss": 0.4075, "lr": 1.1708737369576229e-08, "epoch": 2.9411764705882355, "percentage": 98.04, "elapsed_time": "5:13:09", "remaining_time": "0:06:15"}
|
| 1451 |
+
{"current_steps": 1451, "total_steps": 1479, "loss": 0.4343, "lr": 1.0915449511708088e-08, "epoch": 2.943204868154158, "percentage": 98.11, "elapsed_time": "5:13:22", "remaining_time": "0:06:02"}
|
| 1452 |
+
{"current_steps": 1452, "total_steps": 1479, "loss": 0.4508, "lr": 1.0149956501421254e-08, "epoch": 2.945233265720081, "percentage": 98.17, "elapsed_time": "5:13:34", "remaining_time": "0:05:49"}
|
| 1453 |
+
{"current_steps": 1453, "total_steps": 1479, "loss": 0.4328, "lr": 9.412262603378797e-09, "epoch": 2.947261663286004, "percentage": 98.24, "elapsed_time": "5:13:47", "remaining_time": "0:05:36"}
|
| 1454 |
+
{"current_steps": 1454, "total_steps": 1479, "loss": 0.3979, "lr": 8.70237192736989e-09, "epoch": 2.949290060851927, "percentage": 98.31, "elapsed_time": "5:14:00", "remaining_time": "0:05:23"}
|
| 1455 |
+
{"current_steps": 1455, "total_steps": 1479, "loss": 0.4287, "lr": 8.020288428289836e-09, "epoch": 2.95131845841785, "percentage": 98.38, "elapsed_time": "5:14:13", "remaining_time": "0:05:10"}
|
| 1456 |
+
{"current_steps": 1456, "total_steps": 1479, "loss": 0.4133, "lr": 7.366015906115076e-09, "epoch": 2.9533468559837726, "percentage": 98.44, "elapsed_time": "5:14:25", "remaining_time": "0:04:58"}
|
| 1457 |
+
{"current_steps": 1457, "total_steps": 1479, "loss": 0.4431, "lr": 6.739558005884883e-09, "epoch": 2.955375253549696, "percentage": 98.51, "elapsed_time": "5:14:38", "remaining_time": "0:04:45"}
|
| 1458 |
+
{"current_steps": 1458, "total_steps": 1479, "loss": 0.4309, "lr": 6.140918217678038e-09, "epoch": 2.9574036511156185, "percentage": 98.58, "elapsed_time": "5:14:51", "remaining_time": "0:04:32"}
|
| 1459 |
+
{"current_steps": 1459, "total_steps": 1479, "loss": 0.4192, "lr": 5.570099876595625e-09, "epoch": 2.9594320486815415, "percentage": 98.65, "elapsed_time": "5:15:04", "remaining_time": "0:04:19"}
|
| 1460 |
+
{"current_steps": 1460, "total_steps": 1479, "loss": 0.4182, "lr": 5.027106162742712e-09, "epoch": 2.9614604462474645, "percentage": 98.72, "elapsed_time": "5:15:16", "remaining_time": "0:04:06"}
|
| 1461 |
+
{"current_steps": 1461, "total_steps": 1479, "loss": 0.4309, "lr": 4.511940101207812e-09, "epoch": 2.9634888438133875, "percentage": 98.78, "elapsed_time": "5:15:29", "remaining_time": "0:03:53"}
|
| 1462 |
+
{"current_steps": 1462, "total_steps": 1479, "loss": 0.4134, "lr": 4.024604562049561e-09, "epoch": 2.9655172413793105, "percentage": 98.85, "elapsed_time": "5:15:42", "remaining_time": "0:03:40"}
|
| 1463 |
+
{"current_steps": 1463, "total_steps": 1479, "loss": 0.4383, "lr": 3.565102260278397e-09, "epoch": 2.967545638945233, "percentage": 98.92, "elapsed_time": "5:15:55", "remaining_time": "0:03:27"}
|
| 1464 |
+
{"current_steps": 1464, "total_steps": 1479, "loss": 0.4357, "lr": 3.133435755842129e-09, "epoch": 2.969574036511156, "percentage": 98.99, "elapsed_time": "5:16:08", "remaining_time": "0:03:14"}
|
| 1465 |
+
{"current_steps": 1465, "total_steps": 1479, "loss": 0.4222, "lr": 2.72960745361206e-09, "epoch": 2.971602434077079, "percentage": 99.05, "elapsed_time": "5:16:20", "remaining_time": "0:03:01"}
|
| 1466 |
+
{"current_steps": 1466, "total_steps": 1479, "loss": 0.4395, "lr": 2.353619603368551e-09, "epoch": 2.973630831643002, "percentage": 99.12, "elapsed_time": "5:16:33", "remaining_time": "0:02:48"}
|
| 1467 |
+
{"current_steps": 1467, "total_steps": 1479, "loss": 0.4198, "lr": 2.0054742997893674e-09, "epoch": 2.975659229208925, "percentage": 99.19, "elapsed_time": "5:16:46", "remaining_time": "0:02:35"}
|
| 1468 |
+
{"current_steps": 1468, "total_steps": 1479, "loss": 0.4238, "lr": 1.6851734824380184e-09, "epoch": 2.977687626774848, "percentage": 99.26, "elapsed_time": "5:16:59", "remaining_time": "0:02:22"}
|
| 1469 |
+
{"current_steps": 1469, "total_steps": 1479, "loss": 0.4338, "lr": 1.392718935752102e-09, "epoch": 2.979716024340771, "percentage": 99.32, "elapsed_time": "5:17:12", "remaining_time": "0:02:09"}
|
| 1470 |
+
{"current_steps": 1470, "total_steps": 1479, "loss": 0.4292, "lr": 1.1281122890355322e-09, "epoch": 2.9817444219066935, "percentage": 99.39, "elapsed_time": "5:17:25", "remaining_time": "0:01:56"}
|
| 1471 |
+
{"current_steps": 1471, "total_steps": 1479, "loss": 0.413, "lr": 8.913550164463269e-10, "epoch": 2.9837728194726165, "percentage": 99.46, "elapsed_time": "5:17:37", "remaining_time": "0:01:43"}
|
| 1472 |
+
{"current_steps": 1472, "total_steps": 1479, "loss": 0.4042, "lr": 6.824484369899464e-10, "epoch": 2.9858012170385395, "percentage": 99.53, "elapsed_time": "5:17:50", "remaining_time": "0:01:30"}
|
| 1473 |
+
{"current_steps": 1473, "total_steps": 1479, "loss": 0.4073, "lr": 5.013937145131875e-10, "epoch": 2.9878296146044625, "percentage": 99.59, "elapsed_time": "5:18:03", "remaining_time": "0:01:17"}
|
| 1474 |
+
{"current_steps": 1474, "total_steps": 1479, "loss": 0.4005, "lr": 3.481918576953014e-10, "epoch": 2.9898580121703855, "percentage": 99.66, "elapsed_time": "5:18:16", "remaining_time": "0:01:04"}
|
| 1475 |
+
{"current_steps": 1475, "total_steps": 1479, "loss": 0.4232, "lr": 2.2284372004410804e-10, "epoch": 2.991886409736308, "percentage": 99.73, "elapsed_time": "5:18:29", "remaining_time": "0:00:51"}
|
| 1476 |
+
{"current_steps": 1476, "total_steps": 1479, "loss": 0.4214, "lr": 1.2534999989044506e-10, "epoch": 2.9939148073022315, "percentage": 99.8, "elapsed_time": "5:18:41", "remaining_time": "0:00:38"}
|
| 1477 |
+
{"current_steps": 1477, "total_steps": 1479, "loss": 0.4295, "lr": 5.5711240385392106e-11, "epoch": 2.995943204868154, "percentage": 99.86, "elapsed_time": "5:18:54", "remaining_time": "0:00:25"}
|
| 1478 |
+
{"current_steps": 1478, "total_steps": 1479, "loss": 0.4385, "lr": 1.3927829494719825e-11, "epoch": 2.997971602434077, "percentage": 99.93, "elapsed_time": "5:19:07", "remaining_time": "0:00:12"}
|
| 1479 |
+
{"current_steps": 1479, "total_steps": 1479, "loss": 0.4267, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "5:19:20", "remaining_time": "0:00:00"}
|
| 1480 |
+
{"current_steps": 1479, "total_steps": 1479, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "5:20:50", "remaining_time": "0:00:00"}
|