Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c807f0b5f67096c1bc9209cc789f867cb5c174c67e4ea2e3b355fa3b7e8935df
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:909a64aa460c63e5115befc5fa13e48155b39799d0b9cccbc89491f009320874
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ed83ae7515ae0985eca9ab1594d067d0b4f12dc76c7730bcfb757310e48206c
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec1f7297f2b3aa6ee68791ff320eabd14ccf296ff820bff72df73007e0ad9ed0
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -1054,3 +1054,508 @@
|
|
| 1054 |
{"current_steps": 1054, "total_steps": 1560, "loss": 0.2911, "lr": 2.876774210937843e-06, "epoch": 2.0256, "percentage": 67.56, "elapsed_time": "2:32:55", "remaining_time": "1:13:24"}
|
| 1055 |
{"current_steps": 1055, "total_steps": 1560, "loss": 0.2849, "lr": 2.866650361271023e-06, "epoch": 2.02752, "percentage": 67.63, "elapsed_time": "2:33:04", "remaining_time": "1:13:16"}
|
| 1056 |
{"current_steps": 1056, "total_steps": 1560, "loss": 0.3168, "lr": 2.8565371929847286e-06, "epoch": 2.02944, "percentage": 67.69, "elapsed_time": "2:33:12", "remaining_time": "1:13:07"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1054 |
{"current_steps": 1054, "total_steps": 1560, "loss": 0.2911, "lr": 2.876774210937843e-06, "epoch": 2.0256, "percentage": 67.56, "elapsed_time": "2:32:55", "remaining_time": "1:13:24"}
|
| 1055 |
{"current_steps": 1055, "total_steps": 1560, "loss": 0.2849, "lr": 2.866650361271023e-06, "epoch": 2.02752, "percentage": 67.63, "elapsed_time": "2:33:04", "remaining_time": "1:13:16"}
|
| 1056 |
{"current_steps": 1056, "total_steps": 1560, "loss": 0.3168, "lr": 2.8565371929847286e-06, "epoch": 2.02944, "percentage": 67.69, "elapsed_time": "2:33:12", "remaining_time": "1:13:07"}
|
| 1057 |
+
{"current_steps": 1057, "total_steps": 1560, "loss": 0.2785, "lr": 2.84643475671417e-06, "epoch": 2.03136, "percentage": 67.76, "elapsed_time": "2:33:21", "remaining_time": "1:12:58"}
|
| 1058 |
+
{"current_steps": 1058, "total_steps": 1560, "loss": 0.3336, "lr": 2.836343103040819e-06, "epoch": 2.03328, "percentage": 67.82, "elapsed_time": "2:33:29", "remaining_time": "1:12:49"}
|
| 1059 |
+
{"current_steps": 1059, "total_steps": 1560, "loss": 0.2702, "lr": 2.8262622824921593e-06, "epoch": 2.0352, "percentage": 67.88, "elapsed_time": "2:33:37", "remaining_time": "1:12:40"}
|
| 1060 |
+
{"current_steps": 1060, "total_steps": 1560, "loss": 0.2651, "lr": 2.816192345541437e-06, "epoch": 2.03712, "percentage": 67.95, "elapsed_time": "2:33:46", "remaining_time": "1:12:31"}
|
| 1061 |
+
{"current_steps": 1061, "total_steps": 1560, "loss": 0.2777, "lr": 2.8061333426074054e-06, "epoch": 2.03904, "percentage": 68.01, "elapsed_time": "2:33:54", "remaining_time": "1:12:23"}
|
| 1062 |
+
{"current_steps": 1062, "total_steps": 1560, "loss": 0.3002, "lr": 2.7960853240540703e-06, "epoch": 2.04096, "percentage": 68.08, "elapsed_time": "2:34:02", "remaining_time": "1:12:14"}
|
| 1063 |
+
{"current_steps": 1063, "total_steps": 1560, "loss": 0.3205, "lr": 2.7860483401904483e-06, "epoch": 2.04288, "percentage": 68.14, "elapsed_time": "2:34:10", "remaining_time": "1:12:05"}
|
| 1064 |
+
{"current_steps": 1064, "total_steps": 1560, "loss": 0.2825, "lr": 2.776022441270295e-06, "epoch": 2.0448, "percentage": 68.21, "elapsed_time": "2:34:19", "remaining_time": "1:11:56"}
|
| 1065 |
+
{"current_steps": 1065, "total_steps": 1560, "loss": 0.27, "lr": 2.766007677491871e-06, "epoch": 2.04672, "percentage": 68.27, "elapsed_time": "2:34:27", "remaining_time": "1:11:47"}
|
| 1066 |
+
{"current_steps": 1066, "total_steps": 1560, "loss": 0.2519, "lr": 2.7560040989976894e-06, "epoch": 2.04864, "percentage": 68.33, "elapsed_time": "2:34:35", "remaining_time": "1:11:38"}
|
| 1067 |
+
{"current_steps": 1067, "total_steps": 1560, "loss": 0.2817, "lr": 2.7460117558742532e-06, "epoch": 2.05056, "percentage": 68.4, "elapsed_time": "2:34:43", "remaining_time": "1:11:29"}
|
| 1068 |
+
{"current_steps": 1068, "total_steps": 1560, "loss": 0.3113, "lr": 2.736030698151815e-06, "epoch": 2.05248, "percentage": 68.46, "elapsed_time": "2:34:52", "remaining_time": "1:11:20"}
|
| 1069 |
+
{"current_steps": 1069, "total_steps": 1560, "loss": 0.3104, "lr": 2.72606097580412e-06, "epoch": 2.0544, "percentage": 68.53, "elapsed_time": "2:35:00", "remaining_time": "1:11:11"}
|
| 1070 |
+
{"current_steps": 1070, "total_steps": 1560, "loss": 0.2682, "lr": 2.7161026387481636e-06, "epoch": 2.05632, "percentage": 68.59, "elapsed_time": "2:35:08", "remaining_time": "1:11:02"}
|
| 1071 |
+
{"current_steps": 1071, "total_steps": 1560, "loss": 0.3398, "lr": 2.7061557368439294e-06, "epoch": 2.05824, "percentage": 68.65, "elapsed_time": "2:35:16", "remaining_time": "1:10:53"}
|
| 1072 |
+
{"current_steps": 1072, "total_steps": 1560, "loss": 0.2547, "lr": 2.6962203198941587e-06, "epoch": 2.06016, "percentage": 68.72, "elapsed_time": "2:35:25", "remaining_time": "1:10:44"}
|
| 1073 |
+
{"current_steps": 1073, "total_steps": 1560, "loss": 0.2593, "lr": 2.686296437644074e-06, "epoch": 2.06208, "percentage": 68.78, "elapsed_time": "2:35:33", "remaining_time": "1:10:36"}
|
| 1074 |
+
{"current_steps": 1074, "total_steps": 1560, "loss": 0.2548, "lr": 2.6763841397811576e-06, "epoch": 2.064, "percentage": 68.85, "elapsed_time": "2:35:41", "remaining_time": "1:10:27"}
|
| 1075 |
+
{"current_steps": 1075, "total_steps": 1560, "loss": 0.2779, "lr": 2.666483475934885e-06, "epoch": 2.06592, "percentage": 68.91, "elapsed_time": "2:35:49", "remaining_time": "1:10:18"}
|
| 1076 |
+
{"current_steps": 1076, "total_steps": 1560, "loss": 0.3047, "lr": 2.656594495676482e-06, "epoch": 2.06784, "percentage": 68.97, "elapsed_time": "2:35:57", "remaining_time": "1:10:09"}
|
| 1077 |
+
{"current_steps": 1077, "total_steps": 1560, "loss": 0.263, "lr": 2.6467172485186775e-06, "epoch": 2.06976, "percentage": 69.04, "elapsed_time": "2:36:06", "remaining_time": "1:10:00"}
|
| 1078 |
+
{"current_steps": 1078, "total_steps": 1560, "loss": 0.2966, "lr": 2.636851783915454e-06, "epoch": 2.07168, "percentage": 69.1, "elapsed_time": "2:36:14", "remaining_time": "1:09:51"}
|
| 1079 |
+
{"current_steps": 1079, "total_steps": 1560, "loss": 0.2769, "lr": 2.626998151261798e-06, "epoch": 2.0736, "percentage": 69.17, "elapsed_time": "2:36:22", "remaining_time": "1:09:42"}
|
| 1080 |
+
{"current_steps": 1080, "total_steps": 1560, "loss": 0.4097, "lr": 2.6171563998934605e-06, "epoch": 2.07552, "percentage": 69.23, "elapsed_time": "2:36:30", "remaining_time": "1:09:33"}
|
| 1081 |
+
{"current_steps": 1081, "total_steps": 1560, "loss": 0.2686, "lr": 2.607326579086701e-06, "epoch": 2.07744, "percentage": 69.29, "elapsed_time": "2:36:38", "remaining_time": "1:09:24"}
|
| 1082 |
+
{"current_steps": 1082, "total_steps": 1560, "loss": 0.2711, "lr": 2.5975087380580445e-06, "epoch": 2.07936, "percentage": 69.36, "elapsed_time": "2:36:47", "remaining_time": "1:09:15"}
|
| 1083 |
+
{"current_steps": 1083, "total_steps": 1560, "loss": 0.3293, "lr": 2.587702925964034e-06, "epoch": 2.08128, "percentage": 69.42, "elapsed_time": "2:36:55", "remaining_time": "1:09:06"}
|
| 1084 |
+
{"current_steps": 1084, "total_steps": 1560, "loss": 0.2487, "lr": 2.577909191900988e-06, "epoch": 2.0832, "percentage": 69.49, "elapsed_time": "2:37:03", "remaining_time": "1:08:58"}
|
| 1085 |
+
{"current_steps": 1085, "total_steps": 1560, "loss": 0.2513, "lr": 2.5681275849047482e-06, "epoch": 2.08512, "percentage": 69.55, "elapsed_time": "2:37:11", "remaining_time": "1:08:49"}
|
| 1086 |
+
{"current_steps": 1086, "total_steps": 1560, "loss": 0.291, "lr": 2.5583581539504464e-06, "epoch": 2.08704, "percentage": 69.62, "elapsed_time": "2:37:20", "remaining_time": "1:08:40"}
|
| 1087 |
+
{"current_steps": 1087, "total_steps": 1560, "loss": 0.311, "lr": 2.5486009479522355e-06, "epoch": 2.08896, "percentage": 69.68, "elapsed_time": "2:37:28", "remaining_time": "1:08:31"}
|
| 1088 |
+
{"current_steps": 1088, "total_steps": 1560, "loss": 0.2578, "lr": 2.5388560157630765e-06, "epoch": 2.09088, "percentage": 69.74, "elapsed_time": "2:37:36", "remaining_time": "1:08:22"}
|
| 1089 |
+
{"current_steps": 1089, "total_steps": 1560, "loss": 0.2865, "lr": 2.5291234061744655e-06, "epoch": 2.0928, "percentage": 69.81, "elapsed_time": "2:37:44", "remaining_time": "1:08:13"}
|
| 1090 |
+
{"current_steps": 1090, "total_steps": 1560, "loss": 0.2577, "lr": 2.519403167916207e-06, "epoch": 2.09472, "percentage": 69.87, "elapsed_time": "2:37:53", "remaining_time": "1:08:04"}
|
| 1091 |
+
{"current_steps": 1091, "total_steps": 1560, "loss": 0.3064, "lr": 2.50969534965616e-06, "epoch": 2.09664, "percentage": 69.94, "elapsed_time": "2:38:01", "remaining_time": "1:07:55"}
|
| 1092 |
+
{"current_steps": 1092, "total_steps": 1560, "loss": 0.3994, "lr": 2.5000000000000015e-06, "epoch": 2.09856, "percentage": 70.0, "elapsed_time": "2:38:09", "remaining_time": "1:07:46"}
|
| 1093 |
+
{"current_steps": 1093, "total_steps": 1560, "loss": 0.3051, "lr": 2.490317167490976e-06, "epoch": 2.10048, "percentage": 70.06, "elapsed_time": "2:38:17", "remaining_time": "1:07:38"}
|
| 1094 |
+
{"current_steps": 1094, "total_steps": 1560, "loss": 0.2609, "lr": 2.480646900609664e-06, "epoch": 2.1024, "percentage": 70.13, "elapsed_time": "2:38:26", "remaining_time": "1:07:29"}
|
| 1095 |
+
{"current_steps": 1095, "total_steps": 1560, "loss": 0.3303, "lr": 2.4709892477737263e-06, "epoch": 2.10432, "percentage": 70.19, "elapsed_time": "2:38:34", "remaining_time": "1:07:20"}
|
| 1096 |
+
{"current_steps": 1096, "total_steps": 1560, "loss": 0.2656, "lr": 2.4613442573376625e-06, "epoch": 2.10624, "percentage": 70.26, "elapsed_time": "2:38:42", "remaining_time": "1:07:11"}
|
| 1097 |
+
{"current_steps": 1097, "total_steps": 1560, "loss": 0.3097, "lr": 2.4517119775925824e-06, "epoch": 2.10816, "percentage": 70.32, "elapsed_time": "2:38:50", "remaining_time": "1:07:02"}
|
| 1098 |
+
{"current_steps": 1098, "total_steps": 1560, "loss": 0.2538, "lr": 2.4420924567659508e-06, "epoch": 2.11008, "percentage": 70.38, "elapsed_time": "2:39:00", "remaining_time": "1:06:54"}
|
| 1099 |
+
{"current_steps": 1099, "total_steps": 1560, "loss": 0.2214, "lr": 2.4324857430213504e-06, "epoch": 2.112, "percentage": 70.45, "elapsed_time": "2:39:09", "remaining_time": "1:06:45"}
|
| 1100 |
+
{"current_steps": 1100, "total_steps": 1560, "loss": 0.3502, "lr": 2.422891884458241e-06, "epoch": 2.11392, "percentage": 70.51, "elapsed_time": "2:39:17", "remaining_time": "1:06:36"}
|
| 1101 |
+
{"current_steps": 1101, "total_steps": 1560, "loss": 0.2679, "lr": 2.4133109291117156e-06, "epoch": 2.11584, "percentage": 70.58, "elapsed_time": "2:39:25", "remaining_time": "1:06:27"}
|
| 1102 |
+
{"current_steps": 1102, "total_steps": 1560, "loss": 0.3096, "lr": 2.4037429249522702e-06, "epoch": 2.11776, "percentage": 70.64, "elapsed_time": "2:39:33", "remaining_time": "1:06:18"}
|
| 1103 |
+
{"current_steps": 1103, "total_steps": 1560, "loss": 0.301, "lr": 2.394187919885548e-06, "epoch": 2.11968, "percentage": 70.71, "elapsed_time": "2:39:41", "remaining_time": "1:06:10"}
|
| 1104 |
+
{"current_steps": 1104, "total_steps": 1560, "loss": 0.3019, "lr": 2.384645961752113e-06, "epoch": 2.1216, "percentage": 70.77, "elapsed_time": "2:39:50", "remaining_time": "1:06:01"}
|
| 1105 |
+
{"current_steps": 1105, "total_steps": 1560, "loss": 0.2944, "lr": 2.3751170983272e-06, "epoch": 2.12352, "percentage": 70.83, "elapsed_time": "2:39:58", "remaining_time": "1:05:52"}
|
| 1106 |
+
{"current_steps": 1106, "total_steps": 1560, "loss": 0.2824, "lr": 2.3656013773204843e-06, "epoch": 2.12544, "percentage": 70.9, "elapsed_time": "2:40:06", "remaining_time": "1:05:43"}
|
| 1107 |
+
{"current_steps": 1107, "total_steps": 1560, "loss": 0.3638, "lr": 2.3560988463758366e-06, "epoch": 2.12736, "percentage": 70.96, "elapsed_time": "2:40:14", "remaining_time": "1:05:34"}
|
| 1108 |
+
{"current_steps": 1108, "total_steps": 1560, "loss": 0.3119, "lr": 2.346609553071093e-06, "epoch": 2.12928, "percentage": 71.03, "elapsed_time": "2:40:22", "remaining_time": "1:05:25"}
|
| 1109 |
+
{"current_steps": 1109, "total_steps": 1560, "loss": 0.255, "lr": 2.3371335449178006e-06, "epoch": 2.1312, "percentage": 71.09, "elapsed_time": "2:40:31", "remaining_time": "1:05:16"}
|
| 1110 |
+
{"current_steps": 1110, "total_steps": 1560, "loss": 0.3121, "lr": 2.3276708693609947e-06, "epoch": 2.13312, "percentage": 71.15, "elapsed_time": "2:40:39", "remaining_time": "1:05:07"}
|
| 1111 |
+
{"current_steps": 1111, "total_steps": 1560, "loss": 0.3135, "lr": 2.3182215737789593e-06, "epoch": 2.13504, "percentage": 71.22, "elapsed_time": "2:40:47", "remaining_time": "1:04:58"}
|
| 1112 |
+
{"current_steps": 1112, "total_steps": 1560, "loss": 0.2823, "lr": 2.308785705482982e-06, "epoch": 2.13696, "percentage": 71.28, "elapsed_time": "2:40:55", "remaining_time": "1:04:50"}
|
| 1113 |
+
{"current_steps": 1113, "total_steps": 1560, "loss": 0.3009, "lr": 2.2993633117171243e-06, "epoch": 2.13888, "percentage": 71.35, "elapsed_time": "2:41:03", "remaining_time": "1:04:41"}
|
| 1114 |
+
{"current_steps": 1114, "total_steps": 1560, "loss": 0.3318, "lr": 2.289954439657981e-06, "epoch": 2.1408, "percentage": 71.41, "elapsed_time": "2:41:12", "remaining_time": "1:04:32"}
|
| 1115 |
+
{"current_steps": 1115, "total_steps": 1560, "loss": 0.2629, "lr": 2.2805591364144446e-06, "epoch": 2.14272, "percentage": 71.47, "elapsed_time": "2:41:20", "remaining_time": "1:04:23"}
|
| 1116 |
+
{"current_steps": 1116, "total_steps": 1560, "loss": 0.3054, "lr": 2.2711774490274767e-06, "epoch": 2.14464, "percentage": 71.54, "elapsed_time": "2:41:28", "remaining_time": "1:04:14"}
|
| 1117 |
+
{"current_steps": 1117, "total_steps": 1560, "loss": 0.2922, "lr": 2.2618094244698614e-06, "epoch": 2.14656, "percentage": 71.6, "elapsed_time": "2:41:36", "remaining_time": "1:04:05"}
|
| 1118 |
+
{"current_steps": 1118, "total_steps": 1560, "loss": 0.2313, "lr": 2.2524551096459703e-06, "epoch": 2.14848, "percentage": 71.67, "elapsed_time": "2:41:44", "remaining_time": "1:03:56"}
|
| 1119 |
+
{"current_steps": 1119, "total_steps": 1560, "loss": 0.2797, "lr": 2.243114551391542e-06, "epoch": 2.1504, "percentage": 71.73, "elapsed_time": "2:41:52", "remaining_time": "1:03:47"}
|
| 1120 |
+
{"current_steps": 1120, "total_steps": 1560, "loss": 0.2728, "lr": 2.2337877964734324e-06, "epoch": 2.15232, "percentage": 71.79, "elapsed_time": "2:42:01", "remaining_time": "1:03:38"}
|
| 1121 |
+
{"current_steps": 1121, "total_steps": 1560, "loss": 0.2748, "lr": 2.224474891589386e-06, "epoch": 2.15424, "percentage": 71.86, "elapsed_time": "2:42:09", "remaining_time": "1:03:30"}
|
| 1122 |
+
{"current_steps": 1122, "total_steps": 1560, "loss": 0.2783, "lr": 2.2151758833678044e-06, "epoch": 2.15616, "percentage": 71.92, "elapsed_time": "2:42:17", "remaining_time": "1:03:21"}
|
| 1123 |
+
{"current_steps": 1123, "total_steps": 1560, "loss": 0.3185, "lr": 2.205890818367508e-06, "epoch": 2.15808, "percentage": 71.99, "elapsed_time": "2:42:25", "remaining_time": "1:03:12"}
|
| 1124 |
+
{"current_steps": 1124, "total_steps": 1560, "loss": 0.2804, "lr": 2.1966197430775056e-06, "epoch": 2.16, "percentage": 72.05, "elapsed_time": "2:42:33", "remaining_time": "1:03:03"}
|
| 1125 |
+
{"current_steps": 1125, "total_steps": 1560, "loss": 0.2699, "lr": 2.187362703916766e-06, "epoch": 2.16192, "percentage": 72.12, "elapsed_time": "2:42:41", "remaining_time": "1:02:54"}
|
| 1126 |
+
{"current_steps": 1126, "total_steps": 1560, "loss": 0.2749, "lr": 2.178119747233976e-06, "epoch": 2.16384, "percentage": 72.18, "elapsed_time": "2:42:49", "remaining_time": "1:02:45"}
|
| 1127 |
+
{"current_steps": 1127, "total_steps": 1560, "loss": 0.3258, "lr": 2.168890919307315e-06, "epoch": 2.16576, "percentage": 72.24, "elapsed_time": "2:42:58", "remaining_time": "1:02:36"}
|
| 1128 |
+
{"current_steps": 1128, "total_steps": 1560, "loss": 0.2573, "lr": 2.159676266344222e-06, "epoch": 2.16768, "percentage": 72.31, "elapsed_time": "2:43:06", "remaining_time": "1:02:27"}
|
| 1129 |
+
{"current_steps": 1129, "total_steps": 1560, "loss": 0.308, "lr": 2.1504758344811615e-06, "epoch": 2.1696, "percentage": 72.37, "elapsed_time": "2:43:14", "remaining_time": "1:02:19"}
|
| 1130 |
+
{"current_steps": 1130, "total_steps": 1560, "loss": 0.2809, "lr": 2.141289669783401e-06, "epoch": 2.17152, "percentage": 72.44, "elapsed_time": "2:43:22", "remaining_time": "1:02:10"}
|
| 1131 |
+
{"current_steps": 1131, "total_steps": 1560, "loss": 0.289, "lr": 2.132117818244771e-06, "epoch": 2.17344, "percentage": 72.5, "elapsed_time": "2:43:30", "remaining_time": "1:02:01"}
|
| 1132 |
+
{"current_steps": 1132, "total_steps": 1560, "loss": 0.2888, "lr": 2.122960325787432e-06, "epoch": 2.17536, "percentage": 72.56, "elapsed_time": "2:43:38", "remaining_time": "1:01:52"}
|
| 1133 |
+
{"current_steps": 1133, "total_steps": 1560, "loss": 0.3649, "lr": 2.1138172382616612e-06, "epoch": 2.17728, "percentage": 72.63, "elapsed_time": "2:43:47", "remaining_time": "1:01:43"}
|
| 1134 |
+
{"current_steps": 1134, "total_steps": 1560, "loss": 0.2731, "lr": 2.104688601445606e-06, "epoch": 2.1792, "percentage": 72.69, "elapsed_time": "2:43:55", "remaining_time": "1:01:34"}
|
| 1135 |
+
{"current_steps": 1135, "total_steps": 1560, "loss": 0.2618, "lr": 2.0955744610450616e-06, "epoch": 2.18112, "percentage": 72.76, "elapsed_time": "2:44:03", "remaining_time": "1:01:25"}
|
| 1136 |
+
{"current_steps": 1136, "total_steps": 1560, "loss": 0.3187, "lr": 2.086474862693244e-06, "epoch": 2.18304, "percentage": 72.82, "elapsed_time": "2:44:11", "remaining_time": "1:01:17"}
|
| 1137 |
+
{"current_steps": 1137, "total_steps": 1560, "loss": 0.3175, "lr": 2.077389851950557e-06, "epoch": 2.1849600000000002, "percentage": 72.88, "elapsed_time": "2:44:20", "remaining_time": "1:01:08"}
|
| 1138 |
+
{"current_steps": 1138, "total_steps": 1560, "loss": 0.2749, "lr": 2.068319474304365e-06, "epoch": 2.18688, "percentage": 72.95, "elapsed_time": "2:44:28", "remaining_time": "1:00:59"}
|
| 1139 |
+
{"current_steps": 1139, "total_steps": 1560, "loss": 0.3081, "lr": 2.059263775168773e-06, "epoch": 2.1888, "percentage": 73.01, "elapsed_time": "2:44:36", "remaining_time": "1:00:50"}
|
| 1140 |
+
{"current_steps": 1140, "total_steps": 1560, "loss": 0.2454, "lr": 2.050222799884387e-06, "epoch": 2.19072, "percentage": 73.08, "elapsed_time": "2:44:45", "remaining_time": "1:00:41"}
|
| 1141 |
+
{"current_steps": 1141, "total_steps": 1560, "loss": 0.3034, "lr": 2.0411965937180907e-06, "epoch": 2.19264, "percentage": 73.14, "elapsed_time": "2:44:53", "remaining_time": "1:00:33"}
|
| 1142 |
+
{"current_steps": 1142, "total_steps": 1560, "loss": 0.283, "lr": 2.0321852018628278e-06, "epoch": 2.19456, "percentage": 73.21, "elapsed_time": "2:45:01", "remaining_time": "1:00:24"}
|
| 1143 |
+
{"current_steps": 1143, "total_steps": 1560, "loss": 0.3406, "lr": 2.0231886694373653e-06, "epoch": 2.19648, "percentage": 73.27, "elapsed_time": "2:45:09", "remaining_time": "1:00:15"}
|
| 1144 |
+
{"current_steps": 1144, "total_steps": 1560, "loss": 0.2602, "lr": 2.0142070414860704e-06, "epoch": 2.1984, "percentage": 73.33, "elapsed_time": "2:45:18", "remaining_time": "1:00:06"}
|
| 1145 |
+
{"current_steps": 1145, "total_steps": 1560, "loss": 0.2424, "lr": 2.005240362978686e-06, "epoch": 2.20032, "percentage": 73.4, "elapsed_time": "2:45:26", "remaining_time": "0:59:57"}
|
| 1146 |
+
{"current_steps": 1146, "total_steps": 1560, "loss": 0.2879, "lr": 1.996288678810105e-06, "epoch": 2.20224, "percentage": 73.46, "elapsed_time": "2:45:34", "remaining_time": "0:59:49"}
|
| 1147 |
+
{"current_steps": 1147, "total_steps": 1560, "loss": 0.3131, "lr": 1.98735203380015e-06, "epoch": 2.20416, "percentage": 73.53, "elapsed_time": "2:45:43", "remaining_time": "0:59:40"}
|
| 1148 |
+
{"current_steps": 1148, "total_steps": 1560, "loss": 0.2607, "lr": 1.9784304726933384e-06, "epoch": 2.20608, "percentage": 73.59, "elapsed_time": "2:45:51", "remaining_time": "0:59:31"}
|
| 1149 |
+
{"current_steps": 1149, "total_steps": 1560, "loss": 0.2674, "lr": 1.9695240401586687e-06, "epoch": 2.208, "percentage": 73.65, "elapsed_time": "2:45:59", "remaining_time": "0:59:22"}
|
| 1150 |
+
{"current_steps": 1150, "total_steps": 1560, "loss": 0.2672, "lr": 1.9606327807893905e-06, "epoch": 2.20992, "percentage": 73.72, "elapsed_time": "2:46:07", "remaining_time": "0:59:13"}
|
| 1151 |
+
{"current_steps": 1151, "total_steps": 1560, "loss": 0.4047, "lr": 1.9517567391027853e-06, "epoch": 2.21184, "percentage": 73.78, "elapsed_time": "2:46:16", "remaining_time": "0:59:04"}
|
| 1152 |
+
{"current_steps": 1152, "total_steps": 1560, "loss": 0.275, "lr": 1.942895959539939e-06, "epoch": 2.21376, "percentage": 73.85, "elapsed_time": "2:46:24", "remaining_time": "0:58:56"}
|
| 1153 |
+
{"current_steps": 1153, "total_steps": 1560, "loss": 0.263, "lr": 1.934050486465529e-06, "epoch": 2.21568, "percentage": 73.91, "elapsed_time": "2:46:32", "remaining_time": "0:58:47"}
|
| 1154 |
+
{"current_steps": 1154, "total_steps": 1560, "loss": 0.2913, "lr": 1.9252203641675854e-06, "epoch": 2.2176, "percentage": 73.97, "elapsed_time": "2:46:40", "remaining_time": "0:58:38"}
|
| 1155 |
+
{"current_steps": 1155, "total_steps": 1560, "loss": 0.2891, "lr": 1.9164056368572847e-06, "epoch": 2.21952, "percentage": 74.04, "elapsed_time": "2:46:48", "remaining_time": "0:58:29"}
|
| 1156 |
+
{"current_steps": 1156, "total_steps": 1560, "loss": 0.33, "lr": 1.9076063486687256e-06, "epoch": 2.22144, "percentage": 74.1, "elapsed_time": "2:46:57", "remaining_time": "0:58:20"}
|
| 1157 |
+
{"current_steps": 1157, "total_steps": 1560, "loss": 0.2687, "lr": 1.8988225436587005e-06, "epoch": 2.22336, "percentage": 74.17, "elapsed_time": "2:47:05", "remaining_time": "0:58:11"}
|
| 1158 |
+
{"current_steps": 1158, "total_steps": 1560, "loss": 0.2582, "lr": 1.8900542658064807e-06, "epoch": 2.22528, "percentage": 74.23, "elapsed_time": "2:47:13", "remaining_time": "0:58:03"}
|
| 1159 |
+
{"current_steps": 1159, "total_steps": 1560, "loss": 0.284, "lr": 1.8813015590135963e-06, "epoch": 2.2272, "percentage": 74.29, "elapsed_time": "2:47:21", "remaining_time": "0:57:54"}
|
| 1160 |
+
{"current_steps": 1160, "total_steps": 1560, "loss": 0.2894, "lr": 1.8725644671036125e-06, "epoch": 2.22912, "percentage": 74.36, "elapsed_time": "2:47:29", "remaining_time": "0:57:45"}
|
| 1161 |
+
{"current_steps": 1161, "total_steps": 1560, "loss": 0.3655, "lr": 1.8638430338219199e-06, "epoch": 2.23104, "percentage": 74.42, "elapsed_time": "2:47:38", "remaining_time": "0:57:36"}
|
| 1162 |
+
{"current_steps": 1162, "total_steps": 1560, "loss": 0.316, "lr": 1.8551373028355013e-06, "epoch": 2.23296, "percentage": 74.49, "elapsed_time": "2:47:46", "remaining_time": "0:57:27"}
|
| 1163 |
+
{"current_steps": 1163, "total_steps": 1560, "loss": 0.3216, "lr": 1.846447317732723e-06, "epoch": 2.23488, "percentage": 74.55, "elapsed_time": "2:47:54", "remaining_time": "0:57:18"}
|
| 1164 |
+
{"current_steps": 1164, "total_steps": 1560, "loss": 0.2345, "lr": 1.8377731220231144e-06, "epoch": 2.2368, "percentage": 74.62, "elapsed_time": "2:48:02", "remaining_time": "0:57:10"}
|
| 1165 |
+
{"current_steps": 1165, "total_steps": 1560, "loss": 0.3002, "lr": 1.8291147591371482e-06, "epoch": 2.23872, "percentage": 74.68, "elapsed_time": "2:48:10", "remaining_time": "0:57:01"}
|
| 1166 |
+
{"current_steps": 1166, "total_steps": 1560, "loss": 0.2879, "lr": 1.8204722724260266e-06, "epoch": 2.24064, "percentage": 74.74, "elapsed_time": "2:48:18", "remaining_time": "0:56:52"}
|
| 1167 |
+
{"current_steps": 1167, "total_steps": 1560, "loss": 0.2928, "lr": 1.8118457051614591e-06, "epoch": 2.24256, "percentage": 74.81, "elapsed_time": "2:48:27", "remaining_time": "0:56:43"}
|
| 1168 |
+
{"current_steps": 1168, "total_steps": 1560, "loss": 0.2776, "lr": 1.803235100535452e-06, "epoch": 2.24448, "percentage": 74.87, "elapsed_time": "2:48:35", "remaining_time": "0:56:34"}
|
| 1169 |
+
{"current_steps": 1169, "total_steps": 1560, "loss": 0.3407, "lr": 1.7946405016600843e-06, "epoch": 2.2464, "percentage": 74.94, "elapsed_time": "2:48:43", "remaining_time": "0:56:26"}
|
| 1170 |
+
{"current_steps": 1170, "total_steps": 1560, "loss": 0.2727, "lr": 1.7860619515673034e-06, "epoch": 2.24832, "percentage": 75.0, "elapsed_time": "2:48:51", "remaining_time": "0:56:17"}
|
| 1171 |
+
{"current_steps": 1171, "total_steps": 1560, "loss": 0.2804, "lr": 1.7774994932086976e-06, "epoch": 2.25024, "percentage": 75.06, "elapsed_time": "2:48:59", "remaining_time": "0:56:08"}
|
| 1172 |
+
{"current_steps": 1172, "total_steps": 1560, "loss": 0.2944, "lr": 1.7689531694552863e-06, "epoch": 2.25216, "percentage": 75.13, "elapsed_time": "2:49:08", "remaining_time": "0:55:59"}
|
| 1173 |
+
{"current_steps": 1173, "total_steps": 1560, "loss": 0.306, "lr": 1.7604230230973068e-06, "epoch": 2.25408, "percentage": 75.19, "elapsed_time": "2:49:16", "remaining_time": "0:55:50"}
|
| 1174 |
+
{"current_steps": 1174, "total_steps": 1560, "loss": 0.2572, "lr": 1.7519090968439966e-06, "epoch": 2.2560000000000002, "percentage": 75.26, "elapsed_time": "2:49:24", "remaining_time": "0:55:41"}
|
| 1175 |
+
{"current_steps": 1175, "total_steps": 1560, "loss": 0.3028, "lr": 1.7434114333233853e-06, "epoch": 2.25792, "percentage": 75.32, "elapsed_time": "2:49:32", "remaining_time": "0:55:33"}
|
| 1176 |
+
{"current_steps": 1176, "total_steps": 1560, "loss": 0.2762, "lr": 1.7349300750820758e-06, "epoch": 2.25984, "percentage": 75.38, "elapsed_time": "2:49:40", "remaining_time": "0:55:24"}
|
| 1177 |
+
{"current_steps": 1177, "total_steps": 1560, "loss": 0.2836, "lr": 1.7264650645850256e-06, "epoch": 2.2617599999999998, "percentage": 75.45, "elapsed_time": "2:49:48", "remaining_time": "0:55:15"}
|
| 1178 |
+
{"current_steps": 1178, "total_steps": 1560, "loss": 0.2297, "lr": 1.7180164442153529e-06, "epoch": 2.26368, "percentage": 75.51, "elapsed_time": "2:49:57", "remaining_time": "0:55:06"}
|
| 1179 |
+
{"current_steps": 1179, "total_steps": 1560, "loss": 0.3069, "lr": 1.709584256274106e-06, "epoch": 2.2656, "percentage": 75.58, "elapsed_time": "2:50:05", "remaining_time": "0:54:57"}
|
| 1180 |
+
{"current_steps": 1180, "total_steps": 1560, "loss": 0.3167, "lr": 1.7011685429800596e-06, "epoch": 2.26752, "percentage": 75.64, "elapsed_time": "2:50:13", "remaining_time": "0:54:49"}
|
| 1181 |
+
{"current_steps": 1181, "total_steps": 1560, "loss": 0.2595, "lr": 1.6927693464695022e-06, "epoch": 2.26944, "percentage": 75.71, "elapsed_time": "2:50:21", "remaining_time": "0:54:40"}
|
| 1182 |
+
{"current_steps": 1182, "total_steps": 1560, "loss": 0.3076, "lr": 1.6843867087960252e-06, "epoch": 2.27136, "percentage": 75.77, "elapsed_time": "2:50:29", "remaining_time": "0:54:31"}
|
| 1183 |
+
{"current_steps": 1183, "total_steps": 1560, "loss": 0.2961, "lr": 1.6760206719303107e-06, "epoch": 2.27328, "percentage": 75.83, "elapsed_time": "2:50:38", "remaining_time": "0:54:22"}
|
| 1184 |
+
{"current_steps": 1184, "total_steps": 1560, "loss": 0.2758, "lr": 1.6676712777599275e-06, "epoch": 2.2752, "percentage": 75.9, "elapsed_time": "2:50:46", "remaining_time": "0:54:13"}
|
| 1185 |
+
{"current_steps": 1185, "total_steps": 1560, "loss": 0.3264, "lr": 1.6593385680891139e-06, "epoch": 2.27712, "percentage": 75.96, "elapsed_time": "2:50:54", "remaining_time": "0:54:05"}
|
| 1186 |
+
{"current_steps": 1186, "total_steps": 1560, "loss": 0.2672, "lr": 1.6510225846385668e-06, "epoch": 2.27904, "percentage": 76.03, "elapsed_time": "2:51:02", "remaining_time": "0:53:56"}
|
| 1187 |
+
{"current_steps": 1187, "total_steps": 1560, "loss": 0.2934, "lr": 1.6427233690452455e-06, "epoch": 2.28096, "percentage": 76.09, "elapsed_time": "2:51:10", "remaining_time": "0:53:47"}
|
| 1188 |
+
{"current_steps": 1188, "total_steps": 1560, "loss": 0.2354, "lr": 1.6344409628621482e-06, "epoch": 2.28288, "percentage": 76.15, "elapsed_time": "2:51:18", "remaining_time": "0:53:38"}
|
| 1189 |
+
{"current_steps": 1189, "total_steps": 1560, "loss": 0.2571, "lr": 1.6261754075581187e-06, "epoch": 2.2848, "percentage": 76.22, "elapsed_time": "2:51:27", "remaining_time": "0:53:29"}
|
| 1190 |
+
{"current_steps": 1190, "total_steps": 1560, "loss": 0.2754, "lr": 1.6179267445176206e-06, "epoch": 2.28672, "percentage": 76.28, "elapsed_time": "2:51:35", "remaining_time": "0:53:21"}
|
| 1191 |
+
{"current_steps": 1191, "total_steps": 1560, "loss": 0.2847, "lr": 1.6096950150405454e-06, "epoch": 2.28864, "percentage": 76.35, "elapsed_time": "2:51:43", "remaining_time": "0:53:12"}
|
| 1192 |
+
{"current_steps": 1192, "total_steps": 1560, "loss": 0.2203, "lr": 1.6014802603420044e-06, "epoch": 2.29056, "percentage": 76.41, "elapsed_time": "2:51:51", "remaining_time": "0:53:03"}
|
| 1193 |
+
{"current_steps": 1193, "total_steps": 1560, "loss": 0.2612, "lr": 1.593282521552113e-06, "epoch": 2.29248, "percentage": 76.47, "elapsed_time": "2:51:59", "remaining_time": "0:52:54"}
|
| 1194 |
+
{"current_steps": 1194, "total_steps": 1560, "loss": 0.2722, "lr": 1.5851018397157918e-06, "epoch": 2.2944, "percentage": 76.54, "elapsed_time": "2:52:07", "remaining_time": "0:52:45"}
|
| 1195 |
+
{"current_steps": 1195, "total_steps": 1560, "loss": 0.2623, "lr": 1.5769382557925612e-06, "epoch": 2.29632, "percentage": 76.6, "elapsed_time": "2:52:16", "remaining_time": "0:52:37"}
|
| 1196 |
+
{"current_steps": 1196, "total_steps": 1560, "loss": 0.2762, "lr": 1.5687918106563326e-06, "epoch": 2.29824, "percentage": 76.67, "elapsed_time": "2:52:24", "remaining_time": "0:52:28"}
|
| 1197 |
+
{"current_steps": 1197, "total_steps": 1560, "loss": 0.3863, "lr": 1.5606625450952062e-06, "epoch": 2.30016, "percentage": 76.73, "elapsed_time": "2:52:32", "remaining_time": "0:52:19"}
|
| 1198 |
+
{"current_steps": 1198, "total_steps": 1560, "loss": 0.2837, "lr": 1.5525504998112717e-06, "epoch": 2.30208, "percentage": 76.79, "elapsed_time": "2:52:40", "remaining_time": "0:52:10"}
|
| 1199 |
+
{"current_steps": 1199, "total_steps": 1560, "loss": 0.271, "lr": 1.5444557154203892e-06, "epoch": 2.304, "percentage": 76.86, "elapsed_time": "2:52:48", "remaining_time": "0:52:01"}
|
| 1200 |
+
{"current_steps": 1200, "total_steps": 1560, "loss": 0.3548, "lr": 1.5363782324520033e-06, "epoch": 2.30592, "percentage": 76.92, "elapsed_time": "2:52:57", "remaining_time": "0:51:53"}
|
| 1201 |
+
{"current_steps": 1201, "total_steps": 1560, "loss": 0.2822, "lr": 1.5283180913489326e-06, "epoch": 2.30784, "percentage": 76.99, "elapsed_time": "2:53:05", "remaining_time": "0:51:44"}
|
| 1202 |
+
{"current_steps": 1202, "total_steps": 1560, "loss": 0.275, "lr": 1.520275332467166e-06, "epoch": 2.30976, "percentage": 77.05, "elapsed_time": "2:53:13", "remaining_time": "0:51:35"}
|
| 1203 |
+
{"current_steps": 1203, "total_steps": 1560, "loss": 0.2794, "lr": 1.5122499960756604e-06, "epoch": 2.31168, "percentage": 77.12, "elapsed_time": "2:53:21", "remaining_time": "0:51:26"}
|
| 1204 |
+
{"current_steps": 1204, "total_steps": 1560, "loss": 0.3468, "lr": 1.504242122356143e-06, "epoch": 2.3136, "percentage": 77.18, "elapsed_time": "2:53:29", "remaining_time": "0:51:18"}
|
| 1205 |
+
{"current_steps": 1205, "total_steps": 1560, "loss": 0.4115, "lr": 1.4962517514029069e-06, "epoch": 2.3155200000000002, "percentage": 77.24, "elapsed_time": "2:53:38", "remaining_time": "0:51:09"}
|
| 1206 |
+
{"current_steps": 1206, "total_steps": 1560, "loss": 0.3043, "lr": 1.4882789232226124e-06, "epoch": 2.31744, "percentage": 77.31, "elapsed_time": "2:53:46", "remaining_time": "0:51:00"}
|
| 1207 |
+
{"current_steps": 1207, "total_steps": 1560, "loss": 0.282, "lr": 1.4803236777340856e-06, "epoch": 2.31936, "percentage": 77.37, "elapsed_time": "2:53:54", "remaining_time": "0:50:51"}
|
| 1208 |
+
{"current_steps": 1208, "total_steps": 1560, "loss": 0.3147, "lr": 1.4723860547681163e-06, "epoch": 2.32128, "percentage": 77.44, "elapsed_time": "2:54:02", "remaining_time": "0:50:42"}
|
| 1209 |
+
{"current_steps": 1209, "total_steps": 1560, "loss": 0.2561, "lr": 1.4644660940672628e-06, "epoch": 2.3232, "percentage": 77.5, "elapsed_time": "2:54:10", "remaining_time": "0:50:34"}
|
| 1210 |
+
{"current_steps": 1210, "total_steps": 1560, "loss": 0.2906, "lr": 1.4565638352856504e-06, "epoch": 2.32512, "percentage": 77.56, "elapsed_time": "2:54:19", "remaining_time": "0:50:25"}
|
| 1211 |
+
{"current_steps": 1211, "total_steps": 1560, "loss": 0.2662, "lr": 1.4486793179887738e-06, "epoch": 2.32704, "percentage": 77.63, "elapsed_time": "2:54:27", "remaining_time": "0:50:16"}
|
| 1212 |
+
{"current_steps": 1212, "total_steps": 1560, "loss": 0.3095, "lr": 1.4408125816532981e-06, "epoch": 2.32896, "percentage": 77.69, "elapsed_time": "2:54:36", "remaining_time": "0:50:07"}
|
| 1213 |
+
{"current_steps": 1213, "total_steps": 1560, "loss": 0.2799, "lr": 1.4329636656668617e-06, "epoch": 2.33088, "percentage": 77.76, "elapsed_time": "2:54:44", "remaining_time": "0:49:59"}
|
| 1214 |
+
{"current_steps": 1214, "total_steps": 1560, "loss": 0.3195, "lr": 1.4251326093278773e-06, "epoch": 2.3327999999999998, "percentage": 77.82, "elapsed_time": "2:54:53", "remaining_time": "0:49:50"}
|
| 1215 |
+
{"current_steps": 1215, "total_steps": 1560, "loss": 0.3173, "lr": 1.4173194518453415e-06, "epoch": 2.33472, "percentage": 77.88, "elapsed_time": "2:55:01", "remaining_time": "0:49:42"}
|
| 1216 |
+
{"current_steps": 1216, "total_steps": 1560, "loss": 0.2497, "lr": 1.4095242323386305e-06, "epoch": 2.33664, "percentage": 77.95, "elapsed_time": "2:55:10", "remaining_time": "0:49:33"}
|
| 1217 |
+
{"current_steps": 1217, "total_steps": 1560, "loss": 0.2535, "lr": 1.4017469898373077e-06, "epoch": 2.33856, "percentage": 78.01, "elapsed_time": "2:55:19", "remaining_time": "0:49:24"}
|
| 1218 |
+
{"current_steps": 1218, "total_steps": 1560, "loss": 0.2698, "lr": 1.3939877632809279e-06, "epoch": 2.34048, "percentage": 78.08, "elapsed_time": "2:55:27", "remaining_time": "0:49:16"}
|
| 1219 |
+
{"current_steps": 1219, "total_steps": 1560, "loss": 0.312, "lr": 1.3862465915188427e-06, "epoch": 2.3424, "percentage": 78.14, "elapsed_time": "2:55:36", "remaining_time": "0:49:07"}
|
| 1220 |
+
{"current_steps": 1220, "total_steps": 1560, "loss": 0.2763, "lr": 1.3785235133100088e-06, "epoch": 2.34432, "percentage": 78.21, "elapsed_time": "2:55:44", "remaining_time": "0:48:58"}
|
| 1221 |
+
{"current_steps": 1221, "total_steps": 1560, "loss": 0.2413, "lr": 1.3708185673227896e-06, "epoch": 2.34624, "percentage": 78.27, "elapsed_time": "2:55:53", "remaining_time": "0:48:50"}
|
| 1222 |
+
{"current_steps": 1222, "total_steps": 1560, "loss": 0.2995, "lr": 1.3631317921347564e-06, "epoch": 2.34816, "percentage": 78.33, "elapsed_time": "2:56:02", "remaining_time": "0:48:41"}
|
| 1223 |
+
{"current_steps": 1223, "total_steps": 1560, "loss": 0.2836, "lr": 1.3554632262325129e-06, "epoch": 2.35008, "percentage": 78.4, "elapsed_time": "2:56:10", "remaining_time": "0:48:32"}
|
| 1224 |
+
{"current_steps": 1224, "total_steps": 1560, "loss": 0.2801, "lr": 1.347812908011485e-06, "epoch": 2.352, "percentage": 78.46, "elapsed_time": "2:56:19", "remaining_time": "0:48:24"}
|
| 1225 |
+
{"current_steps": 1225, "total_steps": 1560, "loss": 0.2558, "lr": 1.340180875775735e-06, "epoch": 2.35392, "percentage": 78.53, "elapsed_time": "2:56:28", "remaining_time": "0:48:15"}
|
| 1226 |
+
{"current_steps": 1226, "total_steps": 1560, "loss": 0.2635, "lr": 1.3325671677377727e-06, "epoch": 2.35584, "percentage": 78.59, "elapsed_time": "2:56:36", "remaining_time": "0:48:06"}
|
| 1227 |
+
{"current_steps": 1227, "total_steps": 1560, "loss": 0.3403, "lr": 1.3249718220183583e-06, "epoch": 2.35776, "percentage": 78.65, "elapsed_time": "2:56:44", "remaining_time": "0:47:58"}
|
| 1228 |
+
{"current_steps": 1228, "total_steps": 1560, "loss": 0.2354, "lr": 1.3173948766463146e-06, "epoch": 2.35968, "percentage": 78.72, "elapsed_time": "2:56:53", "remaining_time": "0:47:49"}
|
| 1229 |
+
{"current_steps": 1229, "total_steps": 1560, "loss": 0.2497, "lr": 1.309836369558341e-06, "epoch": 2.3616, "percentage": 78.78, "elapsed_time": "2:57:01", "remaining_time": "0:47:40"}
|
| 1230 |
+
{"current_steps": 1230, "total_steps": 1560, "loss": 0.3405, "lr": 1.3022963385988153e-06, "epoch": 2.36352, "percentage": 78.85, "elapsed_time": "2:57:10", "remaining_time": "0:47:31"}
|
| 1231 |
+
{"current_steps": 1231, "total_steps": 1560, "loss": 0.2827, "lr": 1.2947748215196038e-06, "epoch": 2.36544, "percentage": 78.91, "elapsed_time": "2:57:18", "remaining_time": "0:47:23"}
|
| 1232 |
+
{"current_steps": 1232, "total_steps": 1560, "loss": 0.3192, "lr": 1.2872718559798852e-06, "epoch": 2.36736, "percentage": 78.97, "elapsed_time": "2:57:26", "remaining_time": "0:47:14"}
|
| 1233 |
+
{"current_steps": 1233, "total_steps": 1560, "loss": 0.2211, "lr": 1.2797874795459464e-06, "epoch": 2.36928, "percentage": 79.04, "elapsed_time": "2:57:35", "remaining_time": "0:47:05"}
|
| 1234 |
+
{"current_steps": 1234, "total_steps": 1560, "loss": 0.2737, "lr": 1.2723217296910078e-06, "epoch": 2.3712, "percentage": 79.1, "elapsed_time": "2:57:43", "remaining_time": "0:46:57"}
|
| 1235 |
+
{"current_steps": 1235, "total_steps": 1560, "loss": 0.2977, "lr": 1.264874643795021e-06, "epoch": 2.37312, "percentage": 79.17, "elapsed_time": "2:57:51", "remaining_time": "0:46:48"}
|
| 1236 |
+
{"current_steps": 1236, "total_steps": 1560, "loss": 0.2462, "lr": 1.257446259144494e-06, "epoch": 2.37504, "percentage": 79.23, "elapsed_time": "2:58:00", "remaining_time": "0:46:39"}
|
| 1237 |
+
{"current_steps": 1237, "total_steps": 1560, "loss": 0.2923, "lr": 1.2500366129323039e-06, "epoch": 2.37696, "percentage": 79.29, "elapsed_time": "2:58:08", "remaining_time": "0:46:30"}
|
| 1238 |
+
{"current_steps": 1238, "total_steps": 1560, "loss": 0.2326, "lr": 1.2426457422575e-06, "epoch": 2.37888, "percentage": 79.36, "elapsed_time": "2:58:16", "remaining_time": "0:46:22"}
|
| 1239 |
+
{"current_steps": 1239, "total_steps": 1560, "loss": 0.308, "lr": 1.2352736841251306e-06, "epoch": 2.3808, "percentage": 79.42, "elapsed_time": "2:58:25", "remaining_time": "0:46:13"}
|
| 1240 |
+
{"current_steps": 1240, "total_steps": 1560, "loss": 0.3104, "lr": 1.2279204754460494e-06, "epoch": 2.38272, "percentage": 79.49, "elapsed_time": "2:58:34", "remaining_time": "0:46:05"}
|
| 1241 |
+
{"current_steps": 1241, "total_steps": 1560, "loss": 0.292, "lr": 1.2205861530367342e-06, "epoch": 2.38464, "percentage": 79.55, "elapsed_time": "2:58:43", "remaining_time": "0:45:56"}
|
| 1242 |
+
{"current_steps": 1242, "total_steps": 1560, "loss": 0.232, "lr": 1.2132707536191008e-06, "epoch": 2.3865600000000002, "percentage": 79.62, "elapsed_time": "2:58:52", "remaining_time": "0:45:47"}
|
| 1243 |
+
{"current_steps": 1243, "total_steps": 1560, "loss": 0.2677, "lr": 1.2059743138203256e-06, "epoch": 2.38848, "percentage": 79.68, "elapsed_time": "2:59:00", "remaining_time": "0:45:39"}
|
| 1244 |
+
{"current_steps": 1244, "total_steps": 1560, "loss": 0.312, "lr": 1.1986968701726492e-06, "epoch": 2.3904, "percentage": 79.74, "elapsed_time": "2:59:09", "remaining_time": "0:45:30"}
|
| 1245 |
+
{"current_steps": 1245, "total_steps": 1560, "loss": 0.3074, "lr": 1.1914384591132045e-06, "epoch": 2.39232, "percentage": 79.81, "elapsed_time": "2:59:18", "remaining_time": "0:45:21"}
|
| 1246 |
+
{"current_steps": 1246, "total_steps": 1560, "loss": 0.291, "lr": 1.184199116983834e-06, "epoch": 2.39424, "percentage": 79.87, "elapsed_time": "2:59:26", "remaining_time": "0:45:13"}
|
| 1247 |
+
{"current_steps": 1247, "total_steps": 1560, "loss": 0.2913, "lr": 1.1769788800309001e-06, "epoch": 2.39616, "percentage": 79.94, "elapsed_time": "2:59:35", "remaining_time": "0:45:04"}
|
| 1248 |
+
{"current_steps": 1248, "total_steps": 1560, "loss": 0.3379, "lr": 1.1697777844051105e-06, "epoch": 2.39808, "percentage": 80.0, "elapsed_time": "2:59:46", "remaining_time": "0:44:56"}
|
| 1249 |
+
{"current_steps": 1249, "total_steps": 1560, "loss": 0.2928, "lr": 1.1625958661613345e-06, "epoch": 2.4, "percentage": 80.06, "elapsed_time": "2:59:55", "remaining_time": "0:44:47"}
|
| 1250 |
+
{"current_steps": 1250, "total_steps": 1560, "loss": 0.3514, "lr": 1.1554331612584218e-06, "epoch": 2.40192, "percentage": 80.13, "elapsed_time": "3:00:03", "remaining_time": "0:44:39"}
|
| 1251 |
+
{"current_steps": 1251, "total_steps": 1560, "loss": 0.2611, "lr": 1.1482897055590275e-06, "epoch": 2.4038399999999998, "percentage": 80.19, "elapsed_time": "3:00:12", "remaining_time": "0:44:30"}
|
| 1252 |
+
{"current_steps": 1252, "total_steps": 1560, "loss": 0.2871, "lr": 1.141165534829425e-06, "epoch": 2.40576, "percentage": 80.26, "elapsed_time": "3:00:20", "remaining_time": "0:44:21"}
|
| 1253 |
+
{"current_steps": 1253, "total_steps": 1560, "loss": 0.2827, "lr": 1.134060684739331e-06, "epoch": 2.40768, "percentage": 80.32, "elapsed_time": "3:00:29", "remaining_time": "0:44:13"}
|
| 1254 |
+
{"current_steps": 1254, "total_steps": 1560, "loss": 0.3143, "lr": 1.1269751908617277e-06, "epoch": 2.4096, "percentage": 80.38, "elapsed_time": "3:00:37", "remaining_time": "0:44:04"}
|
| 1255 |
+
{"current_steps": 1255, "total_steps": 1560, "loss": 0.2936, "lr": 1.119909088672682e-06, "epoch": 2.41152, "percentage": 80.45, "elapsed_time": "3:00:46", "remaining_time": "0:43:55"}
|
| 1256 |
+
{"current_steps": 1256, "total_steps": 1560, "loss": 0.2658, "lr": 1.1128624135511712e-06, "epoch": 2.41344, "percentage": 80.51, "elapsed_time": "3:00:54", "remaining_time": "0:43:47"}
|
| 1257 |
+
{"current_steps": 1257, "total_steps": 1560, "loss": 0.3018, "lr": 1.105835200778902e-06, "epoch": 2.41536, "percentage": 80.58, "elapsed_time": "3:01:02", "remaining_time": "0:43:38"}
|
| 1258 |
+
{"current_steps": 1258, "total_steps": 1560, "loss": 0.2974, "lr": 1.0988274855401377e-06, "epoch": 2.41728, "percentage": 80.64, "elapsed_time": "3:01:11", "remaining_time": "0:43:29"}
|
| 1259 |
+
{"current_steps": 1259, "total_steps": 1560, "loss": 0.2799, "lr": 1.091839302921518e-06, "epoch": 2.4192, "percentage": 80.71, "elapsed_time": "3:01:19", "remaining_time": "0:43:21"}
|
| 1260 |
+
{"current_steps": 1260, "total_steps": 1560, "loss": 0.2926, "lr": 1.0848706879118893e-06, "epoch": 2.42112, "percentage": 80.77, "elapsed_time": "3:01:27", "remaining_time": "0:43:12"}
|
| 1261 |
+
{"current_steps": 1261, "total_steps": 1560, "loss": 0.2738, "lr": 1.0779216754021215e-06, "epoch": 2.42304, "percentage": 80.83, "elapsed_time": "3:01:36", "remaining_time": "0:43:03"}
|
| 1262 |
+
{"current_steps": 1262, "total_steps": 1560, "loss": 0.2623, "lr": 1.070992300184941e-06, "epoch": 2.42496, "percentage": 80.9, "elapsed_time": "3:01:44", "remaining_time": "0:42:54"}
|
| 1263 |
+
{"current_steps": 1263, "total_steps": 1560, "loss": 0.2811, "lr": 1.0640825969547498e-06, "epoch": 2.42688, "percentage": 80.96, "elapsed_time": "3:01:53", "remaining_time": "0:42:46"}
|
| 1264 |
+
{"current_steps": 1264, "total_steps": 1560, "loss": 0.3692, "lr": 1.057192600307456e-06, "epoch": 2.4288, "percentage": 81.03, "elapsed_time": "3:02:01", "remaining_time": "0:42:37"}
|
| 1265 |
+
{"current_steps": 1265, "total_steps": 1560, "loss": 0.247, "lr": 1.0503223447403033e-06, "epoch": 2.43072, "percentage": 81.09, "elapsed_time": "3:02:09", "remaining_time": "0:42:28"}
|
| 1266 |
+
{"current_steps": 1266, "total_steps": 1560, "loss": 0.3301, "lr": 1.0434718646516917e-06, "epoch": 2.43264, "percentage": 81.15, "elapsed_time": "3:02:18", "remaining_time": "0:42:20"}
|
| 1267 |
+
{"current_steps": 1267, "total_steps": 1560, "loss": 0.3254, "lr": 1.0366411943410033e-06, "epoch": 2.43456, "percentage": 81.22, "elapsed_time": "3:02:26", "remaining_time": "0:42:11"}
|
| 1268 |
+
{"current_steps": 1268, "total_steps": 1560, "loss": 0.2392, "lr": 1.0298303680084448e-06, "epoch": 2.43648, "percentage": 81.28, "elapsed_time": "3:02:34", "remaining_time": "0:42:02"}
|
| 1269 |
+
{"current_steps": 1269, "total_steps": 1560, "loss": 0.2541, "lr": 1.0230394197548605e-06, "epoch": 2.4384, "percentage": 81.35, "elapsed_time": "3:02:43", "remaining_time": "0:41:54"}
|
| 1270 |
+
{"current_steps": 1270, "total_steps": 1560, "loss": 0.28, "lr": 1.0162683835815706e-06, "epoch": 2.44032, "percentage": 81.41, "elapsed_time": "3:02:51", "remaining_time": "0:41:45"}
|
| 1271 |
+
{"current_steps": 1271, "total_steps": 1560, "loss": 0.2788, "lr": 1.009517293390197e-06, "epoch": 2.44224, "percentage": 81.47, "elapsed_time": "3:02:59", "remaining_time": "0:41:36"}
|
| 1272 |
+
{"current_steps": 1272, "total_steps": 1560, "loss": 0.2315, "lr": 1.0027861829824953e-06, "epoch": 2.44416, "percentage": 81.54, "elapsed_time": "3:03:08", "remaining_time": "0:41:28"}
|
| 1273 |
+
{"current_steps": 1273, "total_steps": 1560, "loss": 0.3374, "lr": 9.960750860601842e-07, "epoch": 2.44608, "percentage": 81.6, "elapsed_time": "3:03:17", "remaining_time": "0:41:19"}
|
| 1274 |
+
{"current_steps": 1274, "total_steps": 1560, "loss": 0.2754, "lr": 9.893840362247809e-07, "epoch": 2.448, "percentage": 81.67, "elapsed_time": "3:03:26", "remaining_time": "0:41:10"}
|
| 1275 |
+
{"current_steps": 1275, "total_steps": 1560, "loss": 0.2415, "lr": 9.82713066977427e-07, "epoch": 2.44992, "percentage": 81.73, "elapsed_time": "3:03:34", "remaining_time": "0:41:02"}
|
| 1276 |
+
{"current_steps": 1276, "total_steps": 1560, "loss": 0.3354, "lr": 9.760622117187234e-07, "epoch": 2.45184, "percentage": 81.79, "elapsed_time": "3:03:43", "remaining_time": "0:40:53"}
|
| 1277 |
+
{"current_steps": 1277, "total_steps": 1560, "loss": 0.3129, "lr": 9.694315037485635e-07, "epoch": 2.45376, "percentage": 81.86, "elapsed_time": "3:03:52", "remaining_time": "0:40:44"}
|
| 1278 |
+
{"current_steps": 1278, "total_steps": 1560, "loss": 0.2824, "lr": 9.628209762659658e-07, "epoch": 2.45568, "percentage": 81.92, "elapsed_time": "3:04:01", "remaining_time": "0:40:36"}
|
| 1279 |
+
{"current_steps": 1279, "total_steps": 1560, "loss": 0.2411, "lr": 9.562306623689111e-07, "epoch": 2.4576000000000002, "percentage": 81.99, "elapsed_time": "3:04:09", "remaining_time": "0:40:27"}
|
| 1280 |
+
{"current_steps": 1280, "total_steps": 1560, "loss": 0.2719, "lr": 9.496605950541676e-07, "epoch": 2.45952, "percentage": 82.05, "elapsed_time": "3:04:18", "remaining_time": "0:40:18"}
|
| 1281 |
+
{"current_steps": 1281, "total_steps": 1560, "loss": 0.2166, "lr": 9.431108072171346e-07, "epoch": 2.46144, "percentage": 82.12, "elapsed_time": "3:04:26", "remaining_time": "0:40:10"}
|
| 1282 |
+
{"current_steps": 1282, "total_steps": 1560, "loss": 0.2718, "lr": 9.365813316516787e-07, "epoch": 2.4633599999999998, "percentage": 82.18, "elapsed_time": "3:04:34", "remaining_time": "0:40:01"}
|
| 1283 |
+
{"current_steps": 1283, "total_steps": 1560, "loss": 0.2605, "lr": 9.300722010499608e-07, "epoch": 2.46528, "percentage": 82.24, "elapsed_time": "3:04:43", "remaining_time": "0:39:52"}
|
| 1284 |
+
{"current_steps": 1284, "total_steps": 1560, "loss": 0.2125, "lr": 9.235834480022788e-07, "epoch": 2.4672, "percentage": 82.31, "elapsed_time": "3:04:51", "remaining_time": "0:39:44"}
|
| 1285 |
+
{"current_steps": 1285, "total_steps": 1560, "loss": 0.2827, "lr": 9.17115104996903e-07, "epoch": 2.46912, "percentage": 82.37, "elapsed_time": "3:05:00", "remaining_time": "0:39:35"}
|
| 1286 |
+
{"current_steps": 1286, "total_steps": 1560, "loss": 0.2683, "lr": 9.10667204419915e-07, "epoch": 2.47104, "percentage": 82.44, "elapsed_time": "3:05:08", "remaining_time": "0:39:26"}
|
| 1287 |
+
{"current_steps": 1287, "total_steps": 1560, "loss": 0.2793, "lr": 9.042397785550405e-07, "epoch": 2.47296, "percentage": 82.5, "elapsed_time": "3:05:17", "remaining_time": "0:39:18"}
|
| 1288 |
+
{"current_steps": 1288, "total_steps": 1560, "loss": 0.2677, "lr": 8.978328595834984e-07, "epoch": 2.47488, "percentage": 82.56, "elapsed_time": "3:05:25", "remaining_time": "0:39:09"}
|
| 1289 |
+
{"current_steps": 1289, "total_steps": 1560, "loss": 0.2874, "lr": 8.91446479583823e-07, "epoch": 2.4768, "percentage": 82.63, "elapsed_time": "3:05:33", "remaining_time": "0:39:00"}
|
| 1290 |
+
{"current_steps": 1290, "total_steps": 1560, "loss": 0.3385, "lr": 8.850806705317183e-07, "epoch": 2.47872, "percentage": 82.69, "elapsed_time": "3:05:42", "remaining_time": "0:38:52"}
|
| 1291 |
+
{"current_steps": 1291, "total_steps": 1560, "loss": 0.2252, "lr": 8.787354642998936e-07, "epoch": 2.48064, "percentage": 82.76, "elapsed_time": "3:05:50", "remaining_time": "0:38:43"}
|
| 1292 |
+
{"current_steps": 1292, "total_steps": 1560, "loss": 0.2483, "lr": 8.724108926579e-07, "epoch": 2.48256, "percentage": 82.82, "elapsed_time": "3:05:58", "remaining_time": "0:38:34"}
|
| 1293 |
+
{"current_steps": 1293, "total_steps": 1560, "loss": 0.2993, "lr": 8.661069872719746e-07, "epoch": 2.48448, "percentage": 82.88, "elapsed_time": "3:06:06", "remaining_time": "0:38:25"}
|
| 1294 |
+
{"current_steps": 1294, "total_steps": 1560, "loss": 0.303, "lr": 8.598237797048825e-07, "epoch": 2.4864, "percentage": 82.95, "elapsed_time": "3:06:15", "remaining_time": "0:38:17"}
|
| 1295 |
+
{"current_steps": 1295, "total_steps": 1560, "loss": 0.2687, "lr": 8.535613014157556e-07, "epoch": 2.48832, "percentage": 83.01, "elapsed_time": "3:06:23", "remaining_time": "0:38:08"}
|
| 1296 |
+
{"current_steps": 1296, "total_steps": 1560, "loss": 0.3153, "lr": 8.473195837599419e-07, "epoch": 2.49024, "percentage": 83.08, "elapsed_time": "3:06:31", "remaining_time": "0:37:59"}
|
| 1297 |
+
{"current_steps": 1297, "total_steps": 1560, "loss": 0.3159, "lr": 8.410986579888381e-07, "epoch": 2.49216, "percentage": 83.14, "elapsed_time": "3:06:40", "remaining_time": "0:37:51"}
|
| 1298 |
+
{"current_steps": 1298, "total_steps": 1560, "loss": 0.2983, "lr": 8.348985552497424e-07, "epoch": 2.49408, "percentage": 83.21, "elapsed_time": "3:06:48", "remaining_time": "0:37:42"}
|
| 1299 |
+
{"current_steps": 1299, "total_steps": 1560, "loss": 0.6145, "lr": 8.287193065856936e-07, "epoch": 2.496, "percentage": 83.27, "elapsed_time": "3:06:58", "remaining_time": "0:37:34"}
|
| 1300 |
+
{"current_steps": 1300, "total_steps": 1560, "loss": 0.301, "lr": 8.225609429353187e-07, "epoch": 2.49792, "percentage": 83.33, "elapsed_time": "3:07:06", "remaining_time": "0:37:25"}
|
| 1301 |
+
{"current_steps": 1301, "total_steps": 1560, "loss": 0.2985, "lr": 8.164234951326727e-07, "epoch": 2.49984, "percentage": 83.4, "elapsed_time": "3:07:14", "remaining_time": "0:37:16"}
|
| 1302 |
+
{"current_steps": 1302, "total_steps": 1560, "loss": 0.2781, "lr": 8.103069939070945e-07, "epoch": 2.50176, "percentage": 83.46, "elapsed_time": "3:07:23", "remaining_time": "0:37:07"}
|
| 1303 |
+
{"current_steps": 1303, "total_steps": 1560, "loss": 0.3129, "lr": 8.042114698830394e-07, "epoch": 2.50368, "percentage": 83.53, "elapsed_time": "3:07:31", "remaining_time": "0:36:59"}
|
| 1304 |
+
{"current_steps": 1304, "total_steps": 1560, "loss": 0.2879, "lr": 7.981369535799354e-07, "epoch": 2.5056000000000003, "percentage": 83.59, "elapsed_time": "3:07:39", "remaining_time": "0:36:50"}
|
| 1305 |
+
{"current_steps": 1305, "total_steps": 1560, "loss": 0.2931, "lr": 7.920834754120305e-07, "epoch": 2.50752, "percentage": 83.65, "elapsed_time": "3:07:47", "remaining_time": "0:36:41"}
|
| 1306 |
+
{"current_steps": 1306, "total_steps": 1560, "loss": 0.2951, "lr": 7.860510656882342e-07, "epoch": 2.50944, "percentage": 83.72, "elapsed_time": "3:07:56", "remaining_time": "0:36:33"}
|
| 1307 |
+
{"current_steps": 1307, "total_steps": 1560, "loss": 0.2996, "lr": 7.800397546119709e-07, "epoch": 2.51136, "percentage": 83.78, "elapsed_time": "3:08:04", "remaining_time": "0:36:24"}
|
| 1308 |
+
{"current_steps": 1308, "total_steps": 1560, "loss": 0.2703, "lr": 7.740495722810271e-07, "epoch": 2.51328, "percentage": 83.85, "elapsed_time": "3:08:12", "remaining_time": "0:36:15"}
|
| 1309 |
+
{"current_steps": 1309, "total_steps": 1560, "loss": 0.2872, "lr": 7.680805486873977e-07, "epoch": 2.5152, "percentage": 83.91, "elapsed_time": "3:08:21", "remaining_time": "0:36:06"}
|
| 1310 |
+
{"current_steps": 1310, "total_steps": 1560, "loss": 0.2583, "lr": 7.621327137171447e-07, "epoch": 2.5171200000000002, "percentage": 83.97, "elapsed_time": "3:08:29", "remaining_time": "0:35:58"}
|
| 1311 |
+
{"current_steps": 1311, "total_steps": 1560, "loss": 0.2762, "lr": 7.562060971502383e-07, "epoch": 2.51904, "percentage": 84.04, "elapsed_time": "3:08:38", "remaining_time": "0:35:49"}
|
| 1312 |
+
{"current_steps": 1312, "total_steps": 1560, "loss": 0.286, "lr": 7.50300728660407e-07, "epoch": 2.52096, "percentage": 84.1, "elapsed_time": "3:08:46", "remaining_time": "0:35:41"}
|
| 1313 |
+
{"current_steps": 1313, "total_steps": 1560, "loss": 0.3246, "lr": 7.444166378150014e-07, "epoch": 2.52288, "percentage": 84.17, "elapsed_time": "3:08:55", "remaining_time": "0:35:32"}
|
| 1314 |
+
{"current_steps": 1314, "total_steps": 1560, "loss": 0.2946, "lr": 7.385538540748327e-07, "epoch": 2.5248, "percentage": 84.23, "elapsed_time": "3:09:04", "remaining_time": "0:35:23"}
|
| 1315 |
+
{"current_steps": 1315, "total_steps": 1560, "loss": 0.2669, "lr": 7.327124067940311e-07, "epoch": 2.52672, "percentage": 84.29, "elapsed_time": "3:09:12", "remaining_time": "0:35:15"}
|
| 1316 |
+
{"current_steps": 1316, "total_steps": 1560, "loss": 0.2914, "lr": 7.26892325219899e-07, "epoch": 2.52864, "percentage": 84.36, "elapsed_time": "3:09:21", "remaining_time": "0:35:06"}
|
| 1317 |
+
{"current_steps": 1317, "total_steps": 1560, "loss": 0.2699, "lr": 7.210936384927631e-07, "epoch": 2.53056, "percentage": 84.42, "elapsed_time": "3:09:30", "remaining_time": "0:34:57"}
|
| 1318 |
+
{"current_steps": 1318, "total_steps": 1560, "loss": 0.3096, "lr": 7.153163756458287e-07, "epoch": 2.53248, "percentage": 84.49, "elapsed_time": "3:09:38", "remaining_time": "0:34:49"}
|
| 1319 |
+
{"current_steps": 1319, "total_steps": 1560, "loss": 0.3501, "lr": 7.09560565605037e-07, "epoch": 2.5343999999999998, "percentage": 84.55, "elapsed_time": "3:09:47", "remaining_time": "0:34:40"}
|
| 1320 |
+
{"current_steps": 1320, "total_steps": 1560, "loss": 0.2785, "lr": 7.03826237188916e-07, "epoch": 2.53632, "percentage": 84.62, "elapsed_time": "3:09:56", "remaining_time": "0:34:32"}
|
| 1321 |
+
{"current_steps": 1321, "total_steps": 1560, "loss": 0.2399, "lr": 6.981134191084388e-07, "epoch": 2.53824, "percentage": 84.68, "elapsed_time": "3:10:04", "remaining_time": "0:34:23"}
|
| 1322 |
+
{"current_steps": 1322, "total_steps": 1560, "loss": 0.2983, "lr": 6.924221399668785e-07, "epoch": 2.54016, "percentage": 84.74, "elapsed_time": "3:10:13", "remaining_time": "0:34:14"}
|
| 1323 |
+
{"current_steps": 1323, "total_steps": 1560, "loss": 0.2601, "lr": 6.867524282596655e-07, "epoch": 2.54208, "percentage": 84.81, "elapsed_time": "3:10:22", "remaining_time": "0:34:06"}
|
| 1324 |
+
{"current_steps": 1324, "total_steps": 1560, "loss": 0.2602, "lr": 6.811043123742494e-07, "epoch": 2.544, "percentage": 84.87, "elapsed_time": "3:10:30", "remaining_time": "0:33:57"}
|
| 1325 |
+
{"current_steps": 1325, "total_steps": 1560, "loss": 0.2978, "lr": 6.754778205899465e-07, "epoch": 2.5459199999999997, "percentage": 84.94, "elapsed_time": "3:10:39", "remaining_time": "0:33:48"}
|
| 1326 |
+
{"current_steps": 1326, "total_steps": 1560, "loss": 0.324, "lr": 6.698729810778065e-07, "epoch": 2.54784, "percentage": 85.0, "elapsed_time": "3:10:48", "remaining_time": "0:33:40"}
|
| 1327 |
+
{"current_steps": 1327, "total_steps": 1560, "loss": 0.2633, "lr": 6.642898219004723e-07, "epoch": 2.54976, "percentage": 85.06, "elapsed_time": "3:10:57", "remaining_time": "0:33:31"}
|
| 1328 |
+
{"current_steps": 1328, "total_steps": 1560, "loss": 0.2985, "lr": 6.587283710120324e-07, "epoch": 2.55168, "percentage": 85.13, "elapsed_time": "3:11:05", "remaining_time": "0:33:23"}
|
| 1329 |
+
{"current_steps": 1329, "total_steps": 1560, "loss": 0.3101, "lr": 6.531886562578859e-07, "epoch": 2.5536, "percentage": 85.19, "elapsed_time": "3:11:14", "remaining_time": "0:33:14"}
|
| 1330 |
+
{"current_steps": 1330, "total_steps": 1560, "loss": 0.2532, "lr": 6.47670705374604e-07, "epoch": 2.55552, "percentage": 85.26, "elapsed_time": "3:11:23", "remaining_time": "0:33:05"}
|
| 1331 |
+
{"current_steps": 1331, "total_steps": 1560, "loss": 0.3051, "lr": 6.421745459897871e-07, "epoch": 2.55744, "percentage": 85.32, "elapsed_time": "3:11:31", "remaining_time": "0:32:57"}
|
| 1332 |
+
{"current_steps": 1332, "total_steps": 1560, "loss": 0.2968, "lr": 6.367002056219285e-07, "epoch": 2.55936, "percentage": 85.38, "elapsed_time": "3:11:40", "remaining_time": "0:32:48"}
|
| 1333 |
+
{"current_steps": 1333, "total_steps": 1560, "loss": 0.2767, "lr": 6.312477116802807e-07, "epoch": 2.56128, "percentage": 85.45, "elapsed_time": "3:11:49", "remaining_time": "0:32:39"}
|
| 1334 |
+
{"current_steps": 1334, "total_steps": 1560, "loss": 0.2826, "lr": 6.258170914647077e-07, "epoch": 2.5632, "percentage": 85.51, "elapsed_time": "3:11:57", "remaining_time": "0:32:31"}
|
| 1335 |
+
{"current_steps": 1335, "total_steps": 1560, "loss": 0.3224, "lr": 6.204083721655607e-07, "epoch": 2.56512, "percentage": 85.58, "elapsed_time": "3:12:06", "remaining_time": "0:32:22"}
|
| 1336 |
+
{"current_steps": 1336, "total_steps": 1560, "loss": 0.2776, "lr": 6.150215808635334e-07, "epoch": 2.56704, "percentage": 85.64, "elapsed_time": "3:12:14", "remaining_time": "0:32:14"}
|
| 1337 |
+
{"current_steps": 1337, "total_steps": 1560, "loss": 0.2826, "lr": 6.096567445295298e-07, "epoch": 2.56896, "percentage": 85.71, "elapsed_time": "3:12:23", "remaining_time": "0:32:05"}
|
| 1338 |
+
{"current_steps": 1338, "total_steps": 1560, "loss": 0.2232, "lr": 6.043138900245277e-07, "epoch": 2.57088, "percentage": 85.77, "elapsed_time": "3:12:31", "remaining_time": "0:31:56"}
|
| 1339 |
+
{"current_steps": 1339, "total_steps": 1560, "loss": 0.2845, "lr": 5.989930440994451e-07, "epoch": 2.5728, "percentage": 85.83, "elapsed_time": "3:12:40", "remaining_time": "0:31:47"}
|
| 1340 |
+
{"current_steps": 1340, "total_steps": 1560, "loss": 0.2993, "lr": 5.936942333950063e-07, "epoch": 2.57472, "percentage": 85.9, "elapsed_time": "3:12:48", "remaining_time": "0:31:39"}
|
| 1341 |
+
{"current_steps": 1341, "total_steps": 1560, "loss": 0.2803, "lr": 5.884174844416102e-07, "epoch": 2.5766400000000003, "percentage": 85.96, "elapsed_time": "3:12:56", "remaining_time": "0:31:30"}
|
| 1342 |
+
{"current_steps": 1342, "total_steps": 1560, "loss": 0.2458, "lr": 5.831628236591929e-07, "epoch": 2.57856, "percentage": 86.03, "elapsed_time": "3:13:04", "remaining_time": "0:31:21"}
|
| 1343 |
+
{"current_steps": 1343, "total_steps": 1560, "loss": 0.2852, "lr": 5.779302773570994e-07, "epoch": 2.58048, "percentage": 86.09, "elapsed_time": "3:13:13", "remaining_time": "0:31:13"}
|
| 1344 |
+
{"current_steps": 1344, "total_steps": 1560, "loss": 0.3027, "lr": 5.727198717339511e-07, "epoch": 2.5824, "percentage": 86.15, "elapsed_time": "3:13:21", "remaining_time": "0:31:04"}
|
| 1345 |
+
{"current_steps": 1345, "total_steps": 1560, "loss": 0.2425, "lr": 5.675316328775126e-07, "epoch": 2.58432, "percentage": 86.22, "elapsed_time": "3:13:29", "remaining_time": "0:30:55"}
|
| 1346 |
+
{"current_steps": 1346, "total_steps": 1560, "loss": 0.355, "lr": 5.623655867645628e-07, "epoch": 2.58624, "percentage": 86.28, "elapsed_time": "3:13:38", "remaining_time": "0:30:47"}
|
| 1347 |
+
{"current_steps": 1347, "total_steps": 1560, "loss": 0.2744, "lr": 5.572217592607687e-07, "epoch": 2.5881600000000002, "percentage": 86.35, "elapsed_time": "3:13:46", "remaining_time": "0:30:38"}
|
| 1348 |
+
{"current_steps": 1348, "total_steps": 1560, "loss": 0.2609, "lr": 5.521001761205441e-07, "epoch": 2.59008, "percentage": 86.41, "elapsed_time": "3:13:54", "remaining_time": "0:30:29"}
|
| 1349 |
+
{"current_steps": 1349, "total_steps": 1560, "loss": 0.2862, "lr": 5.470008629869367e-07, "epoch": 2.592, "percentage": 86.47, "elapsed_time": "3:14:02", "remaining_time": "0:30:21"}
|
| 1350 |
+
{"current_steps": 1350, "total_steps": 1560, "loss": 0.2896, "lr": 5.41923845391486e-07, "epoch": 2.59392, "percentage": 86.54, "elapsed_time": "3:14:11", "remaining_time": "0:30:12"}
|
| 1351 |
+
{"current_steps": 1351, "total_steps": 1560, "loss": 0.3037, "lr": 5.368691487541027e-07, "epoch": 2.59584, "percentage": 86.6, "elapsed_time": "3:14:19", "remaining_time": "0:30:03"}
|
| 1352 |
+
{"current_steps": 1352, "total_steps": 1560, "loss": 0.2981, "lr": 5.318367983829393e-07, "epoch": 2.59776, "percentage": 86.67, "elapsed_time": "3:14:28", "remaining_time": "0:29:55"}
|
| 1353 |
+
{"current_steps": 1353, "total_steps": 1560, "loss": 0.2787, "lr": 5.268268194742638e-07, "epoch": 2.59968, "percentage": 86.73, "elapsed_time": "3:14:36", "remaining_time": "0:29:46"}
|
| 1354 |
+
{"current_steps": 1354, "total_steps": 1560, "loss": 0.322, "lr": 5.218392371123326e-07, "epoch": 2.6016, "percentage": 86.79, "elapsed_time": "3:14:44", "remaining_time": "0:29:37"}
|
| 1355 |
+
{"current_steps": 1355, "total_steps": 1560, "loss": 0.2344, "lr": 5.168740762692681e-07, "epoch": 2.60352, "percentage": 86.86, "elapsed_time": "3:14:52", "remaining_time": "0:29:29"}
|
| 1356 |
+
{"current_steps": 1356, "total_steps": 1560, "loss": 0.2516, "lr": 5.119313618049309e-07, "epoch": 2.6054399999999998, "percentage": 86.92, "elapsed_time": "3:15:01", "remaining_time": "0:29:20"}
|
| 1357 |
+
{"current_steps": 1357, "total_steps": 1560, "loss": 0.2877, "lr": 5.070111184667908e-07, "epoch": 2.60736, "percentage": 86.99, "elapsed_time": "3:15:09", "remaining_time": "0:29:11"}
|
| 1358 |
+
{"current_steps": 1358, "total_steps": 1560, "loss": 0.2753, "lr": 5.021133708898146e-07, "epoch": 2.60928, "percentage": 87.05, "elapsed_time": "3:15:17", "remaining_time": "0:29:03"}
|
| 1359 |
+
{"current_steps": 1359, "total_steps": 1560, "loss": 0.29, "lr": 4.972381435963331e-07, "epoch": 2.6112, "percentage": 87.12, "elapsed_time": "3:15:26", "remaining_time": "0:28:54"}
|
| 1360 |
+
{"current_steps": 1360, "total_steps": 1560, "loss": 0.3648, "lr": 4.9238546099592e-07, "epoch": 2.61312, "percentage": 87.18, "elapsed_time": "3:15:34", "remaining_time": "0:28:45"}
|
| 1361 |
+
{"current_steps": 1361, "total_steps": 1560, "loss": 0.247, "lr": 4.875553473852735e-07, "epoch": 2.61504, "percentage": 87.24, "elapsed_time": "3:15:43", "remaining_time": "0:28:37"}
|
| 1362 |
+
{"current_steps": 1362, "total_steps": 1560, "loss": 0.2632, "lr": 4.827478269480895e-07, "epoch": 2.6169599999999997, "percentage": 87.31, "elapsed_time": "3:15:51", "remaining_time": "0:28:28"}
|
| 1363 |
+
{"current_steps": 1363, "total_steps": 1560, "loss": 0.325, "lr": 4.779629237549438e-07, "epoch": 2.61888, "percentage": 87.37, "elapsed_time": "3:15:59", "remaining_time": "0:28:19"}
|
| 1364 |
+
{"current_steps": 1364, "total_steps": 1560, "loss": 0.2376, "lr": 4.732006617631729e-07, "epoch": 2.6208, "percentage": 87.44, "elapsed_time": "3:16:08", "remaining_time": "0:28:11"}
|
| 1365 |
+
{"current_steps": 1365, "total_steps": 1560, "loss": 0.2601, "lr": 4.6846106481675035e-07, "epoch": 2.62272, "percentage": 87.5, "elapsed_time": "3:16:16", "remaining_time": "0:28:02"}
|
| 1366 |
+
{"current_steps": 1366, "total_steps": 1560, "loss": 0.3528, "lr": 4.637441566461681e-07, "epoch": 2.62464, "percentage": 87.56, "elapsed_time": "3:16:24", "remaining_time": "0:27:53"}
|
| 1367 |
+
{"current_steps": 1367, "total_steps": 1560, "loss": 0.2692, "lr": 4.590499608683202e-07, "epoch": 2.62656, "percentage": 87.63, "elapsed_time": "3:16:32", "remaining_time": "0:27:44"}
|
| 1368 |
+
{"current_steps": 1368, "total_steps": 1560, "loss": 0.2869, "lr": 4.54378500986381e-07, "epoch": 2.62848, "percentage": 87.69, "elapsed_time": "3:16:41", "remaining_time": "0:27:36"}
|
| 1369 |
+
{"current_steps": 1369, "total_steps": 1560, "loss": 0.3423, "lr": 4.497298003896944e-07, "epoch": 2.6304, "percentage": 87.76, "elapsed_time": "3:16:49", "remaining_time": "0:27:27"}
|
| 1370 |
+
{"current_steps": 1370, "total_steps": 1560, "loss": 0.2561, "lr": 4.451038823536441e-07, "epoch": 2.63232, "percentage": 87.82, "elapsed_time": "3:16:57", "remaining_time": "0:27:18"}
|
| 1371 |
+
{"current_steps": 1371, "total_steps": 1560, "loss": 0.3867, "lr": 4.405007700395497e-07, "epoch": 2.63424, "percentage": 87.88, "elapsed_time": "3:17:05", "remaining_time": "0:27:10"}
|
| 1372 |
+
{"current_steps": 1372, "total_steps": 1560, "loss": 0.2746, "lr": 4.35920486494546e-07, "epoch": 2.63616, "percentage": 87.95, "elapsed_time": "3:17:14", "remaining_time": "0:27:01"}
|
| 1373 |
+
{"current_steps": 1373, "total_steps": 1560, "loss": 0.2777, "lr": 4.313630546514663e-07, "epoch": 2.63808, "percentage": 88.01, "elapsed_time": "3:17:22", "remaining_time": "0:26:52"}
|
| 1374 |
+
{"current_steps": 1374, "total_steps": 1560, "loss": 0.2655, "lr": 4.268284973287273e-07, "epoch": 2.64, "percentage": 88.08, "elapsed_time": "3:17:30", "remaining_time": "0:26:44"}
|
| 1375 |
+
{"current_steps": 1375, "total_steps": 1560, "loss": 0.2681, "lr": 4.223168372302189e-07, "epoch": 2.64192, "percentage": 88.14, "elapsed_time": "3:17:39", "remaining_time": "0:26:35"}
|
| 1376 |
+
{"current_steps": 1376, "total_steps": 1560, "loss": 0.274, "lr": 4.1782809694518533e-07, "epoch": 2.64384, "percentage": 88.21, "elapsed_time": "3:17:47", "remaining_time": "0:26:26"}
|
| 1377 |
+
{"current_steps": 1377, "total_steps": 1560, "loss": 0.3223, "lr": 4.1336229894811454e-07, "epoch": 2.64576, "percentage": 88.27, "elapsed_time": "3:17:55", "remaining_time": "0:26:18"}
|
| 1378 |
+
{"current_steps": 1378, "total_steps": 1560, "loss": 0.2572, "lr": 4.089194655986306e-07, "epoch": 2.6476800000000003, "percentage": 88.33, "elapsed_time": "3:18:04", "remaining_time": "0:26:09"}
|
| 1379 |
+
{"current_steps": 1379, "total_steps": 1560, "loss": 0.3832, "lr": 4.044996191413686e-07, "epoch": 2.6496, "percentage": 88.4, "elapsed_time": "3:18:12", "remaining_time": "0:26:00"}
|
| 1380 |
+
{"current_steps": 1380, "total_steps": 1560, "loss": 0.2897, "lr": 4.001027817058789e-07, "epoch": 2.65152, "percentage": 88.46, "elapsed_time": "3:18:21", "remaining_time": "0:25:52"}
|
| 1381 |
+
{"current_steps": 1381, "total_steps": 1560, "loss": 0.256, "lr": 3.957289753065052e-07, "epoch": 2.65344, "percentage": 88.53, "elapsed_time": "3:18:29", "remaining_time": "0:25:43"}
|
| 1382 |
+
{"current_steps": 1382, "total_steps": 1560, "loss": 0.3415, "lr": 3.9137822184227845e-07, "epoch": 2.65536, "percentage": 88.59, "elapsed_time": "3:18:38", "remaining_time": "0:25:35"}
|
| 1383 |
+
{"current_steps": 1383, "total_steps": 1560, "loss": 0.2727, "lr": 3.870505430968069e-07, "epoch": 2.65728, "percentage": 88.65, "elapsed_time": "3:18:46", "remaining_time": "0:25:26"}
|
| 1384 |
+
{"current_steps": 1384, "total_steps": 1560, "loss": 0.2784, "lr": 3.8274596073816784e-07, "epoch": 2.6592000000000002, "percentage": 88.72, "elapsed_time": "3:18:55", "remaining_time": "0:25:17"}
|
| 1385 |
+
{"current_steps": 1385, "total_steps": 1560, "loss": 0.3175, "lr": 3.7846449631879664e-07, "epoch": 2.66112, "percentage": 88.78, "elapsed_time": "3:19:04", "remaining_time": "0:25:09"}
|
| 1386 |
+
{"current_steps": 1386, "total_steps": 1560, "loss": 0.2732, "lr": 3.742061712753825e-07, "epoch": 2.66304, "percentage": 88.85, "elapsed_time": "3:19:12", "remaining_time": "0:25:00"}
|
| 1387 |
+
{"current_steps": 1387, "total_steps": 1560, "loss": 0.2872, "lr": 3.699710069287571e-07, "epoch": 2.6649599999999998, "percentage": 88.91, "elapsed_time": "3:19:20", "remaining_time": "0:24:51"}
|
| 1388 |
+
{"current_steps": 1388, "total_steps": 1560, "loss": 0.3075, "lr": 3.657590244837911e-07, "epoch": 2.66688, "percentage": 88.97, "elapsed_time": "3:19:29", "remaining_time": "0:24:43"}
|
| 1389 |
+
{"current_steps": 1389, "total_steps": 1560, "loss": 0.3204, "lr": 3.615702450292857e-07, "epoch": 2.6688, "percentage": 89.04, "elapsed_time": "3:19:37", "remaining_time": "0:24:34"}
|
| 1390 |
+
{"current_steps": 1390, "total_steps": 1560, "loss": 0.286, "lr": 3.5740468953786854e-07, "epoch": 2.67072, "percentage": 89.1, "elapsed_time": "3:19:45", "remaining_time": "0:24:25"}
|
| 1391 |
+
{"current_steps": 1391, "total_steps": 1560, "loss": 0.2731, "lr": 3.5326237886588734e-07, "epoch": 2.67264, "percentage": 89.17, "elapsed_time": "3:19:54", "remaining_time": "0:24:17"}
|
| 1392 |
+
{"current_steps": 1392, "total_steps": 1560, "loss": 0.2396, "lr": 3.49143333753309e-07, "epoch": 2.67456, "percentage": 89.23, "elapsed_time": "3:20:02", "remaining_time": "0:24:08"}
|
| 1393 |
+
{"current_steps": 1393, "total_steps": 1560, "loss": 0.2523, "lr": 3.4504757482360817e-07, "epoch": 2.6764799999999997, "percentage": 89.29, "elapsed_time": "3:20:11", "remaining_time": "0:24:00"}
|
| 1394 |
+
{"current_steps": 1394, "total_steps": 1560, "loss": 0.2735, "lr": 3.4097512258367385e-07, "epoch": 2.6784, "percentage": 89.36, "elapsed_time": "3:20:20", "remaining_time": "0:23:51"}
|
| 1395 |
+
{"current_steps": 1395, "total_steps": 1560, "loss": 0.3389, "lr": 3.369259974236988e-07, "epoch": 2.68032, "percentage": 89.42, "elapsed_time": "3:20:29", "remaining_time": "0:23:42"}
|
| 1396 |
+
{"current_steps": 1396, "total_steps": 1560, "loss": 0.2793, "lr": 3.3290021961708163e-07, "epoch": 2.68224, "percentage": 89.49, "elapsed_time": "3:20:38", "remaining_time": "0:23:34"}
|
| 1397 |
+
{"current_steps": 1397, "total_steps": 1560, "loss": 0.2739, "lr": 3.288978093203227e-07, "epoch": 2.68416, "percentage": 89.55, "elapsed_time": "3:20:47", "remaining_time": "0:23:25"}
|
| 1398 |
+
{"current_steps": 1398, "total_steps": 1560, "loss": 0.2666, "lr": 3.2491878657292643e-07, "epoch": 2.68608, "percentage": 89.62, "elapsed_time": "3:21:02", "remaining_time": "0:23:17"}
|
| 1399 |
+
{"current_steps": 1399, "total_steps": 1560, "loss": 0.2458, "lr": 3.209631712972966e-07, "epoch": 2.6879999999999997, "percentage": 89.68, "elapsed_time": "3:21:11", "remaining_time": "0:23:09"}
|
| 1400 |
+
{"current_steps": 1400, "total_steps": 1560, "loss": 0.3603, "lr": 3.1703098329864237e-07, "epoch": 2.68992, "percentage": 89.74, "elapsed_time": "3:21:19", "remaining_time": "0:23:00"}
|
| 1401 |
+
{"current_steps": 1401, "total_steps": 1560, "loss": 0.2672, "lr": 3.131222422648744e-07, "epoch": 2.69184, "percentage": 89.81, "elapsed_time": "3:21:28", "remaining_time": "0:22:51"}
|
| 1402 |
+
{"current_steps": 1402, "total_steps": 1560, "loss": 0.2813, "lr": 3.0923696776650414e-07, "epoch": 2.69376, "percentage": 89.87, "elapsed_time": "3:21:36", "remaining_time": "0:22:43"}
|
| 1403 |
+
{"current_steps": 1403, "total_steps": 1560, "loss": 0.3076, "lr": 3.0537517925655567e-07, "epoch": 2.69568, "percentage": 89.94, "elapsed_time": "3:21:45", "remaining_time": "0:22:34"}
|
| 1404 |
+
{"current_steps": 1404, "total_steps": 1560, "loss": 0.2849, "lr": 3.015368960704584e-07, "epoch": 2.6976, "percentage": 90.0, "elapsed_time": "3:21:53", "remaining_time": "0:22:25"}
|
| 1405 |
+
{"current_steps": 1405, "total_steps": 1560, "loss": 0.2707, "lr": 2.9772213742595367e-07, "epoch": 2.69952, "percentage": 90.06, "elapsed_time": "3:22:01", "remaining_time": "0:22:17"}
|
| 1406 |
+
{"current_steps": 1406, "total_steps": 1560, "loss": 0.2666, "lr": 2.9393092242300026e-07, "epoch": 2.70144, "percentage": 90.13, "elapsed_time": "3:22:10", "remaining_time": "0:22:08"}
|
| 1407 |
+
{"current_steps": 1407, "total_steps": 1560, "loss": 0.222, "lr": 2.901632700436757e-07, "epoch": 2.70336, "percentage": 90.19, "elapsed_time": "3:22:18", "remaining_time": "0:21:59"}
|
| 1408 |
+
{"current_steps": 1408, "total_steps": 1560, "loss": 0.2669, "lr": 2.864191991520848e-07, "epoch": 2.70528, "percentage": 90.26, "elapsed_time": "3:22:27", "remaining_time": "0:21:51"}
|
| 1409 |
+
{"current_steps": 1409, "total_steps": 1560, "loss": 0.2844, "lr": 2.8269872849426114e-07, "epoch": 2.7072000000000003, "percentage": 90.32, "elapsed_time": "3:22:35", "remaining_time": "0:21:42"}
|
| 1410 |
+
{"current_steps": 1410, "total_steps": 1560, "loss": 0.3051, "lr": 2.790018766980773e-07, "epoch": 2.70912, "percentage": 90.38, "elapsed_time": "3:22:43", "remaining_time": "0:21:34"}
|
| 1411 |
+
{"current_steps": 1411, "total_steps": 1560, "loss": 0.3082, "lr": 2.7532866227314714e-07, "epoch": 2.71104, "percentage": 90.45, "elapsed_time": "3:22:52", "remaining_time": "0:21:25"}
|
| 1412 |
+
{"current_steps": 1412, "total_steps": 1560, "loss": 0.2579, "lr": 2.71679103610738e-07, "epoch": 2.71296, "percentage": 90.51, "elapsed_time": "3:23:00", "remaining_time": "0:21:16"}
|
| 1413 |
+
{"current_steps": 1413, "total_steps": 1560, "loss": 0.2742, "lr": 2.6805321898367323e-07, "epoch": 2.71488, "percentage": 90.58, "elapsed_time": "3:23:08", "remaining_time": "0:21:08"}
|
| 1414 |
+
{"current_steps": 1414, "total_steps": 1560, "loss": 0.3105, "lr": 2.64451026546248e-07, "epoch": 2.7168, "percentage": 90.64, "elapsed_time": "3:23:17", "remaining_time": "0:20:59"}
|
| 1415 |
+
{"current_steps": 1415, "total_steps": 1560, "loss": 0.2877, "lr": 2.6087254433412924e-07, "epoch": 2.7187200000000002, "percentage": 90.71, "elapsed_time": "3:23:25", "remaining_time": "0:20:50"}
|
| 1416 |
+
{"current_steps": 1416, "total_steps": 1560, "loss": 0.3247, "lr": 2.573177902642726e-07, "epoch": 2.72064, "percentage": 90.77, "elapsed_time": "3:23:33", "remaining_time": "0:20:42"}
|
| 1417 |
+
{"current_steps": 1417, "total_steps": 1560, "loss": 0.2171, "lr": 2.5378678213483057e-07, "epoch": 2.72256, "percentage": 90.83, "elapsed_time": "3:23:42", "remaining_time": "0:20:33"}
|
| 1418 |
+
{"current_steps": 1418, "total_steps": 1560, "loss": 0.2512, "lr": 2.502795376250622e-07, "epoch": 2.72448, "percentage": 90.9, "elapsed_time": "3:23:50", "remaining_time": "0:20:24"}
|
| 1419 |
+
{"current_steps": 1419, "total_steps": 1560, "loss": 0.3139, "lr": 2.467960742952463e-07, "epoch": 2.7264, "percentage": 90.96, "elapsed_time": "3:23:59", "remaining_time": "0:20:16"}
|
| 1420 |
+
{"current_steps": 1420, "total_steps": 1560, "loss": 0.2856, "lr": 2.4333640958659144e-07, "epoch": 2.72832, "percentage": 91.03, "elapsed_time": "3:24:07", "remaining_time": "0:20:07"}
|
| 1421 |
+
{"current_steps": 1421, "total_steps": 1560, "loss": 0.343, "lr": 2.399005608211502e-07, "epoch": 2.7302400000000002, "percentage": 91.09, "elapsed_time": "3:24:15", "remaining_time": "0:19:58"}
|
| 1422 |
+
{"current_steps": 1422, "total_steps": 1560, "loss": 0.246, "lr": 2.3648854520173237e-07, "epoch": 2.73216, "percentage": 91.15, "elapsed_time": "3:24:24", "remaining_time": "0:19:50"}
|
| 1423 |
+
{"current_steps": 1423, "total_steps": 1560, "loss": 0.2787, "lr": 2.3310037981182088e-07, "epoch": 2.73408, "percentage": 91.22, "elapsed_time": "3:24:32", "remaining_time": "0:19:41"}
|
| 1424 |
+
{"current_steps": 1424, "total_steps": 1560, "loss": 0.2383, "lr": 2.2973608161547755e-07, "epoch": 2.7359999999999998, "percentage": 91.28, "elapsed_time": "3:24:40", "remaining_time": "0:19:32"}
|
| 1425 |
+
{"current_steps": 1425, "total_steps": 1560, "loss": 0.3292, "lr": 2.2639566745727203e-07, "epoch": 2.73792, "percentage": 91.35, "elapsed_time": "3:24:48", "remaining_time": "0:19:24"}
|
| 1426 |
+
{"current_steps": 1426, "total_steps": 1560, "loss": 0.2619, "lr": 2.2307915406218517e-07, "epoch": 2.73984, "percentage": 91.41, "elapsed_time": "3:24:57", "remaining_time": "0:19:15"}
|
| 1427 |
+
{"current_steps": 1427, "total_steps": 1560, "loss": 0.2525, "lr": 2.1978655803553128e-07, "epoch": 2.74176, "percentage": 91.47, "elapsed_time": "3:25:05", "remaining_time": "0:19:06"}
|
| 1428 |
+
{"current_steps": 1428, "total_steps": 1560, "loss": 0.3198, "lr": 2.1651789586287442e-07, "epoch": 2.74368, "percentage": 91.54, "elapsed_time": "3:25:14", "remaining_time": "0:18:58"}
|
| 1429 |
+
{"current_steps": 1429, "total_steps": 1560, "loss": 0.2885, "lr": 2.1327318390994445e-07, "epoch": 2.7456, "percentage": 91.6, "elapsed_time": "3:25:22", "remaining_time": "0:18:49"}
|
| 1430 |
+
{"current_steps": 1430, "total_steps": 1560, "loss": 0.2678, "lr": 2.1005243842255552e-07, "epoch": 2.7475199999999997, "percentage": 91.67, "elapsed_time": "3:25:30", "remaining_time": "0:18:40"}
|
| 1431 |
+
{"current_steps": 1431, "total_steps": 1560, "loss": 0.2777, "lr": 2.068556755265272e-07, "epoch": 2.74944, "percentage": 91.73, "elapsed_time": "3:25:39", "remaining_time": "0:18:32"}
|
| 1432 |
+
{"current_steps": 1432, "total_steps": 1560, "loss": 0.2672, "lr": 2.0368291122759898e-07, "epoch": 2.75136, "percentage": 91.79, "elapsed_time": "3:25:47", "remaining_time": "0:18:23"}
|
| 1433 |
+
{"current_steps": 1433, "total_steps": 1560, "loss": 0.3326, "lr": 2.005341614113543e-07, "epoch": 2.75328, "percentage": 91.86, "elapsed_time": "3:25:56", "remaining_time": "0:18:15"}
|
| 1434 |
+
{"current_steps": 1434, "total_steps": 1560, "loss": 0.3185, "lr": 1.9740944184313882e-07, "epoch": 2.7552, "percentage": 91.92, "elapsed_time": "3:26:04", "remaining_time": "0:18:06"}
|
| 1435 |
+
{"current_steps": 1435, "total_steps": 1560, "loss": 0.2864, "lr": 1.9430876816798228e-07, "epoch": 2.75712, "percentage": 91.99, "elapsed_time": "3:26:13", "remaining_time": "0:17:57"}
|
| 1436 |
+
{"current_steps": 1436, "total_steps": 1560, "loss": 0.2284, "lr": 1.9123215591052014e-07, "epoch": 2.75904, "percentage": 92.05, "elapsed_time": "3:26:21", "remaining_time": "0:17:49"}
|
| 1437 |
+
{"current_steps": 1437, "total_steps": 1560, "loss": 0.2776, "lr": 1.88179620474917e-07, "epoch": 2.76096, "percentage": 92.12, "elapsed_time": "3:26:29", "remaining_time": "0:17:40"}
|
| 1438 |
+
{"current_steps": 1438, "total_steps": 1560, "loss": 0.2955, "lr": 1.8515117714478447e-07, "epoch": 2.76288, "percentage": 92.18, "elapsed_time": "3:26:38", "remaining_time": "0:17:31"}
|
| 1439 |
+
{"current_steps": 1439, "total_steps": 1560, "loss": 0.2997, "lr": 1.8214684108311286e-07, "epoch": 2.7648, "percentage": 92.24, "elapsed_time": "3:26:46", "remaining_time": "0:17:23"}
|
| 1440 |
+
{"current_steps": 1440, "total_steps": 1560, "loss": 0.3018, "lr": 1.7916662733218848e-07, "epoch": 2.76672, "percentage": 92.31, "elapsed_time": "3:26:55", "remaining_time": "0:17:14"}
|
| 1441 |
+
{"current_steps": 1441, "total_steps": 1560, "loss": 0.2022, "lr": 1.762105508135198e-07, "epoch": 2.76864, "percentage": 92.37, "elapsed_time": "3:27:04", "remaining_time": "0:17:06"}
|
| 1442 |
+
{"current_steps": 1442, "total_steps": 1560, "loss": 0.3218, "lr": 1.7327862632776638e-07, "epoch": 2.77056, "percentage": 92.44, "elapsed_time": "3:27:12", "remaining_time": "0:16:57"}
|
| 1443 |
+
{"current_steps": 1443, "total_steps": 1560, "loss": 0.2894, "lr": 1.7037086855465902e-07, "epoch": 2.77248, "percentage": 92.5, "elapsed_time": "3:27:20", "remaining_time": "0:16:48"}
|
| 1444 |
+
{"current_steps": 1444, "total_steps": 1560, "loss": 0.282, "lr": 1.6748729205293024e-07, "epoch": 2.7744, "percentage": 92.56, "elapsed_time": "3:27:29", "remaining_time": "0:16:40"}
|
| 1445 |
+
{"current_steps": 1445, "total_steps": 1560, "loss": 0.3495, "lr": 1.646279112602417e-07, "epoch": 2.77632, "percentage": 92.63, "elapsed_time": "3:27:37", "remaining_time": "0:16:31"}
|
| 1446 |
+
{"current_steps": 1446, "total_steps": 1560, "loss": 0.2785, "lr": 1.6179274049310966e-07, "epoch": 2.7782400000000003, "percentage": 92.69, "elapsed_time": "3:27:45", "remaining_time": "0:16:22"}
|
| 1447 |
+
{"current_steps": 1447, "total_steps": 1560, "loss": 0.2385, "lr": 1.5898179394683244e-07, "epoch": 2.78016, "percentage": 92.76, "elapsed_time": "3:27:54", "remaining_time": "0:16:14"}
|
| 1448 |
+
{"current_steps": 1448, "total_steps": 1560, "loss": 0.2575, "lr": 1.5619508569542363e-07, "epoch": 2.78208, "percentage": 92.82, "elapsed_time": "3:28:02", "remaining_time": "0:16:05"}
|
| 1449 |
+
{"current_steps": 1449, "total_steps": 1560, "loss": 0.2531, "lr": 1.5343262969153781e-07, "epoch": 2.784, "percentage": 92.88, "elapsed_time": "3:28:10", "remaining_time": "0:15:56"}
|
| 1450 |
+
{"current_steps": 1450, "total_steps": 1560, "loss": 0.3086, "lr": 1.5069443976640287e-07, "epoch": 2.78592, "percentage": 92.95, "elapsed_time": "3:28:19", "remaining_time": "0:15:48"}
|
| 1451 |
+
{"current_steps": 1451, "total_steps": 1560, "loss": 0.2433, "lr": 1.4798052962974874e-07, "epoch": 2.78784, "percentage": 93.01, "elapsed_time": "3:28:27", "remaining_time": "0:15:39"}
|
| 1452 |
+
{"current_steps": 1452, "total_steps": 1560, "loss": 0.2636, "lr": 1.4529091286973994e-07, "epoch": 2.7897600000000002, "percentage": 93.08, "elapsed_time": "3:28:35", "remaining_time": "0:15:30"}
|
| 1453 |
+
{"current_steps": 1453, "total_steps": 1560, "loss": 0.26, "lr": 1.4262560295290884e-07, "epoch": 2.79168, "percentage": 93.14, "elapsed_time": "3:28:44", "remaining_time": "0:15:22"}
|
| 1454 |
+
{"current_steps": 1454, "total_steps": 1560, "loss": 0.2669, "lr": 1.3998461322408563e-07, "epoch": 2.7936, "percentage": 93.21, "elapsed_time": "3:28:52", "remaining_time": "0:15:13"}
|
| 1455 |
+
{"current_steps": 1455, "total_steps": 1560, "loss": 0.21, "lr": 1.3736795690633353e-07, "epoch": 2.79552, "percentage": 93.27, "elapsed_time": "3:29:00", "remaining_time": "0:15:05"}
|
| 1456 |
+
{"current_steps": 1456, "total_steps": 1560, "loss": 0.3053, "lr": 1.3477564710088097e-07, "epoch": 2.79744, "percentage": 93.33, "elapsed_time": "3:29:09", "remaining_time": "0:14:56"}
|
| 1457 |
+
{"current_steps": 1457, "total_steps": 1560, "loss": 0.3053, "lr": 1.3220769678705724e-07, "epoch": 2.79936, "percentage": 93.4, "elapsed_time": "3:29:17", "remaining_time": "0:14:47"}
|
| 1458 |
+
{"current_steps": 1458, "total_steps": 1560, "loss": 0.2055, "lr": 1.2966411882222695e-07, "epoch": 2.80128, "percentage": 93.46, "elapsed_time": "3:29:25", "remaining_time": "0:14:39"}
|
| 1459 |
+
{"current_steps": 1459, "total_steps": 1560, "loss": 0.3367, "lr": 1.271449259417268e-07, "epoch": 2.8032, "percentage": 93.53, "elapsed_time": "3:29:34", "remaining_time": "0:14:30"}
|
| 1460 |
+
{"current_steps": 1460, "total_steps": 1560, "loss": 0.2504, "lr": 1.2465013075879884e-07, "epoch": 2.80512, "percentage": 93.59, "elapsed_time": "3:29:42", "remaining_time": "0:14:21"}
|
| 1461 |
+
{"current_steps": 1461, "total_steps": 1560, "loss": 0.3333, "lr": 1.2217974576453072e-07, "epoch": 2.8070399999999998, "percentage": 93.65, "elapsed_time": "3:29:50", "remaining_time": "0:14:13"}
|
| 1462 |
+
{"current_steps": 1462, "total_steps": 1560, "loss": 0.2815, "lr": 1.1973378332779229e-07, "epoch": 2.80896, "percentage": 93.72, "elapsed_time": "3:29:59", "remaining_time": "0:14:04"}
|
| 1463 |
+
{"current_steps": 1463, "total_steps": 1560, "loss": 0.2363, "lr": 1.1731225569517113e-07, "epoch": 2.81088, "percentage": 93.78, "elapsed_time": "3:30:07", "remaining_time": "0:13:55"}
|
| 1464 |
+
{"current_steps": 1464, "total_steps": 1560, "loss": 0.2465, "lr": 1.1491517499091498e-07, "epoch": 2.8128, "percentage": 93.85, "elapsed_time": "3:30:15", "remaining_time": "0:13:47"}
|
| 1465 |
+
{"current_steps": 1465, "total_steps": 1560, "loss": 0.26, "lr": 1.1254255321686836e-07, "epoch": 2.81472, "percentage": 93.91, "elapsed_time": "3:30:24", "remaining_time": "0:13:38"}
|
| 1466 |
+
{"current_steps": 1466, "total_steps": 1560, "loss": 0.3018, "lr": 1.1019440225241317e-07, "epoch": 2.81664, "percentage": 93.97, "elapsed_time": "3:30:32", "remaining_time": "0:13:29"}
|
| 1467 |
+
{"current_steps": 1467, "total_steps": 1560, "loss": 0.2797, "lr": 1.078707338544105e-07, "epoch": 2.8185599999999997, "percentage": 94.04, "elapsed_time": "3:30:40", "remaining_time": "0:13:21"}
|
| 1468 |
+
{"current_steps": 1468, "total_steps": 1560, "loss": 0.2722, "lr": 1.055715596571405e-07, "epoch": 2.82048, "percentage": 94.1, "elapsed_time": "3:30:49", "remaining_time": "0:13:12"}
|
| 1469 |
+
{"current_steps": 1469, "total_steps": 1560, "loss": 0.2634, "lr": 1.0329689117224262e-07, "epoch": 2.8224, "percentage": 94.17, "elapsed_time": "3:30:57", "remaining_time": "0:13:04"}
|
| 1470 |
+
{"current_steps": 1470, "total_steps": 1560, "loss": 0.2736, "lr": 1.0104673978866164e-07, "epoch": 2.82432, "percentage": 94.23, "elapsed_time": "3:31:05", "remaining_time": "0:12:55"}
|
| 1471 |
+
{"current_steps": 1471, "total_steps": 1560, "loss": 0.2894, "lr": 9.882111677258777e-08, "epoch": 2.82624, "percentage": 94.29, "elapsed_time": "3:31:13", "remaining_time": "0:12:46"}
|
| 1472 |
+
{"current_steps": 1472, "total_steps": 1560, "loss": 0.2611, "lr": 9.662003326740166e-08, "epoch": 2.82816, "percentage": 94.36, "elapsed_time": "3:31:22", "remaining_time": "0:12:38"}
|
| 1473 |
+
{"current_steps": 1473, "total_steps": 1560, "loss": 0.3096, "lr": 9.444350029361671e-08, "epoch": 2.83008, "percentage": 94.42, "elapsed_time": "3:31:30", "remaining_time": "0:12:29"}
|
| 1474 |
+
{"current_steps": 1474, "total_steps": 1560, "loss": 0.2736, "lr": 9.22915287488274e-08, "epoch": 2.832, "percentage": 94.49, "elapsed_time": "3:31:38", "remaining_time": "0:12:20"}
|
| 1475 |
+
{"current_steps": 1475, "total_steps": 1560, "loss": 0.3118, "lr": 9.016412940765107e-08, "epoch": 2.83392, "percentage": 94.55, "elapsed_time": "3:31:47", "remaining_time": "0:12:12"}
|
| 1476 |
+
{"current_steps": 1476, "total_steps": 1560, "loss": 0.2668, "lr": 8.80613129216762e-08, "epoch": 2.83584, "percentage": 94.62, "elapsed_time": "3:31:55", "remaining_time": "0:12:03"}
|
| 1477 |
+
{"current_steps": 1477, "total_steps": 1560, "loss": 0.2873, "lr": 8.598308981940751e-08, "epoch": 2.83776, "percentage": 94.68, "elapsed_time": "3:32:04", "remaining_time": "0:11:55"}
|
| 1478 |
+
{"current_steps": 1478, "total_steps": 1560, "loss": 0.2246, "lr": 8.392947050621603e-08, "epoch": 2.83968, "percentage": 94.74, "elapsed_time": "3:32:12", "remaining_time": "0:11:46"}
|
| 1479 |
+
{"current_steps": 1479, "total_steps": 1560, "loss": 0.3324, "lr": 8.190046526428241e-08, "epoch": 2.8416, "percentage": 94.81, "elapsed_time": "3:32:20", "remaining_time": "0:11:37"}
|
| 1480 |
+
{"current_steps": 1480, "total_steps": 1560, "loss": 0.2426, "lr": 7.989608425254924e-08, "epoch": 2.84352, "percentage": 94.87, "elapsed_time": "3:32:28", "remaining_time": "0:11:29"}
|
| 1481 |
+
{"current_steps": 1481, "total_steps": 1560, "loss": 0.3047, "lr": 7.791633750667105e-08, "epoch": 2.84544, "percentage": 94.94, "elapsed_time": "3:32:37", "remaining_time": "0:11:20"}
|
| 1482 |
+
{"current_steps": 1482, "total_steps": 1560, "loss": 0.2377, "lr": 7.59612349389599e-08, "epoch": 2.84736, "percentage": 95.0, "elapsed_time": "3:32:45", "remaining_time": "0:11:11"}
|
| 1483 |
+
{"current_steps": 1483, "total_steps": 1560, "loss": 0.2649, "lr": 7.403078633833716e-08, "epoch": 2.8492800000000003, "percentage": 95.06, "elapsed_time": "3:32:53", "remaining_time": "0:11:03"}
|
| 1484 |
+
{"current_steps": 1484, "total_steps": 1560, "loss": 0.2953, "lr": 7.212500137028789e-08, "epoch": 2.8512, "percentage": 95.13, "elapsed_time": "3:33:02", "remaining_time": "0:10:54"}
|
| 1485 |
+
{"current_steps": 1485, "total_steps": 1560, "loss": 0.2578, "lr": 7.024388957680705e-08, "epoch": 2.85312, "percentage": 95.19, "elapsed_time": "3:33:10", "remaining_time": "0:10:45"}
|
| 1486 |
+
{"current_steps": 1486, "total_steps": 1560, "loss": 0.2729, "lr": 6.838746037635735e-08, "epoch": 2.85504, "percentage": 95.26, "elapsed_time": "3:33:18", "remaining_time": "0:10:37"}
|
| 1487 |
+
{"current_steps": 1487, "total_steps": 1560, "loss": 0.2415, "lr": 6.655572306381696e-08, "epoch": 2.85696, "percentage": 95.32, "elapsed_time": "3:33:26", "remaining_time": "0:10:28"}
|
| 1488 |
+
{"current_steps": 1488, "total_steps": 1560, "loss": 0.2602, "lr": 6.474868681043578e-08, "epoch": 2.85888, "percentage": 95.38, "elapsed_time": "3:33:35", "remaining_time": "0:10:20"}
|
| 1489 |
+
{"current_steps": 1489, "total_steps": 1560, "loss": 0.2683, "lr": 6.29663606637898e-08, "epoch": 2.8608000000000002, "percentage": 95.45, "elapsed_time": "3:33:43", "remaining_time": "0:10:11"}
|
| 1490 |
+
{"current_steps": 1490, "total_steps": 1560, "loss": 0.2973, "lr": 6.120875354773459e-08, "epoch": 2.86272, "percentage": 95.51, "elapsed_time": "3:33:51", "remaining_time": "0:10:02"}
|
| 1491 |
+
{"current_steps": 1491, "total_steps": 1560, "loss": 0.2668, "lr": 5.947587426236079e-08, "epoch": 2.86464, "percentage": 95.58, "elapsed_time": "3:33:59", "remaining_time": "0:09:54"}
|
| 1492 |
+
{"current_steps": 1492, "total_steps": 1560, "loss": 0.2855, "lr": 5.776773148394976e-08, "epoch": 2.8665599999999998, "percentage": 95.64, "elapsed_time": "3:34:08", "remaining_time": "0:09:45"}
|
| 1493 |
+
{"current_steps": 1493, "total_steps": 1560, "loss": 0.2714, "lr": 5.608433376493194e-08, "epoch": 2.86848, "percentage": 95.71, "elapsed_time": "3:34:16", "remaining_time": "0:09:36"}
|
| 1494 |
+
{"current_steps": 1494, "total_steps": 1560, "loss": 0.269, "lr": 5.4425689533841864e-08, "epoch": 2.8704, "percentage": 95.77, "elapsed_time": "3:34:24", "remaining_time": "0:09:28"}
|
| 1495 |
+
{"current_steps": 1495, "total_steps": 1560, "loss": 0.2956, "lr": 5.279180709527765e-08, "epoch": 2.87232, "percentage": 95.83, "elapsed_time": "3:34:33", "remaining_time": "0:09:19"}
|
| 1496 |
+
{"current_steps": 1496, "total_steps": 1560, "loss": 0.2759, "lr": 5.1182694629857145e-08, "epoch": 2.87424, "percentage": 95.9, "elapsed_time": "3:34:41", "remaining_time": "0:09:11"}
|
| 1497 |
+
{"current_steps": 1497, "total_steps": 1560, "loss": 0.2697, "lr": 4.959836019417963e-08, "epoch": 2.87616, "percentage": 95.96, "elapsed_time": "3:34:50", "remaining_time": "0:09:02"}
|
| 1498 |
+
{"current_steps": 1498, "total_steps": 1560, "loss": 0.2936, "lr": 4.803881172078473e-08, "epoch": 2.8780799999999997, "percentage": 96.03, "elapsed_time": "3:34:58", "remaining_time": "0:08:53"}
|
| 1499 |
+
{"current_steps": 1499, "total_steps": 1560, "loss": 0.269, "lr": 4.650405701811078e-08, "epoch": 2.88, "percentage": 96.09, "elapsed_time": "3:35:06", "remaining_time": "0:08:45"}
|
| 1500 |
+
{"current_steps": 1500, "total_steps": 1560, "loss": 0.2641, "lr": 4.499410377045765e-08, "epoch": 2.88192, "percentage": 96.15, "elapsed_time": "3:35:15", "remaining_time": "0:08:36"}
|
| 1501 |
+
{"current_steps": 1501, "total_steps": 1560, "loss": 0.318, "lr": 4.350895953794898e-08, "epoch": 2.88384, "percentage": 96.22, "elapsed_time": "3:35:23", "remaining_time": "0:08:27"}
|
| 1502 |
+
{"current_steps": 1502, "total_steps": 1560, "loss": 0.2875, "lr": 4.2048631756492206e-08, "epoch": 2.88576, "percentage": 96.28, "elapsed_time": "3:35:31", "remaining_time": "0:08:19"}
|
| 1503 |
+
{"current_steps": 1503, "total_steps": 1560, "loss": 0.2684, "lr": 4.0613127737741396e-08, "epoch": 2.88768, "percentage": 96.35, "elapsed_time": "3:35:40", "remaining_time": "0:08:10"}
|
| 1504 |
+
{"current_steps": 1504, "total_steps": 1560, "loss": 0.3114, "lr": 3.9202454669063915e-08, "epoch": 2.8895999999999997, "percentage": 96.41, "elapsed_time": "3:35:48", "remaining_time": "0:08:02"}
|
| 1505 |
+
{"current_steps": 1505, "total_steps": 1560, "loss": 0.2945, "lr": 3.781661961349992e-08, "epoch": 2.89152, "percentage": 96.47, "elapsed_time": "3:35:56", "remaining_time": "0:07:53"}
|
| 1506 |
+
{"current_steps": 1506, "total_steps": 1560, "loss": 0.2969, "lr": 3.645562950973014e-08, "epoch": 2.89344, "percentage": 96.54, "elapsed_time": "3:36:05", "remaining_time": "0:07:44"}
|
| 1507 |
+
{"current_steps": 1507, "total_steps": 1560, "loss": 0.2962, "lr": 3.5119491172039836e-08, "epoch": 2.89536, "percentage": 96.6, "elapsed_time": "3:36:13", "remaining_time": "0:07:36"}
|
| 1508 |
+
{"current_steps": 1508, "total_steps": 1560, "loss": 0.2868, "lr": 3.3808211290284886e-08, "epoch": 2.89728, "percentage": 96.67, "elapsed_time": "3:36:21", "remaining_time": "0:07:27"}
|
| 1509 |
+
{"current_steps": 1509, "total_steps": 1560, "loss": 0.3144, "lr": 3.252179642985909e-08, "epoch": 2.8992, "percentage": 96.73, "elapsed_time": "3:36:30", "remaining_time": "0:07:19"}
|
| 1510 |
+
{"current_steps": 1510, "total_steps": 1560, "loss": 0.2763, "lr": 3.1260253031660247e-08, "epoch": 2.90112, "percentage": 96.79, "elapsed_time": "3:36:38", "remaining_time": "0:07:10"}
|
| 1511 |
+
{"current_steps": 1511, "total_steps": 1560, "loss": 0.2916, "lr": 3.002358741205691e-08, "epoch": 2.90304, "percentage": 96.86, "elapsed_time": "3:36:47", "remaining_time": "0:07:01"}
|
| 1512 |
+
{"current_steps": 1512, "total_steps": 1560, "loss": 0.2705, "lr": 2.8811805762860578e-08, "epoch": 2.90496, "percentage": 96.92, "elapsed_time": "3:36:55", "remaining_time": "0:06:53"}
|
| 1513 |
+
{"current_steps": 1513, "total_steps": 1560, "loss": 0.2943, "lr": 2.762491415128965e-08, "epoch": 2.90688, "percentage": 96.99, "elapsed_time": "3:37:04", "remaining_time": "0:06:44"}
|
| 1514 |
+
{"current_steps": 1514, "total_steps": 1560, "loss": 0.2923, "lr": 2.6462918519944425e-08, "epoch": 2.9088000000000003, "percentage": 97.05, "elapsed_time": "3:37:12", "remaining_time": "0:06:35"}
|
| 1515 |
+
{"current_steps": 1515, "total_steps": 1560, "loss": 0.2735, "lr": 2.5325824686772138e-08, "epoch": 2.91072, "percentage": 97.12, "elapsed_time": "3:37:20", "remaining_time": "0:06:27"}
|
| 1516 |
+
{"current_steps": 1516, "total_steps": 1560, "loss": 0.3105, "lr": 2.4213638345040868e-08, "epoch": 2.91264, "percentage": 97.18, "elapsed_time": "3:37:28", "remaining_time": "0:06:18"}
|
| 1517 |
+
{"current_steps": 1517, "total_steps": 1560, "loss": 0.2912, "lr": 2.3126365063311228e-08, "epoch": 2.91456, "percentage": 97.24, "elapsed_time": "3:37:37", "remaining_time": "0:06:10"}
|
| 1518 |
+
{"current_steps": 1518, "total_steps": 1560, "loss": 0.3156, "lr": 2.206401028540639e-08, "epoch": 2.91648, "percentage": 97.31, "elapsed_time": "3:37:45", "remaining_time": "0:06:01"}
|
| 1519 |
+
{"current_steps": 1519, "total_steps": 1560, "loss": 0.2812, "lr": 2.1026579330387655e-08, "epoch": 2.9184, "percentage": 97.37, "elapsed_time": "3:37:53", "remaining_time": "0:05:52"}
|
| 1520 |
+
{"current_steps": 1520, "total_steps": 1560, "loss": 0.2399, "lr": 2.0014077392525035e-08, "epoch": 2.9203200000000002, "percentage": 97.44, "elapsed_time": "3:38:01", "remaining_time": "0:05:44"}
|
| 1521 |
+
{"current_steps": 1521, "total_steps": 1560, "loss": 0.3013, "lr": 1.9026509541272276e-08, "epoch": 2.92224, "percentage": 97.5, "elapsed_time": "3:38:09", "remaining_time": "0:05:35"}
|
| 1522 |
+
{"current_steps": 1522, "total_steps": 1560, "loss": 0.2988, "lr": 1.8063880721242986e-08, "epoch": 2.92416, "percentage": 97.56, "elapsed_time": "3:38:18", "remaining_time": "0:05:27"}
|
| 1523 |
+
{"current_steps": 1523, "total_steps": 1560, "loss": 0.258, "lr": 1.712619575218344e-08, "epoch": 2.92608, "percentage": 97.63, "elapsed_time": "3:38:26", "remaining_time": "0:05:18"}
|
| 1524 |
+
{"current_steps": 1524, "total_steps": 1560, "loss": 0.3094, "lr": 1.6213459328950355e-08, "epoch": 2.928, "percentage": 97.69, "elapsed_time": "3:38:34", "remaining_time": "0:05:09"}
|
| 1525 |
+
{"current_steps": 1525, "total_steps": 1560, "loss": 0.2191, "lr": 1.5325676021484826e-08, "epoch": 2.92992, "percentage": 97.76, "elapsed_time": "3:38:42", "remaining_time": "0:05:01"}
|
| 1526 |
+
{"current_steps": 1526, "total_steps": 1560, "loss": 0.2577, "lr": 1.4462850274794548e-08, "epoch": 2.9318400000000002, "percentage": 97.82, "elapsed_time": "3:38:51", "remaining_time": "0:04:52"}
|
| 1527 |
+
{"current_steps": 1527, "total_steps": 1560, "loss": 0.2951, "lr": 1.3624986408924956e-08, "epoch": 2.93376, "percentage": 97.88, "elapsed_time": "3:38:59", "remaining_time": "0:04:43"}
|
| 1528 |
+
{"current_steps": 1528, "total_steps": 1560, "loss": 0.2911, "lr": 1.2812088618942009e-08, "epoch": 2.93568, "percentage": 97.95, "elapsed_time": "3:39:07", "remaining_time": "0:04:35"}
|
| 1529 |
+
{"current_steps": 1529, "total_steps": 1560, "loss": 0.2812, "lr": 1.2024160974911103e-08, "epoch": 2.9375999999999998, "percentage": 98.01, "elapsed_time": "3:39:15", "remaining_time": "0:04:26"}
|
| 1530 |
+
{"current_steps": 1530, "total_steps": 1560, "loss": 0.2886, "lr": 1.1261207421874309e-08, "epoch": 2.93952, "percentage": 98.08, "elapsed_time": "3:39:23", "remaining_time": "0:04:18"}
|
| 1531 |
+
{"current_steps": 1531, "total_steps": 1560, "loss": 0.2786, "lr": 1.0523231779832055e-08, "epoch": 2.94144, "percentage": 98.14, "elapsed_time": "3:39:32", "remaining_time": "0:04:09"}
|
| 1532 |
+
{"current_steps": 1532, "total_steps": 1560, "loss": 0.2866, "lr": 9.810237743724805e-09, "epoch": 2.94336, "percentage": 98.21, "elapsed_time": "3:39:40", "remaining_time": "0:04:00"}
|
| 1533 |
+
{"current_steps": 1533, "total_steps": 1560, "loss": 0.2572, "lr": 9.12222888341252e-09, "epoch": 2.94528, "percentage": 98.27, "elapsed_time": "3:39:48", "remaining_time": "0:03:52"}
|
| 1534 |
+
{"current_steps": 1534, "total_steps": 1560, "loss": 0.2832, "lr": 8.459208643659122e-09, "epoch": 2.9472, "percentage": 98.33, "elapsed_time": "3:39:57", "remaining_time": "0:03:43"}
|
| 1535 |
+
{"current_steps": 1535, "total_steps": 1560, "loss": 0.2559, "lr": 7.8211803441125e-09, "epoch": 2.9491199999999997, "percentage": 98.4, "elapsed_time": "3:40:05", "remaining_time": "0:03:35"}
|
| 1536 |
+
{"current_steps": 1536, "total_steps": 1560, "loss": 0.3153, "lr": 7.2081471792911914e-09, "epoch": 2.95104, "percentage": 98.46, "elapsed_time": "3:40:13", "remaining_time": "0:03:26"}
|
| 1537 |
+
{"current_steps": 1537, "total_steps": 1560, "loss": 0.2619, "lr": 6.6201122185649555e-09, "epoch": 2.95296, "percentage": 98.53, "elapsed_time": "3:40:21", "remaining_time": "0:03:17"}
|
| 1538 |
+
{"current_steps": 1538, "total_steps": 1560, "loss": 0.3306, "lr": 6.057078406142003e-09, "epoch": 2.95488, "percentage": 98.59, "elapsed_time": "3:40:30", "remaining_time": "0:03:09"}
|
| 1539 |
+
{"current_steps": 1539, "total_steps": 1560, "loss": 0.2509, "lr": 5.519048561053453e-09, "epoch": 2.9568, "percentage": 98.65, "elapsed_time": "3:40:38", "remaining_time": "0:03:00"}
|
| 1540 |
+
{"current_steps": 1540, "total_steps": 1560, "loss": 0.266, "lr": 5.006025377138901e-09, "epoch": 2.95872, "percentage": 98.72, "elapsed_time": "3:40:46", "remaining_time": "0:02:52"}
|
| 1541 |
+
{"current_steps": 1541, "total_steps": 1560, "loss": 0.2688, "lr": 4.518011423032542e-09, "epoch": 2.96064, "percentage": 98.78, "elapsed_time": "3:40:54", "remaining_time": "0:02:43"}
|
| 1542 |
+
{"current_steps": 1542, "total_steps": 1560, "loss": 0.2879, "lr": 4.055009142152066e-09, "epoch": 2.96256, "percentage": 98.85, "elapsed_time": "3:41:02", "remaining_time": "0:02:34"}
|
| 1543 |
+
{"current_steps": 1543, "total_steps": 1560, "loss": 0.2997, "lr": 3.6170208526836724e-09, "epoch": 2.96448, "percentage": 98.91, "elapsed_time": "3:41:11", "remaining_time": "0:02:26"}
|
| 1544 |
+
{"current_steps": 1544, "total_steps": 1560, "loss": 0.3001, "lr": 3.204048747573185e-09, "epoch": 2.9664, "percentage": 98.97, "elapsed_time": "3:41:19", "remaining_time": "0:02:17"}
|
| 1545 |
+
{"current_steps": 1545, "total_steps": 1560, "loss": 0.265, "lr": 2.816094894513843e-09, "epoch": 2.96832, "percentage": 99.04, "elapsed_time": "3:41:27", "remaining_time": "0:02:09"}
|
| 1546 |
+
{"current_steps": 1546, "total_steps": 1560, "loss": 0.2547, "lr": 2.4531612359363077e-09, "epoch": 2.97024, "percentage": 99.1, "elapsed_time": "3:41:35", "remaining_time": "0:02:00"}
|
| 1547 |
+
{"current_steps": 1547, "total_steps": 1560, "loss": 0.267, "lr": 2.1152495889970035e-09, "epoch": 2.97216, "percentage": 99.17, "elapsed_time": "3:41:44", "remaining_time": "0:01:51"}
|
| 1548 |
+
{"current_steps": 1548, "total_steps": 1560, "loss": 0.2817, "lr": 1.8023616455731253e-09, "epoch": 2.97408, "percentage": 99.23, "elapsed_time": "3:41:52", "remaining_time": "0:01:43"}
|
| 1549 |
+
{"current_steps": 1549, "total_steps": 1560, "loss": 0.3095, "lr": 1.514498972249312e-09, "epoch": 2.976, "percentage": 99.29, "elapsed_time": "3:42:00", "remaining_time": "0:01:34"}
|
| 1550 |
+
{"current_steps": 1550, "total_steps": 1560, "loss": 0.3095, "lr": 1.2516630103137638e-09, "epoch": 2.97792, "percentage": 99.36, "elapsed_time": "3:42:08", "remaining_time": "0:01:25"}
|
| 1551 |
+
{"current_steps": 1551, "total_steps": 1560, "loss": 0.3246, "lr": 1.0138550757493592e-09, "epoch": 2.9798400000000003, "percentage": 99.42, "elapsed_time": "3:42:17", "remaining_time": "0:01:17"}
|
| 1552 |
+
{"current_steps": 1552, "total_steps": 1560, "loss": 0.26, "lr": 8.010763592264381e-10, "epoch": 2.98176, "percentage": 99.49, "elapsed_time": "3:42:25", "remaining_time": "0:01:08"}
|
| 1553 |
+
{"current_steps": 1553, "total_steps": 1560, "loss": 0.3251, "lr": 6.133279260983616e-10, "epoch": 2.98368, "percentage": 99.55, "elapsed_time": "3:42:33", "remaining_time": "0:01:00"}
|
| 1554 |
+
{"current_steps": 1554, "total_steps": 1560, "loss": 0.2451, "lr": 4.506107163948503e-10, "epoch": 2.9856, "percentage": 99.62, "elapsed_time": "3:42:41", "remaining_time": "0:00:51"}
|
| 1555 |
+
{"current_steps": 1555, "total_steps": 1560, "loss": 0.3267, "lr": 3.12925544818099e-10, "epoch": 2.98752, "percentage": 99.68, "elapsed_time": "3:42:50", "remaining_time": "0:00:42"}
|
| 1556 |
+
{"current_steps": 1556, "total_steps": 1560, "loss": 0.2593, "lr": 2.0027310073833516e-10, "epoch": 2.98944, "percentage": 99.74, "elapsed_time": "3:42:59", "remaining_time": "0:00:34"}
|
| 1557 |
+
{"current_steps": 1557, "total_steps": 1560, "loss": 0.3219, "lr": 1.1265394818993358e-10, "epoch": 2.9913600000000002, "percentage": 99.81, "elapsed_time": "3:43:07", "remaining_time": "0:00:25"}
|
| 1558 |
+
{"current_steps": 1558, "total_steps": 1560, "loss": 0.2918, "lr": 5.0068525870305974e-11, "epoch": 2.99328, "percentage": 99.87, "elapsed_time": "3:43:16", "remaining_time": "0:00:17"}
|
| 1559 |
+
{"current_steps": 1559, "total_steps": 1560, "loss": 0.3611, "lr": 1.251714713546015e-11, "epoch": 2.9952, "percentage": 99.94, "elapsed_time": "3:43:24", "remaining_time": "0:00:08"}
|
| 1560 |
+
{"current_steps": 1560, "total_steps": 1560, "loss": 0.2725, "lr": 0.0, "epoch": 2.99712, "percentage": 100.0, "elapsed_time": "3:43:33", "remaining_time": "0:00:00"}
|
| 1561 |
+
{"current_steps": 1560, "total_steps": 1560, "epoch": 2.99712, "percentage": 100.0, "elapsed_time": "3:45:19", "remaining_time": "0:00:00"}
|