sedrickkeh commited on
Commit
1661cf7
·
verified ·
1 Parent(s): b09c788

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:299f01665f170bfa860d27dc12a5be0cf719f6687d52f2c5ee48d0e4fad9a7b8
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fae6549f4a6e5e6fa6c2451c52a83aa70c844fd0604cceee70555843364efe33
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5d2c4a46f27ca9823c2049273721cf97fd61e2aaba9cf35e9a383b100ce95fe
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8528f99fc9d9f7810ba1c2da425be1d813d89a1b99af5f26f2e68ab690674301
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:280eca396cb8ac8aad179df85682726157eeecbe41a29ea13b9fa2ba08048c1b
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fd033e942c231af670f8d7d840c0e067ba6d9ea132a855fb7888ab5c8ef97b1
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6535574faed94d320315d03d3460ab688c04488812c49b0ae0f48dc1833bdc33
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b10b4e50391c7c29e80f2d6a832d4d85b6a32356a3f35d6babca2d186d6ffac1
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -1055,3 +1055,507 @@
1055
  {"current_steps": 1055, "total_steps": 1560, "loss": 0.2, "lr": 2.866650361271023e-06, "epoch": 2.02752, "percentage": 67.63, "elapsed_time": "2:41:42", "remaining_time": "1:17:24"}
1056
  {"current_steps": 1056, "total_steps": 1560, "loss": 0.1395, "lr": 2.8565371929847286e-06, "epoch": 2.02944, "percentage": 67.69, "elapsed_time": "2:41:51", "remaining_time": "1:17:15"}
1057
  {"current_steps": 1057, "total_steps": 1560, "loss": 0.152, "lr": 2.84643475671417e-06, "epoch": 2.03136, "percentage": 67.76, "elapsed_time": "2:42:00", "remaining_time": "1:17:05"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1055
  {"current_steps": 1055, "total_steps": 1560, "loss": 0.2, "lr": 2.866650361271023e-06, "epoch": 2.02752, "percentage": 67.63, "elapsed_time": "2:41:42", "remaining_time": "1:17:24"}
1056
  {"current_steps": 1056, "total_steps": 1560, "loss": 0.1395, "lr": 2.8565371929847286e-06, "epoch": 2.02944, "percentage": 67.69, "elapsed_time": "2:41:51", "remaining_time": "1:17:15"}
1057
  {"current_steps": 1057, "total_steps": 1560, "loss": 0.152, "lr": 2.84643475671417e-06, "epoch": 2.03136, "percentage": 67.76, "elapsed_time": "2:42:00", "remaining_time": "1:17:05"}
1058
+ {"current_steps": 1058, "total_steps": 1560, "loss": 0.1685, "lr": 2.836343103040819e-06, "epoch": 2.03328, "percentage": 67.82, "elapsed_time": "2:42:09", "remaining_time": "1:16:56"}
1059
+ {"current_steps": 1059, "total_steps": 1560, "loss": 0.1692, "lr": 2.8262622824921593e-06, "epoch": 2.0352, "percentage": 67.88, "elapsed_time": "2:42:19", "remaining_time": "1:16:47"}
1060
+ {"current_steps": 1060, "total_steps": 1560, "loss": 0.1657, "lr": 2.816192345541437e-06, "epoch": 2.03712, "percentage": 67.95, "elapsed_time": "2:42:28", "remaining_time": "1:16:38"}
1061
+ {"current_steps": 1061, "total_steps": 1560, "loss": 0.2042, "lr": 2.8061333426074054e-06, "epoch": 2.03904, "percentage": 68.01, "elapsed_time": "2:42:38", "remaining_time": "1:16:29"}
1062
+ {"current_steps": 1062, "total_steps": 1560, "loss": 0.1747, "lr": 2.7960853240540703e-06, "epoch": 2.04096, "percentage": 68.08, "elapsed_time": "2:42:47", "remaining_time": "1:16:20"}
1063
+ {"current_steps": 1063, "total_steps": 1560, "loss": 0.175, "lr": 2.7860483401904483e-06, "epoch": 2.04288, "percentage": 68.14, "elapsed_time": "2:42:56", "remaining_time": "1:16:11"}
1064
+ {"current_steps": 1064, "total_steps": 1560, "loss": 0.1725, "lr": 2.776022441270295e-06, "epoch": 2.0448, "percentage": 68.21, "elapsed_time": "2:43:06", "remaining_time": "1:16:02"}
1065
+ {"current_steps": 1065, "total_steps": 1560, "loss": 0.2107, "lr": 2.766007677491871e-06, "epoch": 2.04672, "percentage": 68.27, "elapsed_time": "2:43:15", "remaining_time": "1:15:52"}
1066
+ {"current_steps": 1066, "total_steps": 1560, "loss": 0.1681, "lr": 2.7560040989976894e-06, "epoch": 2.04864, "percentage": 68.33, "elapsed_time": "2:43:25", "remaining_time": "1:15:43"}
1067
+ {"current_steps": 1067, "total_steps": 1560, "loss": 0.1706, "lr": 2.7460117558742532e-06, "epoch": 2.05056, "percentage": 68.4, "elapsed_time": "2:43:34", "remaining_time": "1:15:34"}
1068
+ {"current_steps": 1068, "total_steps": 1560, "loss": 0.1579, "lr": 2.736030698151815e-06, "epoch": 2.05248, "percentage": 68.46, "elapsed_time": "2:43:43", "remaining_time": "1:15:25"}
1069
+ {"current_steps": 1069, "total_steps": 1560, "loss": 0.1745, "lr": 2.72606097580412e-06, "epoch": 2.0544, "percentage": 68.53, "elapsed_time": "2:43:53", "remaining_time": "1:15:16"}
1070
+ {"current_steps": 1070, "total_steps": 1560, "loss": 0.1853, "lr": 2.7161026387481636e-06, "epoch": 2.05632, "percentage": 68.59, "elapsed_time": "2:44:02", "remaining_time": "1:15:07"}
1071
+ {"current_steps": 1071, "total_steps": 1560, "loss": 0.1697, "lr": 2.7061557368439294e-06, "epoch": 2.05824, "percentage": 68.65, "elapsed_time": "2:44:12", "remaining_time": "1:14:58"}
1072
+ {"current_steps": 1072, "total_steps": 1560, "loss": 0.2094, "lr": 2.6962203198941587e-06, "epoch": 2.06016, "percentage": 68.72, "elapsed_time": "2:44:21", "remaining_time": "1:14:49"}
1073
+ {"current_steps": 1073, "total_steps": 1560, "loss": 0.1661, "lr": 2.686296437644074e-06, "epoch": 2.06208, "percentage": 68.78, "elapsed_time": "2:44:30", "remaining_time": "1:14:39"}
1074
+ {"current_steps": 1074, "total_steps": 1560, "loss": 0.1804, "lr": 2.6763841397811576e-06, "epoch": 2.064, "percentage": 68.85, "elapsed_time": "2:44:40", "remaining_time": "1:14:30"}
1075
+ {"current_steps": 1075, "total_steps": 1560, "loss": 0.153, "lr": 2.666483475934885e-06, "epoch": 2.06592, "percentage": 68.91, "elapsed_time": "2:44:49", "remaining_time": "1:14:21"}
1076
+ {"current_steps": 1076, "total_steps": 1560, "loss": 0.1871, "lr": 2.656594495676482e-06, "epoch": 2.06784, "percentage": 68.97, "elapsed_time": "2:44:58", "remaining_time": "1:14:12"}
1077
+ {"current_steps": 1077, "total_steps": 1560, "loss": 0.1703, "lr": 2.6467172485186775e-06, "epoch": 2.06976, "percentage": 69.04, "elapsed_time": "2:45:07", "remaining_time": "1:14:03"}
1078
+ {"current_steps": 1078, "total_steps": 1560, "loss": 0.1498, "lr": 2.636851783915454e-06, "epoch": 2.07168, "percentage": 69.1, "elapsed_time": "2:45:17", "remaining_time": "1:13:54"}
1079
+ {"current_steps": 1079, "total_steps": 1560, "loss": 0.2051, "lr": 2.626998151261798e-06, "epoch": 2.0736, "percentage": 69.17, "elapsed_time": "2:45:26", "remaining_time": "1:13:45"}
1080
+ {"current_steps": 1080, "total_steps": 1560, "loss": 0.1706, "lr": 2.6171563998934605e-06, "epoch": 2.07552, "percentage": 69.23, "elapsed_time": "2:45:35", "remaining_time": "1:13:35"}
1081
+ {"current_steps": 1081, "total_steps": 1560, "loss": 0.1781, "lr": 2.607326579086701e-06, "epoch": 2.07744, "percentage": 69.29, "elapsed_time": "2:45:45", "remaining_time": "1:13:26"}
1082
+ {"current_steps": 1082, "total_steps": 1560, "loss": 0.1585, "lr": 2.5975087380580445e-06, "epoch": 2.07936, "percentage": 69.36, "elapsed_time": "2:45:54", "remaining_time": "1:13:17"}
1083
+ {"current_steps": 1083, "total_steps": 1560, "loss": 0.159, "lr": 2.587702925964034e-06, "epoch": 2.08128, "percentage": 69.42, "elapsed_time": "2:46:04", "remaining_time": "1:13:08"}
1084
+ {"current_steps": 1084, "total_steps": 1560, "loss": 0.1917, "lr": 2.577909191900988e-06, "epoch": 2.0832, "percentage": 69.49, "elapsed_time": "2:46:13", "remaining_time": "1:12:59"}
1085
+ {"current_steps": 1085, "total_steps": 1560, "loss": 0.1537, "lr": 2.5681275849047482e-06, "epoch": 2.08512, "percentage": 69.55, "elapsed_time": "2:46:22", "remaining_time": "1:12:50"}
1086
+ {"current_steps": 1086, "total_steps": 1560, "loss": 0.166, "lr": 2.5583581539504464e-06, "epoch": 2.08704, "percentage": 69.62, "elapsed_time": "2:46:32", "remaining_time": "1:12:41"}
1087
+ {"current_steps": 1087, "total_steps": 1560, "loss": 0.2267, "lr": 2.5486009479522355e-06, "epoch": 2.08896, "percentage": 69.68, "elapsed_time": "2:46:41", "remaining_time": "1:12:32"}
1088
+ {"current_steps": 1088, "total_steps": 1560, "loss": 0.194, "lr": 2.5388560157630765e-06, "epoch": 2.09088, "percentage": 69.74, "elapsed_time": "2:46:50", "remaining_time": "1:12:22"}
1089
+ {"current_steps": 1089, "total_steps": 1560, "loss": 0.2013, "lr": 2.5291234061744655e-06, "epoch": 2.0928, "percentage": 69.81, "elapsed_time": "2:46:59", "remaining_time": "1:12:13"}
1090
+ {"current_steps": 1090, "total_steps": 1560, "loss": 0.1547, "lr": 2.519403167916207e-06, "epoch": 2.09472, "percentage": 69.87, "elapsed_time": "2:47:09", "remaining_time": "1:12:04"}
1091
+ {"current_steps": 1091, "total_steps": 1560, "loss": 0.1897, "lr": 2.50969534965616e-06, "epoch": 2.09664, "percentage": 69.94, "elapsed_time": "2:47:18", "remaining_time": "1:11:55"}
1092
+ {"current_steps": 1092, "total_steps": 1560, "loss": 0.1562, "lr": 2.5000000000000015e-06, "epoch": 2.09856, "percentage": 70.0, "elapsed_time": "2:47:27", "remaining_time": "1:11:46"}
1093
+ {"current_steps": 1093, "total_steps": 1560, "loss": 0.1862, "lr": 2.490317167490976e-06, "epoch": 2.10048, "percentage": 70.06, "elapsed_time": "2:47:37", "remaining_time": "1:11:37"}
1094
+ {"current_steps": 1094, "total_steps": 1560, "loss": 0.1681, "lr": 2.480646900609664e-06, "epoch": 2.1024, "percentage": 70.13, "elapsed_time": "2:47:46", "remaining_time": "1:11:27"}
1095
+ {"current_steps": 1095, "total_steps": 1560, "loss": 0.2487, "lr": 2.4709892477737263e-06, "epoch": 2.10432, "percentage": 70.19, "elapsed_time": "2:47:55", "remaining_time": "1:11:18"}
1096
+ {"current_steps": 1096, "total_steps": 1560, "loss": 0.2103, "lr": 2.4613442573376625e-06, "epoch": 2.10624, "percentage": 70.26, "elapsed_time": "2:48:05", "remaining_time": "1:11:09"}
1097
+ {"current_steps": 1097, "total_steps": 1560, "loss": 0.1881, "lr": 2.4517119775925824e-06, "epoch": 2.10816, "percentage": 70.32, "elapsed_time": "2:48:13", "remaining_time": "1:11:00"}
1098
+ {"current_steps": 1098, "total_steps": 1560, "loss": 0.2005, "lr": 2.4420924567659508e-06, "epoch": 2.11008, "percentage": 70.38, "elapsed_time": "2:48:23", "remaining_time": "1:10:51"}
1099
+ {"current_steps": 1099, "total_steps": 1560, "loss": 0.1708, "lr": 2.4324857430213504e-06, "epoch": 2.112, "percentage": 70.45, "elapsed_time": "2:48:32", "remaining_time": "1:10:41"}
1100
+ {"current_steps": 1100, "total_steps": 1560, "loss": 0.1723, "lr": 2.422891884458241e-06, "epoch": 2.11392, "percentage": 70.51, "elapsed_time": "2:48:41", "remaining_time": "1:10:32"}
1101
+ {"current_steps": 1101, "total_steps": 1560, "loss": 0.175, "lr": 2.4133109291117156e-06, "epoch": 2.11584, "percentage": 70.58, "elapsed_time": "2:48:51", "remaining_time": "1:10:23"}
1102
+ {"current_steps": 1102, "total_steps": 1560, "loss": 0.1482, "lr": 2.4037429249522702e-06, "epoch": 2.11776, "percentage": 70.64, "elapsed_time": "2:49:00", "remaining_time": "1:10:14"}
1103
+ {"current_steps": 1103, "total_steps": 1560, "loss": 0.1948, "lr": 2.394187919885548e-06, "epoch": 2.11968, "percentage": 70.71, "elapsed_time": "2:49:09", "remaining_time": "1:10:05"}
1104
+ {"current_steps": 1104, "total_steps": 1560, "loss": 0.1912, "lr": 2.384645961752113e-06, "epoch": 2.1216, "percentage": 70.77, "elapsed_time": "2:49:18", "remaining_time": "1:09:56"}
1105
+ {"current_steps": 1105, "total_steps": 1560, "loss": 0.1742, "lr": 2.3751170983272e-06, "epoch": 2.12352, "percentage": 70.83, "elapsed_time": "2:49:28", "remaining_time": "1:09:46"}
1106
+ {"current_steps": 1106, "total_steps": 1560, "loss": 0.2181, "lr": 2.3656013773204843e-06, "epoch": 2.12544, "percentage": 70.9, "elapsed_time": "2:49:37", "remaining_time": "1:09:37"}
1107
+ {"current_steps": 1107, "total_steps": 1560, "loss": 0.1871, "lr": 2.3560988463758366e-06, "epoch": 2.12736, "percentage": 70.96, "elapsed_time": "2:49:46", "remaining_time": "1:09:28"}
1108
+ {"current_steps": 1108, "total_steps": 1560, "loss": 0.1632, "lr": 2.346609553071093e-06, "epoch": 2.12928, "percentage": 71.03, "elapsed_time": "2:49:55", "remaining_time": "1:09:19"}
1109
+ {"current_steps": 1109, "total_steps": 1560, "loss": 0.1822, "lr": 2.3371335449178006e-06, "epoch": 2.1312, "percentage": 71.09, "elapsed_time": "2:50:04", "remaining_time": "1:09:09"}
1110
+ {"current_steps": 1110, "total_steps": 1560, "loss": 0.1319, "lr": 2.3276708693609947e-06, "epoch": 2.13312, "percentage": 71.15, "elapsed_time": "2:50:13", "remaining_time": "1:09:00"}
1111
+ {"current_steps": 1111, "total_steps": 1560, "loss": 0.1526, "lr": 2.3182215737789593e-06, "epoch": 2.13504, "percentage": 71.22, "elapsed_time": "2:50:22", "remaining_time": "1:08:51"}
1112
+ {"current_steps": 1112, "total_steps": 1560, "loss": 0.186, "lr": 2.308785705482982e-06, "epoch": 2.13696, "percentage": 71.28, "elapsed_time": "2:50:31", "remaining_time": "1:08:41"}
1113
+ {"current_steps": 1113, "total_steps": 1560, "loss": 0.1468, "lr": 2.2993633117171243e-06, "epoch": 2.13888, "percentage": 71.35, "elapsed_time": "2:50:40", "remaining_time": "1:08:32"}
1114
+ {"current_steps": 1114, "total_steps": 1560, "loss": 0.1699, "lr": 2.289954439657981e-06, "epoch": 2.1408, "percentage": 71.41, "elapsed_time": "2:50:49", "remaining_time": "1:08:23"}
1115
+ {"current_steps": 1115, "total_steps": 1560, "loss": 0.173, "lr": 2.2805591364144446e-06, "epoch": 2.14272, "percentage": 71.47, "elapsed_time": "2:50:58", "remaining_time": "1:08:14"}
1116
+ {"current_steps": 1116, "total_steps": 1560, "loss": 0.1683, "lr": 2.2711774490274767e-06, "epoch": 2.14464, "percentage": 71.54, "elapsed_time": "2:51:07", "remaining_time": "1:08:04"}
1117
+ {"current_steps": 1117, "total_steps": 1560, "loss": 0.1664, "lr": 2.2618094244698614e-06, "epoch": 2.14656, "percentage": 71.6, "elapsed_time": "2:51:16", "remaining_time": "1:07:55"}
1118
+ {"current_steps": 1118, "total_steps": 1560, "loss": 0.1922, "lr": 2.2524551096459703e-06, "epoch": 2.14848, "percentage": 71.67, "elapsed_time": "2:51:25", "remaining_time": "1:07:46"}
1119
+ {"current_steps": 1119, "total_steps": 1560, "loss": 0.1836, "lr": 2.243114551391542e-06, "epoch": 2.1504, "percentage": 71.73, "elapsed_time": "2:51:34", "remaining_time": "1:07:37"}
1120
+ {"current_steps": 1120, "total_steps": 1560, "loss": 0.1524, "lr": 2.2337877964734324e-06, "epoch": 2.15232, "percentage": 71.79, "elapsed_time": "2:51:43", "remaining_time": "1:07:27"}
1121
+ {"current_steps": 1121, "total_steps": 1560, "loss": 0.1846, "lr": 2.224474891589386e-06, "epoch": 2.15424, "percentage": 71.86, "elapsed_time": "2:51:52", "remaining_time": "1:07:18"}
1122
+ {"current_steps": 1122, "total_steps": 1560, "loss": 0.1572, "lr": 2.2151758833678044e-06, "epoch": 2.15616, "percentage": 71.92, "elapsed_time": "2:52:01", "remaining_time": "1:07:09"}
1123
+ {"current_steps": 1123, "total_steps": 1560, "loss": 0.159, "lr": 2.205890818367508e-06, "epoch": 2.15808, "percentage": 71.99, "elapsed_time": "2:52:10", "remaining_time": "1:06:59"}
1124
+ {"current_steps": 1124, "total_steps": 1560, "loss": 0.1818, "lr": 2.1966197430775056e-06, "epoch": 2.16, "percentage": 72.05, "elapsed_time": "2:52:19", "remaining_time": "1:06:50"}
1125
+ {"current_steps": 1125, "total_steps": 1560, "loss": 0.1581, "lr": 2.187362703916766e-06, "epoch": 2.16192, "percentage": 72.12, "elapsed_time": "2:52:28", "remaining_time": "1:06:41"}
1126
+ {"current_steps": 1126, "total_steps": 1560, "loss": 0.1487, "lr": 2.178119747233976e-06, "epoch": 2.16384, "percentage": 72.18, "elapsed_time": "2:52:37", "remaining_time": "1:06:31"}
1127
+ {"current_steps": 1127, "total_steps": 1560, "loss": 0.2019, "lr": 2.168890919307315e-06, "epoch": 2.16576, "percentage": 72.24, "elapsed_time": "2:52:45", "remaining_time": "1:06:22"}
1128
+ {"current_steps": 1128, "total_steps": 1560, "loss": 0.2035, "lr": 2.159676266344222e-06, "epoch": 2.16768, "percentage": 72.31, "elapsed_time": "2:52:54", "remaining_time": "1:06:13"}
1129
+ {"current_steps": 1129, "total_steps": 1560, "loss": 0.2016, "lr": 2.1504758344811615e-06, "epoch": 2.1696, "percentage": 72.37, "elapsed_time": "2:53:03", "remaining_time": "1:06:04"}
1130
+ {"current_steps": 1130, "total_steps": 1560, "loss": 0.1917, "lr": 2.141289669783401e-06, "epoch": 2.17152, "percentage": 72.44, "elapsed_time": "2:53:13", "remaining_time": "1:05:54"}
1131
+ {"current_steps": 1131, "total_steps": 1560, "loss": 0.1589, "lr": 2.132117818244771e-06, "epoch": 2.17344, "percentage": 72.5, "elapsed_time": "2:53:22", "remaining_time": "1:05:45"}
1132
+ {"current_steps": 1132, "total_steps": 1560, "loss": 0.1919, "lr": 2.122960325787432e-06, "epoch": 2.17536, "percentage": 72.56, "elapsed_time": "2:53:31", "remaining_time": "1:05:36"}
1133
+ {"current_steps": 1133, "total_steps": 1560, "loss": 0.1646, "lr": 2.1138172382616612e-06, "epoch": 2.17728, "percentage": 72.63, "elapsed_time": "2:53:41", "remaining_time": "1:05:27"}
1134
+ {"current_steps": 1134, "total_steps": 1560, "loss": 0.1754, "lr": 2.104688601445606e-06, "epoch": 2.1792, "percentage": 72.69, "elapsed_time": "2:53:50", "remaining_time": "1:05:18"}
1135
+ {"current_steps": 1135, "total_steps": 1560, "loss": 0.1617, "lr": 2.0955744610450616e-06, "epoch": 2.18112, "percentage": 72.76, "elapsed_time": "2:53:59", "remaining_time": "1:05:09"}
1136
+ {"current_steps": 1136, "total_steps": 1560, "loss": 0.187, "lr": 2.086474862693244e-06, "epoch": 2.18304, "percentage": 72.82, "elapsed_time": "2:54:09", "remaining_time": "1:05:00"}
1137
+ {"current_steps": 1137, "total_steps": 1560, "loss": 0.172, "lr": 2.077389851950557e-06, "epoch": 2.1849600000000002, "percentage": 72.88, "elapsed_time": "2:54:18", "remaining_time": "1:04:50"}
1138
+ {"current_steps": 1138, "total_steps": 1560, "loss": 0.1654, "lr": 2.068319474304365e-06, "epoch": 2.18688, "percentage": 72.95, "elapsed_time": "2:54:27", "remaining_time": "1:04:41"}
1139
+ {"current_steps": 1139, "total_steps": 1560, "loss": 0.1702, "lr": 2.059263775168773e-06, "epoch": 2.1888, "percentage": 73.01, "elapsed_time": "2:54:37", "remaining_time": "1:04:32"}
1140
+ {"current_steps": 1140, "total_steps": 1560, "loss": 0.2147, "lr": 2.050222799884387e-06, "epoch": 2.19072, "percentage": 73.08, "elapsed_time": "2:54:46", "remaining_time": "1:04:23"}
1141
+ {"current_steps": 1141, "total_steps": 1560, "loss": 0.1798, "lr": 2.0411965937180907e-06, "epoch": 2.19264, "percentage": 73.14, "elapsed_time": "2:54:55", "remaining_time": "1:04:14"}
1142
+ {"current_steps": 1142, "total_steps": 1560, "loss": 0.1699, "lr": 2.0321852018628278e-06, "epoch": 2.19456, "percentage": 73.21, "elapsed_time": "2:55:05", "remaining_time": "1:04:05"}
1143
+ {"current_steps": 1143, "total_steps": 1560, "loss": 0.1741, "lr": 2.0231886694373653e-06, "epoch": 2.19648, "percentage": 73.27, "elapsed_time": "2:55:14", "remaining_time": "1:03:55"}
1144
+ {"current_steps": 1144, "total_steps": 1560, "loss": 0.1655, "lr": 2.0142070414860704e-06, "epoch": 2.1984, "percentage": 73.33, "elapsed_time": "2:55:23", "remaining_time": "1:03:46"}
1145
+ {"current_steps": 1145, "total_steps": 1560, "loss": 0.1669, "lr": 2.005240362978686e-06, "epoch": 2.20032, "percentage": 73.4, "elapsed_time": "2:55:32", "remaining_time": "1:03:37"}
1146
+ {"current_steps": 1146, "total_steps": 1560, "loss": 0.1701, "lr": 1.996288678810105e-06, "epoch": 2.20224, "percentage": 73.46, "elapsed_time": "2:55:42", "remaining_time": "1:03:28"}
1147
+ {"current_steps": 1147, "total_steps": 1560, "loss": 0.1817, "lr": 1.98735203380015e-06, "epoch": 2.20416, "percentage": 73.53, "elapsed_time": "2:55:51", "remaining_time": "1:03:19"}
1148
+ {"current_steps": 1148, "total_steps": 1560, "loss": 0.1741, "lr": 1.9784304726933384e-06, "epoch": 2.20608, "percentage": 73.59, "elapsed_time": "2:56:00", "remaining_time": "1:03:10"}
1149
+ {"current_steps": 1149, "total_steps": 1560, "loss": 0.1563, "lr": 1.9695240401586687e-06, "epoch": 2.208, "percentage": 73.65, "elapsed_time": "2:56:09", "remaining_time": "1:03:00"}
1150
+ {"current_steps": 1150, "total_steps": 1560, "loss": 0.2083, "lr": 1.9606327807893905e-06, "epoch": 2.20992, "percentage": 73.72, "elapsed_time": "2:56:18", "remaining_time": "1:02:51"}
1151
+ {"current_steps": 1151, "total_steps": 1560, "loss": 0.1601, "lr": 1.9517567391027853e-06, "epoch": 2.21184, "percentage": 73.78, "elapsed_time": "2:56:27", "remaining_time": "1:02:42"}
1152
+ {"current_steps": 1152, "total_steps": 1560, "loss": 0.1968, "lr": 1.942895959539939e-06, "epoch": 2.21376, "percentage": 73.85, "elapsed_time": "2:56:37", "remaining_time": "1:02:33"}
1153
+ {"current_steps": 1153, "total_steps": 1560, "loss": 0.1881, "lr": 1.934050486465529e-06, "epoch": 2.21568, "percentage": 73.91, "elapsed_time": "2:56:46", "remaining_time": "1:02:24"}
1154
+ {"current_steps": 1154, "total_steps": 1560, "loss": 0.2102, "lr": 1.9252203641675854e-06, "epoch": 2.2176, "percentage": 73.97, "elapsed_time": "2:56:55", "remaining_time": "1:02:14"}
1155
+ {"current_steps": 1155, "total_steps": 1560, "loss": 0.1762, "lr": 1.9164056368572847e-06, "epoch": 2.21952, "percentage": 74.04, "elapsed_time": "2:57:05", "remaining_time": "1:02:05"}
1156
+ {"current_steps": 1156, "total_steps": 1560, "loss": 0.1983, "lr": 1.9076063486687256e-06, "epoch": 2.22144, "percentage": 74.1, "elapsed_time": "2:57:14", "remaining_time": "1:01:56"}
1157
+ {"current_steps": 1157, "total_steps": 1560, "loss": 0.2091, "lr": 1.8988225436587005e-06, "epoch": 2.22336, "percentage": 74.17, "elapsed_time": "2:57:23", "remaining_time": "1:01:47"}
1158
+ {"current_steps": 1158, "total_steps": 1560, "loss": 0.2038, "lr": 1.8900542658064807e-06, "epoch": 2.22528, "percentage": 74.23, "elapsed_time": "2:57:33", "remaining_time": "1:01:38"}
1159
+ {"current_steps": 1159, "total_steps": 1560, "loss": 0.1815, "lr": 1.8813015590135963e-06, "epoch": 2.2272, "percentage": 74.29, "elapsed_time": "2:57:42", "remaining_time": "1:01:29"}
1160
+ {"current_steps": 1160, "total_steps": 1560, "loss": 0.1467, "lr": 1.8725644671036125e-06, "epoch": 2.22912, "percentage": 74.36, "elapsed_time": "2:57:51", "remaining_time": "1:01:19"}
1161
+ {"current_steps": 1161, "total_steps": 1560, "loss": 0.1708, "lr": 1.8638430338219199e-06, "epoch": 2.23104, "percentage": 74.42, "elapsed_time": "2:58:01", "remaining_time": "1:01:10"}
1162
+ {"current_steps": 1162, "total_steps": 1560, "loss": 0.2108, "lr": 1.8551373028355013e-06, "epoch": 2.23296, "percentage": 74.49, "elapsed_time": "2:58:10", "remaining_time": "1:01:01"}
1163
+ {"current_steps": 1163, "total_steps": 1560, "loss": 0.1477, "lr": 1.846447317732723e-06, "epoch": 2.23488, "percentage": 74.55, "elapsed_time": "2:58:19", "remaining_time": "1:00:52"}
1164
+ {"current_steps": 1164, "total_steps": 1560, "loss": 0.1838, "lr": 1.8377731220231144e-06, "epoch": 2.2368, "percentage": 74.62, "elapsed_time": "2:58:28", "remaining_time": "1:00:43"}
1165
+ {"current_steps": 1165, "total_steps": 1560, "loss": 0.2023, "lr": 1.8291147591371482e-06, "epoch": 2.23872, "percentage": 74.68, "elapsed_time": "2:58:37", "remaining_time": "1:00:33"}
1166
+ {"current_steps": 1166, "total_steps": 1560, "loss": 0.1574, "lr": 1.8204722724260266e-06, "epoch": 2.24064, "percentage": 74.74, "elapsed_time": "2:58:46", "remaining_time": "1:00:24"}
1167
+ {"current_steps": 1167, "total_steps": 1560, "loss": 0.1889, "lr": 1.8118457051614591e-06, "epoch": 2.24256, "percentage": 74.81, "elapsed_time": "2:58:56", "remaining_time": "1:00:15"}
1168
+ {"current_steps": 1168, "total_steps": 1560, "loss": 0.2189, "lr": 1.803235100535452e-06, "epoch": 2.24448, "percentage": 74.87, "elapsed_time": "2:59:05", "remaining_time": "1:00:06"}
1169
+ {"current_steps": 1169, "total_steps": 1560, "loss": 0.1932, "lr": 1.7946405016600843e-06, "epoch": 2.2464, "percentage": 74.94, "elapsed_time": "2:59:14", "remaining_time": "0:59:57"}
1170
+ {"current_steps": 1170, "total_steps": 1560, "loss": 0.1954, "lr": 1.7860619515673034e-06, "epoch": 2.24832, "percentage": 75.0, "elapsed_time": "2:59:23", "remaining_time": "0:59:47"}
1171
+ {"current_steps": 1171, "total_steps": 1560, "loss": 0.1427, "lr": 1.7774994932086976e-06, "epoch": 2.25024, "percentage": 75.06, "elapsed_time": "2:59:32", "remaining_time": "0:59:38"}
1172
+ {"current_steps": 1172, "total_steps": 1560, "loss": 0.1918, "lr": 1.7689531694552863e-06, "epoch": 2.25216, "percentage": 75.13, "elapsed_time": "2:59:41", "remaining_time": "0:59:29"}
1173
+ {"current_steps": 1173, "total_steps": 1560, "loss": 0.1919, "lr": 1.7604230230973068e-06, "epoch": 2.25408, "percentage": 75.19, "elapsed_time": "2:59:51", "remaining_time": "0:59:20"}
1174
+ {"current_steps": 1174, "total_steps": 1560, "loss": 0.1586, "lr": 1.7519090968439966e-06, "epoch": 2.2560000000000002, "percentage": 75.26, "elapsed_time": "3:00:00", "remaining_time": "0:59:11"}
1175
+ {"current_steps": 1175, "total_steps": 1560, "loss": 0.1854, "lr": 1.7434114333233853e-06, "epoch": 2.25792, "percentage": 75.32, "elapsed_time": "3:00:09", "remaining_time": "0:59:01"}
1176
+ {"current_steps": 1176, "total_steps": 1560, "loss": 0.2069, "lr": 1.7349300750820758e-06, "epoch": 2.25984, "percentage": 75.38, "elapsed_time": "3:00:18", "remaining_time": "0:58:52"}
1177
+ {"current_steps": 1177, "total_steps": 1560, "loss": 0.1975, "lr": 1.7264650645850256e-06, "epoch": 2.2617599999999998, "percentage": 75.45, "elapsed_time": "3:00:28", "remaining_time": "0:58:43"}
1178
+ {"current_steps": 1178, "total_steps": 1560, "loss": 0.2015, "lr": 1.7180164442153529e-06, "epoch": 2.26368, "percentage": 75.51, "elapsed_time": "3:00:37", "remaining_time": "0:58:34"}
1179
+ {"current_steps": 1179, "total_steps": 1560, "loss": 0.1651, "lr": 1.709584256274106e-06, "epoch": 2.2656, "percentage": 75.58, "elapsed_time": "3:00:46", "remaining_time": "0:58:25"}
1180
+ {"current_steps": 1180, "total_steps": 1560, "loss": 0.1951, "lr": 1.7011685429800596e-06, "epoch": 2.26752, "percentage": 75.64, "elapsed_time": "3:00:56", "remaining_time": "0:58:16"}
1181
+ {"current_steps": 1181, "total_steps": 1560, "loss": 0.1487, "lr": 1.6927693464695022e-06, "epoch": 2.26944, "percentage": 75.71, "elapsed_time": "3:01:05", "remaining_time": "0:58:06"}
1182
+ {"current_steps": 1182, "total_steps": 1560, "loss": 0.1682, "lr": 1.6843867087960252e-06, "epoch": 2.27136, "percentage": 75.77, "elapsed_time": "3:01:14", "remaining_time": "0:57:57"}
1183
+ {"current_steps": 1183, "total_steps": 1560, "loss": 0.1844, "lr": 1.6760206719303107e-06, "epoch": 2.27328, "percentage": 75.83, "elapsed_time": "3:01:24", "remaining_time": "0:57:48"}
1184
+ {"current_steps": 1184, "total_steps": 1560, "loss": 0.1746, "lr": 1.6676712777599275e-06, "epoch": 2.2752, "percentage": 75.9, "elapsed_time": "3:01:33", "remaining_time": "0:57:39"}
1185
+ {"current_steps": 1185, "total_steps": 1560, "loss": 0.1789, "lr": 1.6593385680891139e-06, "epoch": 2.27712, "percentage": 75.96, "elapsed_time": "3:01:42", "remaining_time": "0:57:30"}
1186
+ {"current_steps": 1186, "total_steps": 1560, "loss": 0.1578, "lr": 1.6510225846385668e-06, "epoch": 2.27904, "percentage": 76.03, "elapsed_time": "3:01:52", "remaining_time": "0:57:21"}
1187
+ {"current_steps": 1187, "total_steps": 1560, "loss": 0.1795, "lr": 1.6427233690452455e-06, "epoch": 2.28096, "percentage": 76.09, "elapsed_time": "3:02:01", "remaining_time": "0:57:11"}
1188
+ {"current_steps": 1188, "total_steps": 1560, "loss": 0.192, "lr": 1.6344409628621482e-06, "epoch": 2.28288, "percentage": 76.15, "elapsed_time": "3:02:10", "remaining_time": "0:57:02"}
1189
+ {"current_steps": 1189, "total_steps": 1560, "loss": 0.1432, "lr": 1.6261754075581187e-06, "epoch": 2.2848, "percentage": 76.22, "elapsed_time": "3:02:19", "remaining_time": "0:56:53"}
1190
+ {"current_steps": 1190, "total_steps": 1560, "loss": 0.1736, "lr": 1.6179267445176206e-06, "epoch": 2.28672, "percentage": 76.28, "elapsed_time": "3:02:29", "remaining_time": "0:56:44"}
1191
+ {"current_steps": 1191, "total_steps": 1560, "loss": 0.2014, "lr": 1.6096950150405454e-06, "epoch": 2.28864, "percentage": 76.35, "elapsed_time": "3:02:38", "remaining_time": "0:56:35"}
1192
+ {"current_steps": 1192, "total_steps": 1560, "loss": 0.2058, "lr": 1.6014802603420044e-06, "epoch": 2.29056, "percentage": 76.41, "elapsed_time": "3:02:47", "remaining_time": "0:56:26"}
1193
+ {"current_steps": 1193, "total_steps": 1560, "loss": 0.1781, "lr": 1.593282521552113e-06, "epoch": 2.29248, "percentage": 76.47, "elapsed_time": "3:02:57", "remaining_time": "0:56:16"}
1194
+ {"current_steps": 1194, "total_steps": 1560, "loss": 0.1575, "lr": 1.5851018397157918e-06, "epoch": 2.2944, "percentage": 76.54, "elapsed_time": "3:03:06", "remaining_time": "0:56:07"}
1195
+ {"current_steps": 1195, "total_steps": 1560, "loss": 0.1453, "lr": 1.5769382557925612e-06, "epoch": 2.29632, "percentage": 76.6, "elapsed_time": "3:03:15", "remaining_time": "0:55:58"}
1196
+ {"current_steps": 1196, "total_steps": 1560, "loss": 0.1638, "lr": 1.5687918106563326e-06, "epoch": 2.29824, "percentage": 76.67, "elapsed_time": "3:03:25", "remaining_time": "0:55:49"}
1197
+ {"current_steps": 1197, "total_steps": 1560, "loss": 0.1784, "lr": 1.5606625450952062e-06, "epoch": 2.30016, "percentage": 76.73, "elapsed_time": "3:03:34", "remaining_time": "0:55:40"}
1198
+ {"current_steps": 1198, "total_steps": 1560, "loss": 0.2021, "lr": 1.5525504998112717e-06, "epoch": 2.30208, "percentage": 76.79, "elapsed_time": "3:03:43", "remaining_time": "0:55:31"}
1199
+ {"current_steps": 1199, "total_steps": 1560, "loss": 0.1502, "lr": 1.5444557154203892e-06, "epoch": 2.304, "percentage": 76.86, "elapsed_time": "3:03:52", "remaining_time": "0:55:21"}
1200
+ {"current_steps": 1200, "total_steps": 1560, "loss": 0.1863, "lr": 1.5363782324520033e-06, "epoch": 2.30592, "percentage": 76.92, "elapsed_time": "3:04:02", "remaining_time": "0:55:12"}
1201
+ {"current_steps": 1201, "total_steps": 1560, "loss": 0.1483, "lr": 1.5283180913489326e-06, "epoch": 2.30784, "percentage": 76.99, "elapsed_time": "3:04:11", "remaining_time": "0:55:03"}
1202
+ {"current_steps": 1202, "total_steps": 1560, "loss": 0.1794, "lr": 1.520275332467166e-06, "epoch": 2.30976, "percentage": 77.05, "elapsed_time": "3:04:20", "remaining_time": "0:54:54"}
1203
+ {"current_steps": 1203, "total_steps": 1560, "loss": 0.1971, "lr": 1.5122499960756604e-06, "epoch": 2.31168, "percentage": 77.12, "elapsed_time": "3:04:30", "remaining_time": "0:54:45"}
1204
+ {"current_steps": 1204, "total_steps": 1560, "loss": 0.2118, "lr": 1.504242122356143e-06, "epoch": 2.3136, "percentage": 77.18, "elapsed_time": "3:04:39", "remaining_time": "0:54:35"}
1205
+ {"current_steps": 1205, "total_steps": 1560, "loss": 0.1738, "lr": 1.4962517514029069e-06, "epoch": 2.3155200000000002, "percentage": 77.24, "elapsed_time": "3:04:48", "remaining_time": "0:54:26"}
1206
+ {"current_steps": 1206, "total_steps": 1560, "loss": 0.1748, "lr": 1.4882789232226124e-06, "epoch": 2.31744, "percentage": 77.31, "elapsed_time": "3:04:58", "remaining_time": "0:54:17"}
1207
+ {"current_steps": 1207, "total_steps": 1560, "loss": 0.1687, "lr": 1.4803236777340856e-06, "epoch": 2.31936, "percentage": 77.37, "elapsed_time": "3:05:07", "remaining_time": "0:54:08"}
1208
+ {"current_steps": 1208, "total_steps": 1560, "loss": 0.1866, "lr": 1.4723860547681163e-06, "epoch": 2.32128, "percentage": 77.44, "elapsed_time": "3:05:16", "remaining_time": "0:53:59"}
1209
+ {"current_steps": 1209, "total_steps": 1560, "loss": 0.1679, "lr": 1.4644660940672628e-06, "epoch": 2.3232, "percentage": 77.5, "elapsed_time": "3:05:26", "remaining_time": "0:53:50"}
1210
+ {"current_steps": 1210, "total_steps": 1560, "loss": 0.2266, "lr": 1.4565638352856504e-06, "epoch": 2.32512, "percentage": 77.56, "elapsed_time": "3:05:35", "remaining_time": "0:53:40"}
1211
+ {"current_steps": 1211, "total_steps": 1560, "loss": 0.1577, "lr": 1.4486793179887738e-06, "epoch": 2.32704, "percentage": 77.63, "elapsed_time": "3:05:44", "remaining_time": "0:53:31"}
1212
+ {"current_steps": 1212, "total_steps": 1560, "loss": 0.1858, "lr": 1.4408125816532981e-06, "epoch": 2.32896, "percentage": 77.69, "elapsed_time": "3:05:53", "remaining_time": "0:53:22"}
1213
+ {"current_steps": 1213, "total_steps": 1560, "loss": 0.1839, "lr": 1.4329636656668617e-06, "epoch": 2.33088, "percentage": 77.76, "elapsed_time": "3:06:02", "remaining_time": "0:53:13"}
1214
+ {"current_steps": 1214, "total_steps": 1560, "loss": 0.16, "lr": 1.4251326093278773e-06, "epoch": 2.3327999999999998, "percentage": 77.82, "elapsed_time": "3:06:11", "remaining_time": "0:53:03"}
1215
+ {"current_steps": 1215, "total_steps": 1560, "loss": 0.2081, "lr": 1.4173194518453415e-06, "epoch": 2.33472, "percentage": 77.88, "elapsed_time": "3:06:20", "remaining_time": "0:52:54"}
1216
+ {"current_steps": 1216, "total_steps": 1560, "loss": 0.1749, "lr": 1.4095242323386305e-06, "epoch": 2.33664, "percentage": 77.95, "elapsed_time": "3:06:29", "remaining_time": "0:52:45"}
1217
+ {"current_steps": 1217, "total_steps": 1560, "loss": 0.1753, "lr": 1.4017469898373077e-06, "epoch": 2.33856, "percentage": 78.01, "elapsed_time": "3:06:38", "remaining_time": "0:52:36"}
1218
+ {"current_steps": 1218, "total_steps": 1560, "loss": 0.1606, "lr": 1.3939877632809279e-06, "epoch": 2.34048, "percentage": 78.08, "elapsed_time": "3:06:47", "remaining_time": "0:52:26"}
1219
+ {"current_steps": 1219, "total_steps": 1560, "loss": 0.1892, "lr": 1.3862465915188427e-06, "epoch": 2.3424, "percentage": 78.14, "elapsed_time": "3:06:56", "remaining_time": "0:52:17"}
1220
+ {"current_steps": 1220, "total_steps": 1560, "loss": 0.1535, "lr": 1.3785235133100088e-06, "epoch": 2.34432, "percentage": 78.21, "elapsed_time": "3:07:05", "remaining_time": "0:52:08"}
1221
+ {"current_steps": 1221, "total_steps": 1560, "loss": 0.1931, "lr": 1.3708185673227896e-06, "epoch": 2.34624, "percentage": 78.27, "elapsed_time": "3:07:15", "remaining_time": "0:51:59"}
1222
+ {"current_steps": 1222, "total_steps": 1560, "loss": 0.1527, "lr": 1.3631317921347564e-06, "epoch": 2.34816, "percentage": 78.33, "elapsed_time": "3:07:24", "remaining_time": "0:51:50"}
1223
+ {"current_steps": 1223, "total_steps": 1560, "loss": 0.2289, "lr": 1.3554632262325129e-06, "epoch": 2.35008, "percentage": 78.4, "elapsed_time": "3:07:33", "remaining_time": "0:51:41"}
1224
+ {"current_steps": 1224, "total_steps": 1560, "loss": 0.2013, "lr": 1.347812908011485e-06, "epoch": 2.352, "percentage": 78.46, "elapsed_time": "3:07:43", "remaining_time": "0:51:31"}
1225
+ {"current_steps": 1225, "total_steps": 1560, "loss": 0.1997, "lr": 1.340180875775735e-06, "epoch": 2.35392, "percentage": 78.53, "elapsed_time": "3:07:52", "remaining_time": "0:51:22"}
1226
+ {"current_steps": 1226, "total_steps": 1560, "loss": 0.2287, "lr": 1.3325671677377727e-06, "epoch": 2.35584, "percentage": 78.59, "elapsed_time": "3:08:01", "remaining_time": "0:51:13"}
1227
+ {"current_steps": 1227, "total_steps": 1560, "loss": 0.1698, "lr": 1.3249718220183583e-06, "epoch": 2.35776, "percentage": 78.65, "elapsed_time": "3:08:11", "remaining_time": "0:51:04"}
1228
+ {"current_steps": 1228, "total_steps": 1560, "loss": 0.1843, "lr": 1.3173948766463146e-06, "epoch": 2.35968, "percentage": 78.72, "elapsed_time": "3:08:20", "remaining_time": "0:50:55"}
1229
+ {"current_steps": 1229, "total_steps": 1560, "loss": 0.1748, "lr": 1.309836369558341e-06, "epoch": 2.3616, "percentage": 78.78, "elapsed_time": "3:08:29", "remaining_time": "0:50:46"}
1230
+ {"current_steps": 1230, "total_steps": 1560, "loss": 0.183, "lr": 1.3022963385988153e-06, "epoch": 2.36352, "percentage": 78.85, "elapsed_time": "3:08:39", "remaining_time": "0:50:36"}
1231
+ {"current_steps": 1231, "total_steps": 1560, "loss": 0.1539, "lr": 1.2947748215196038e-06, "epoch": 2.36544, "percentage": 78.91, "elapsed_time": "3:08:48", "remaining_time": "0:50:27"}
1232
+ {"current_steps": 1232, "total_steps": 1560, "loss": 0.1591, "lr": 1.2872718559798852e-06, "epoch": 2.36736, "percentage": 78.97, "elapsed_time": "3:08:57", "remaining_time": "0:50:18"}
1233
+ {"current_steps": 1233, "total_steps": 1560, "loss": 0.1559, "lr": 1.2797874795459464e-06, "epoch": 2.36928, "percentage": 79.04, "elapsed_time": "3:09:06", "remaining_time": "0:50:09"}
1234
+ {"current_steps": 1234, "total_steps": 1560, "loss": 0.2063, "lr": 1.2723217296910078e-06, "epoch": 2.3712, "percentage": 79.1, "elapsed_time": "3:09:16", "remaining_time": "0:50:00"}
1235
+ {"current_steps": 1235, "total_steps": 1560, "loss": 0.179, "lr": 1.264874643795021e-06, "epoch": 2.37312, "percentage": 79.17, "elapsed_time": "3:09:25", "remaining_time": "0:49:50"}
1236
+ {"current_steps": 1236, "total_steps": 1560, "loss": 0.1874, "lr": 1.257446259144494e-06, "epoch": 2.37504, "percentage": 79.23, "elapsed_time": "3:09:34", "remaining_time": "0:49:41"}
1237
+ {"current_steps": 1237, "total_steps": 1560, "loss": 0.2074, "lr": 1.2500366129323039e-06, "epoch": 2.37696, "percentage": 79.29, "elapsed_time": "3:09:43", "remaining_time": "0:49:32"}
1238
+ {"current_steps": 1238, "total_steps": 1560, "loss": 0.1563, "lr": 1.2426457422575e-06, "epoch": 2.37888, "percentage": 79.36, "elapsed_time": "3:09:53", "remaining_time": "0:49:23"}
1239
+ {"current_steps": 1239, "total_steps": 1560, "loss": 0.1504, "lr": 1.2352736841251306e-06, "epoch": 2.3808, "percentage": 79.42, "elapsed_time": "3:10:02", "remaining_time": "0:49:14"}
1240
+ {"current_steps": 1240, "total_steps": 1560, "loss": 0.1742, "lr": 1.2279204754460494e-06, "epoch": 2.38272, "percentage": 79.49, "elapsed_time": "3:10:11", "remaining_time": "0:49:04"}
1241
+ {"current_steps": 1241, "total_steps": 1560, "loss": 0.1509, "lr": 1.2205861530367342e-06, "epoch": 2.38464, "percentage": 79.55, "elapsed_time": "3:10:20", "remaining_time": "0:48:55"}
1242
+ {"current_steps": 1242, "total_steps": 1560, "loss": 0.1721, "lr": 1.2132707536191008e-06, "epoch": 2.3865600000000002, "percentage": 79.62, "elapsed_time": "3:10:29", "remaining_time": "0:48:46"}
1243
+ {"current_steps": 1243, "total_steps": 1560, "loss": 0.177, "lr": 1.2059743138203256e-06, "epoch": 2.38848, "percentage": 79.68, "elapsed_time": "3:10:38", "remaining_time": "0:48:37"}
1244
+ {"current_steps": 1244, "total_steps": 1560, "loss": 0.1787, "lr": 1.1986968701726492e-06, "epoch": 2.3904, "percentage": 79.74, "elapsed_time": "3:10:47", "remaining_time": "0:48:27"}
1245
+ {"current_steps": 1245, "total_steps": 1560, "loss": 0.1622, "lr": 1.1914384591132045e-06, "epoch": 2.39232, "percentage": 79.81, "elapsed_time": "3:10:56", "remaining_time": "0:48:18"}
1246
+ {"current_steps": 1246, "total_steps": 1560, "loss": 0.1736, "lr": 1.184199116983834e-06, "epoch": 2.39424, "percentage": 79.87, "elapsed_time": "3:11:05", "remaining_time": "0:48:09"}
1247
+ {"current_steps": 1247, "total_steps": 1560, "loss": 0.1706, "lr": 1.1769788800309001e-06, "epoch": 2.39616, "percentage": 79.94, "elapsed_time": "3:11:13", "remaining_time": "0:47:59"}
1248
+ {"current_steps": 1248, "total_steps": 1560, "loss": 0.1701, "lr": 1.1697777844051105e-06, "epoch": 2.39808, "percentage": 80.0, "elapsed_time": "3:11:22", "remaining_time": "0:47:50"}
1249
+ {"current_steps": 1249, "total_steps": 1560, "loss": 0.1979, "lr": 1.1625958661613345e-06, "epoch": 2.4, "percentage": 80.06, "elapsed_time": "3:11:31", "remaining_time": "0:47:41"}
1250
+ {"current_steps": 1250, "total_steps": 1560, "loss": 0.1698, "lr": 1.1554331612584218e-06, "epoch": 2.40192, "percentage": 80.13, "elapsed_time": "3:11:40", "remaining_time": "0:47:32"}
1251
+ {"current_steps": 1251, "total_steps": 1560, "loss": 0.1634, "lr": 1.1482897055590275e-06, "epoch": 2.4038399999999998, "percentage": 80.19, "elapsed_time": "3:11:49", "remaining_time": "0:47:22"}
1252
+ {"current_steps": 1252, "total_steps": 1560, "loss": 0.1681, "lr": 1.141165534829425e-06, "epoch": 2.40576, "percentage": 80.26, "elapsed_time": "3:11:58", "remaining_time": "0:47:13"}
1253
+ {"current_steps": 1253, "total_steps": 1560, "loss": 0.1549, "lr": 1.134060684739331e-06, "epoch": 2.40768, "percentage": 80.32, "elapsed_time": "3:12:06", "remaining_time": "0:47:04"}
1254
+ {"current_steps": 1254, "total_steps": 1560, "loss": 0.1864, "lr": 1.1269751908617277e-06, "epoch": 2.4096, "percentage": 80.38, "elapsed_time": "3:12:15", "remaining_time": "0:46:54"}
1255
+ {"current_steps": 1255, "total_steps": 1560, "loss": 0.1903, "lr": 1.119909088672682e-06, "epoch": 2.41152, "percentage": 80.45, "elapsed_time": "3:12:24", "remaining_time": "0:46:45"}
1256
+ {"current_steps": 1256, "total_steps": 1560, "loss": 0.1749, "lr": 1.1128624135511712e-06, "epoch": 2.41344, "percentage": 80.51, "elapsed_time": "3:12:33", "remaining_time": "0:46:36"}
1257
+ {"current_steps": 1257, "total_steps": 1560, "loss": 0.1718, "lr": 1.105835200778902e-06, "epoch": 2.41536, "percentage": 80.58, "elapsed_time": "3:12:42", "remaining_time": "0:46:27"}
1258
+ {"current_steps": 1258, "total_steps": 1560, "loss": 0.1859, "lr": 1.0988274855401377e-06, "epoch": 2.41728, "percentage": 80.64, "elapsed_time": "3:12:51", "remaining_time": "0:46:17"}
1259
+ {"current_steps": 1259, "total_steps": 1560, "loss": 0.1507, "lr": 1.091839302921518e-06, "epoch": 2.4192, "percentage": 80.71, "elapsed_time": "3:13:00", "remaining_time": "0:46:08"}
1260
+ {"current_steps": 1260, "total_steps": 1560, "loss": 0.169, "lr": 1.0848706879118893e-06, "epoch": 2.42112, "percentage": 80.77, "elapsed_time": "3:13:09", "remaining_time": "0:45:59"}
1261
+ {"current_steps": 1261, "total_steps": 1560, "loss": 0.1782, "lr": 1.0779216754021215e-06, "epoch": 2.42304, "percentage": 80.83, "elapsed_time": "3:13:18", "remaining_time": "0:45:50"}
1262
+ {"current_steps": 1262, "total_steps": 1560, "loss": 0.18, "lr": 1.070992300184941e-06, "epoch": 2.42496, "percentage": 80.9, "elapsed_time": "3:13:27", "remaining_time": "0:45:40"}
1263
+ {"current_steps": 1263, "total_steps": 1560, "loss": 0.171, "lr": 1.0640825969547498e-06, "epoch": 2.42688, "percentage": 80.96, "elapsed_time": "3:13:36", "remaining_time": "0:45:31"}
1264
+ {"current_steps": 1264, "total_steps": 1560, "loss": 0.1393, "lr": 1.057192600307456e-06, "epoch": 2.4288, "percentage": 81.03, "elapsed_time": "3:13:45", "remaining_time": "0:45:22"}
1265
+ {"current_steps": 1265, "total_steps": 1560, "loss": 0.2022, "lr": 1.0503223447403033e-06, "epoch": 2.43072, "percentage": 81.09, "elapsed_time": "3:13:54", "remaining_time": "0:45:13"}
1266
+ {"current_steps": 1266, "total_steps": 1560, "loss": 0.1644, "lr": 1.0434718646516917e-06, "epoch": 2.43264, "percentage": 81.15, "elapsed_time": "3:14:03", "remaining_time": "0:45:03"}
1267
+ {"current_steps": 1267, "total_steps": 1560, "loss": 0.1695, "lr": 1.0366411943410033e-06, "epoch": 2.43456, "percentage": 81.22, "elapsed_time": "3:14:12", "remaining_time": "0:44:54"}
1268
+ {"current_steps": 1268, "total_steps": 1560, "loss": 0.1985, "lr": 1.0298303680084448e-06, "epoch": 2.43648, "percentage": 81.28, "elapsed_time": "3:14:21", "remaining_time": "0:44:45"}
1269
+ {"current_steps": 1269, "total_steps": 1560, "loss": 0.1732, "lr": 1.0230394197548605e-06, "epoch": 2.4384, "percentage": 81.35, "elapsed_time": "3:14:31", "remaining_time": "0:44:36"}
1270
+ {"current_steps": 1270, "total_steps": 1560, "loss": 0.1813, "lr": 1.0162683835815706e-06, "epoch": 2.44032, "percentage": 81.41, "elapsed_time": "3:14:40", "remaining_time": "0:44:27"}
1271
+ {"current_steps": 1271, "total_steps": 1560, "loss": 0.1618, "lr": 1.009517293390197e-06, "epoch": 2.44224, "percentage": 81.47, "elapsed_time": "3:14:49", "remaining_time": "0:44:17"}
1272
+ {"current_steps": 1272, "total_steps": 1560, "loss": 0.1973, "lr": 1.0027861829824953e-06, "epoch": 2.44416, "percentage": 81.54, "elapsed_time": "3:14:58", "remaining_time": "0:44:08"}
1273
+ {"current_steps": 1273, "total_steps": 1560, "loss": 0.1623, "lr": 9.960750860601842e-07, "epoch": 2.44608, "percentage": 81.6, "elapsed_time": "3:15:07", "remaining_time": "0:43:59"}
1274
+ {"current_steps": 1274, "total_steps": 1560, "loss": 0.1964, "lr": 9.893840362247809e-07, "epoch": 2.448, "percentage": 81.67, "elapsed_time": "3:15:17", "remaining_time": "0:43:50"}
1275
+ {"current_steps": 1275, "total_steps": 1560, "loss": 0.2058, "lr": 9.82713066977427e-07, "epoch": 2.44992, "percentage": 81.73, "elapsed_time": "3:15:26", "remaining_time": "0:43:41"}
1276
+ {"current_steps": 1276, "total_steps": 1560, "loss": 0.1683, "lr": 9.760622117187234e-07, "epoch": 2.45184, "percentage": 81.79, "elapsed_time": "3:15:35", "remaining_time": "0:43:31"}
1277
+ {"current_steps": 1277, "total_steps": 1560, "loss": 0.1751, "lr": 9.694315037485635e-07, "epoch": 2.45376, "percentage": 81.86, "elapsed_time": "3:15:44", "remaining_time": "0:43:22"}
1278
+ {"current_steps": 1278, "total_steps": 1560, "loss": 0.1944, "lr": 9.628209762659658e-07, "epoch": 2.45568, "percentage": 81.92, "elapsed_time": "3:15:54", "remaining_time": "0:43:13"}
1279
+ {"current_steps": 1279, "total_steps": 1560, "loss": 0.1633, "lr": 9.562306623689111e-07, "epoch": 2.4576000000000002, "percentage": 81.99, "elapsed_time": "3:16:03", "remaining_time": "0:43:04"}
1280
+ {"current_steps": 1280, "total_steps": 1560, "loss": 0.2106, "lr": 9.496605950541676e-07, "epoch": 2.45952, "percentage": 82.05, "elapsed_time": "3:16:12", "remaining_time": "0:42:55"}
1281
+ {"current_steps": 1281, "total_steps": 1560, "loss": 0.1428, "lr": 9.431108072171346e-07, "epoch": 2.46144, "percentage": 82.12, "elapsed_time": "3:16:21", "remaining_time": "0:42:46"}
1282
+ {"current_steps": 1282, "total_steps": 1560, "loss": 0.176, "lr": 9.365813316516787e-07, "epoch": 2.4633599999999998, "percentage": 82.18, "elapsed_time": "3:16:30", "remaining_time": "0:42:36"}
1283
+ {"current_steps": 1283, "total_steps": 1560, "loss": 0.1923, "lr": 9.300722010499608e-07, "epoch": 2.46528, "percentage": 82.24, "elapsed_time": "3:16:40", "remaining_time": "0:42:27"}
1284
+ {"current_steps": 1284, "total_steps": 1560, "loss": 0.1636, "lr": 9.235834480022788e-07, "epoch": 2.4672, "percentage": 82.31, "elapsed_time": "3:16:49", "remaining_time": "0:42:18"}
1285
+ {"current_steps": 1285, "total_steps": 1560, "loss": 0.2038, "lr": 9.17115104996903e-07, "epoch": 2.46912, "percentage": 82.37, "elapsed_time": "3:16:58", "remaining_time": "0:42:09"}
1286
+ {"current_steps": 1286, "total_steps": 1560, "loss": 0.1624, "lr": 9.10667204419915e-07, "epoch": 2.47104, "percentage": 82.44, "elapsed_time": "3:17:07", "remaining_time": "0:42:00"}
1287
+ {"current_steps": 1287, "total_steps": 1560, "loss": 0.1381, "lr": 9.042397785550405e-07, "epoch": 2.47296, "percentage": 82.5, "elapsed_time": "3:17:16", "remaining_time": "0:41:50"}
1288
+ {"current_steps": 1288, "total_steps": 1560, "loss": 0.172, "lr": 8.978328595834984e-07, "epoch": 2.47488, "percentage": 82.56, "elapsed_time": "3:17:26", "remaining_time": "0:41:41"}
1289
+ {"current_steps": 1289, "total_steps": 1560, "loss": 0.1733, "lr": 8.91446479583823e-07, "epoch": 2.4768, "percentage": 82.63, "elapsed_time": "3:17:35", "remaining_time": "0:41:32"}
1290
+ {"current_steps": 1290, "total_steps": 1560, "loss": 0.1586, "lr": 8.850806705317183e-07, "epoch": 2.47872, "percentage": 82.69, "elapsed_time": "3:17:44", "remaining_time": "0:41:23"}
1291
+ {"current_steps": 1291, "total_steps": 1560, "loss": 0.2182, "lr": 8.787354642998936e-07, "epoch": 2.48064, "percentage": 82.76, "elapsed_time": "3:17:53", "remaining_time": "0:41:14"}
1292
+ {"current_steps": 1292, "total_steps": 1560, "loss": 0.1744, "lr": 8.724108926579e-07, "epoch": 2.48256, "percentage": 82.82, "elapsed_time": "3:18:02", "remaining_time": "0:41:04"}
1293
+ {"current_steps": 1293, "total_steps": 1560, "loss": 0.1735, "lr": 8.661069872719746e-07, "epoch": 2.48448, "percentage": 82.88, "elapsed_time": "3:18:11", "remaining_time": "0:40:55"}
1294
+ {"current_steps": 1294, "total_steps": 1560, "loss": 0.1682, "lr": 8.598237797048825e-07, "epoch": 2.4864, "percentage": 82.95, "elapsed_time": "3:18:21", "remaining_time": "0:40:46"}
1295
+ {"current_steps": 1295, "total_steps": 1560, "loss": 0.1546, "lr": 8.535613014157556e-07, "epoch": 2.48832, "percentage": 83.01, "elapsed_time": "3:18:30", "remaining_time": "0:40:37"}
1296
+ {"current_steps": 1296, "total_steps": 1560, "loss": 0.1697, "lr": 8.473195837599419e-07, "epoch": 2.49024, "percentage": 83.08, "elapsed_time": "3:18:39", "remaining_time": "0:40:28"}
1297
+ {"current_steps": 1297, "total_steps": 1560, "loss": 0.1807, "lr": 8.410986579888381e-07, "epoch": 2.49216, "percentage": 83.14, "elapsed_time": "3:18:48", "remaining_time": "0:40:18"}
1298
+ {"current_steps": 1298, "total_steps": 1560, "loss": 0.2005, "lr": 8.348985552497424e-07, "epoch": 2.49408, "percentage": 83.21, "elapsed_time": "3:18:58", "remaining_time": "0:40:09"}
1299
+ {"current_steps": 1299, "total_steps": 1560, "loss": 0.1784, "lr": 8.287193065856936e-07, "epoch": 2.496, "percentage": 83.27, "elapsed_time": "3:19:07", "remaining_time": "0:40:00"}
1300
+ {"current_steps": 1300, "total_steps": 1560, "loss": 0.1523, "lr": 8.225609429353187e-07, "epoch": 2.49792, "percentage": 83.33, "elapsed_time": "3:19:16", "remaining_time": "0:39:51"}
1301
+ {"current_steps": 1301, "total_steps": 1560, "loss": 0.161, "lr": 8.164234951326727e-07, "epoch": 2.49984, "percentage": 83.4, "elapsed_time": "3:19:25", "remaining_time": "0:39:42"}
1302
+ {"current_steps": 1302, "total_steps": 1560, "loss": 0.1666, "lr": 8.103069939070945e-07, "epoch": 2.50176, "percentage": 83.46, "elapsed_time": "3:19:35", "remaining_time": "0:39:32"}
1303
+ {"current_steps": 1303, "total_steps": 1560, "loss": 0.1914, "lr": 8.042114698830394e-07, "epoch": 2.50368, "percentage": 83.53, "elapsed_time": "3:19:44", "remaining_time": "0:39:23"}
1304
+ {"current_steps": 1304, "total_steps": 1560, "loss": 0.1803, "lr": 7.981369535799354e-07, "epoch": 2.5056000000000003, "percentage": 83.59, "elapsed_time": "3:19:53", "remaining_time": "0:39:14"}
1305
+ {"current_steps": 1305, "total_steps": 1560, "loss": 0.1926, "lr": 7.920834754120305e-07, "epoch": 2.50752, "percentage": 83.65, "elapsed_time": "3:20:02", "remaining_time": "0:39:05"}
1306
+ {"current_steps": 1306, "total_steps": 1560, "loss": 0.1782, "lr": 7.860510656882342e-07, "epoch": 2.50944, "percentage": 83.72, "elapsed_time": "3:20:11", "remaining_time": "0:38:56"}
1307
+ {"current_steps": 1307, "total_steps": 1560, "loss": 0.205, "lr": 7.800397546119709e-07, "epoch": 2.51136, "percentage": 83.78, "elapsed_time": "3:20:20", "remaining_time": "0:38:46"}
1308
+ {"current_steps": 1308, "total_steps": 1560, "loss": 0.1539, "lr": 7.740495722810271e-07, "epoch": 2.51328, "percentage": 83.85, "elapsed_time": "3:20:29", "remaining_time": "0:38:37"}
1309
+ {"current_steps": 1309, "total_steps": 1560, "loss": 0.2204, "lr": 7.680805486873977e-07, "epoch": 2.5152, "percentage": 83.91, "elapsed_time": "3:20:39", "remaining_time": "0:38:28"}
1310
+ {"current_steps": 1310, "total_steps": 1560, "loss": 0.1736, "lr": 7.621327137171447e-07, "epoch": 2.5171200000000002, "percentage": 83.97, "elapsed_time": "3:20:48", "remaining_time": "0:38:19"}
1311
+ {"current_steps": 1311, "total_steps": 1560, "loss": 0.1516, "lr": 7.562060971502383e-07, "epoch": 2.51904, "percentage": 84.04, "elapsed_time": "3:20:57", "remaining_time": "0:38:10"}
1312
+ {"current_steps": 1312, "total_steps": 1560, "loss": 0.146, "lr": 7.50300728660407e-07, "epoch": 2.52096, "percentage": 84.1, "elapsed_time": "3:21:06", "remaining_time": "0:38:00"}
1313
+ {"current_steps": 1313, "total_steps": 1560, "loss": 0.1752, "lr": 7.444166378150014e-07, "epoch": 2.52288, "percentage": 84.17, "elapsed_time": "3:21:15", "remaining_time": "0:37:51"}
1314
+ {"current_steps": 1314, "total_steps": 1560, "loss": 0.191, "lr": 7.385538540748327e-07, "epoch": 2.5248, "percentage": 84.23, "elapsed_time": "3:21:24", "remaining_time": "0:37:42"}
1315
+ {"current_steps": 1315, "total_steps": 1560, "loss": 0.1658, "lr": 7.327124067940311e-07, "epoch": 2.52672, "percentage": 84.29, "elapsed_time": "3:21:34", "remaining_time": "0:37:33"}
1316
+ {"current_steps": 1316, "total_steps": 1560, "loss": 0.1676, "lr": 7.26892325219899e-07, "epoch": 2.52864, "percentage": 84.36, "elapsed_time": "3:21:43", "remaining_time": "0:37:24"}
1317
+ {"current_steps": 1317, "total_steps": 1560, "loss": 0.1639, "lr": 7.210936384927631e-07, "epoch": 2.53056, "percentage": 84.42, "elapsed_time": "3:21:52", "remaining_time": "0:37:14"}
1318
+ {"current_steps": 1318, "total_steps": 1560, "loss": 0.2259, "lr": 7.153163756458287e-07, "epoch": 2.53248, "percentage": 84.49, "elapsed_time": "3:22:01", "remaining_time": "0:37:05"}
1319
+ {"current_steps": 1319, "total_steps": 1560, "loss": 0.1465, "lr": 7.09560565605037e-07, "epoch": 2.5343999999999998, "percentage": 84.55, "elapsed_time": "3:22:11", "remaining_time": "0:36:56"}
1320
+ {"current_steps": 1320, "total_steps": 1560, "loss": 0.1506, "lr": 7.03826237188916e-07, "epoch": 2.53632, "percentage": 84.62, "elapsed_time": "3:22:20", "remaining_time": "0:36:47"}
1321
+ {"current_steps": 1321, "total_steps": 1560, "loss": 0.1898, "lr": 6.981134191084388e-07, "epoch": 2.53824, "percentage": 84.68, "elapsed_time": "3:22:29", "remaining_time": "0:36:38"}
1322
+ {"current_steps": 1322, "total_steps": 1560, "loss": 0.1701, "lr": 6.924221399668785e-07, "epoch": 2.54016, "percentage": 84.74, "elapsed_time": "3:22:39", "remaining_time": "0:36:29"}
1323
+ {"current_steps": 1323, "total_steps": 1560, "loss": 0.1621, "lr": 6.867524282596655e-07, "epoch": 2.54208, "percentage": 84.81, "elapsed_time": "3:22:48", "remaining_time": "0:36:19"}
1324
+ {"current_steps": 1324, "total_steps": 1560, "loss": 0.1969, "lr": 6.811043123742494e-07, "epoch": 2.544, "percentage": 84.87, "elapsed_time": "3:22:57", "remaining_time": "0:36:10"}
1325
+ {"current_steps": 1325, "total_steps": 1560, "loss": 0.1629, "lr": 6.754778205899465e-07, "epoch": 2.5459199999999997, "percentage": 84.94, "elapsed_time": "3:23:07", "remaining_time": "0:36:01"}
1326
+ {"current_steps": 1326, "total_steps": 1560, "loss": 0.1657, "lr": 6.698729810778065e-07, "epoch": 2.54784, "percentage": 85.0, "elapsed_time": "3:23:16", "remaining_time": "0:35:52"}
1327
+ {"current_steps": 1327, "total_steps": 1560, "loss": 0.1427, "lr": 6.642898219004723e-07, "epoch": 2.54976, "percentage": 85.06, "elapsed_time": "3:23:25", "remaining_time": "0:35:43"}
1328
+ {"current_steps": 1328, "total_steps": 1560, "loss": 0.176, "lr": 6.587283710120324e-07, "epoch": 2.55168, "percentage": 85.13, "elapsed_time": "3:23:34", "remaining_time": "0:35:33"}
1329
+ {"current_steps": 1329, "total_steps": 1560, "loss": 0.1738, "lr": 6.531886562578859e-07, "epoch": 2.5536, "percentage": 85.19, "elapsed_time": "3:23:44", "remaining_time": "0:35:24"}
1330
+ {"current_steps": 1330, "total_steps": 1560, "loss": 0.1615, "lr": 6.47670705374604e-07, "epoch": 2.55552, "percentage": 85.26, "elapsed_time": "3:23:53", "remaining_time": "0:35:15"}
1331
+ {"current_steps": 1331, "total_steps": 1560, "loss": 0.191, "lr": 6.421745459897871e-07, "epoch": 2.55744, "percentage": 85.32, "elapsed_time": "3:24:02", "remaining_time": "0:35:06"}
1332
+ {"current_steps": 1332, "total_steps": 1560, "loss": 0.1524, "lr": 6.367002056219285e-07, "epoch": 2.55936, "percentage": 85.38, "elapsed_time": "3:24:12", "remaining_time": "0:34:57"}
1333
+ {"current_steps": 1333, "total_steps": 1560, "loss": 0.1524, "lr": 6.312477116802807e-07, "epoch": 2.56128, "percentage": 85.45, "elapsed_time": "3:24:21", "remaining_time": "0:34:48"}
1334
+ {"current_steps": 1334, "total_steps": 1560, "loss": 0.1785, "lr": 6.258170914647077e-07, "epoch": 2.5632, "percentage": 85.51, "elapsed_time": "3:24:30", "remaining_time": "0:34:38"}
1335
+ {"current_steps": 1335, "total_steps": 1560, "loss": 0.1471, "lr": 6.204083721655607e-07, "epoch": 2.56512, "percentage": 85.58, "elapsed_time": "3:24:39", "remaining_time": "0:34:29"}
1336
+ {"current_steps": 1336, "total_steps": 1560, "loss": 0.1926, "lr": 6.150215808635334e-07, "epoch": 2.56704, "percentage": 85.64, "elapsed_time": "3:24:49", "remaining_time": "0:34:20"}
1337
+ {"current_steps": 1337, "total_steps": 1560, "loss": 0.1954, "lr": 6.096567445295298e-07, "epoch": 2.56896, "percentage": 85.71, "elapsed_time": "3:24:58", "remaining_time": "0:34:11"}
1338
+ {"current_steps": 1338, "total_steps": 1560, "loss": 0.1583, "lr": 6.043138900245277e-07, "epoch": 2.57088, "percentage": 85.77, "elapsed_time": "3:25:07", "remaining_time": "0:34:02"}
1339
+ {"current_steps": 1339, "total_steps": 1560, "loss": 0.2119, "lr": 5.989930440994451e-07, "epoch": 2.5728, "percentage": 85.83, "elapsed_time": "3:25:16", "remaining_time": "0:33:52"}
1340
+ {"current_steps": 1340, "total_steps": 1560, "loss": 0.1751, "lr": 5.936942333950063e-07, "epoch": 2.57472, "percentage": 85.9, "elapsed_time": "3:25:26", "remaining_time": "0:33:43"}
1341
+ {"current_steps": 1341, "total_steps": 1560, "loss": 0.1477, "lr": 5.884174844416102e-07, "epoch": 2.5766400000000003, "percentage": 85.96, "elapsed_time": "3:25:35", "remaining_time": "0:33:34"}
1342
+ {"current_steps": 1342, "total_steps": 1560, "loss": 0.1379, "lr": 5.831628236591929e-07, "epoch": 2.57856, "percentage": 86.03, "elapsed_time": "3:25:44", "remaining_time": "0:33:25"}
1343
+ {"current_steps": 1343, "total_steps": 1560, "loss": 0.1613, "lr": 5.779302773570994e-07, "epoch": 2.58048, "percentage": 86.09, "elapsed_time": "3:25:53", "remaining_time": "0:33:15"}
1344
+ {"current_steps": 1344, "total_steps": 1560, "loss": 0.1595, "lr": 5.727198717339511e-07, "epoch": 2.5824, "percentage": 86.15, "elapsed_time": "3:26:02", "remaining_time": "0:33:06"}
1345
+ {"current_steps": 1345, "total_steps": 1560, "loss": 0.1748, "lr": 5.675316328775126e-07, "epoch": 2.58432, "percentage": 86.22, "elapsed_time": "3:26:11", "remaining_time": "0:32:57"}
1346
+ {"current_steps": 1346, "total_steps": 1560, "loss": 0.1841, "lr": 5.623655867645628e-07, "epoch": 2.58624, "percentage": 86.28, "elapsed_time": "3:26:20", "remaining_time": "0:32:48"}
1347
+ {"current_steps": 1347, "total_steps": 1560, "loss": 0.1304, "lr": 5.572217592607687e-07, "epoch": 2.5881600000000002, "percentage": 86.35, "elapsed_time": "3:26:29", "remaining_time": "0:32:39"}
1348
+ {"current_steps": 1348, "total_steps": 1560, "loss": 0.1983, "lr": 5.521001761205441e-07, "epoch": 2.59008, "percentage": 86.41, "elapsed_time": "3:26:38", "remaining_time": "0:32:29"}
1349
+ {"current_steps": 1349, "total_steps": 1560, "loss": 0.1854, "lr": 5.470008629869367e-07, "epoch": 2.592, "percentage": 86.47, "elapsed_time": "3:26:47", "remaining_time": "0:32:20"}
1350
+ {"current_steps": 1350, "total_steps": 1560, "loss": 0.1781, "lr": 5.41923845391486e-07, "epoch": 2.59392, "percentage": 86.54, "elapsed_time": "3:26:56", "remaining_time": "0:32:11"}
1351
+ {"current_steps": 1351, "total_steps": 1560, "loss": 0.1782, "lr": 5.368691487541027e-07, "epoch": 2.59584, "percentage": 86.6, "elapsed_time": "3:27:05", "remaining_time": "0:32:02"}
1352
+ {"current_steps": 1352, "total_steps": 1560, "loss": 0.1594, "lr": 5.318367983829393e-07, "epoch": 2.59776, "percentage": 86.67, "elapsed_time": "3:27:15", "remaining_time": "0:31:53"}
1353
+ {"current_steps": 1353, "total_steps": 1560, "loss": 0.1738, "lr": 5.268268194742638e-07, "epoch": 2.59968, "percentage": 86.73, "elapsed_time": "3:27:24", "remaining_time": "0:31:43"}
1354
+ {"current_steps": 1354, "total_steps": 1560, "loss": 0.1454, "lr": 5.218392371123326e-07, "epoch": 2.6016, "percentage": 86.79, "elapsed_time": "3:27:33", "remaining_time": "0:31:34"}
1355
+ {"current_steps": 1355, "total_steps": 1560, "loss": 0.1943, "lr": 5.168740762692681e-07, "epoch": 2.60352, "percentage": 86.86, "elapsed_time": "3:27:42", "remaining_time": "0:31:25"}
1356
+ {"current_steps": 1356, "total_steps": 1560, "loss": 0.2222, "lr": 5.119313618049309e-07, "epoch": 2.6054399999999998, "percentage": 86.92, "elapsed_time": "3:27:51", "remaining_time": "0:31:16"}
1357
+ {"current_steps": 1357, "total_steps": 1560, "loss": 0.1435, "lr": 5.070111184667908e-07, "epoch": 2.60736, "percentage": 86.99, "elapsed_time": "3:28:00", "remaining_time": "0:31:07"}
1358
+ {"current_steps": 1358, "total_steps": 1560, "loss": 0.2089, "lr": 5.021133708898146e-07, "epoch": 2.60928, "percentage": 87.05, "elapsed_time": "3:28:09", "remaining_time": "0:30:57"}
1359
+ {"current_steps": 1359, "total_steps": 1560, "loss": 0.1719, "lr": 4.972381435963331e-07, "epoch": 2.6112, "percentage": 87.12, "elapsed_time": "3:28:19", "remaining_time": "0:30:48"}
1360
+ {"current_steps": 1360, "total_steps": 1560, "loss": 0.1948, "lr": 4.9238546099592e-07, "epoch": 2.61312, "percentage": 87.18, "elapsed_time": "3:28:28", "remaining_time": "0:30:39"}
1361
+ {"current_steps": 1361, "total_steps": 1560, "loss": 0.1505, "lr": 4.875553473852735e-07, "epoch": 2.61504, "percentage": 87.24, "elapsed_time": "3:28:37", "remaining_time": "0:30:30"}
1362
+ {"current_steps": 1362, "total_steps": 1560, "loss": 0.2252, "lr": 4.827478269480895e-07, "epoch": 2.6169599999999997, "percentage": 87.31, "elapsed_time": "3:28:46", "remaining_time": "0:30:20"}
1363
+ {"current_steps": 1363, "total_steps": 1560, "loss": 0.1511, "lr": 4.779629237549438e-07, "epoch": 2.61888, "percentage": 87.37, "elapsed_time": "3:28:55", "remaining_time": "0:30:11"}
1364
+ {"current_steps": 1364, "total_steps": 1560, "loss": 0.1866, "lr": 4.732006617631729e-07, "epoch": 2.6208, "percentage": 87.44, "elapsed_time": "3:29:04", "remaining_time": "0:30:02"}
1365
+ {"current_steps": 1365, "total_steps": 1560, "loss": 0.1854, "lr": 4.6846106481675035e-07, "epoch": 2.62272, "percentage": 87.5, "elapsed_time": "3:29:13", "remaining_time": "0:29:53"}
1366
+ {"current_steps": 1366, "total_steps": 1560, "loss": 0.1552, "lr": 4.637441566461681e-07, "epoch": 2.62464, "percentage": 87.56, "elapsed_time": "3:29:22", "remaining_time": "0:29:44"}
1367
+ {"current_steps": 1367, "total_steps": 1560, "loss": 0.1757, "lr": 4.590499608683202e-07, "epoch": 2.62656, "percentage": 87.63, "elapsed_time": "3:29:31", "remaining_time": "0:29:34"}
1368
+ {"current_steps": 1368, "total_steps": 1560, "loss": 0.1628, "lr": 4.54378500986381e-07, "epoch": 2.62848, "percentage": 87.69, "elapsed_time": "3:29:40", "remaining_time": "0:29:25"}
1369
+ {"current_steps": 1369, "total_steps": 1560, "loss": 0.1782, "lr": 4.497298003896944e-07, "epoch": 2.6304, "percentage": 87.76, "elapsed_time": "3:29:50", "remaining_time": "0:29:16"}
1370
+ {"current_steps": 1370, "total_steps": 1560, "loss": 0.1365, "lr": 4.451038823536441e-07, "epoch": 2.63232, "percentage": 87.82, "elapsed_time": "3:29:59", "remaining_time": "0:29:07"}
1371
+ {"current_steps": 1371, "total_steps": 1560, "loss": 0.2089, "lr": 4.405007700395497e-07, "epoch": 2.63424, "percentage": 87.88, "elapsed_time": "3:30:08", "remaining_time": "0:28:58"}
1372
+ {"current_steps": 1372, "total_steps": 1560, "loss": 0.2094, "lr": 4.35920486494546e-07, "epoch": 2.63616, "percentage": 87.95, "elapsed_time": "3:30:17", "remaining_time": "0:28:48"}
1373
+ {"current_steps": 1373, "total_steps": 1560, "loss": 0.1891, "lr": 4.313630546514663e-07, "epoch": 2.63808, "percentage": 88.01, "elapsed_time": "3:30:26", "remaining_time": "0:28:39"}
1374
+ {"current_steps": 1374, "total_steps": 1560, "loss": 0.1878, "lr": 4.268284973287273e-07, "epoch": 2.64, "percentage": 88.08, "elapsed_time": "3:30:36", "remaining_time": "0:28:30"}
1375
+ {"current_steps": 1375, "total_steps": 1560, "loss": 0.2096, "lr": 4.223168372302189e-07, "epoch": 2.64192, "percentage": 88.14, "elapsed_time": "3:30:45", "remaining_time": "0:28:21"}
1376
+ {"current_steps": 1376, "total_steps": 1560, "loss": 0.168, "lr": 4.1782809694518533e-07, "epoch": 2.64384, "percentage": 88.21, "elapsed_time": "3:30:54", "remaining_time": "0:28:12"}
1377
+ {"current_steps": 1377, "total_steps": 1560, "loss": 0.1607, "lr": 4.1336229894811454e-07, "epoch": 2.64576, "percentage": 88.27, "elapsed_time": "3:31:03", "remaining_time": "0:28:02"}
1378
+ {"current_steps": 1378, "total_steps": 1560, "loss": 0.1888, "lr": 4.089194655986306e-07, "epoch": 2.6476800000000003, "percentage": 88.33, "elapsed_time": "3:31:12", "remaining_time": "0:27:53"}
1379
+ {"current_steps": 1379, "total_steps": 1560, "loss": 0.1846, "lr": 4.044996191413686e-07, "epoch": 2.6496, "percentage": 88.4, "elapsed_time": "3:31:21", "remaining_time": "0:27:44"}
1380
+ {"current_steps": 1380, "total_steps": 1560, "loss": 0.192, "lr": 4.001027817058789e-07, "epoch": 2.65152, "percentage": 88.46, "elapsed_time": "3:31:30", "remaining_time": "0:27:35"}
1381
+ {"current_steps": 1381, "total_steps": 1560, "loss": 0.1584, "lr": 3.957289753065052e-07, "epoch": 2.65344, "percentage": 88.53, "elapsed_time": "3:31:39", "remaining_time": "0:27:26"}
1382
+ {"current_steps": 1382, "total_steps": 1560, "loss": 0.1904, "lr": 3.9137822184227845e-07, "epoch": 2.65536, "percentage": 88.59, "elapsed_time": "3:31:48", "remaining_time": "0:27:16"}
1383
+ {"current_steps": 1383, "total_steps": 1560, "loss": 0.186, "lr": 3.870505430968069e-07, "epoch": 2.65728, "percentage": 88.65, "elapsed_time": "3:31:57", "remaining_time": "0:27:07"}
1384
+ {"current_steps": 1384, "total_steps": 1560, "loss": 0.1571, "lr": 3.8274596073816784e-07, "epoch": 2.6592000000000002, "percentage": 88.72, "elapsed_time": "3:32:06", "remaining_time": "0:26:58"}
1385
+ {"current_steps": 1385, "total_steps": 1560, "loss": 0.1616, "lr": 3.7846449631879664e-07, "epoch": 2.66112, "percentage": 88.78, "elapsed_time": "3:32:15", "remaining_time": "0:26:49"}
1386
+ {"current_steps": 1386, "total_steps": 1560, "loss": 0.1808, "lr": 3.742061712753825e-07, "epoch": 2.66304, "percentage": 88.85, "elapsed_time": "3:32:24", "remaining_time": "0:26:39"}
1387
+ {"current_steps": 1387, "total_steps": 1560, "loss": 0.1783, "lr": 3.699710069287571e-07, "epoch": 2.6649599999999998, "percentage": 88.91, "elapsed_time": "3:32:33", "remaining_time": "0:26:30"}
1388
+ {"current_steps": 1388, "total_steps": 1560, "loss": 0.1692, "lr": 3.657590244837911e-07, "epoch": 2.66688, "percentage": 88.97, "elapsed_time": "3:32:42", "remaining_time": "0:26:21"}
1389
+ {"current_steps": 1389, "total_steps": 1560, "loss": 0.1682, "lr": 3.615702450292857e-07, "epoch": 2.6688, "percentage": 89.04, "elapsed_time": "3:32:51", "remaining_time": "0:26:12"}
1390
+ {"current_steps": 1390, "total_steps": 1560, "loss": 0.1532, "lr": 3.5740468953786854e-07, "epoch": 2.67072, "percentage": 89.1, "elapsed_time": "3:33:00", "remaining_time": "0:26:03"}
1391
+ {"current_steps": 1391, "total_steps": 1560, "loss": 0.1546, "lr": 3.5326237886588734e-07, "epoch": 2.67264, "percentage": 89.17, "elapsed_time": "3:33:10", "remaining_time": "0:25:53"}
1392
+ {"current_steps": 1392, "total_steps": 1560, "loss": 0.1582, "lr": 3.49143333753309e-07, "epoch": 2.67456, "percentage": 89.23, "elapsed_time": "3:33:19", "remaining_time": "0:25:44"}
1393
+ {"current_steps": 1393, "total_steps": 1560, "loss": 0.1769, "lr": 3.4504757482360817e-07, "epoch": 2.6764799999999997, "percentage": 89.29, "elapsed_time": "3:33:29", "remaining_time": "0:25:35"}
1394
+ {"current_steps": 1394, "total_steps": 1560, "loss": 0.1734, "lr": 3.4097512258367385e-07, "epoch": 2.6784, "percentage": 89.36, "elapsed_time": "3:33:38", "remaining_time": "0:25:26"}
1395
+ {"current_steps": 1395, "total_steps": 1560, "loss": 0.189, "lr": 3.369259974236988e-07, "epoch": 2.68032, "percentage": 89.42, "elapsed_time": "3:33:48", "remaining_time": "0:25:17"}
1396
+ {"current_steps": 1396, "total_steps": 1560, "loss": 0.1375, "lr": 3.3290021961708163e-07, "epoch": 2.68224, "percentage": 89.49, "elapsed_time": "3:33:57", "remaining_time": "0:25:08"}
1397
+ {"current_steps": 1397, "total_steps": 1560, "loss": 0.1955, "lr": 3.288978093203227e-07, "epoch": 2.68416, "percentage": 89.55, "elapsed_time": "3:34:07", "remaining_time": "0:24:58"}
1398
+ {"current_steps": 1398, "total_steps": 1560, "loss": 0.1507, "lr": 3.2491878657292643e-07, "epoch": 2.68608, "percentage": 89.62, "elapsed_time": "3:34:16", "remaining_time": "0:24:49"}
1399
+ {"current_steps": 1399, "total_steps": 1560, "loss": 0.1933, "lr": 3.209631712972966e-07, "epoch": 2.6879999999999997, "percentage": 89.68, "elapsed_time": "3:34:26", "remaining_time": "0:24:40"}
1400
+ {"current_steps": 1400, "total_steps": 1560, "loss": 0.1592, "lr": 3.1703098329864237e-07, "epoch": 2.68992, "percentage": 89.74, "elapsed_time": "3:34:35", "remaining_time": "0:24:31"}
1401
+ {"current_steps": 1401, "total_steps": 1560, "loss": 0.1873, "lr": 3.131222422648744e-07, "epoch": 2.69184, "percentage": 89.81, "elapsed_time": "3:34:45", "remaining_time": "0:24:22"}
1402
+ {"current_steps": 1402, "total_steps": 1560, "loss": 0.1831, "lr": 3.0923696776650414e-07, "epoch": 2.69376, "percentage": 89.87, "elapsed_time": "3:34:54", "remaining_time": "0:24:13"}
1403
+ {"current_steps": 1403, "total_steps": 1560, "loss": 0.1712, "lr": 3.0537517925655567e-07, "epoch": 2.69568, "percentage": 89.94, "elapsed_time": "3:35:04", "remaining_time": "0:24:04"}
1404
+ {"current_steps": 1404, "total_steps": 1560, "loss": 0.1303, "lr": 3.015368960704584e-07, "epoch": 2.6976, "percentage": 90.0, "elapsed_time": "3:35:13", "remaining_time": "0:23:54"}
1405
+ {"current_steps": 1405, "total_steps": 1560, "loss": 0.2105, "lr": 2.9772213742595367e-07, "epoch": 2.69952, "percentage": 90.06, "elapsed_time": "3:35:22", "remaining_time": "0:23:45"}
1406
+ {"current_steps": 1406, "total_steps": 1560, "loss": 0.1611, "lr": 2.9393092242300026e-07, "epoch": 2.70144, "percentage": 90.13, "elapsed_time": "3:35:31", "remaining_time": "0:23:36"}
1407
+ {"current_steps": 1407, "total_steps": 1560, "loss": 0.2246, "lr": 2.901632700436757e-07, "epoch": 2.70336, "percentage": 90.19, "elapsed_time": "3:35:40", "remaining_time": "0:23:27"}
1408
+ {"current_steps": 1408, "total_steps": 1560, "loss": 0.1568, "lr": 2.864191991520848e-07, "epoch": 2.70528, "percentage": 90.26, "elapsed_time": "3:35:49", "remaining_time": "0:23:17"}
1409
+ {"current_steps": 1409, "total_steps": 1560, "loss": 0.1802, "lr": 2.8269872849426114e-07, "epoch": 2.7072000000000003, "percentage": 90.32, "elapsed_time": "3:35:58", "remaining_time": "0:23:08"}
1410
+ {"current_steps": 1410, "total_steps": 1560, "loss": 0.1584, "lr": 2.790018766980773e-07, "epoch": 2.70912, "percentage": 90.38, "elapsed_time": "3:36:08", "remaining_time": "0:22:59"}
1411
+ {"current_steps": 1411, "total_steps": 1560, "loss": 0.1802, "lr": 2.7532866227314714e-07, "epoch": 2.71104, "percentage": 90.45, "elapsed_time": "3:36:17", "remaining_time": "0:22:50"}
1412
+ {"current_steps": 1412, "total_steps": 1560, "loss": 0.1908, "lr": 2.71679103610738e-07, "epoch": 2.71296, "percentage": 90.51, "elapsed_time": "3:36:26", "remaining_time": "0:22:41"}
1413
+ {"current_steps": 1413, "total_steps": 1560, "loss": 0.1747, "lr": 2.6805321898367323e-07, "epoch": 2.71488, "percentage": 90.58, "elapsed_time": "3:36:35", "remaining_time": "0:22:31"}
1414
+ {"current_steps": 1414, "total_steps": 1560, "loss": 0.1825, "lr": 2.64451026546248e-07, "epoch": 2.7168, "percentage": 90.64, "elapsed_time": "3:36:44", "remaining_time": "0:22:22"}
1415
+ {"current_steps": 1415, "total_steps": 1560, "loss": 0.2024, "lr": 2.6087254433412924e-07, "epoch": 2.7187200000000002, "percentage": 90.71, "elapsed_time": "3:36:53", "remaining_time": "0:22:13"}
1416
+ {"current_steps": 1416, "total_steps": 1560, "loss": 0.1691, "lr": 2.573177902642726e-07, "epoch": 2.72064, "percentage": 90.77, "elapsed_time": "3:37:02", "remaining_time": "0:22:04"}
1417
+ {"current_steps": 1417, "total_steps": 1560, "loss": 0.1493, "lr": 2.5378678213483057e-07, "epoch": 2.72256, "percentage": 90.83, "elapsed_time": "3:37:12", "remaining_time": "0:21:55"}
1418
+ {"current_steps": 1418, "total_steps": 1560, "loss": 0.2316, "lr": 2.502795376250622e-07, "epoch": 2.72448, "percentage": 90.9, "elapsed_time": "3:37:21", "remaining_time": "0:21:46"}
1419
+ {"current_steps": 1419, "total_steps": 1560, "loss": 0.2066, "lr": 2.467960742952463e-07, "epoch": 2.7264, "percentage": 90.96, "elapsed_time": "3:37:30", "remaining_time": "0:21:36"}
1420
+ {"current_steps": 1420, "total_steps": 1560, "loss": 0.2062, "lr": 2.4333640958659144e-07, "epoch": 2.72832, "percentage": 91.03, "elapsed_time": "3:37:39", "remaining_time": "0:21:27"}
1421
+ {"current_steps": 1421, "total_steps": 1560, "loss": 0.1606, "lr": 2.399005608211502e-07, "epoch": 2.7302400000000002, "percentage": 91.09, "elapsed_time": "3:37:49", "remaining_time": "0:21:18"}
1422
+ {"current_steps": 1422, "total_steps": 1560, "loss": 0.1954, "lr": 2.3648854520173237e-07, "epoch": 2.73216, "percentage": 91.15, "elapsed_time": "3:37:58", "remaining_time": "0:21:09"}
1423
+ {"current_steps": 1423, "total_steps": 1560, "loss": 0.156, "lr": 2.3310037981182088e-07, "epoch": 2.73408, "percentage": 91.22, "elapsed_time": "3:38:07", "remaining_time": "0:21:00"}
1424
+ {"current_steps": 1424, "total_steps": 1560, "loss": 0.1781, "lr": 2.2973608161547755e-07, "epoch": 2.7359999999999998, "percentage": 91.28, "elapsed_time": "3:38:17", "remaining_time": "0:20:50"}
1425
+ {"current_steps": 1425, "total_steps": 1560, "loss": 0.2062, "lr": 2.2639566745727203e-07, "epoch": 2.73792, "percentage": 91.35, "elapsed_time": "3:38:26", "remaining_time": "0:20:41"}
1426
+ {"current_steps": 1426, "total_steps": 1560, "loss": 0.2092, "lr": 2.2307915406218517e-07, "epoch": 2.73984, "percentage": 91.41, "elapsed_time": "3:38:36", "remaining_time": "0:20:32"}
1427
+ {"current_steps": 1427, "total_steps": 1560, "loss": 0.1415, "lr": 2.1978655803553128e-07, "epoch": 2.74176, "percentage": 91.47, "elapsed_time": "3:38:45", "remaining_time": "0:20:23"}
1428
+ {"current_steps": 1428, "total_steps": 1560, "loss": 0.1949, "lr": 2.1651789586287442e-07, "epoch": 2.74368, "percentage": 91.54, "elapsed_time": "3:38:54", "remaining_time": "0:20:14"}
1429
+ {"current_steps": 1429, "total_steps": 1560, "loss": 0.1419, "lr": 2.1327318390994445e-07, "epoch": 2.7456, "percentage": 91.6, "elapsed_time": "3:39:04", "remaining_time": "0:20:04"}
1430
+ {"current_steps": 1430, "total_steps": 1560, "loss": 0.1668, "lr": 2.1005243842255552e-07, "epoch": 2.7475199999999997, "percentage": 91.67, "elapsed_time": "3:39:13", "remaining_time": "0:19:55"}
1431
+ {"current_steps": 1431, "total_steps": 1560, "loss": 0.2052, "lr": 2.068556755265272e-07, "epoch": 2.74944, "percentage": 91.73, "elapsed_time": "3:39:23", "remaining_time": "0:19:46"}
1432
+ {"current_steps": 1432, "total_steps": 1560, "loss": 0.1583, "lr": 2.0368291122759898e-07, "epoch": 2.75136, "percentage": 91.79, "elapsed_time": "3:39:32", "remaining_time": "0:19:37"}
1433
+ {"current_steps": 1433, "total_steps": 1560, "loss": 0.1847, "lr": 2.005341614113543e-07, "epoch": 2.75328, "percentage": 91.86, "elapsed_time": "3:39:41", "remaining_time": "0:19:28"}
1434
+ {"current_steps": 1434, "total_steps": 1560, "loss": 0.2009, "lr": 1.9740944184313882e-07, "epoch": 2.7552, "percentage": 91.92, "elapsed_time": "3:39:51", "remaining_time": "0:19:19"}
1435
+ {"current_steps": 1435, "total_steps": 1560, "loss": 0.1496, "lr": 1.9430876816798228e-07, "epoch": 2.75712, "percentage": 91.99, "elapsed_time": "3:40:00", "remaining_time": "0:19:09"}
1436
+ {"current_steps": 1436, "total_steps": 1560, "loss": 0.2015, "lr": 1.9123215591052014e-07, "epoch": 2.75904, "percentage": 92.05, "elapsed_time": "3:40:09", "remaining_time": "0:19:00"}
1437
+ {"current_steps": 1437, "total_steps": 1560, "loss": 0.1937, "lr": 1.88179620474917e-07, "epoch": 2.76096, "percentage": 92.12, "elapsed_time": "3:40:19", "remaining_time": "0:18:51"}
1438
+ {"current_steps": 1438, "total_steps": 1560, "loss": 0.179, "lr": 1.8515117714478447e-07, "epoch": 2.76288, "percentage": 92.18, "elapsed_time": "3:40:28", "remaining_time": "0:18:42"}
1439
+ {"current_steps": 1439, "total_steps": 1560, "loss": 0.1581, "lr": 1.8214684108311286e-07, "epoch": 2.7648, "percentage": 92.24, "elapsed_time": "3:40:37", "remaining_time": "0:18:33"}
1440
+ {"current_steps": 1440, "total_steps": 1560, "loss": 0.1594, "lr": 1.7916662733218848e-07, "epoch": 2.76672, "percentage": 92.31, "elapsed_time": "3:40:46", "remaining_time": "0:18:23"}
1441
+ {"current_steps": 1441, "total_steps": 1560, "loss": 0.1455, "lr": 1.762105508135198e-07, "epoch": 2.76864, "percentage": 92.37, "elapsed_time": "3:40:55", "remaining_time": "0:18:14"}
1442
+ {"current_steps": 1442, "total_steps": 1560, "loss": 0.1777, "lr": 1.7327862632776638e-07, "epoch": 2.77056, "percentage": 92.44, "elapsed_time": "3:41:04", "remaining_time": "0:18:05"}
1443
+ {"current_steps": 1443, "total_steps": 1560, "loss": 0.1908, "lr": 1.7037086855465902e-07, "epoch": 2.77248, "percentage": 92.5, "elapsed_time": "3:41:13", "remaining_time": "0:17:56"}
1444
+ {"current_steps": 1444, "total_steps": 1560, "loss": 0.1736, "lr": 1.6748729205293024e-07, "epoch": 2.7744, "percentage": 92.56, "elapsed_time": "3:41:22", "remaining_time": "0:17:47"}
1445
+ {"current_steps": 1445, "total_steps": 1560, "loss": 0.2112, "lr": 1.646279112602417e-07, "epoch": 2.77632, "percentage": 92.63, "elapsed_time": "3:41:32", "remaining_time": "0:17:37"}
1446
+ {"current_steps": 1446, "total_steps": 1560, "loss": 0.2041, "lr": 1.6179274049310966e-07, "epoch": 2.7782400000000003, "percentage": 92.69, "elapsed_time": "3:41:41", "remaining_time": "0:17:28"}
1447
+ {"current_steps": 1447, "total_steps": 1560, "loss": 0.1544, "lr": 1.5898179394683244e-07, "epoch": 2.78016, "percentage": 92.76, "elapsed_time": "3:41:50", "remaining_time": "0:17:19"}
1448
+ {"current_steps": 1448, "total_steps": 1560, "loss": 0.1862, "lr": 1.5619508569542363e-07, "epoch": 2.78208, "percentage": 92.82, "elapsed_time": "3:42:00", "remaining_time": "0:17:10"}
1449
+ {"current_steps": 1449, "total_steps": 1560, "loss": 0.1592, "lr": 1.5343262969153781e-07, "epoch": 2.784, "percentage": 92.88, "elapsed_time": "3:42:09", "remaining_time": "0:17:01"}
1450
+ {"current_steps": 1450, "total_steps": 1560, "loss": 0.1566, "lr": 1.5069443976640287e-07, "epoch": 2.78592, "percentage": 92.95, "elapsed_time": "3:42:19", "remaining_time": "0:16:51"}
1451
+ {"current_steps": 1451, "total_steps": 1560, "loss": 0.1682, "lr": 1.4798052962974874e-07, "epoch": 2.78784, "percentage": 93.01, "elapsed_time": "3:42:28", "remaining_time": "0:16:42"}
1452
+ {"current_steps": 1452, "total_steps": 1560, "loss": 0.1686, "lr": 1.4529091286973994e-07, "epoch": 2.7897600000000002, "percentage": 93.08, "elapsed_time": "3:42:37", "remaining_time": "0:16:33"}
1453
+ {"current_steps": 1453, "total_steps": 1560, "loss": 0.1615, "lr": 1.4262560295290884e-07, "epoch": 2.79168, "percentage": 93.14, "elapsed_time": "3:42:46", "remaining_time": "0:16:24"}
1454
+ {"current_steps": 1454, "total_steps": 1560, "loss": 0.1451, "lr": 1.3998461322408563e-07, "epoch": 2.7936, "percentage": 93.21, "elapsed_time": "3:42:56", "remaining_time": "0:16:15"}
1455
+ {"current_steps": 1455, "total_steps": 1560, "loss": 0.1868, "lr": 1.3736795690633353e-07, "epoch": 2.79552, "percentage": 93.27, "elapsed_time": "3:43:05", "remaining_time": "0:16:05"}
1456
+ {"current_steps": 1456, "total_steps": 1560, "loss": 0.186, "lr": 1.3477564710088097e-07, "epoch": 2.79744, "percentage": 93.33, "elapsed_time": "3:43:15", "remaining_time": "0:15:56"}
1457
+ {"current_steps": 1457, "total_steps": 1560, "loss": 0.1611, "lr": 1.3220769678705724e-07, "epoch": 2.79936, "percentage": 93.4, "elapsed_time": "3:43:24", "remaining_time": "0:15:47"}
1458
+ {"current_steps": 1458, "total_steps": 1560, "loss": 0.1783, "lr": 1.2966411882222695e-07, "epoch": 2.80128, "percentage": 93.46, "elapsed_time": "3:43:34", "remaining_time": "0:15:38"}
1459
+ {"current_steps": 1459, "total_steps": 1560, "loss": 0.1817, "lr": 1.271449259417268e-07, "epoch": 2.8032, "percentage": 93.53, "elapsed_time": "3:43:43", "remaining_time": "0:15:29"}
1460
+ {"current_steps": 1460, "total_steps": 1560, "loss": 0.1606, "lr": 1.2465013075879884e-07, "epoch": 2.80512, "percentage": 93.59, "elapsed_time": "3:43:53", "remaining_time": "0:15:20"}
1461
+ {"current_steps": 1461, "total_steps": 1560, "loss": 0.2111, "lr": 1.2217974576453072e-07, "epoch": 2.8070399999999998, "percentage": 93.65, "elapsed_time": "3:44:02", "remaining_time": "0:15:10"}
1462
+ {"current_steps": 1462, "total_steps": 1560, "loss": 0.1972, "lr": 1.1973378332779229e-07, "epoch": 2.80896, "percentage": 93.72, "elapsed_time": "3:44:11", "remaining_time": "0:15:01"}
1463
+ {"current_steps": 1463, "total_steps": 1560, "loss": 0.1656, "lr": 1.1731225569517113e-07, "epoch": 2.81088, "percentage": 93.78, "elapsed_time": "3:44:21", "remaining_time": "0:14:52"}
1464
+ {"current_steps": 1464, "total_steps": 1560, "loss": 0.1829, "lr": 1.1491517499091498e-07, "epoch": 2.8128, "percentage": 93.85, "elapsed_time": "3:44:30", "remaining_time": "0:14:43"}
1465
+ {"current_steps": 1465, "total_steps": 1560, "loss": 0.1816, "lr": 1.1254255321686836e-07, "epoch": 2.81472, "percentage": 93.91, "elapsed_time": "3:44:40", "remaining_time": "0:14:34"}
1466
+ {"current_steps": 1466, "total_steps": 1560, "loss": 0.1943, "lr": 1.1019440225241317e-07, "epoch": 2.81664, "percentage": 93.97, "elapsed_time": "3:44:49", "remaining_time": "0:14:24"}
1467
+ {"current_steps": 1467, "total_steps": 1560, "loss": 0.1796, "lr": 1.078707338544105e-07, "epoch": 2.8185599999999997, "percentage": 94.04, "elapsed_time": "3:44:59", "remaining_time": "0:14:15"}
1468
+ {"current_steps": 1468, "total_steps": 1560, "loss": 0.1613, "lr": 1.055715596571405e-07, "epoch": 2.82048, "percentage": 94.1, "elapsed_time": "3:45:08", "remaining_time": "0:14:06"}
1469
+ {"current_steps": 1469, "total_steps": 1560, "loss": 0.161, "lr": 1.0329689117224262e-07, "epoch": 2.8224, "percentage": 94.17, "elapsed_time": "3:45:18", "remaining_time": "0:13:57"}
1470
+ {"current_steps": 1470, "total_steps": 1560, "loss": 0.1619, "lr": 1.0104673978866164e-07, "epoch": 2.82432, "percentage": 94.23, "elapsed_time": "3:45:27", "remaining_time": "0:13:48"}
1471
+ {"current_steps": 1471, "total_steps": 1560, "loss": 0.1578, "lr": 9.882111677258777e-08, "epoch": 2.82624, "percentage": 94.29, "elapsed_time": "3:45:37", "remaining_time": "0:13:39"}
1472
+ {"current_steps": 1472, "total_steps": 1560, "loss": 0.1954, "lr": 9.662003326740166e-08, "epoch": 2.82816, "percentage": 94.36, "elapsed_time": "3:45:46", "remaining_time": "0:13:29"}
1473
+ {"current_steps": 1473, "total_steps": 1560, "loss": 0.1966, "lr": 9.444350029361671e-08, "epoch": 2.83008, "percentage": 94.42, "elapsed_time": "3:45:55", "remaining_time": "0:13:20"}
1474
+ {"current_steps": 1474, "total_steps": 1560, "loss": 0.1552, "lr": 9.22915287488274e-08, "epoch": 2.832, "percentage": 94.49, "elapsed_time": "3:46:05", "remaining_time": "0:13:11"}
1475
+ {"current_steps": 1475, "total_steps": 1560, "loss": 0.1694, "lr": 9.016412940765107e-08, "epoch": 2.83392, "percentage": 94.55, "elapsed_time": "3:46:14", "remaining_time": "0:13:02"}
1476
+ {"current_steps": 1476, "total_steps": 1560, "loss": 0.1703, "lr": 8.80613129216762e-08, "epoch": 2.83584, "percentage": 94.62, "elapsed_time": "3:46:24", "remaining_time": "0:12:53"}
1477
+ {"current_steps": 1477, "total_steps": 1560, "loss": 0.194, "lr": 8.598308981940751e-08, "epoch": 2.83776, "percentage": 94.68, "elapsed_time": "3:46:33", "remaining_time": "0:12:43"}
1478
+ {"current_steps": 1478, "total_steps": 1560, "loss": 0.1582, "lr": 8.392947050621603e-08, "epoch": 2.83968, "percentage": 94.74, "elapsed_time": "3:46:43", "remaining_time": "0:12:34"}
1479
+ {"current_steps": 1479, "total_steps": 1560, "loss": 0.171, "lr": 8.190046526428241e-08, "epoch": 2.8416, "percentage": 94.81, "elapsed_time": "3:46:52", "remaining_time": "0:12:25"}
1480
+ {"current_steps": 1480, "total_steps": 1560, "loss": 0.1786, "lr": 7.989608425254924e-08, "epoch": 2.84352, "percentage": 94.87, "elapsed_time": "3:47:02", "remaining_time": "0:12:16"}
1481
+ {"current_steps": 1481, "total_steps": 1560, "loss": 0.2625, "lr": 7.791633750667105e-08, "epoch": 2.84544, "percentage": 94.94, "elapsed_time": "3:47:11", "remaining_time": "0:12:07"}
1482
+ {"current_steps": 1482, "total_steps": 1560, "loss": 0.1805, "lr": 7.59612349389599e-08, "epoch": 2.84736, "percentage": 95.0, "elapsed_time": "3:47:21", "remaining_time": "0:11:57"}
1483
+ {"current_steps": 1483, "total_steps": 1560, "loss": 0.1691, "lr": 7.403078633833716e-08, "epoch": 2.8492800000000003, "percentage": 95.06, "elapsed_time": "3:47:30", "remaining_time": "0:11:48"}
1484
+ {"current_steps": 1484, "total_steps": 1560, "loss": 0.1578, "lr": 7.212500137028789e-08, "epoch": 2.8512, "percentage": 95.13, "elapsed_time": "3:47:39", "remaining_time": "0:11:39"}
1485
+ {"current_steps": 1485, "total_steps": 1560, "loss": 0.173, "lr": 7.024388957680705e-08, "epoch": 2.85312, "percentage": 95.19, "elapsed_time": "3:47:49", "remaining_time": "0:11:30"}
1486
+ {"current_steps": 1486, "total_steps": 1560, "loss": 0.1657, "lr": 6.838746037635735e-08, "epoch": 2.85504, "percentage": 95.26, "elapsed_time": "3:47:58", "remaining_time": "0:11:21"}
1487
+ {"current_steps": 1487, "total_steps": 1560, "loss": 0.2141, "lr": 6.655572306381696e-08, "epoch": 2.85696, "percentage": 95.32, "elapsed_time": "3:48:08", "remaining_time": "0:11:11"}
1488
+ {"current_steps": 1488, "total_steps": 1560, "loss": 0.165, "lr": 6.474868681043578e-08, "epoch": 2.85888, "percentage": 95.38, "elapsed_time": "3:48:17", "remaining_time": "0:11:02"}
1489
+ {"current_steps": 1489, "total_steps": 1560, "loss": 0.1544, "lr": 6.29663606637898e-08, "epoch": 2.8608000000000002, "percentage": 95.45, "elapsed_time": "3:48:27", "remaining_time": "0:10:53"}
1490
+ {"current_steps": 1490, "total_steps": 1560, "loss": 0.1625, "lr": 6.120875354773459e-08, "epoch": 2.86272, "percentage": 95.51, "elapsed_time": "3:48:36", "remaining_time": "0:10:44"}
1491
+ {"current_steps": 1491, "total_steps": 1560, "loss": 0.148, "lr": 5.947587426236079e-08, "epoch": 2.86464, "percentage": 95.58, "elapsed_time": "3:48:46", "remaining_time": "0:10:35"}
1492
+ {"current_steps": 1492, "total_steps": 1560, "loss": 0.1696, "lr": 5.776773148394976e-08, "epoch": 2.8665599999999998, "percentage": 95.64, "elapsed_time": "3:48:55", "remaining_time": "0:10:26"}
1493
+ {"current_steps": 1493, "total_steps": 1560, "loss": 0.2113, "lr": 5.608433376493194e-08, "epoch": 2.86848, "percentage": 95.71, "elapsed_time": "3:49:04", "remaining_time": "0:10:16"}
1494
+ {"current_steps": 1494, "total_steps": 1560, "loss": 0.1344, "lr": 5.4425689533841864e-08, "epoch": 2.8704, "percentage": 95.77, "elapsed_time": "3:49:14", "remaining_time": "0:10:07"}
1495
+ {"current_steps": 1495, "total_steps": 1560, "loss": 0.1629, "lr": 5.279180709527765e-08, "epoch": 2.87232, "percentage": 95.83, "elapsed_time": "3:49:23", "remaining_time": "0:09:58"}
1496
+ {"current_steps": 1496, "total_steps": 1560, "loss": 0.1808, "lr": 5.1182694629857145e-08, "epoch": 2.87424, "percentage": 95.9, "elapsed_time": "3:49:33", "remaining_time": "0:09:49"}
1497
+ {"current_steps": 1497, "total_steps": 1560, "loss": 0.1621, "lr": 4.959836019417963e-08, "epoch": 2.87616, "percentage": 95.96, "elapsed_time": "3:49:42", "remaining_time": "0:09:40"}
1498
+ {"current_steps": 1498, "total_steps": 1560, "loss": 0.202, "lr": 4.803881172078473e-08, "epoch": 2.8780799999999997, "percentage": 96.03, "elapsed_time": "3:49:52", "remaining_time": "0:09:30"}
1499
+ {"current_steps": 1499, "total_steps": 1560, "loss": 0.1601, "lr": 4.650405701811078e-08, "epoch": 2.88, "percentage": 96.09, "elapsed_time": "3:50:01", "remaining_time": "0:09:21"}
1500
+ {"current_steps": 1500, "total_steps": 1560, "loss": 0.1836, "lr": 4.499410377045765e-08, "epoch": 2.88192, "percentage": 96.15, "elapsed_time": "3:50:11", "remaining_time": "0:09:12"}
1501
+ {"current_steps": 1501, "total_steps": 1560, "loss": 0.1639, "lr": 4.350895953794898e-08, "epoch": 2.88384, "percentage": 96.22, "elapsed_time": "3:50:20", "remaining_time": "0:09:03"}
1502
+ {"current_steps": 1502, "total_steps": 1560, "loss": 0.1742, "lr": 4.2048631756492206e-08, "epoch": 2.88576, "percentage": 96.28, "elapsed_time": "3:50:30", "remaining_time": "0:08:54"}
1503
+ {"current_steps": 1503, "total_steps": 1560, "loss": 0.1528, "lr": 4.0613127737741396e-08, "epoch": 2.88768, "percentage": 96.35, "elapsed_time": "3:50:39", "remaining_time": "0:08:44"}
1504
+ {"current_steps": 1504, "total_steps": 1560, "loss": 0.1715, "lr": 3.9202454669063915e-08, "epoch": 2.8895999999999997, "percentage": 96.41, "elapsed_time": "3:50:49", "remaining_time": "0:08:35"}
1505
+ {"current_steps": 1505, "total_steps": 1560, "loss": 0.1609, "lr": 3.781661961349992e-08, "epoch": 2.89152, "percentage": 96.47, "elapsed_time": "3:50:58", "remaining_time": "0:08:26"}
1506
+ {"current_steps": 1506, "total_steps": 1560, "loss": 0.1722, "lr": 3.645562950973014e-08, "epoch": 2.89344, "percentage": 96.54, "elapsed_time": "3:51:08", "remaining_time": "0:08:17"}
1507
+ {"current_steps": 1507, "total_steps": 1560, "loss": 0.1864, "lr": 3.5119491172039836e-08, "epoch": 2.89536, "percentage": 96.6, "elapsed_time": "3:51:17", "remaining_time": "0:08:08"}
1508
+ {"current_steps": 1508, "total_steps": 1560, "loss": 0.1743, "lr": 3.3808211290284886e-08, "epoch": 2.89728, "percentage": 96.67, "elapsed_time": "3:51:27", "remaining_time": "0:07:58"}
1509
+ {"current_steps": 1509, "total_steps": 1560, "loss": 0.1713, "lr": 3.252179642985909e-08, "epoch": 2.8992, "percentage": 96.73, "elapsed_time": "3:51:36", "remaining_time": "0:07:49"}
1510
+ {"current_steps": 1510, "total_steps": 1560, "loss": 0.1795, "lr": 3.1260253031660247e-08, "epoch": 2.90112, "percentage": 96.79, "elapsed_time": "3:51:46", "remaining_time": "0:07:40"}
1511
+ {"current_steps": 1511, "total_steps": 1560, "loss": 0.1964, "lr": 3.002358741205691e-08, "epoch": 2.90304, "percentage": 96.86, "elapsed_time": "3:51:55", "remaining_time": "0:07:31"}
1512
+ {"current_steps": 1512, "total_steps": 1560, "loss": 0.2168, "lr": 2.8811805762860578e-08, "epoch": 2.90496, "percentage": 96.92, "elapsed_time": "3:52:05", "remaining_time": "0:07:22"}
1513
+ {"current_steps": 1513, "total_steps": 1560, "loss": 0.1595, "lr": 2.762491415128965e-08, "epoch": 2.90688, "percentage": 96.99, "elapsed_time": "3:52:14", "remaining_time": "0:07:12"}
1514
+ {"current_steps": 1514, "total_steps": 1560, "loss": 0.1905, "lr": 2.6462918519944425e-08, "epoch": 2.9088000000000003, "percentage": 97.05, "elapsed_time": "3:52:24", "remaining_time": "0:07:03"}
1515
+ {"current_steps": 1515, "total_steps": 1560, "loss": 0.1589, "lr": 2.5325824686772138e-08, "epoch": 2.91072, "percentage": 97.12, "elapsed_time": "3:52:33", "remaining_time": "0:06:54"}
1516
+ {"current_steps": 1516, "total_steps": 1560, "loss": 0.1667, "lr": 2.4213638345040868e-08, "epoch": 2.91264, "percentage": 97.18, "elapsed_time": "3:52:43", "remaining_time": "0:06:45"}
1517
+ {"current_steps": 1517, "total_steps": 1560, "loss": 0.1533, "lr": 2.3126365063311228e-08, "epoch": 2.91456, "percentage": 97.24, "elapsed_time": "3:52:52", "remaining_time": "0:06:36"}
1518
+ {"current_steps": 1518, "total_steps": 1560, "loss": 0.1731, "lr": 2.206401028540639e-08, "epoch": 2.91648, "percentage": 97.31, "elapsed_time": "3:53:02", "remaining_time": "0:06:26"}
1519
+ {"current_steps": 1519, "total_steps": 1560, "loss": 0.172, "lr": 2.1026579330387655e-08, "epoch": 2.9184, "percentage": 97.37, "elapsed_time": "3:53:11", "remaining_time": "0:06:17"}
1520
+ {"current_steps": 1520, "total_steps": 1560, "loss": 0.1827, "lr": 2.0014077392525035e-08, "epoch": 2.9203200000000002, "percentage": 97.44, "elapsed_time": "3:53:21", "remaining_time": "0:06:08"}
1521
+ {"current_steps": 1521, "total_steps": 1560, "loss": 0.1848, "lr": 1.9026509541272276e-08, "epoch": 2.92224, "percentage": 97.5, "elapsed_time": "3:53:30", "remaining_time": "0:05:59"}
1522
+ {"current_steps": 1522, "total_steps": 1560, "loss": 0.1876, "lr": 1.8063880721242986e-08, "epoch": 2.92416, "percentage": 97.56, "elapsed_time": "3:53:40", "remaining_time": "0:05:50"}
1523
+ {"current_steps": 1523, "total_steps": 1560, "loss": 0.1785, "lr": 1.712619575218344e-08, "epoch": 2.92608, "percentage": 97.63, "elapsed_time": "3:53:49", "remaining_time": "0:05:40"}
1524
+ {"current_steps": 1524, "total_steps": 1560, "loss": 0.1479, "lr": 1.6213459328950355e-08, "epoch": 2.928, "percentage": 97.69, "elapsed_time": "3:53:59", "remaining_time": "0:05:31"}
1525
+ {"current_steps": 1525, "total_steps": 1560, "loss": 0.1645, "lr": 1.5325676021484826e-08, "epoch": 2.92992, "percentage": 97.76, "elapsed_time": "3:54:08", "remaining_time": "0:05:22"}
1526
+ {"current_steps": 1526, "total_steps": 1560, "loss": 0.1678, "lr": 1.4462850274794548e-08, "epoch": 2.9318400000000002, "percentage": 97.82, "elapsed_time": "3:54:18", "remaining_time": "0:05:13"}
1527
+ {"current_steps": 1527, "total_steps": 1560, "loss": 0.2245, "lr": 1.3624986408924956e-08, "epoch": 2.93376, "percentage": 97.88, "elapsed_time": "3:54:27", "remaining_time": "0:05:04"}
1528
+ {"current_steps": 1528, "total_steps": 1560, "loss": 0.1749, "lr": 1.2812088618942009e-08, "epoch": 2.93568, "percentage": 97.95, "elapsed_time": "3:54:37", "remaining_time": "0:04:54"}
1529
+ {"current_steps": 1529, "total_steps": 1560, "loss": 0.1705, "lr": 1.2024160974911103e-08, "epoch": 2.9375999999999998, "percentage": 98.01, "elapsed_time": "3:54:46", "remaining_time": "0:04:45"}
1530
+ {"current_steps": 1530, "total_steps": 1560, "loss": 0.1539, "lr": 1.1261207421874309e-08, "epoch": 2.93952, "percentage": 98.08, "elapsed_time": "3:54:56", "remaining_time": "0:04:36"}
1531
+ {"current_steps": 1531, "total_steps": 1560, "loss": 0.2185, "lr": 1.0523231779832055e-08, "epoch": 2.94144, "percentage": 98.14, "elapsed_time": "3:55:05", "remaining_time": "0:04:27"}
1532
+ {"current_steps": 1532, "total_steps": 1560, "loss": 0.1676, "lr": 9.810237743724805e-09, "epoch": 2.94336, "percentage": 98.21, "elapsed_time": "3:55:15", "remaining_time": "0:04:17"}
1533
+ {"current_steps": 1533, "total_steps": 1560, "loss": 0.1926, "lr": 9.12222888341252e-09, "epoch": 2.94528, "percentage": 98.27, "elapsed_time": "3:55:24", "remaining_time": "0:04:08"}
1534
+ {"current_steps": 1534, "total_steps": 1560, "loss": 0.1922, "lr": 8.459208643659122e-09, "epoch": 2.9472, "percentage": 98.33, "elapsed_time": "3:55:33", "remaining_time": "0:03:59"}
1535
+ {"current_steps": 1535, "total_steps": 1560, "loss": 0.1648, "lr": 7.8211803441125e-09, "epoch": 2.9491199999999997, "percentage": 98.4, "elapsed_time": "3:55:43", "remaining_time": "0:03:50"}
1536
+ {"current_steps": 1536, "total_steps": 1560, "loss": 0.1484, "lr": 7.2081471792911914e-09, "epoch": 2.95104, "percentage": 98.46, "elapsed_time": "3:55:52", "remaining_time": "0:03:41"}
1537
+ {"current_steps": 1537, "total_steps": 1560, "loss": 0.1758, "lr": 6.6201122185649555e-09, "epoch": 2.95296, "percentage": 98.53, "elapsed_time": "3:56:01", "remaining_time": "0:03:31"}
1538
+ {"current_steps": 1538, "total_steps": 1560, "loss": 0.168, "lr": 6.057078406142003e-09, "epoch": 2.95488, "percentage": 98.59, "elapsed_time": "3:56:10", "remaining_time": "0:03:22"}
1539
+ {"current_steps": 1539, "total_steps": 1560, "loss": 0.1786, "lr": 5.519048561053453e-09, "epoch": 2.9568, "percentage": 98.65, "elapsed_time": "3:56:19", "remaining_time": "0:03:13"}
1540
+ {"current_steps": 1540, "total_steps": 1560, "loss": 0.1719, "lr": 5.006025377138901e-09, "epoch": 2.95872, "percentage": 98.72, "elapsed_time": "3:56:28", "remaining_time": "0:03:04"}
1541
+ {"current_steps": 1541, "total_steps": 1560, "loss": 0.17, "lr": 4.518011423032542e-09, "epoch": 2.96064, "percentage": 98.78, "elapsed_time": "3:56:37", "remaining_time": "0:02:55"}
1542
+ {"current_steps": 1542, "total_steps": 1560, "loss": 0.164, "lr": 4.055009142152066e-09, "epoch": 2.96256, "percentage": 98.85, "elapsed_time": "3:56:46", "remaining_time": "0:02:45"}
1543
+ {"current_steps": 1543, "total_steps": 1560, "loss": 0.1698, "lr": 3.6170208526836724e-09, "epoch": 2.96448, "percentage": 98.91, "elapsed_time": "3:56:55", "remaining_time": "0:02:36"}
1544
+ {"current_steps": 1544, "total_steps": 1560, "loss": 0.1625, "lr": 3.204048747573185e-09, "epoch": 2.9664, "percentage": 98.97, "elapsed_time": "3:57:04", "remaining_time": "0:02:27"}
1545
+ {"current_steps": 1545, "total_steps": 1560, "loss": 0.1712, "lr": 2.816094894513843e-09, "epoch": 2.96832, "percentage": 99.04, "elapsed_time": "3:57:14", "remaining_time": "0:02:18"}
1546
+ {"current_steps": 1546, "total_steps": 1560, "loss": 0.1783, "lr": 2.4531612359363077e-09, "epoch": 2.97024, "percentage": 99.1, "elapsed_time": "3:57:23", "remaining_time": "0:02:08"}
1547
+ {"current_steps": 1547, "total_steps": 1560, "loss": 0.1703, "lr": 2.1152495889970035e-09, "epoch": 2.97216, "percentage": 99.17, "elapsed_time": "3:57:33", "remaining_time": "0:01:59"}
1548
+ {"current_steps": 1548, "total_steps": 1560, "loss": 0.1651, "lr": 1.8023616455731253e-09, "epoch": 2.97408, "percentage": 99.23, "elapsed_time": "3:57:42", "remaining_time": "0:01:50"}
1549
+ {"current_steps": 1549, "total_steps": 1560, "loss": 0.1697, "lr": 1.514498972249312e-09, "epoch": 2.976, "percentage": 99.29, "elapsed_time": "3:57:52", "remaining_time": "0:01:41"}
1550
+ {"current_steps": 1550, "total_steps": 1560, "loss": 0.1932, "lr": 1.2516630103137638e-09, "epoch": 2.97792, "percentage": 99.36, "elapsed_time": "3:58:01", "remaining_time": "0:01:32"}
1551
+ {"current_steps": 1551, "total_steps": 1560, "loss": 0.1723, "lr": 1.0138550757493592e-09, "epoch": 2.9798400000000003, "percentage": 99.42, "elapsed_time": "3:58:10", "remaining_time": "0:01:22"}
1552
+ {"current_steps": 1552, "total_steps": 1560, "loss": 0.1621, "lr": 8.010763592264381e-10, "epoch": 2.98176, "percentage": 99.49, "elapsed_time": "3:58:20", "remaining_time": "0:01:13"}
1553
+ {"current_steps": 1553, "total_steps": 1560, "loss": 0.2144, "lr": 6.133279260983616e-10, "epoch": 2.98368, "percentage": 99.55, "elapsed_time": "3:58:29", "remaining_time": "0:01:04"}
1554
+ {"current_steps": 1554, "total_steps": 1560, "loss": 0.1725, "lr": 4.506107163948503e-10, "epoch": 2.9856, "percentage": 99.62, "elapsed_time": "3:58:39", "remaining_time": "0:00:55"}
1555
+ {"current_steps": 1555, "total_steps": 1560, "loss": 0.1489, "lr": 3.12925544818099e-10, "epoch": 2.98752, "percentage": 99.68, "elapsed_time": "3:58:48", "remaining_time": "0:00:46"}
1556
+ {"current_steps": 1556, "total_steps": 1560, "loss": 0.1884, "lr": 2.0027310073833516e-10, "epoch": 2.98944, "percentage": 99.74, "elapsed_time": "3:58:58", "remaining_time": "0:00:36"}
1557
+ {"current_steps": 1557, "total_steps": 1560, "loss": 0.1519, "lr": 1.1265394818993358e-10, "epoch": 2.9913600000000002, "percentage": 99.81, "elapsed_time": "3:59:07", "remaining_time": "0:00:27"}
1558
+ {"current_steps": 1558, "total_steps": 1560, "loss": 0.1611, "lr": 5.0068525870305974e-11, "epoch": 2.99328, "percentage": 99.87, "elapsed_time": "3:59:16", "remaining_time": "0:00:18"}
1559
+ {"current_steps": 1559, "total_steps": 1560, "loss": 0.1731, "lr": 1.251714713546015e-11, "epoch": 2.9952, "percentage": 99.94, "elapsed_time": "3:59:26", "remaining_time": "0:00:09"}
1560
+ {"current_steps": 1560, "total_steps": 1560, "loss": 0.1588, "lr": 0.0, "epoch": 2.99712, "percentage": 100.0, "elapsed_time": "3:59:35", "remaining_time": "0:00:00"}
1561
+ {"current_steps": 1560, "total_steps": 1560, "epoch": 2.99712, "percentage": 100.0, "elapsed_time": "4:01:21", "remaining_time": "0:00:00"}