yuzhounie commited on
Commit
61f03d1
·
verified ·
1 Parent(s): 6020c5e

Training in progress, step 1600

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:141477d56c7dc6b88a976fc707e88dc20695fce810b7f380fa156fc68f16ec76
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9be3b6a41b0ce05d80d6903f549e820472e0b908599e49b8dab71d6fee82275e
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc4caf783d6635cc98624be5290882818bc33794834a1e85b9cda5ecd5ff283d
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce7c5ce0a2ea4c63c9a193414ee30f823d96c672e74ec475533255fef55cd2f4
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35dfa44a8001f4d9e7cbb3e7b8685bde5dfc4f085a951354a10de0f891413faa
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:464de9af4b49a93b5aaedc9e30151b924ff14812684c6c8bbd71fecb534fa141
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3e83c92c7e62b377b3896576ede3701d478282c72da70191f5419cd9f4b41e3
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73a708e88799b98c4c296d3a3c1cf1ed10d0cdbd940d62fa6203bf1d549cc3fc
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -1212,3 +1212,404 @@
1212
  {"current_steps": 1212, "total_steps": 2148, "loss": 0.4912, "lr": 4.7603686460252265e-06, "epoch": 1.6919321088119044, "percentage": 56.42, "elapsed_time": "2:49:38", "remaining_time": "2:11:00"}
1213
  {"current_steps": 1213, "total_steps": 2148, "loss": 0.464, "lr": 4.75225209444569e-06, "epoch": 1.6933271332248314, "percentage": 56.47, "elapsed_time": "2:49:44", "remaining_time": "2:10:50"}
1214
  {"current_steps": 1214, "total_steps": 2148, "loss": 0.5325, "lr": 4.744136197270135e-06, "epoch": 1.6947221576377587, "percentage": 56.52, "elapsed_time": "2:49:54", "remaining_time": "2:10:43"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1212
  {"current_steps": 1212, "total_steps": 2148, "loss": 0.4912, "lr": 4.7603686460252265e-06, "epoch": 1.6919321088119044, "percentage": 56.42, "elapsed_time": "2:49:38", "remaining_time": "2:11:00"}
1213
  {"current_steps": 1213, "total_steps": 2148, "loss": 0.464, "lr": 4.75225209444569e-06, "epoch": 1.6933271332248314, "percentage": 56.47, "elapsed_time": "2:49:44", "remaining_time": "2:10:50"}
1214
  {"current_steps": 1214, "total_steps": 2148, "loss": 0.5325, "lr": 4.744136197270135e-06, "epoch": 1.6947221576377587, "percentage": 56.52, "elapsed_time": "2:49:54", "remaining_time": "2:10:43"}
1215
+ {"current_steps": 1215, "total_steps": 2148, "loss": 0.4799, "lr": 4.736020975935981e-06, "epoch": 1.6961171820506857, "percentage": 56.56, "elapsed_time": "2:50:01", "remaining_time": "2:10:33"}
1216
+ {"current_steps": 1216, "total_steps": 2148, "loss": 0.4379, "lr": 4.72790645187886e-06, "epoch": 1.697512206463613, "percentage": 56.61, "elapsed_time": "2:50:08", "remaining_time": "2:10:24"}
1217
+ {"current_steps": 1217, "total_steps": 2148, "loss": 0.4568, "lr": 4.7197926465325626e-06, "epoch": 1.6989072308765403, "percentage": 56.66, "elapsed_time": "2:50:14", "remaining_time": "2:10:13"}
1218
+ {"current_steps": 1218, "total_steps": 2148, "loss": 0.4844, "lr": 4.711679581328983e-06, "epoch": 1.7003022552894675, "percentage": 56.7, "elapsed_time": "2:50:22", "remaining_time": "2:10:05"}
1219
+ {"current_steps": 1219, "total_steps": 2148, "loss": 0.5517, "lr": 4.703567277698058e-06, "epoch": 1.7016972797023948, "percentage": 56.75, "elapsed_time": "2:50:30", "remaining_time": "2:09:56"}
1220
+ {"current_steps": 1220, "total_steps": 2148, "loss": 0.4494, "lr": 4.695455757067712e-06, "epoch": 1.703092304115322, "percentage": 56.8, "elapsed_time": "2:50:39", "remaining_time": "2:09:48"}
1221
+ {"current_steps": 1221, "total_steps": 2148, "loss": 0.4841, "lr": 4.687345040863808e-06, "epoch": 1.7044873285282494, "percentage": 56.84, "elapsed_time": "2:50:47", "remaining_time": "2:09:39"}
1222
+ {"current_steps": 1222, "total_steps": 2148, "loss": 0.4329, "lr": 4.679235150510072e-06, "epoch": 1.7058823529411766, "percentage": 56.89, "elapsed_time": "2:50:55", "remaining_time": "2:09:31"}
1223
+ {"current_steps": 1223, "total_steps": 2148, "loss": 0.4774, "lr": 4.671126107428061e-06, "epoch": 1.7072773773541037, "percentage": 56.94, "elapsed_time": "2:51:02", "remaining_time": "2:09:22"}
1224
+ {"current_steps": 1224, "total_steps": 2148, "loss": 0.4623, "lr": 4.663017933037087e-06, "epoch": 1.708672401767031, "percentage": 56.98, "elapsed_time": "2:51:11", "remaining_time": "2:09:14"}
1225
+ {"current_steps": 1225, "total_steps": 2148, "loss": 0.4922, "lr": 4.6549106487541666e-06, "epoch": 1.710067426179958, "percentage": 57.03, "elapsed_time": "2:51:18", "remaining_time": "2:09:04"}
1226
+ {"current_steps": 1226, "total_steps": 2148, "loss": 0.4598, "lr": 4.646804275993971e-06, "epoch": 1.7114624505928853, "percentage": 57.08, "elapsed_time": "2:51:25", "remaining_time": "2:08:55"}
1227
+ {"current_steps": 1227, "total_steps": 2148, "loss": 0.4517, "lr": 4.63869883616876e-06, "epoch": 1.7128574750058125, "percentage": 57.12, "elapsed_time": "2:51:34", "remaining_time": "2:08:47"}
1228
+ {"current_steps": 1228, "total_steps": 2148, "loss": 0.4974, "lr": 4.630594350688327e-06, "epoch": 1.7142524994187398, "percentage": 57.17, "elapsed_time": "2:51:42", "remaining_time": "2:08:38"}
1229
+ {"current_steps": 1229, "total_steps": 2148, "loss": 0.464, "lr": 4.62249084095995e-06, "epoch": 1.715647523831667, "percentage": 57.22, "elapsed_time": "2:51:48", "remaining_time": "2:08:28"}
1230
+ {"current_steps": 1230, "total_steps": 2148, "loss": 0.5124, "lr": 4.614388328388327e-06, "epoch": 1.7170425482445943, "percentage": 57.26, "elapsed_time": "2:51:55", "remaining_time": "2:08:18"}
1231
+ {"current_steps": 1231, "total_steps": 2148, "loss": 0.498, "lr": 4.606286834375517e-06, "epoch": 1.7184375726575216, "percentage": 57.31, "elapsed_time": "2:52:03", "remaining_time": "2:08:10"}
1232
+ {"current_steps": 1232, "total_steps": 2148, "loss": 0.4357, "lr": 4.598186380320899e-06, "epoch": 1.7198325970704489, "percentage": 57.36, "elapsed_time": "2:52:14", "remaining_time": "2:08:03"}
1233
+ {"current_steps": 1233, "total_steps": 2148, "loss": 0.4807, "lr": 4.5900869876210986e-06, "epoch": 1.721227621483376, "percentage": 57.4, "elapsed_time": "2:52:20", "remaining_time": "2:07:53"}
1234
+ {"current_steps": 1234, "total_steps": 2148, "loss": 0.5156, "lr": 4.581988677669935e-06, "epoch": 1.7226226458963032, "percentage": 57.45, "elapsed_time": "2:52:29", "remaining_time": "2:07:45"}
1235
+ {"current_steps": 1235, "total_steps": 2148, "loss": 0.4841, "lr": 4.573891471858375e-06, "epoch": 1.7240176703092303, "percentage": 57.5, "elapsed_time": "2:52:38", "remaining_time": "2:07:37"}
1236
+ {"current_steps": 1236, "total_steps": 2148, "loss": 0.4742, "lr": 4.565795391574465e-06, "epoch": 1.7254126947221575, "percentage": 57.54, "elapsed_time": "2:52:48", "remaining_time": "2:07:30"}
1237
+ {"current_steps": 1237, "total_steps": 2148, "loss": 0.4483, "lr": 4.5577004582032745e-06, "epoch": 1.7268077191350848, "percentage": 57.59, "elapsed_time": "2:52:55", "remaining_time": "2:07:21"}
1238
+ {"current_steps": 1238, "total_steps": 2148, "loss": 0.464, "lr": 4.549606693126851e-06, "epoch": 1.728202743548012, "percentage": 57.64, "elapsed_time": "2:53:05", "remaining_time": "2:07:13"}
1239
+ {"current_steps": 1239, "total_steps": 2148, "loss": 0.5271, "lr": 4.541514117724155e-06, "epoch": 1.7295977679609393, "percentage": 57.68, "elapsed_time": "2:53:14", "remaining_time": "2:07:06"}
1240
+ {"current_steps": 1240, "total_steps": 2148, "loss": 0.4246, "lr": 4.533422753370995e-06, "epoch": 1.7309927923738666, "percentage": 57.73, "elapsed_time": "2:53:25", "remaining_time": "2:06:59"}
1241
+ {"current_steps": 1241, "total_steps": 2148, "loss": 0.4876, "lr": 4.525332621439995e-06, "epoch": 1.7323878167867939, "percentage": 57.77, "elapsed_time": "2:53:35", "remaining_time": "2:06:51"}
1242
+ {"current_steps": 1242, "total_steps": 2148, "loss": 0.4195, "lr": 4.517243743300513e-06, "epoch": 1.7337828411997211, "percentage": 57.82, "elapsed_time": "2:53:43", "remaining_time": "2:06:43"}
1243
+ {"current_steps": 1243, "total_steps": 2148, "loss": 0.5121, "lr": 4.5091561403185976e-06, "epoch": 1.7351778656126482, "percentage": 57.87, "elapsed_time": "2:53:53", "remaining_time": "2:06:36"}
1244
+ {"current_steps": 1244, "total_steps": 2148, "loss": 0.4635, "lr": 4.501069833856934e-06, "epoch": 1.7365728900255755, "percentage": 57.91, "elapsed_time": "2:54:00", "remaining_time": "2:06:27"}
1245
+ {"current_steps": 1245, "total_steps": 2148, "loss": 0.4337, "lr": 4.492984845274774e-06, "epoch": 1.7379679144385025, "percentage": 57.96, "elapsed_time": "2:54:07", "remaining_time": "2:06:17"}
1246
+ {"current_steps": 1246, "total_steps": 2148, "loss": 0.4648, "lr": 4.484901195927901e-06, "epoch": 1.7393629388514298, "percentage": 58.01, "elapsed_time": "2:54:14", "remaining_time": "2:06:08"}
1247
+ {"current_steps": 1247, "total_steps": 2148, "loss": 0.4183, "lr": 4.476818907168545e-06, "epoch": 1.740757963264357, "percentage": 58.05, "elapsed_time": "2:54:21", "remaining_time": "2:05:58"}
1248
+ {"current_steps": 1248, "total_steps": 2148, "loss": 0.4416, "lr": 4.4687380003453555e-06, "epoch": 1.7421529876772843, "percentage": 58.1, "elapsed_time": "2:54:30", "remaining_time": "2:05:50"}
1249
+ {"current_steps": 1249, "total_steps": 2148, "loss": 0.4772, "lr": 4.460658496803327e-06, "epoch": 1.7435480120902116, "percentage": 58.15, "elapsed_time": "2:54:39", "remaining_time": "2:05:43"}
1250
+ {"current_steps": 1250, "total_steps": 2148, "loss": 0.461, "lr": 4.4525804178837425e-06, "epoch": 1.7449430365031389, "percentage": 58.19, "elapsed_time": "2:54:53", "remaining_time": "2:05:38"}
1251
+ {"current_steps": 1251, "total_steps": 2148, "loss": 0.5024, "lr": 4.4445037849241305e-06, "epoch": 1.7463380609160661, "percentage": 58.24, "elapsed_time": "2:55:01", "remaining_time": "2:05:29"}
1252
+ {"current_steps": 1252, "total_steps": 2148, "loss": 0.4752, "lr": 4.436428619258196e-06, "epoch": 1.7477330853289934, "percentage": 58.29, "elapsed_time": "2:55:07", "remaining_time": "2:05:19"}
1253
+ {"current_steps": 1253, "total_steps": 2148, "loss": 0.4422, "lr": 4.428354942215766e-06, "epoch": 1.7491281097419205, "percentage": 58.33, "elapsed_time": "2:55:14", "remaining_time": "2:05:10"}
1254
+ {"current_steps": 1254, "total_steps": 2148, "loss": 0.4488, "lr": 4.42028277512274e-06, "epoch": 1.7505231341548477, "percentage": 58.38, "elapsed_time": "2:55:26", "remaining_time": "2:05:04"}
1255
+ {"current_steps": 1255, "total_steps": 2148, "loss": 0.4928, "lr": 4.412212139301027e-06, "epoch": 1.7519181585677748, "percentage": 58.43, "elapsed_time": "2:55:33", "remaining_time": "2:04:55"}
1256
+ {"current_steps": 1256, "total_steps": 2148, "loss": 0.4084, "lr": 4.404143056068489e-06, "epoch": 1.753313182980702, "percentage": 58.47, "elapsed_time": "2:55:41", "remaining_time": "2:04:46"}
1257
+ {"current_steps": 1257, "total_steps": 2148, "loss": 0.475, "lr": 4.3960755467388916e-06, "epoch": 1.7547082073936293, "percentage": 58.52, "elapsed_time": "2:55:51", "remaining_time": "2:04:39"}
1258
+ {"current_steps": 1258, "total_steps": 2148, "loss": 0.5112, "lr": 4.388009632621841e-06, "epoch": 1.7561032318065566, "percentage": 58.57, "elapsed_time": "2:56:02", "remaining_time": "2:04:33"}
1259
+ {"current_steps": 1259, "total_steps": 2148, "loss": 0.4698, "lr": 4.379945335022727e-06, "epoch": 1.7574982562194839, "percentage": 58.61, "elapsed_time": "2:56:10", "remaining_time": "2:04:23"}
1260
+ {"current_steps": 1260, "total_steps": 2148, "loss": 0.5002, "lr": 4.371882675242674e-06, "epoch": 1.7588932806324111, "percentage": 58.66, "elapsed_time": "2:56:23", "remaining_time": "2:04:19"}
1261
+ {"current_steps": 1261, "total_steps": 2148, "loss": 0.5113, "lr": 4.363821674578479e-06, "epoch": 1.7602883050453384, "percentage": 58.71, "elapsed_time": "2:56:34", "remaining_time": "2:04:12"}
1262
+ {"current_steps": 1262, "total_steps": 2148, "loss": 0.4511, "lr": 4.355762354322552e-06, "epoch": 1.7616833294582657, "percentage": 58.75, "elapsed_time": "2:56:42", "remaining_time": "2:04:03"}
1263
+ {"current_steps": 1263, "total_steps": 2148, "loss": 0.496, "lr": 4.347704735762872e-06, "epoch": 1.7630783538711927, "percentage": 58.8, "elapsed_time": "2:56:51", "remaining_time": "2:03:55"}
1264
+ {"current_steps": 1264, "total_steps": 2148, "loss": 0.4827, "lr": 4.339648840182919e-06, "epoch": 1.76447337828412, "percentage": 58.85, "elapsed_time": "2:57:03", "remaining_time": "2:03:49"}
1265
+ {"current_steps": 1265, "total_steps": 2148, "loss": 0.4674, "lr": 4.331594688861619e-06, "epoch": 1.765868402697047, "percentage": 58.89, "elapsed_time": "2:57:12", "remaining_time": "2:03:41"}
1266
+ {"current_steps": 1266, "total_steps": 2148, "loss": 0.4453, "lr": 4.323542303073297e-06, "epoch": 1.7672634271099743, "percentage": 58.94, "elapsed_time": "2:57:18", "remaining_time": "2:03:31"}
1267
+ {"current_steps": 1267, "total_steps": 2148, "loss": 0.4546, "lr": 4.315491704087613e-06, "epoch": 1.7686584515229016, "percentage": 58.99, "elapsed_time": "2:57:26", "remaining_time": "2:03:22"}
1268
+ {"current_steps": 1268, "total_steps": 2148, "loss": 0.4644, "lr": 4.3074429131695e-06, "epoch": 1.7700534759358288, "percentage": 59.03, "elapsed_time": "2:57:34", "remaining_time": "2:03:14"}
1269
+ {"current_steps": 1269, "total_steps": 2148, "loss": 0.468, "lr": 4.299395951579126e-06, "epoch": 1.7714485003487561, "percentage": 59.08, "elapsed_time": "2:57:40", "remaining_time": "2:03:04"}
1270
+ {"current_steps": 1270, "total_steps": 2148, "loss": 0.4304, "lr": 4.291350840571821e-06, "epoch": 1.7728435247616834, "percentage": 59.12, "elapsed_time": "2:57:47", "remaining_time": "2:02:55"}
1271
+ {"current_steps": 1271, "total_steps": 2148, "loss": 0.4824, "lr": 4.283307601398026e-06, "epoch": 1.7742385491746107, "percentage": 59.17, "elapsed_time": "2:57:54", "remaining_time": "2:02:45"}
1272
+ {"current_steps": 1272, "total_steps": 2148, "loss": 0.4915, "lr": 4.275266255303238e-06, "epoch": 1.775633573587538, "percentage": 59.22, "elapsed_time": "2:58:01", "remaining_time": "2:02:36"}
1273
+ {"current_steps": 1273, "total_steps": 2148, "loss": 0.4629, "lr": 4.2672268235279616e-06, "epoch": 1.777028598000465, "percentage": 59.26, "elapsed_time": "2:58:12", "remaining_time": "2:02:29"}
1274
+ {"current_steps": 1274, "total_steps": 2148, "loss": 0.4784, "lr": 4.259189327307632e-06, "epoch": 1.7784236224133922, "percentage": 59.31, "elapsed_time": "2:58:18", "remaining_time": "2:02:19"}
1275
+ {"current_steps": 1275, "total_steps": 2148, "loss": 0.4803, "lr": 4.251153787872579e-06, "epoch": 1.7798186468263193, "percentage": 59.36, "elapsed_time": "2:58:25", "remaining_time": "2:02:10"}
1276
+ {"current_steps": 1276, "total_steps": 2148, "loss": 0.4586, "lr": 4.2431202264479665e-06, "epoch": 1.7812136712392466, "percentage": 59.4, "elapsed_time": "2:58:32", "remaining_time": "2:02:01"}
1277
+ {"current_steps": 1277, "total_steps": 2148, "loss": 0.5089, "lr": 4.235088664253726e-06, "epoch": 1.7826086956521738, "percentage": 59.45, "elapsed_time": "2:58:42", "remaining_time": "2:01:53"}
1278
+ {"current_steps": 1278, "total_steps": 2148, "loss": 0.485, "lr": 4.227059122504514e-06, "epoch": 1.784003720065101, "percentage": 59.5, "elapsed_time": "2:58:50", "remaining_time": "2:01:45"}
1279
+ {"current_steps": 1279, "total_steps": 2148, "loss": 0.4446, "lr": 4.21903162240965e-06, "epoch": 1.7853987444780284, "percentage": 59.54, "elapsed_time": "2:58:57", "remaining_time": "2:01:35"}
1280
+ {"current_steps": 1280, "total_steps": 2148, "loss": 0.5088, "lr": 4.211006185173056e-06, "epoch": 1.7867937688909556, "percentage": 59.59, "elapsed_time": "2:59:04", "remaining_time": "2:01:25"}
1281
+ {"current_steps": 1281, "total_steps": 2148, "loss": 0.425, "lr": 4.20298283199321e-06, "epoch": 1.788188793303883, "percentage": 59.64, "elapsed_time": "2:59:11", "remaining_time": "2:01:16"}
1282
+ {"current_steps": 1282, "total_steps": 2148, "loss": 0.4653, "lr": 4.1949615840630845e-06, "epoch": 1.7895838177168102, "percentage": 59.68, "elapsed_time": "2:59:18", "remaining_time": "2:01:07"}
1283
+ {"current_steps": 1283, "total_steps": 2148, "loss": 0.5048, "lr": 4.186942462570087e-06, "epoch": 1.7909788421297372, "percentage": 59.73, "elapsed_time": "2:59:26", "remaining_time": "2:00:58"}
1284
+ {"current_steps": 1284, "total_steps": 2148, "loss": 0.4903, "lr": 4.178925488696012e-06, "epoch": 1.7923738665426645, "percentage": 59.78, "elapsed_time": "2:59:32", "remaining_time": "2:00:49"}
1285
+ {"current_steps": 1285, "total_steps": 2148, "loss": 0.4688, "lr": 4.170910683616985e-06, "epoch": 1.7937688909555918, "percentage": 59.82, "elapsed_time": "2:59:41", "remaining_time": "2:00:40"}
1286
+ {"current_steps": 1286, "total_steps": 2148, "loss": 0.5185, "lr": 4.1628980685033914e-06, "epoch": 1.7951639153685188, "percentage": 59.87, "elapsed_time": "2:59:51", "remaining_time": "2:00:33"}
1287
+ {"current_steps": 1287, "total_steps": 2148, "loss": 0.4881, "lr": 4.154887664519842e-06, "epoch": 1.796558939781446, "percentage": 59.92, "elapsed_time": "3:00:01", "remaining_time": "2:00:26"}
1288
+ {"current_steps": 1288, "total_steps": 2148, "loss": 0.4673, "lr": 4.1468794928251064e-06, "epoch": 1.7979539641943734, "percentage": 59.96, "elapsed_time": "3:00:09", "remaining_time": "2:00:17"}
1289
+ {"current_steps": 1289, "total_steps": 2148, "loss": 0.4747, "lr": 4.138873574572053e-06, "epoch": 1.7993489886073006, "percentage": 60.01, "elapsed_time": "3:00:15", "remaining_time": "2:00:07"}
1290
+ {"current_steps": 1290, "total_steps": 2148, "loss": 0.4159, "lr": 4.130869930907599e-06, "epoch": 1.800744013020228, "percentage": 60.06, "elapsed_time": "3:00:22", "remaining_time": "1:59:58"}
1291
+ {"current_steps": 1291, "total_steps": 2148, "loss": 0.469, "lr": 4.122868582972659e-06, "epoch": 1.8021390374331552, "percentage": 60.1, "elapsed_time": "3:00:29", "remaining_time": "1:59:48"}
1292
+ {"current_steps": 1292, "total_steps": 2148, "loss": 0.4282, "lr": 4.114869551902075e-06, "epoch": 1.8035340618460824, "percentage": 60.15, "elapsed_time": "3:00:38", "remaining_time": "1:59:40"}
1293
+ {"current_steps": 1293, "total_steps": 2148, "loss": 0.4554, "lr": 4.106872858824576e-06, "epoch": 1.8049290862590095, "percentage": 60.2, "elapsed_time": "3:00:44", "remaining_time": "1:59:31"}
1294
+ {"current_steps": 1294, "total_steps": 2148, "loss": 0.4981, "lr": 4.098878524862715e-06, "epoch": 1.8063241106719368, "percentage": 60.24, "elapsed_time": "3:00:53", "remaining_time": "1:59:23"}
1295
+ {"current_steps": 1295, "total_steps": 2148, "loss": 0.5648, "lr": 4.090886571132807e-06, "epoch": 1.807719135084864, "percentage": 60.29, "elapsed_time": "3:01:02", "remaining_time": "1:59:15"}
1296
+ {"current_steps": 1296, "total_steps": 2148, "loss": 0.4966, "lr": 4.082897018744887e-06, "epoch": 1.809114159497791, "percentage": 60.34, "elapsed_time": "3:01:09", "remaining_time": "1:59:05"}
1297
+ {"current_steps": 1297, "total_steps": 2148, "loss": 0.5033, "lr": 4.074909888802648e-06, "epoch": 1.8105091839107184, "percentage": 60.38, "elapsed_time": "3:01:15", "remaining_time": "1:58:55"}
1298
+ {"current_steps": 1298, "total_steps": 2148, "loss": 0.4183, "lr": 4.066925202403374e-06, "epoch": 1.8119042083236456, "percentage": 60.43, "elapsed_time": "3:01:23", "remaining_time": "1:58:46"}
1299
+ {"current_steps": 1299, "total_steps": 2148, "loss": 0.4835, "lr": 4.058942980637906e-06, "epoch": 1.813299232736573, "percentage": 60.47, "elapsed_time": "3:01:29", "remaining_time": "1:58:37"}
1300
+ {"current_steps": 1300, "total_steps": 2148, "loss": 0.4369, "lr": 4.050963244590571e-06, "epoch": 1.8146942571495002, "percentage": 60.52, "elapsed_time": "3:01:37", "remaining_time": "1:58:28"}
1301
+ {"current_steps": 1301, "total_steps": 2148, "loss": 0.4705, "lr": 4.042986015339126e-06, "epoch": 1.8160892815624274, "percentage": 60.57, "elapsed_time": "3:01:46", "remaining_time": "1:58:20"}
1302
+ {"current_steps": 1302, "total_steps": 2148, "loss": 0.4826, "lr": 4.035011313954713e-06, "epoch": 1.8174843059753547, "percentage": 60.61, "elapsed_time": "3:01:53", "remaining_time": "1:58:11"}
1303
+ {"current_steps": 1303, "total_steps": 2148, "loss": 0.4077, "lr": 4.027039161501795e-06, "epoch": 1.8188793303882818, "percentage": 60.66, "elapsed_time": "3:01:59", "remaining_time": "1:58:01"}
1304
+ {"current_steps": 1304, "total_steps": 2148, "loss": 0.4615, "lr": 4.019069579038096e-06, "epoch": 1.820274354801209, "percentage": 60.71, "elapsed_time": "3:02:07", "remaining_time": "1:57:52"}
1305
+ {"current_steps": 1305, "total_steps": 2148, "loss": 0.427, "lr": 4.011102587614563e-06, "epoch": 1.8216693792141363, "percentage": 60.75, "elapsed_time": "3:02:15", "remaining_time": "1:57:44"}
1306
+ {"current_steps": 1306, "total_steps": 2148, "loss": 0.4925, "lr": 4.00313820827529e-06, "epoch": 1.8230644036270633, "percentage": 60.8, "elapsed_time": "3:02:28", "remaining_time": "1:57:38"}
1307
+ {"current_steps": 1307, "total_steps": 2148, "loss": 0.5266, "lr": 3.995176462057473e-06, "epoch": 1.8244594280399906, "percentage": 60.85, "elapsed_time": "3:02:42", "remaining_time": "1:57:33"}
1308
+ {"current_steps": 1308, "total_steps": 2148, "loss": 0.4703, "lr": 3.987217369991357e-06, "epoch": 1.8258544524529179, "percentage": 60.89, "elapsed_time": "3:02:51", "remaining_time": "1:57:25"}
1309
+ {"current_steps": 1309, "total_steps": 2148, "loss": 0.4721, "lr": 3.979260953100169e-06, "epoch": 1.8272494768658452, "percentage": 60.94, "elapsed_time": "3:02:59", "remaining_time": "1:57:17"}
1310
+ {"current_steps": 1310, "total_steps": 2148, "loss": 0.4539, "lr": 3.97130723240008e-06, "epoch": 1.8286445012787724, "percentage": 60.99, "elapsed_time": "3:03:06", "remaining_time": "1:57:08"}
1311
+ {"current_steps": 1311, "total_steps": 2148, "loss": 0.4988, "lr": 3.96335622890013e-06, "epoch": 1.8300395256916997, "percentage": 61.03, "elapsed_time": "3:03:17", "remaining_time": "1:57:01"}
1312
+ {"current_steps": 1312, "total_steps": 2148, "loss": 0.4765, "lr": 3.955407963602184e-06, "epoch": 1.831434550104627, "percentage": 61.08, "elapsed_time": "3:03:24", "remaining_time": "1:56:52"}
1313
+ {"current_steps": 1313, "total_steps": 2148, "loss": 0.4583, "lr": 3.94746245750088e-06, "epoch": 1.832829574517554, "percentage": 61.13, "elapsed_time": "3:03:32", "remaining_time": "1:56:43"}
1314
+ {"current_steps": 1314, "total_steps": 2148, "loss": 0.4851, "lr": 3.939519731583557e-06, "epoch": 1.8342245989304813, "percentage": 61.17, "elapsed_time": "3:03:39", "remaining_time": "1:56:34"}
1315
+ {"current_steps": 1315, "total_steps": 2148, "loss": 0.4367, "lr": 3.9315798068302214e-06, "epoch": 1.8356196233434086, "percentage": 61.22, "elapsed_time": "3:03:49", "remaining_time": "1:56:26"}
1316
+ {"current_steps": 1316, "total_steps": 2148, "loss": 0.4948, "lr": 3.923642704213475e-06, "epoch": 1.8370146477563356, "percentage": 61.27, "elapsed_time": "3:03:59", "remaining_time": "1:56:19"}
1317
+ {"current_steps": 1317, "total_steps": 2148, "loss": 0.4911, "lr": 3.915708444698465e-06, "epoch": 1.8384096721692629, "percentage": 61.31, "elapsed_time": "3:04:06", "remaining_time": "1:56:10"}
1318
+ {"current_steps": 1318, "total_steps": 2148, "loss": 0.4578, "lr": 3.907777049242828e-06, "epoch": 1.8398046965821901, "percentage": 61.36, "elapsed_time": "3:04:14", "remaining_time": "1:56:01"}
1319
+ {"current_steps": 1319, "total_steps": 2148, "loss": 0.4772, "lr": 3.899848538796643e-06, "epoch": 1.8411997209951174, "percentage": 61.41, "elapsed_time": "3:04:21", "remaining_time": "1:55:52"}
1320
+ {"current_steps": 1320, "total_steps": 2148, "loss": 0.4897, "lr": 3.891922934302356e-06, "epoch": 1.8425947454080447, "percentage": 61.45, "elapsed_time": "3:04:33", "remaining_time": "1:55:46"}
1321
+ {"current_steps": 1321, "total_steps": 2148, "loss": 0.4872, "lr": 3.884000256694749e-06, "epoch": 1.843989769820972, "percentage": 61.5, "elapsed_time": "3:04:40", "remaining_time": "1:55:36"}
1322
+ {"current_steps": 1322, "total_steps": 2148, "loss": 0.5054, "lr": 3.876080526900867e-06, "epoch": 1.8453847942338992, "percentage": 61.55, "elapsed_time": "3:04:46", "remaining_time": "1:55:27"}
1323
+ {"current_steps": 1323, "total_steps": 2148, "loss": 0.4731, "lr": 3.868163765839966e-06, "epoch": 1.8467798186468263, "percentage": 61.59, "elapsed_time": "3:04:53", "remaining_time": "1:55:17"}
1324
+ {"current_steps": 1324, "total_steps": 2148, "loss": 0.4723, "lr": 3.860249994423467e-06, "epoch": 1.8481748430597535, "percentage": 61.64, "elapsed_time": "3:05:01", "remaining_time": "1:55:08"}
1325
+ {"current_steps": 1325, "total_steps": 2148, "loss": 0.4587, "lr": 3.852339233554891e-06, "epoch": 1.8495698674726808, "percentage": 61.69, "elapsed_time": "3:05:11", "remaining_time": "1:55:01"}
1326
+ {"current_steps": 1326, "total_steps": 2148, "loss": 0.5112, "lr": 3.844431504129804e-06, "epoch": 1.8509648918856079, "percentage": 61.73, "elapsed_time": "3:05:19", "remaining_time": "1:54:52"}
1327
+ {"current_steps": 1327, "total_steps": 2148, "loss": 0.4793, "lr": 3.8365268270357715e-06, "epoch": 1.8523599162985351, "percentage": 61.78, "elapsed_time": "3:05:30", "remaining_time": "1:54:46"}
1328
+ {"current_steps": 1328, "total_steps": 2148, "loss": 0.4653, "lr": 3.828625223152291e-06, "epoch": 1.8537549407114624, "percentage": 61.82, "elapsed_time": "3:05:37", "remaining_time": "1:54:36"}
1329
+ {"current_steps": 1329, "total_steps": 2148, "loss": 0.4625, "lr": 3.820726713350742e-06, "epoch": 1.8551499651243897, "percentage": 61.87, "elapsed_time": "3:05:47", "remaining_time": "1:54:29"}
1330
+ {"current_steps": 1330, "total_steps": 2148, "loss": 0.4897, "lr": 3.812831318494335e-06, "epoch": 1.856544989537317, "percentage": 61.92, "elapsed_time": "3:05:53", "remaining_time": "1:54:20"}
1331
+ {"current_steps": 1331, "total_steps": 2148, "loss": 0.4686, "lr": 3.804939059438052e-06, "epoch": 1.8579400139502442, "percentage": 61.96, "elapsed_time": "3:06:00", "remaining_time": "1:54:10"}
1332
+ {"current_steps": 1332, "total_steps": 2148, "loss": 0.4763, "lr": 3.797049957028588e-06, "epoch": 1.8593350383631715, "percentage": 62.01, "elapsed_time": "3:06:06", "remaining_time": "1:54:00"}
1333
+ {"current_steps": 1333, "total_steps": 2148, "loss": 0.421, "lr": 3.7891640321043054e-06, "epoch": 1.8607300627760985, "percentage": 62.06, "elapsed_time": "3:06:15", "remaining_time": "1:53:52"}
1334
+ {"current_steps": 1334, "total_steps": 2148, "loss": 0.419, "lr": 3.781281305495171e-06, "epoch": 1.8621250871890258, "percentage": 62.1, "elapsed_time": "3:06:21", "remaining_time": "1:53:43"}
1335
+ {"current_steps": 1335, "total_steps": 2148, "loss": 0.4321, "lr": 3.773401798022701e-06, "epoch": 1.863520111601953, "percentage": 62.15, "elapsed_time": "3:06:30", "remaining_time": "1:53:34"}
1336
+ {"current_steps": 1336, "total_steps": 2148, "loss": 0.4628, "lr": 3.765525530499915e-06, "epoch": 1.8649151360148801, "percentage": 62.2, "elapsed_time": "3:06:36", "remaining_time": "1:53:24"}
1337
+ {"current_steps": 1337, "total_steps": 2148, "loss": 0.4195, "lr": 3.757652523731269e-06, "epoch": 1.8663101604278074, "percentage": 62.24, "elapsed_time": "3:06:42", "remaining_time": "1:53:15"}
1338
+ {"current_steps": 1338, "total_steps": 2148, "loss": 0.4481, "lr": 3.7497827985126054e-06, "epoch": 1.8677051848407347, "percentage": 62.29, "elapsed_time": "3:06:54", "remaining_time": "1:53:09"}
1339
+ {"current_steps": 1339, "total_steps": 2148, "loss": 0.4319, "lr": 3.741916375631105e-06, "epoch": 1.869100209253662, "percentage": 62.34, "elapsed_time": "3:07:02", "remaining_time": "1:53:00"}
1340
+ {"current_steps": 1340, "total_steps": 2148, "loss": 0.5306, "lr": 3.7340532758652217e-06, "epoch": 1.8704952336665892, "percentage": 62.38, "elapsed_time": "3:07:10", "remaining_time": "1:52:52"}
1341
+ {"current_steps": 1341, "total_steps": 2148, "loss": 0.4423, "lr": 3.7261935199846266e-06, "epoch": 1.8718902580795165, "percentage": 62.43, "elapsed_time": "3:07:16", "remaining_time": "1:52:42"}
1342
+ {"current_steps": 1342, "total_steps": 2148, "loss": 0.4592, "lr": 3.7183371287501684e-06, "epoch": 1.8732852824924437, "percentage": 62.48, "elapsed_time": "3:07:24", "remaining_time": "1:52:33"}
1343
+ {"current_steps": 1343, "total_steps": 2148, "loss": 0.4831, "lr": 3.7104841229138034e-06, "epoch": 1.8746803069053708, "percentage": 62.52, "elapsed_time": "3:07:31", "remaining_time": "1:52:24"}
1344
+ {"current_steps": 1344, "total_steps": 2148, "loss": 0.4368, "lr": 3.7026345232185416e-06, "epoch": 1.876075331318298, "percentage": 62.57, "elapsed_time": "3:07:39", "remaining_time": "1:52:15"}
1345
+ {"current_steps": 1345, "total_steps": 2148, "loss": 0.4429, "lr": 3.6947883503984037e-06, "epoch": 1.8774703557312253, "percentage": 62.62, "elapsed_time": "3:07:49", "remaining_time": "1:52:08"}
1346
+ {"current_steps": 1346, "total_steps": 2148, "loss": 0.4477, "lr": 3.686945625178356e-06, "epoch": 1.8788653801441524, "percentage": 62.66, "elapsed_time": "3:08:00", "remaining_time": "1:52:01"}
1347
+ {"current_steps": 1347, "total_steps": 2148, "loss": 0.4897, "lr": 3.6791063682742535e-06, "epoch": 1.8802604045570797, "percentage": 62.71, "elapsed_time": "3:08:06", "remaining_time": "1:51:51"}
1348
+ {"current_steps": 1348, "total_steps": 2148, "loss": 0.464, "lr": 3.6712706003927937e-06, "epoch": 1.881655428970007, "percentage": 62.76, "elapsed_time": "3:08:13", "remaining_time": "1:51:42"}
1349
+ {"current_steps": 1349, "total_steps": 2148, "loss": 0.4415, "lr": 3.6634383422314622e-06, "epoch": 1.8830504533829342, "percentage": 62.8, "elapsed_time": "3:08:24", "remaining_time": "1:51:35"}
1350
+ {"current_steps": 1350, "total_steps": 2148, "loss": 0.5069, "lr": 3.655609614478467e-06, "epoch": 1.8844454777958615, "percentage": 62.85, "elapsed_time": "3:08:32", "remaining_time": "1:51:27"}
1351
+ {"current_steps": 1351, "total_steps": 2148, "loss": 0.4889, "lr": 3.647784437812693e-06, "epoch": 1.8858405022087887, "percentage": 62.9, "elapsed_time": "3:08:41", "remaining_time": "1:51:18"}
1352
+ {"current_steps": 1352, "total_steps": 2148, "loss": 0.4978, "lr": 3.6399628329036496e-06, "epoch": 1.887235526621716, "percentage": 62.94, "elapsed_time": "3:08:50", "remaining_time": "1:51:10"}
1353
+ {"current_steps": 1353, "total_steps": 2148, "loss": 0.4004, "lr": 3.632144820411405e-06, "epoch": 1.888630551034643, "percentage": 62.99, "elapsed_time": "3:08:56", "remaining_time": "1:51:00"}
1354
+ {"current_steps": 1354, "total_steps": 2148, "loss": 0.4244, "lr": 3.624330420986541e-06, "epoch": 1.8900255754475703, "percentage": 63.04, "elapsed_time": "3:09:02", "remaining_time": "1:50:51"}
1355
+ {"current_steps": 1355, "total_steps": 2148, "loss": 0.4697, "lr": 3.6165196552701e-06, "epoch": 1.8914205998604976, "percentage": 63.08, "elapsed_time": "3:09:09", "remaining_time": "1:50:41"}
1356
+ {"current_steps": 1356, "total_steps": 2148, "loss": 0.4624, "lr": 3.6087125438935187e-06, "epoch": 1.8928156242734246, "percentage": 63.13, "elapsed_time": "3:09:16", "remaining_time": "1:50:32"}
1357
+ {"current_steps": 1357, "total_steps": 2148, "loss": 0.4629, "lr": 3.6009091074785853e-06, "epoch": 1.894210648686352, "percentage": 63.18, "elapsed_time": "3:09:23", "remaining_time": "1:50:23"}
1358
+ {"current_steps": 1358, "total_steps": 2148, "loss": 0.513, "lr": 3.5931093666373845e-06, "epoch": 1.8956056730992792, "percentage": 63.22, "elapsed_time": "3:09:31", "remaining_time": "1:50:15"}
1359
+ {"current_steps": 1359, "total_steps": 2148, "loss": 0.4522, "lr": 3.585313341972232e-06, "epoch": 1.8970006975122065, "percentage": 63.27, "elapsed_time": "3:09:37", "remaining_time": "1:50:05"}
1360
+ {"current_steps": 1360, "total_steps": 2148, "loss": 0.4274, "lr": 3.577521054075631e-06, "epoch": 1.8983957219251337, "percentage": 63.31, "elapsed_time": "3:09:45", "remaining_time": "1:49:56"}
1361
+ {"current_steps": 1361, "total_steps": 2148, "loss": 0.4201, "lr": 3.5697325235302183e-06, "epoch": 1.899790746338061, "percentage": 63.36, "elapsed_time": "3:09:51", "remaining_time": "1:49:47"}
1362
+ {"current_steps": 1362, "total_steps": 2148, "loss": 0.4297, "lr": 3.5619477709086982e-06, "epoch": 1.9011857707509883, "percentage": 63.41, "elapsed_time": "3:09:58", "remaining_time": "1:49:38"}
1363
+ {"current_steps": 1363, "total_steps": 2148, "loss": 0.5433, "lr": 3.5541668167738003e-06, "epoch": 1.9025807951639153, "percentage": 63.45, "elapsed_time": "3:10:06", "remaining_time": "1:49:29"}
1364
+ {"current_steps": 1364, "total_steps": 2148, "loss": 0.4562, "lr": 3.546389681678224e-06, "epoch": 1.9039758195768426, "percentage": 63.5, "elapsed_time": "3:10:12", "remaining_time": "1:49:19"}
1365
+ {"current_steps": 1365, "total_steps": 2148, "loss": 0.4618, "lr": 3.538616386164575e-06, "epoch": 1.9053708439897699, "percentage": 63.55, "elapsed_time": "3:10:19", "remaining_time": "1:49:10"}
1366
+ {"current_steps": 1366, "total_steps": 2148, "loss": 0.4771, "lr": 3.530846950765318e-06, "epoch": 1.906765868402697, "percentage": 63.59, "elapsed_time": "3:10:27", "remaining_time": "1:49:01"}
1367
+ {"current_steps": 1367, "total_steps": 2148, "loss": 0.4773, "lr": 3.5230813960027275e-06, "epoch": 1.9081608928156242, "percentage": 63.64, "elapsed_time": "3:10:34", "remaining_time": "1:48:52"}
1368
+ {"current_steps": 1368, "total_steps": 2148, "loss": 0.4975, "lr": 3.5153197423888206e-06, "epoch": 1.9095559172285514, "percentage": 63.69, "elapsed_time": "3:10:41", "remaining_time": "1:48:43"}
1369
+ {"current_steps": 1369, "total_steps": 2148, "loss": 0.4375, "lr": 3.5075620104253123e-06, "epoch": 1.9109509416414787, "percentage": 63.73, "elapsed_time": "3:10:48", "remaining_time": "1:48:34"}
1370
+ {"current_steps": 1370, "total_steps": 2148, "loss": 0.4481, "lr": 3.4998082206035606e-06, "epoch": 1.912345966054406, "percentage": 63.78, "elapsed_time": "3:10:55", "remaining_time": "1:48:25"}
1371
+ {"current_steps": 1371, "total_steps": 2148, "loss": 0.5112, "lr": 3.492058393404509e-06, "epoch": 1.9137409904673333, "percentage": 63.83, "elapsed_time": "3:11:05", "remaining_time": "1:48:17"}
1372
+ {"current_steps": 1372, "total_steps": 2148, "loss": 0.4213, "lr": 3.4843125492986345e-06, "epoch": 1.9151360148802605, "percentage": 63.87, "elapsed_time": "3:11:11", "remaining_time": "1:48:08"}
1373
+ {"current_steps": 1373, "total_steps": 2148, "loss": 0.493, "lr": 3.4765707087458912e-06, "epoch": 1.9165310392931876, "percentage": 63.92, "elapsed_time": "3:11:21", "remaining_time": "1:48:00"}
1374
+ {"current_steps": 1374, "total_steps": 2148, "loss": 0.4985, "lr": 3.468832892195664e-06, "epoch": 1.9179260637061148, "percentage": 63.97, "elapsed_time": "3:11:29", "remaining_time": "1:47:51"}
1375
+ {"current_steps": 1375, "total_steps": 2148, "loss": 0.4735, "lr": 3.4610991200867006e-06, "epoch": 1.9193210881190421, "percentage": 64.01, "elapsed_time": "3:11:38", "remaining_time": "1:47:44"}
1376
+ {"current_steps": 1376, "total_steps": 2148, "loss": 0.4061, "lr": 3.453369412847071e-06, "epoch": 1.9207161125319692, "percentage": 64.06, "elapsed_time": "3:11:48", "remaining_time": "1:47:36"}
1377
+ {"current_steps": 1377, "total_steps": 2148, "loss": 0.4451, "lr": 3.445643790894109e-06, "epoch": 1.9221111369448964, "percentage": 64.11, "elapsed_time": "3:11:55", "remaining_time": "1:47:27"}
1378
+ {"current_steps": 1378, "total_steps": 2148, "loss": 0.4679, "lr": 3.4379222746343534e-06, "epoch": 1.9235061613578237, "percentage": 64.15, "elapsed_time": "3:12:02", "remaining_time": "1:47:18"}
1379
+ {"current_steps": 1379, "total_steps": 2148, "loss": 0.4776, "lr": 3.4302048844634995e-06, "epoch": 1.924901185770751, "percentage": 64.2, "elapsed_time": "3:12:13", "remaining_time": "1:47:11"}
1380
+ {"current_steps": 1380, "total_steps": 2148, "loss": 0.427, "lr": 3.4224916407663484e-06, "epoch": 1.9262962101836782, "percentage": 64.25, "elapsed_time": "3:12:19", "remaining_time": "1:47:01"}
1381
+ {"current_steps": 1381, "total_steps": 2148, "loss": 0.5011, "lr": 3.414782563916742e-06, "epoch": 1.9276912345966055, "percentage": 64.29, "elapsed_time": "3:12:26", "remaining_time": "1:46:52"}
1382
+ {"current_steps": 1382, "total_steps": 2148, "loss": 0.4716, "lr": 3.407077674277518e-06, "epoch": 1.9290862590095328, "percentage": 64.34, "elapsed_time": "3:12:36", "remaining_time": "1:46:45"}
1383
+ {"current_steps": 1383, "total_steps": 2148, "loss": 0.5317, "lr": 3.3993769922004584e-06, "epoch": 1.93048128342246, "percentage": 64.39, "elapsed_time": "3:12:42", "remaining_time": "1:46:35"}
1384
+ {"current_steps": 1384, "total_steps": 2148, "loss": 0.4242, "lr": 3.391680538026224e-06, "epoch": 1.931876307835387, "percentage": 64.43, "elapsed_time": "3:12:51", "remaining_time": "1:46:27"}
1385
+ {"current_steps": 1385, "total_steps": 2148, "loss": 0.4513, "lr": 3.3839883320843125e-06, "epoch": 1.9332713322483144, "percentage": 64.48, "elapsed_time": "3:12:58", "remaining_time": "1:46:18"}
1386
+ {"current_steps": 1386, "total_steps": 2148, "loss": 0.4656, "lr": 3.3763003946930023e-06, "epoch": 1.9346663566612414, "percentage": 64.53, "elapsed_time": "3:13:06", "remaining_time": "1:46:10"}
1387
+ {"current_steps": 1387, "total_steps": 2148, "loss": 0.4548, "lr": 3.36861674615929e-06, "epoch": 1.9360613810741687, "percentage": 64.57, "elapsed_time": "3:13:12", "remaining_time": "1:46:00"}
1388
+ {"current_steps": 1388, "total_steps": 2148, "loss": 0.5095, "lr": 3.360937406778849e-06, "epoch": 1.937456405487096, "percentage": 64.62, "elapsed_time": "3:13:20", "remaining_time": "1:45:51"}
1389
+ {"current_steps": 1389, "total_steps": 2148, "loss": 0.4221, "lr": 3.35326239683597e-06, "epoch": 1.9388514299000232, "percentage": 64.66, "elapsed_time": "3:13:27", "remaining_time": "1:45:42"}
1390
+ {"current_steps": 1390, "total_steps": 2148, "loss": 0.4702, "lr": 3.3455917366035058e-06, "epoch": 1.9402464543129505, "percentage": 64.71, "elapsed_time": "3:13:34", "remaining_time": "1:45:33"}
1391
+ {"current_steps": 1391, "total_steps": 2148, "loss": 0.4391, "lr": 3.337925446342819e-06, "epoch": 1.9416414787258778, "percentage": 64.76, "elapsed_time": "3:13:41", "remaining_time": "1:45:24"}
1392
+ {"current_steps": 1392, "total_steps": 2148, "loss": 0.3957, "lr": 3.3302635463037352e-06, "epoch": 1.943036503138805, "percentage": 64.8, "elapsed_time": "3:13:49", "remaining_time": "1:45:15"}
1393
+ {"current_steps": 1393, "total_steps": 2148, "loss": 0.479, "lr": 3.3226060567244767e-06, "epoch": 1.9444315275517323, "percentage": 64.85, "elapsed_time": "3:13:55", "remaining_time": "1:45:06"}
1394
+ {"current_steps": 1394, "total_steps": 2148, "loss": 0.4221, "lr": 3.314952997831618e-06, "epoch": 1.9458265519646594, "percentage": 64.9, "elapsed_time": "3:14:03", "remaining_time": "1:44:57"}
1395
+ {"current_steps": 1395, "total_steps": 2148, "loss": 0.4339, "lr": 3.307304389840036e-06, "epoch": 1.9472215763775866, "percentage": 64.94, "elapsed_time": "3:14:11", "remaining_time": "1:44:49"}
1396
+ {"current_steps": 1396, "total_steps": 2148, "loss": 0.447, "lr": 3.29966025295284e-06, "epoch": 1.9486166007905137, "percentage": 64.99, "elapsed_time": "3:14:18", "remaining_time": "1:44:40"}
1397
+ {"current_steps": 1397, "total_steps": 2148, "loss": 0.5655, "lr": 3.292020607361337e-06, "epoch": 1.950011625203441, "percentage": 65.04, "elapsed_time": "3:14:24", "remaining_time": "1:44:30"}
1398
+ {"current_steps": 1398, "total_steps": 2148, "loss": 0.4208, "lr": 3.284385473244974e-06, "epoch": 1.9514066496163682, "percentage": 65.08, "elapsed_time": "3:14:32", "remaining_time": "1:44:22"}
1399
+ {"current_steps": 1399, "total_steps": 2148, "loss": 0.4854, "lr": 3.2767548707712693e-06, "epoch": 1.9528016740292955, "percentage": 65.13, "elapsed_time": "3:14:40", "remaining_time": "1:44:13"}
1400
+ {"current_steps": 1400, "total_steps": 2148, "loss": 0.4792, "lr": 3.2691288200957826e-06, "epoch": 1.9541966984422228, "percentage": 65.18, "elapsed_time": "3:14:51", "remaining_time": "1:44:06"}
1401
+ {"current_steps": 1401, "total_steps": 2148, "loss": 0.4976, "lr": 3.2615073413620467e-06, "epoch": 1.95559172285515, "percentage": 65.22, "elapsed_time": "3:14:59", "remaining_time": "1:43:57"}
1402
+ {"current_steps": 1402, "total_steps": 2148, "loss": 0.4719, "lr": 3.2538904547015137e-06, "epoch": 1.9569867472680773, "percentage": 65.27, "elapsed_time": "3:15:08", "remaining_time": "1:43:50"}
1403
+ {"current_steps": 1403, "total_steps": 2148, "loss": 0.4655, "lr": 3.2462781802335124e-06, "epoch": 1.9583817716810046, "percentage": 65.32, "elapsed_time": "3:15:16", "remaining_time": "1:43:41"}
1404
+ {"current_steps": 1404, "total_steps": 2148, "loss": 0.4686, "lr": 3.2386705380651877e-06, "epoch": 1.9597767960939316, "percentage": 65.36, "elapsed_time": "3:15:24", "remaining_time": "1:43:32"}
1405
+ {"current_steps": 1405, "total_steps": 2148, "loss": 0.4681, "lr": 3.2310675482914444e-06, "epoch": 1.961171820506859, "percentage": 65.41, "elapsed_time": "3:15:32", "remaining_time": "1:43:24"}
1406
+ {"current_steps": 1406, "total_steps": 2148, "loss": 0.4678, "lr": 3.2234692309949034e-06, "epoch": 1.962566844919786, "percentage": 65.46, "elapsed_time": "3:15:41", "remaining_time": "1:43:16"}
1407
+ {"current_steps": 1407, "total_steps": 2148, "loss": 0.4722, "lr": 3.2158756062458422e-06, "epoch": 1.9639618693327132, "percentage": 65.5, "elapsed_time": "3:15:49", "remaining_time": "1:43:08"}
1408
+ {"current_steps": 1408, "total_steps": 2148, "loss": 0.4994, "lr": 3.208286694102141e-06, "epoch": 1.9653568937456405, "percentage": 65.55, "elapsed_time": "3:16:02", "remaining_time": "1:43:02"}
1409
+ {"current_steps": 1409, "total_steps": 2148, "loss": 0.4398, "lr": 3.2007025146092345e-06, "epoch": 1.9667519181585678, "percentage": 65.6, "elapsed_time": "3:16:09", "remaining_time": "1:42:52"}
1410
+ {"current_steps": 1410, "total_steps": 2148, "loss": 0.45, "lr": 3.1931230878000586e-06, "epoch": 1.968146942571495, "percentage": 65.64, "elapsed_time": "3:16:16", "remaining_time": "1:42:43"}
1411
+ {"current_steps": 1411, "total_steps": 2148, "loss": 0.4568, "lr": 3.1855484336949876e-06, "epoch": 1.9695419669844223, "percentage": 65.69, "elapsed_time": "3:16:24", "remaining_time": "1:42:35"}
1412
+ {"current_steps": 1412, "total_steps": 2148, "loss": 0.5065, "lr": 3.1779785723017988e-06, "epoch": 1.9709369913973496, "percentage": 65.74, "elapsed_time": "3:16:30", "remaining_time": "1:42:25"}
1413
+ {"current_steps": 1413, "total_steps": 2148, "loss": 0.441, "lr": 3.170413523615605e-06, "epoch": 1.9723320158102768, "percentage": 65.78, "elapsed_time": "3:16:37", "remaining_time": "1:42:16"}
1414
+ {"current_steps": 1414, "total_steps": 2148, "loss": 0.402, "lr": 3.162853307618805e-06, "epoch": 1.9737270402232039, "percentage": 65.83, "elapsed_time": "3:16:44", "remaining_time": "1:42:07"}
1415
+ {"current_steps": 1415, "total_steps": 2148, "loss": 0.4518, "lr": 3.155297944281036e-06, "epoch": 1.9751220646361312, "percentage": 65.88, "elapsed_time": "3:16:51", "remaining_time": "1:41:58"}
1416
+ {"current_steps": 1416, "total_steps": 2148, "loss": 0.4618, "lr": 3.1477474535591167e-06, "epoch": 1.9765170890490582, "percentage": 65.92, "elapsed_time": "3:16:57", "remaining_time": "1:41:49"}
1417
+ {"current_steps": 1417, "total_steps": 2148, "loss": 0.5035, "lr": 3.1402018553969917e-06, "epoch": 1.9779121134619855, "percentage": 65.97, "elapsed_time": "3:17:10", "remaining_time": "1:41:43"}
1418
+ {"current_steps": 1418, "total_steps": 2148, "loss": 0.4757, "lr": 3.132661169725688e-06, "epoch": 1.9793071378749127, "percentage": 66.01, "elapsed_time": "3:17:22", "remaining_time": "1:41:36"}
1419
+ {"current_steps": 1419, "total_steps": 2148, "loss": 0.4332, "lr": 3.125125416463254e-06, "epoch": 1.98070216228784, "percentage": 66.06, "elapsed_time": "3:17:35", "remaining_time": "1:41:30"}
1420
+ {"current_steps": 1420, "total_steps": 2148, "loss": 0.4633, "lr": 3.1175946155147064e-06, "epoch": 1.9820971867007673, "percentage": 66.11, "elapsed_time": "3:17:46", "remaining_time": "1:41:23"}
1421
+ {"current_steps": 1421, "total_steps": 2148, "loss": 0.4709, "lr": 3.110068786771987e-06, "epoch": 1.9834922111136946, "percentage": 66.15, "elapsed_time": "3:17:56", "remaining_time": "1:41:16"}
1422
+ {"current_steps": 1422, "total_steps": 2148, "loss": 0.4934, "lr": 3.1025479501139e-06, "epoch": 1.9848872355266218, "percentage": 66.2, "elapsed_time": "3:18:04", "remaining_time": "1:41:07"}
1423
+ {"current_steps": 1423, "total_steps": 2148, "loss": 0.4469, "lr": 3.095032125406062e-06, "epoch": 1.986282259939549, "percentage": 66.25, "elapsed_time": "3:18:10", "remaining_time": "1:40:58"}
1424
+ {"current_steps": 1424, "total_steps": 2148, "loss": 0.5061, "lr": 3.0875213325008548e-06, "epoch": 1.9876772843524761, "percentage": 66.29, "elapsed_time": "3:18:18", "remaining_time": "1:40:49"}
1425
+ {"current_steps": 1425, "total_steps": 2148, "loss": 0.4703, "lr": 3.0800155912373696e-06, "epoch": 1.9890723087654034, "percentage": 66.34, "elapsed_time": "3:18:25", "remaining_time": "1:40:40"}
1426
+ {"current_steps": 1426, "total_steps": 2148, "loss": 0.4196, "lr": 3.0725149214413487e-06, "epoch": 1.9904673331783305, "percentage": 66.39, "elapsed_time": "3:18:32", "remaining_time": "1:40:31"}
1427
+ {"current_steps": 1427, "total_steps": 2148, "loss": 0.4886, "lr": 3.065019342925143e-06, "epoch": 1.9918623575912577, "percentage": 66.43, "elapsed_time": "3:18:39", "remaining_time": "1:40:22"}
1428
+ {"current_steps": 1428, "total_steps": 2148, "loss": 0.4786, "lr": 3.0575288754876565e-06, "epoch": 1.993257382004185, "percentage": 66.48, "elapsed_time": "3:18:45", "remaining_time": "1:40:12"}
1429
+ {"current_steps": 1429, "total_steps": 2148, "loss": 0.4108, "lr": 3.0500435389142867e-06, "epoch": 1.9946524064171123, "percentage": 66.53, "elapsed_time": "3:18:54", "remaining_time": "1:40:04"}
1430
+ {"current_steps": 1430, "total_steps": 2148, "loss": 0.4564, "lr": 3.042563352976884e-06, "epoch": 1.9960474308300395, "percentage": 66.57, "elapsed_time": "3:19:02", "remaining_time": "1:39:56"}
1431
+ {"current_steps": 1431, "total_steps": 2148, "loss": 0.4773, "lr": 3.035088337433694e-06, "epoch": 1.9974424552429668, "percentage": 66.62, "elapsed_time": "3:19:11", "remaining_time": "1:39:48"}
1432
+ {"current_steps": 1432, "total_steps": 2148, "loss": 0.4866, "lr": 3.0276185120292996e-06, "epoch": 1.998837479655894, "percentage": 66.67, "elapsed_time": "3:19:22", "remaining_time": "1:39:41"}
1433
+ {"current_steps": 1433, "total_steps": 2148, "loss": 0.7126, "lr": 3.0201538964945787e-06, "epoch": 2.0013950244129273, "percentage": 66.71, "elapsed_time": "3:19:36", "remaining_time": "1:39:35"}
1434
+ {"current_steps": 1434, "total_steps": 2148, "loss": 0.2665, "lr": 3.0126945105466486e-06, "epoch": 2.0027900488258545, "percentage": 66.76, "elapsed_time": "3:19:43", "remaining_time": "1:39:26"}
1435
+ {"current_steps": 1435, "total_steps": 2148, "loss": 0.2909, "lr": 3.005240373888812e-06, "epoch": 2.004185073238782, "percentage": 66.81, "elapsed_time": "3:19:51", "remaining_time": "1:39:18"}
1436
+ {"current_steps": 1436, "total_steps": 2148, "loss": 0.2668, "lr": 2.9977915062105023e-06, "epoch": 2.005580097651709, "percentage": 66.85, "elapsed_time": "3:19:59", "remaining_time": "1:39:09"}
1437
+ {"current_steps": 1437, "total_steps": 2148, "loss": 0.2382, "lr": 2.9903479271872416e-06, "epoch": 2.0069751220646364, "percentage": 66.9, "elapsed_time": "3:20:06", "remaining_time": "1:39:00"}
1438
+ {"current_steps": 1438, "total_steps": 2148, "loss": 0.2321, "lr": 2.9829096564805804e-06, "epoch": 2.008370146477563, "percentage": 66.95, "elapsed_time": "3:20:15", "remaining_time": "1:38:52"}
1439
+ {"current_steps": 1439, "total_steps": 2148, "loss": 0.2496, "lr": 2.975476713738043e-06, "epoch": 2.0097651708904904, "percentage": 66.99, "elapsed_time": "3:20:23", "remaining_time": "1:38:43"}
1440
+ {"current_steps": 1440, "total_steps": 2148, "loss": 0.2556, "lr": 2.9680491185930877e-06, "epoch": 2.0111601953034177, "percentage": 67.04, "elapsed_time": "3:20:29", "remaining_time": "1:38:34"}
1441
+ {"current_steps": 1441, "total_steps": 2148, "loss": 0.2429, "lr": 2.960626890665044e-06, "epoch": 2.012555219716345, "percentage": 67.09, "elapsed_time": "3:20:36", "remaining_time": "1:38:25"}
1442
+ {"current_steps": 1442, "total_steps": 2148, "loss": 0.2149, "lr": 2.953210049559062e-06, "epoch": 2.0139502441292723, "percentage": 67.13, "elapsed_time": "3:20:43", "remaining_time": "1:38:16"}
1443
+ {"current_steps": 1443, "total_steps": 2148, "loss": 0.2684, "lr": 2.945798614866068e-06, "epoch": 2.0153452685421995, "percentage": 67.18, "elapsed_time": "3:20:51", "remaining_time": "1:38:07"}
1444
+ {"current_steps": 1444, "total_steps": 2148, "loss": 0.2407, "lr": 2.9383926061627055e-06, "epoch": 2.016740292955127, "percentage": 67.23, "elapsed_time": "3:20:58", "remaining_time": "1:37:58"}
1445
+ {"current_steps": 1445, "total_steps": 2148, "loss": 0.2713, "lr": 2.9309920430112825e-06, "epoch": 2.018135317368054, "percentage": 67.27, "elapsed_time": "3:21:13", "remaining_time": "1:37:53"}
1446
+ {"current_steps": 1446, "total_steps": 2148, "loss": 0.2561, "lr": 2.92359694495973e-06, "epoch": 2.0195303417809813, "percentage": 67.32, "elapsed_time": "3:21:21", "remaining_time": "1:37:45"}
1447
+ {"current_steps": 1447, "total_steps": 2148, "loss": 0.2361, "lr": 2.9162073315415384e-06, "epoch": 2.0209253661939086, "percentage": 67.36, "elapsed_time": "3:21:29", "remaining_time": "1:37:36"}
1448
+ {"current_steps": 1448, "total_steps": 2148, "loss": 0.2539, "lr": 2.9088232222757085e-06, "epoch": 2.0223203906068354, "percentage": 67.41, "elapsed_time": "3:21:36", "remaining_time": "1:37:27"}
1449
+ {"current_steps": 1449, "total_steps": 2148, "loss": 0.2677, "lr": 2.9014446366667115e-06, "epoch": 2.0237154150197627, "percentage": 67.46, "elapsed_time": "3:21:43", "remaining_time": "1:37:18"}
1450
+ {"current_steps": 1450, "total_steps": 2148, "loss": 0.2583, "lr": 2.8940715942044204e-06, "epoch": 2.02511043943269, "percentage": 67.5, "elapsed_time": "3:21:55", "remaining_time": "1:37:12"}
1451
+ {"current_steps": 1451, "total_steps": 2148, "loss": 0.2395, "lr": 2.8867041143640663e-06, "epoch": 2.0265054638456172, "percentage": 67.55, "elapsed_time": "3:22:04", "remaining_time": "1:37:04"}
1452
+ {"current_steps": 1452, "total_steps": 2148, "loss": 0.2821, "lr": 2.8793422166061918e-06, "epoch": 2.0279004882585445, "percentage": 67.6, "elapsed_time": "3:22:11", "remaining_time": "1:36:55"}
1453
+ {"current_steps": 1453, "total_steps": 2148, "loss": 0.2263, "lr": 2.8719859203765955e-06, "epoch": 2.029295512671472, "percentage": 67.64, "elapsed_time": "3:22:18", "remaining_time": "1:36:46"}
1454
+ {"current_steps": 1454, "total_steps": 2148, "loss": 0.2427, "lr": 2.864635245106272e-06, "epoch": 2.030690537084399, "percentage": 67.69, "elapsed_time": "3:22:28", "remaining_time": "1:36:38"}
1455
+ {"current_steps": 1455, "total_steps": 2148, "loss": 0.2339, "lr": 2.8572902102113788e-06, "epoch": 2.0320855614973263, "percentage": 67.74, "elapsed_time": "3:22:35", "remaining_time": "1:36:29"}
1456
+ {"current_steps": 1456, "total_steps": 2148, "loss": 0.2417, "lr": 2.849950835093168e-06, "epoch": 2.0334805859102536, "percentage": 67.78, "elapsed_time": "3:22:42", "remaining_time": "1:36:20"}
1457
+ {"current_steps": 1457, "total_steps": 2148, "loss": 0.2492, "lr": 2.8426171391379433e-06, "epoch": 2.034875610323181, "percentage": 67.83, "elapsed_time": "3:22:48", "remaining_time": "1:36:11"}
1458
+ {"current_steps": 1458, "total_steps": 2148, "loss": 0.2158, "lr": 2.835289141717008e-06, "epoch": 2.0362706347361077, "percentage": 67.88, "elapsed_time": "3:22:58", "remaining_time": "1:36:03"}
1459
+ {"current_steps": 1459, "total_steps": 2148, "loss": 0.2362, "lr": 2.827966862186616e-06, "epoch": 2.037665659149035, "percentage": 67.92, "elapsed_time": "3:23:07", "remaining_time": "1:35:55"}
1460
+ {"current_steps": 1460, "total_steps": 2148, "loss": 0.2375, "lr": 2.820650319887911e-06, "epoch": 2.0390606835619622, "percentage": 67.97, "elapsed_time": "3:23:14", "remaining_time": "1:35:46"}
1461
+ {"current_steps": 1461, "total_steps": 2148, "loss": 0.2487, "lr": 2.8133395341468915e-06, "epoch": 2.0404557079748895, "percentage": 68.02, "elapsed_time": "3:23:24", "remaining_time": "1:35:38"}
1462
+ {"current_steps": 1462, "total_steps": 2148, "loss": 0.2321, "lr": 2.8060345242743427e-06, "epoch": 2.041850732387817, "percentage": 68.06, "elapsed_time": "3:23:30", "remaining_time": "1:35:29"}
1463
+ {"current_steps": 1463, "total_steps": 2148, "loss": 0.2666, "lr": 2.7987353095657944e-06, "epoch": 2.043245756800744, "percentage": 68.11, "elapsed_time": "3:23:39", "remaining_time": "1:35:21"}
1464
+ {"current_steps": 1464, "total_steps": 2148, "loss": 0.2418, "lr": 2.7914419093014734e-06, "epoch": 2.0446407812136713, "percentage": 68.16, "elapsed_time": "3:23:47", "remaining_time": "1:35:12"}
1465
+ {"current_steps": 1465, "total_steps": 2148, "loss": 0.246, "lr": 2.784154342746246e-06, "epoch": 2.0460358056265986, "percentage": 68.2, "elapsed_time": "3:23:54", "remaining_time": "1:35:03"}
1466
+ {"current_steps": 1466, "total_steps": 2148, "loss": 0.2616, "lr": 2.7768726291495667e-06, "epoch": 2.047430830039526, "percentage": 68.25, "elapsed_time": "3:24:02", "remaining_time": "1:34:55"}
1467
+ {"current_steps": 1467, "total_steps": 2148, "loss": 0.2644, "lr": 2.7695967877454356e-06, "epoch": 2.048825854452453, "percentage": 68.3, "elapsed_time": "3:24:12", "remaining_time": "1:34:47"}
1468
+ {"current_steps": 1468, "total_steps": 2148, "loss": 0.2136, "lr": 2.7623268377523356e-06, "epoch": 2.05022087886538, "percentage": 68.34, "elapsed_time": "3:24:23", "remaining_time": "1:34:40"}
1469
+ {"current_steps": 1469, "total_steps": 2148, "loss": 0.2454, "lr": 2.755062798373189e-06, "epoch": 2.0516159032783072, "percentage": 68.39, "elapsed_time": "3:24:32", "remaining_time": "1:34:32"}
1470
+ {"current_steps": 1470, "total_steps": 2148, "loss": 0.2572, "lr": 2.747804688795311e-06, "epoch": 2.0530109276912345, "percentage": 68.44, "elapsed_time": "3:24:40", "remaining_time": "1:34:24"}
1471
+ {"current_steps": 1471, "total_steps": 2148, "loss": 0.2095, "lr": 2.7405525281903506e-06, "epoch": 2.0544059521041618, "percentage": 68.48, "elapsed_time": "3:24:47", "remaining_time": "1:34:14"}
1472
+ {"current_steps": 1472, "total_steps": 2148, "loss": 0.2398, "lr": 2.7333063357142414e-06, "epoch": 2.055800976517089, "percentage": 68.53, "elapsed_time": "3:24:55", "remaining_time": "1:34:06"}
1473
+ {"current_steps": 1473, "total_steps": 2148, "loss": 0.2217, "lr": 2.7260661305071523e-06, "epoch": 2.0571960009300163, "percentage": 68.58, "elapsed_time": "3:25:04", "remaining_time": "1:33:58"}
1474
+ {"current_steps": 1474, "total_steps": 2148, "loss": 0.2492, "lr": 2.718831931693443e-06, "epoch": 2.0585910253429436, "percentage": 68.62, "elapsed_time": "3:25:11", "remaining_time": "1:33:49"}
1475
+ {"current_steps": 1475, "total_steps": 2148, "loss": 0.2498, "lr": 2.7116037583816e-06, "epoch": 2.059986049755871, "percentage": 68.67, "elapsed_time": "3:25:20", "remaining_time": "1:33:41"}
1476
+ {"current_steps": 1476, "total_steps": 2148, "loss": 0.2331, "lr": 2.7043816296642005e-06, "epoch": 2.061381074168798, "percentage": 68.72, "elapsed_time": "3:25:26", "remaining_time": "1:33:32"}
1477
+ {"current_steps": 1477, "total_steps": 2148, "loss": 0.2612, "lr": 2.6971655646178544e-06, "epoch": 2.0627760985817254, "percentage": 68.76, "elapsed_time": "3:25:35", "remaining_time": "1:33:23"}
1478
+ {"current_steps": 1478, "total_steps": 2148, "loss": 0.2165, "lr": 2.689955582303152e-06, "epoch": 2.064171122994652, "percentage": 68.81, "elapsed_time": "3:25:41", "remaining_time": "1:33:14"}
1479
+ {"current_steps": 1479, "total_steps": 2148, "loss": 0.2245, "lr": 2.6827517017646154e-06, "epoch": 2.0655661474075795, "percentage": 68.85, "elapsed_time": "3:25:49", "remaining_time": "1:33:06"}
1480
+ {"current_steps": 1480, "total_steps": 2148, "loss": 0.2258, "lr": 2.6755539420306565e-06, "epoch": 2.0669611718205068, "percentage": 68.9, "elapsed_time": "3:25:56", "remaining_time": "1:32:57"}
1481
+ {"current_steps": 1481, "total_steps": 2148, "loss": 0.2451, "lr": 2.668362322113512e-06, "epoch": 2.068356196233434, "percentage": 68.95, "elapsed_time": "3:26:05", "remaining_time": "1:32:49"}
1482
+ {"current_steps": 1482, "total_steps": 2148, "loss": 0.2406, "lr": 2.661176861009205e-06, "epoch": 2.0697512206463613, "percentage": 68.99, "elapsed_time": "3:26:11", "remaining_time": "1:32:39"}
1483
+ {"current_steps": 1483, "total_steps": 2148, "loss": 0.2306, "lr": 2.6539975776974926e-06, "epoch": 2.0711462450592886, "percentage": 69.04, "elapsed_time": "3:26:19", "remaining_time": "1:32:31"}
1484
+ {"current_steps": 1484, "total_steps": 2148, "loss": 0.2211, "lr": 2.646824491141807e-06, "epoch": 2.072541269472216, "percentage": 69.09, "elapsed_time": "3:26:25", "remaining_time": "1:32:21"}
1485
+ {"current_steps": 1485, "total_steps": 2148, "loss": 0.2207, "lr": 2.6396576202892176e-06, "epoch": 2.073936293885143, "percentage": 69.13, "elapsed_time": "3:26:31", "remaining_time": "1:32:12"}
1486
+ {"current_steps": 1486, "total_steps": 2148, "loss": 0.2144, "lr": 2.632496984070375e-06, "epoch": 2.0753313182980704, "percentage": 69.18, "elapsed_time": "3:26:45", "remaining_time": "1:32:06"}
1487
+ {"current_steps": 1487, "total_steps": 2148, "loss": 0.2523, "lr": 2.6253426013994586e-06, "epoch": 2.0767263427109977, "percentage": 69.23, "elapsed_time": "3:26:51", "remaining_time": "1:31:57"}
1488
+ {"current_steps": 1488, "total_steps": 2148, "loss": 0.2525, "lr": 2.6181944911741333e-06, "epoch": 2.0781213671239245, "percentage": 69.27, "elapsed_time": "3:26:59", "remaining_time": "1:31:48"}
1489
+ {"current_steps": 1489, "total_steps": 2148, "loss": 0.2679, "lr": 2.6110526722754955e-06, "epoch": 2.0795163915368517, "percentage": 69.32, "elapsed_time": "3:27:06", "remaining_time": "1:31:39"}
1490
+ {"current_steps": 1490, "total_steps": 2148, "loss": 0.2487, "lr": 2.603917163568021e-06, "epoch": 2.080911415949779, "percentage": 69.37, "elapsed_time": "3:27:18", "remaining_time": "1:31:32"}
1491
+ {"current_steps": 1491, "total_steps": 2148, "loss": 0.2268, "lr": 2.5967879838995176e-06, "epoch": 2.0823064403627063, "percentage": 69.41, "elapsed_time": "3:27:26", "remaining_time": "1:31:24"}
1492
+ {"current_steps": 1492, "total_steps": 2148, "loss": 0.2444, "lr": 2.589665152101081e-06, "epoch": 2.0837014647756336, "percentage": 69.46, "elapsed_time": "3:27:36", "remaining_time": "1:31:17"}
1493
+ {"current_steps": 1493, "total_steps": 2148, "loss": 0.233, "lr": 2.582548686987031e-06, "epoch": 2.085096489188561, "percentage": 69.51, "elapsed_time": "3:27:45", "remaining_time": "1:31:08"}
1494
+ {"current_steps": 1494, "total_steps": 2148, "loss": 0.2245, "lr": 2.5754386073548775e-06, "epoch": 2.086491513601488, "percentage": 69.55, "elapsed_time": "3:27:53", "remaining_time": "1:31:00"}
1495
+ {"current_steps": 1495, "total_steps": 2148, "loss": 0.2411, "lr": 2.5683349319852647e-06, "epoch": 2.0878865380144154, "percentage": 69.6, "elapsed_time": "3:28:01", "remaining_time": "1:30:51"}
1496
+ {"current_steps": 1496, "total_steps": 2148, "loss": 0.2382, "lr": 2.5612376796419126e-06, "epoch": 2.0892815624273426, "percentage": 69.65, "elapsed_time": "3:28:09", "remaining_time": "1:30:43"}
1497
+ {"current_steps": 1497, "total_steps": 2148, "loss": 0.2461, "lr": 2.5541468690715797e-06, "epoch": 2.09067658684027, "percentage": 69.69, "elapsed_time": "3:28:19", "remaining_time": "1:30:35"}
1498
+ {"current_steps": 1498, "total_steps": 2148, "loss": 0.249, "lr": 2.5470625190040105e-06, "epoch": 2.0920716112531967, "percentage": 69.74, "elapsed_time": "3:28:28", "remaining_time": "1:30:27"}
1499
+ {"current_steps": 1499, "total_steps": 2148, "loss": 0.2499, "lr": 2.5399846481518857e-06, "epoch": 2.093466635666124, "percentage": 69.79, "elapsed_time": "3:28:36", "remaining_time": "1:30:19"}
1500
+ {"current_steps": 1500, "total_steps": 2148, "loss": 0.2621, "lr": 2.5329132752107675e-06, "epoch": 2.0948616600790513, "percentage": 69.83, "elapsed_time": "3:28:45", "remaining_time": "1:30:11"}
1501
+ {"current_steps": 1501, "total_steps": 2148, "loss": 0.2521, "lr": 2.525848418859055e-06, "epoch": 2.0962566844919786, "percentage": 69.88, "elapsed_time": "3:28:52", "remaining_time": "1:30:01"}
1502
+ {"current_steps": 1502, "total_steps": 2148, "loss": 0.2204, "lr": 2.518790097757938e-06, "epoch": 2.097651708904906, "percentage": 69.93, "elapsed_time": "3:28:59", "remaining_time": "1:29:53"}
1503
+ {"current_steps": 1503, "total_steps": 2148, "loss": 0.2212, "lr": 2.51173833055134e-06, "epoch": 2.099046733317833, "percentage": 69.97, "elapsed_time": "3:29:06", "remaining_time": "1:29:44"}
1504
+ {"current_steps": 1504, "total_steps": 2148, "loss": 0.2621, "lr": 2.504693135865875e-06, "epoch": 2.1004417577307604, "percentage": 70.02, "elapsed_time": "3:29:13", "remaining_time": "1:29:35"}
1505
+ {"current_steps": 1505, "total_steps": 2148, "loss": 0.2454, "lr": 2.497654532310799e-06, "epoch": 2.1018367821436876, "percentage": 70.07, "elapsed_time": "3:29:19", "remaining_time": "1:29:25"}
1506
+ {"current_steps": 1506, "total_steps": 2148, "loss": 0.2406, "lr": 2.490622538477952e-06, "epoch": 2.103231806556615, "percentage": 70.11, "elapsed_time": "3:29:27", "remaining_time": "1:29:17"}
1507
+ {"current_steps": 1507, "total_steps": 2148, "loss": 0.2375, "lr": 2.483597172941718e-06, "epoch": 2.104626830969542, "percentage": 70.16, "elapsed_time": "3:29:35", "remaining_time": "1:29:08"}
1508
+ {"current_steps": 1508, "total_steps": 2148, "loss": 0.2492, "lr": 2.4765784542589754e-06, "epoch": 2.106021855382469, "percentage": 70.2, "elapsed_time": "3:29:45", "remaining_time": "1:29:01"}
1509
+ {"current_steps": 1509, "total_steps": 2148, "loss": 0.2073, "lr": 2.46956640096904e-06, "epoch": 2.1074168797953963, "percentage": 70.25, "elapsed_time": "3:29:53", "remaining_time": "1:28:52"}
1510
+ {"current_steps": 1510, "total_steps": 2148, "loss": 0.2454, "lr": 2.4625610315936267e-06, "epoch": 2.1088119042083235, "percentage": 70.3, "elapsed_time": "3:30:03", "remaining_time": "1:28:45"}
1511
+ {"current_steps": 1511, "total_steps": 2148, "loss": 0.2756, "lr": 2.4555623646367952e-06, "epoch": 2.110206928621251, "percentage": 70.34, "elapsed_time": "3:30:10", "remaining_time": "1:28:36"}
1512
+ {"current_steps": 1512, "total_steps": 2148, "loss": 0.2461, "lr": 2.448570418584898e-06, "epoch": 2.111601953034178, "percentage": 70.39, "elapsed_time": "3:30:20", "remaining_time": "1:28:28"}
1513
+ {"current_steps": 1513, "total_steps": 2148, "loss": 0.247, "lr": 2.4415852119065343e-06, "epoch": 2.1129969774471054, "percentage": 70.44, "elapsed_time": "3:30:26", "remaining_time": "1:28:19"}
1514
+ {"current_steps": 1514, "total_steps": 2148, "loss": 0.24, "lr": 2.4346067630525084e-06, "epoch": 2.1143920018600326, "percentage": 70.48, "elapsed_time": "3:30:34", "remaining_time": "1:28:10"}
1515
+ {"current_steps": 1515, "total_steps": 2148, "loss": 0.229, "lr": 2.427635090455766e-06, "epoch": 2.11578702627296, "percentage": 70.53, "elapsed_time": "3:30:40", "remaining_time": "1:28:01"}
1516
+ {"current_steps": 1516, "total_steps": 2148, "loss": 0.2339, "lr": 2.42067021253136e-06, "epoch": 2.117182050685887, "percentage": 70.58, "elapsed_time": "3:30:46", "remaining_time": "1:27:52"}
1517
+ {"current_steps": 1517, "total_steps": 2148, "loss": 0.2071, "lr": 2.4137121476763965e-06, "epoch": 2.1185770750988144, "percentage": 70.62, "elapsed_time": "3:30:53", "remaining_time": "1:27:43"}
1518
+ {"current_steps": 1518, "total_steps": 2148, "loss": 0.2215, "lr": 2.4067609142699798e-06, "epoch": 2.1199720995117413, "percentage": 70.67, "elapsed_time": "3:31:01", "remaining_time": "1:27:34"}
1519
+ {"current_steps": 1519, "total_steps": 2148, "loss": 0.2444, "lr": 2.3998165306731713e-06, "epoch": 2.1213671239246685, "percentage": 70.72, "elapsed_time": "3:31:07", "remaining_time": "1:27:25"}
1520
+ {"current_steps": 1520, "total_steps": 2148, "loss": 0.2116, "lr": 2.3928790152289443e-06, "epoch": 2.122762148337596, "percentage": 70.76, "elapsed_time": "3:31:13", "remaining_time": "1:27:16"}
1521
+ {"current_steps": 1521, "total_steps": 2148, "loss": 0.2602, "lr": 2.385948386262123e-06, "epoch": 2.124157172750523, "percentage": 70.81, "elapsed_time": "3:31:22", "remaining_time": "1:27:07"}
1522
+ {"current_steps": 1522, "total_steps": 2148, "loss": 0.2457, "lr": 2.3790246620793466e-06, "epoch": 2.1255521971634503, "percentage": 70.86, "elapsed_time": "3:31:29", "remaining_time": "1:26:59"}
1523
+ {"current_steps": 1523, "total_steps": 2148, "loss": 0.2306, "lr": 2.372107860969019e-06, "epoch": 2.1269472215763776, "percentage": 70.9, "elapsed_time": "3:31:37", "remaining_time": "1:26:50"}
1524
+ {"current_steps": 1524, "total_steps": 2148, "loss": 0.2166, "lr": 2.3651980012012454e-06, "epoch": 2.128342245989305, "percentage": 70.95, "elapsed_time": "3:31:46", "remaining_time": "1:26:42"}
1525
+ {"current_steps": 1525, "total_steps": 2148, "loss": 0.2249, "lr": 2.358295101027807e-06, "epoch": 2.129737270402232, "percentage": 71.0, "elapsed_time": "3:31:52", "remaining_time": "1:26:33"}
1526
+ {"current_steps": 1526, "total_steps": 2148, "loss": 0.2284, "lr": 2.351399178682101e-06, "epoch": 2.1311322948151594, "percentage": 71.04, "elapsed_time": "3:31:59", "remaining_time": "1:26:24"}
1527
+ {"current_steps": 1527, "total_steps": 2148, "loss": 0.2198, "lr": 2.3445102523790876e-06, "epoch": 2.1325273192280867, "percentage": 71.09, "elapsed_time": "3:32:07", "remaining_time": "1:26:15"}
1528
+ {"current_steps": 1528, "total_steps": 2148, "loss": 0.2256, "lr": 2.3376283403152527e-06, "epoch": 2.1339223436410135, "percentage": 71.14, "elapsed_time": "3:32:16", "remaining_time": "1:26:08"}
1529
+ {"current_steps": 1529, "total_steps": 2148, "loss": 0.2393, "lr": 2.330753460668553e-06, "epoch": 2.135317368053941, "percentage": 71.18, "elapsed_time": "3:32:22", "remaining_time": "1:25:58"}
1530
+ {"current_steps": 1530, "total_steps": 2148, "loss": 0.2396, "lr": 2.323885631598366e-06, "epoch": 2.136712392466868, "percentage": 71.23, "elapsed_time": "3:32:31", "remaining_time": "1:25:50"}
1531
+ {"current_steps": 1531, "total_steps": 2148, "loss": 0.2461, "lr": 2.3170248712454525e-06, "epoch": 2.1381074168797953, "percentage": 71.28, "elapsed_time": "3:32:42", "remaining_time": "1:25:43"}
1532
+ {"current_steps": 1532, "total_steps": 2148, "loss": 0.2642, "lr": 2.3101711977318995e-06, "epoch": 2.1395024412927226, "percentage": 71.32, "elapsed_time": "3:32:53", "remaining_time": "1:25:35"}
1533
+ {"current_steps": 1533, "total_steps": 2148, "loss": 0.2291, "lr": 2.3033246291610717e-06, "epoch": 2.14089746570565, "percentage": 71.37, "elapsed_time": "3:33:04", "remaining_time": "1:25:28"}
1534
+ {"current_steps": 1534, "total_steps": 2148, "loss": 0.2508, "lr": 2.2964851836175705e-06, "epoch": 2.142292490118577, "percentage": 71.42, "elapsed_time": "3:33:11", "remaining_time": "1:25:19"}
1535
+ {"current_steps": 1535, "total_steps": 2148, "loss": 0.2301, "lr": 2.2896528791671807e-06, "epoch": 2.1436875145315044, "percentage": 71.46, "elapsed_time": "3:33:18", "remaining_time": "1:25:10"}
1536
+ {"current_steps": 1536, "total_steps": 2148, "loss": 0.2316, "lr": 2.2828277338568226e-06, "epoch": 2.1450825389444317, "percentage": 71.51, "elapsed_time": "3:33:28", "remaining_time": "1:25:03"}
1537
+ {"current_steps": 1537, "total_steps": 2148, "loss": 0.2404, "lr": 2.2760097657145096e-06, "epoch": 2.146477563357359, "percentage": 71.55, "elapsed_time": "3:33:34", "remaining_time": "1:24:54"}
1538
+ {"current_steps": 1538, "total_steps": 2148, "loss": 0.2594, "lr": 2.2691989927492984e-06, "epoch": 2.147872587770286, "percentage": 71.6, "elapsed_time": "3:33:42", "remaining_time": "1:24:45"}
1539
+ {"current_steps": 1539, "total_steps": 2148, "loss": 0.264, "lr": 2.262395432951235e-06, "epoch": 2.149267612183213, "percentage": 71.65, "elapsed_time": "3:33:51", "remaining_time": "1:24:37"}
1540
+ {"current_steps": 1540, "total_steps": 2148, "loss": 0.2277, "lr": 2.2555991042913177e-06, "epoch": 2.1506626365961403, "percentage": 71.69, "elapsed_time": "3:33:57", "remaining_time": "1:24:28"}
1541
+ {"current_steps": 1541, "total_steps": 2148, "loss": 0.2245, "lr": 2.248810024721441e-06, "epoch": 2.1520576610090676, "percentage": 71.74, "elapsed_time": "3:34:04", "remaining_time": "1:24:19"}
1542
+ {"current_steps": 1542, "total_steps": 2148, "loss": 0.2384, "lr": 2.2420282121743513e-06, "epoch": 2.153452685421995, "percentage": 71.79, "elapsed_time": "3:34:11", "remaining_time": "1:24:10"}
1543
+ {"current_steps": 1543, "total_steps": 2148, "loss": 0.225, "lr": 2.235253684563602e-06, "epoch": 2.154847709834922, "percentage": 71.83, "elapsed_time": "3:34:20", "remaining_time": "1:24:02"}
1544
+ {"current_steps": 1544, "total_steps": 2148, "loss": 0.2204, "lr": 2.228486459783506e-06, "epoch": 2.1562427342478494, "percentage": 71.88, "elapsed_time": "3:34:27", "remaining_time": "1:23:53"}
1545
+ {"current_steps": 1545, "total_steps": 2148, "loss": 0.2332, "lr": 2.221726555709079e-06, "epoch": 2.1576377586607767, "percentage": 71.93, "elapsed_time": "3:34:33", "remaining_time": "1:23:44"}
1546
+ {"current_steps": 1546, "total_steps": 2148, "loss": 0.2502, "lr": 2.2149739901960088e-06, "epoch": 2.159032783073704, "percentage": 71.97, "elapsed_time": "3:34:40", "remaining_time": "1:23:35"}
1547
+ {"current_steps": 1547, "total_steps": 2148, "loss": 0.2278, "lr": 2.208228781080592e-06, "epoch": 2.160427807486631, "percentage": 72.02, "elapsed_time": "3:34:47", "remaining_time": "1:23:26"}
1548
+ {"current_steps": 1548, "total_steps": 2148, "loss": 0.2222, "lr": 2.201490946179696e-06, "epoch": 2.161822831899558, "percentage": 72.07, "elapsed_time": "3:34:54", "remaining_time": "1:23:17"}
1549
+ {"current_steps": 1549, "total_steps": 2148, "loss": 0.2152, "lr": 2.19476050329071e-06, "epoch": 2.1632178563124853, "percentage": 72.11, "elapsed_time": "3:35:03", "remaining_time": "1:23:09"}
1550
+ {"current_steps": 1550, "total_steps": 2148, "loss": 0.2288, "lr": 2.188037470191502e-06, "epoch": 2.1646128807254126, "percentage": 72.16, "elapsed_time": "3:35:14", "remaining_time": "1:23:02"}
1551
+ {"current_steps": 1551, "total_steps": 2148, "loss": 0.229, "lr": 2.181321864640362e-06, "epoch": 2.16600790513834, "percentage": 72.21, "elapsed_time": "3:35:20", "remaining_time": "1:22:53"}
1552
+ {"current_steps": 1552, "total_steps": 2148, "loss": 0.2098, "lr": 2.1746137043759594e-06, "epoch": 2.167402929551267, "percentage": 72.25, "elapsed_time": "3:35:32", "remaining_time": "1:22:46"}
1553
+ {"current_steps": 1553, "total_steps": 2148, "loss": 0.2245, "lr": 2.167913007117306e-06, "epoch": 2.1687979539641944, "percentage": 72.3, "elapsed_time": "3:35:43", "remaining_time": "1:22:39"}
1554
+ {"current_steps": 1554, "total_steps": 2148, "loss": 0.2544, "lr": 2.1612197905636913e-06, "epoch": 2.1701929783771217, "percentage": 72.35, "elapsed_time": "3:35:52", "remaining_time": "1:22:31"}
1555
+ {"current_steps": 1555, "total_steps": 2148, "loss": 0.235, "lr": 2.154534072394651e-06, "epoch": 2.171588002790049, "percentage": 72.39, "elapsed_time": "3:36:05", "remaining_time": "1:22:24"}
1556
+ {"current_steps": 1556, "total_steps": 2148, "loss": 0.2493, "lr": 2.147855870269916e-06, "epoch": 2.172983027202976, "percentage": 72.44, "elapsed_time": "3:36:15", "remaining_time": "1:22:16"}
1557
+ {"current_steps": 1557, "total_steps": 2148, "loss": 0.2737, "lr": 2.1411852018293583e-06, "epoch": 2.1743780516159035, "percentage": 72.49, "elapsed_time": "3:36:21", "remaining_time": "1:22:07"}
1558
+ {"current_steps": 1558, "total_steps": 2148, "loss": 0.2296, "lr": 2.1345220846929514e-06, "epoch": 2.1757730760288303, "percentage": 72.53, "elapsed_time": "3:36:28", "remaining_time": "1:21:58"}
1559
+ {"current_steps": 1559, "total_steps": 2148, "loss": 0.2306, "lr": 2.127866536460727e-06, "epoch": 2.1771681004417576, "percentage": 72.58, "elapsed_time": "3:36:35", "remaining_time": "1:21:49"}
1560
+ {"current_steps": 1560, "total_steps": 2148, "loss": 0.2397, "lr": 2.1212185747127235e-06, "epoch": 2.178563124854685, "percentage": 72.63, "elapsed_time": "3:36:43", "remaining_time": "1:21:41"}
1561
+ {"current_steps": 1561, "total_steps": 2148, "loss": 0.226, "lr": 2.1145782170089346e-06, "epoch": 2.179958149267612, "percentage": 72.67, "elapsed_time": "3:36:53", "remaining_time": "1:21:33"}
1562
+ {"current_steps": 1562, "total_steps": 2148, "loss": 0.2211, "lr": 2.107945480889276e-06, "epoch": 2.1813531736805394, "percentage": 72.72, "elapsed_time": "3:37:02", "remaining_time": "1:21:25"}
1563
+ {"current_steps": 1563, "total_steps": 2148, "loss": 0.2313, "lr": 2.1013203838735273e-06, "epoch": 2.1827481980934667, "percentage": 72.77, "elapsed_time": "3:37:12", "remaining_time": "1:21:17"}
1564
+ {"current_steps": 1564, "total_steps": 2148, "loss": 0.2265, "lr": 2.094702943461289e-06, "epoch": 2.184143222506394, "percentage": 72.81, "elapsed_time": "3:37:19", "remaining_time": "1:21:09"}
1565
+ {"current_steps": 1565, "total_steps": 2148, "loss": 0.2606, "lr": 2.0880931771319395e-06, "epoch": 2.185538246919321, "percentage": 72.86, "elapsed_time": "3:37:33", "remaining_time": "1:21:02"}
1566
+ {"current_steps": 1566, "total_steps": 2148, "loss": 0.2067, "lr": 2.0814911023445904e-06, "epoch": 2.1869332713322485, "percentage": 72.91, "elapsed_time": "3:37:42", "remaining_time": "1:20:54"}
1567
+ {"current_steps": 1567, "total_steps": 2148, "loss": 0.229, "lr": 2.0748967365380292e-06, "epoch": 2.1883282957451757, "percentage": 72.95, "elapsed_time": "3:37:50", "remaining_time": "1:20:46"}
1568
+ {"current_steps": 1568, "total_steps": 2148, "loss": 0.2482, "lr": 2.0683100971306873e-06, "epoch": 2.1897233201581026, "percentage": 73.0, "elapsed_time": "3:37:57", "remaining_time": "1:20:37"}
1569
+ {"current_steps": 1569, "total_steps": 2148, "loss": 0.2629, "lr": 2.0617312015205844e-06, "epoch": 2.19111834457103, "percentage": 73.04, "elapsed_time": "3:38:03", "remaining_time": "1:20:28"}
1570
+ {"current_steps": 1570, "total_steps": 2148, "loss": 0.2224, "lr": 2.055160067085283e-06, "epoch": 2.192513368983957, "percentage": 73.09, "elapsed_time": "3:38:10", "remaining_time": "1:20:19"}
1571
+ {"current_steps": 1571, "total_steps": 2148, "loss": 0.2465, "lr": 2.0485967111818506e-06, "epoch": 2.1939083933968844, "percentage": 73.14, "elapsed_time": "3:38:17", "remaining_time": "1:20:10"}
1572
+ {"current_steps": 1572, "total_steps": 2148, "loss": 0.2231, "lr": 2.0420411511468086e-06, "epoch": 2.1953034178098116, "percentage": 73.18, "elapsed_time": "3:38:24", "remaining_time": "1:20:01"}
1573
+ {"current_steps": 1573, "total_steps": 2148, "loss": 0.266, "lr": 2.0354934042960804e-06, "epoch": 2.196698442222739, "percentage": 73.23, "elapsed_time": "3:38:31", "remaining_time": "1:19:52"}
1574
+ {"current_steps": 1574, "total_steps": 2148, "loss": 0.2215, "lr": 2.0289534879249544e-06, "epoch": 2.198093466635666, "percentage": 73.28, "elapsed_time": "3:38:39", "remaining_time": "1:19:44"}
1575
+ {"current_steps": 1575, "total_steps": 2148, "loss": 0.2411, "lr": 2.0224214193080394e-06, "epoch": 2.1994884910485935, "percentage": 73.32, "elapsed_time": "3:38:49", "remaining_time": "1:19:36"}
1576
+ {"current_steps": 1576, "total_steps": 2148, "loss": 0.2407, "lr": 2.015897215699208e-06, "epoch": 2.2008835154615207, "percentage": 73.37, "elapsed_time": "3:39:00", "remaining_time": "1:19:29"}
1577
+ {"current_steps": 1577, "total_steps": 2148, "loss": 0.213, "lr": 2.0093808943315636e-06, "epoch": 2.202278539874448, "percentage": 73.42, "elapsed_time": "3:39:06", "remaining_time": "1:19:20"}
1578
+ {"current_steps": 1578, "total_steps": 2148, "loss": 0.2199, "lr": 2.0028724724173886e-06, "epoch": 2.2036735642873753, "percentage": 73.46, "elapsed_time": "3:39:17", "remaining_time": "1:19:12"}
1579
+ {"current_steps": 1579, "total_steps": 2148, "loss": 0.2255, "lr": 1.996371967148098e-06, "epoch": 2.205068588700302, "percentage": 73.51, "elapsed_time": "3:39:23", "remaining_time": "1:19:03"}
1580
+ {"current_steps": 1580, "total_steps": 2148, "loss": 0.2711, "lr": 1.989879395694194e-06, "epoch": 2.2064636131132294, "percentage": 73.56, "elapsed_time": "3:39:34", "remaining_time": "1:18:56"}
1581
+ {"current_steps": 1581, "total_steps": 2148, "loss": 0.2191, "lr": 1.9833947752052286e-06, "epoch": 2.2078586375261566, "percentage": 73.6, "elapsed_time": "3:39:40", "remaining_time": "1:18:47"}
1582
+ {"current_steps": 1582, "total_steps": 2148, "loss": 0.2423, "lr": 1.976918122809744e-06, "epoch": 2.209253661939084, "percentage": 73.65, "elapsed_time": "3:39:53", "remaining_time": "1:18:40"}
1583
+ {"current_steps": 1583, "total_steps": 2148, "loss": 0.2364, "lr": 1.9704494556152413e-06, "epoch": 2.210648686352011, "percentage": 73.7, "elapsed_time": "3:40:00", "remaining_time": "1:18:31"}
1584
+ {"current_steps": 1584, "total_steps": 2148, "loss": 0.2101, "lr": 1.9639887907081297e-06, "epoch": 2.2120437107649384, "percentage": 73.74, "elapsed_time": "3:40:08", "remaining_time": "1:18:22"}
1585
+ {"current_steps": 1585, "total_steps": 2148, "loss": 0.2528, "lr": 1.9575361451536772e-06, "epoch": 2.2134387351778657, "percentage": 73.79, "elapsed_time": "3:40:15", "remaining_time": "1:18:14"}
1586
+ {"current_steps": 1586, "total_steps": 2148, "loss": 0.2052, "lr": 1.9510915359959694e-06, "epoch": 2.214833759590793, "percentage": 73.84, "elapsed_time": "3:40:22", "remaining_time": "1:18:05"}
1587
+ {"current_steps": 1587, "total_steps": 2148, "loss": 0.2248, "lr": 1.944654980257869e-06, "epoch": 2.2162287840037203, "percentage": 73.88, "elapsed_time": "3:40:30", "remaining_time": "1:17:57"}
1588
+ {"current_steps": 1588, "total_steps": 2148, "loss": 0.2334, "lr": 1.9382264949409614e-06, "epoch": 2.217623808416647, "percentage": 73.93, "elapsed_time": "3:40:36", "remaining_time": "1:17:47"}
1589
+ {"current_steps": 1589, "total_steps": 2148, "loss": 0.2512, "lr": 1.931806097025517e-06, "epoch": 2.2190188328295744, "percentage": 73.98, "elapsed_time": "3:40:45", "remaining_time": "1:17:39"}
1590
+ {"current_steps": 1590, "total_steps": 2148, "loss": 0.2132, "lr": 1.925393803470447e-06, "epoch": 2.2204138572425016, "percentage": 74.02, "elapsed_time": "3:40:51", "remaining_time": "1:17:30"}
1591
+ {"current_steps": 1591, "total_steps": 2148, "loss": 0.2341, "lr": 1.9189896312132506e-06, "epoch": 2.221808881655429, "percentage": 74.07, "elapsed_time": "3:40:58", "remaining_time": "1:17:21"}
1592
+ {"current_steps": 1592, "total_steps": 2148, "loss": 0.2081, "lr": 1.912593597169975e-06, "epoch": 2.223203906068356, "percentage": 74.12, "elapsed_time": "3:41:06", "remaining_time": "1:17:13"}
1593
+ {"current_steps": 1593, "total_steps": 2148, "loss": 0.2374, "lr": 1.9062057182351768e-06, "epoch": 2.2245989304812834, "percentage": 74.16, "elapsed_time": "3:41:12", "remaining_time": "1:17:04"}
1594
+ {"current_steps": 1594, "total_steps": 2148, "loss": 0.2551, "lr": 1.899826011281865e-06, "epoch": 2.2259939548942107, "percentage": 74.21, "elapsed_time": "3:41:18", "remaining_time": "1:16:55"}
1595
+ {"current_steps": 1595, "total_steps": 2148, "loss": 0.2208, "lr": 1.893454493161468e-06, "epoch": 2.227388979307138, "percentage": 74.26, "elapsed_time": "3:41:25", "remaining_time": "1:16:46"}
1596
+ {"current_steps": 1596, "total_steps": 2148, "loss": 0.2283, "lr": 1.8870911807037856e-06, "epoch": 2.2287840037200652, "percentage": 74.3, "elapsed_time": "3:41:31", "remaining_time": "1:16:37"}
1597
+ {"current_steps": 1597, "total_steps": 2148, "loss": 0.2577, "lr": 1.8807360907169326e-06, "epoch": 2.2301790281329925, "percentage": 74.35, "elapsed_time": "3:41:38", "remaining_time": "1:16:28"}
1598
+ {"current_steps": 1598, "total_steps": 2148, "loss": 0.2252, "lr": 1.8743892399873154e-06, "epoch": 2.23157405254592, "percentage": 74.39, "elapsed_time": "3:41:44", "remaining_time": "1:16:19"}
1599
+ {"current_steps": 1599, "total_steps": 2148, "loss": 0.2368, "lr": 1.868050645279576e-06, "epoch": 2.2329690769588466, "percentage": 74.44, "elapsed_time": "3:41:51", "remaining_time": "1:16:10"}
1600
+ {"current_steps": 1600, "total_steps": 2148, "loss": 0.2306, "lr": 1.8617203233365427e-06, "epoch": 2.234364101371774, "percentage": 74.49, "elapsed_time": "3:42:01", "remaining_time": "1:16:02"}
1601
+ {"current_steps": 1601, "total_steps": 2148, "loss": 0.2372, "lr": 1.8553982908792e-06, "epoch": 2.235759125784701, "percentage": 74.53, "elapsed_time": "3:43:56", "remaining_time": "1:16:30"}
1602
+ {"current_steps": 1602, "total_steps": 2148, "loss": 0.2783, "lr": 1.8490845646066303e-06, "epoch": 2.2371541501976284, "percentage": 74.58, "elapsed_time": "3:44:03", "remaining_time": "1:16:21"}
1603
+ {"current_steps": 1603, "total_steps": 2148, "loss": 0.2567, "lr": 1.8427791611959762e-06, "epoch": 2.2385491746105557, "percentage": 74.63, "elapsed_time": "3:44:12", "remaining_time": "1:16:13"}
1604
+ {"current_steps": 1604, "total_steps": 2148, "loss": 0.2154, "lr": 1.8364820973024e-06, "epoch": 2.239944199023483, "percentage": 74.67, "elapsed_time": "3:44:19", "remaining_time": "1:16:04"}
1605
+ {"current_steps": 1605, "total_steps": 2148, "loss": 0.2522, "lr": 1.8301933895590362e-06, "epoch": 2.2413392234364102, "percentage": 74.72, "elapsed_time": "3:44:30", "remaining_time": "1:15:57"}
1606
+ {"current_steps": 1606, "total_steps": 2148, "loss": 0.2189, "lr": 1.8239130545769408e-06, "epoch": 2.2427342478493375, "percentage": 74.77, "elapsed_time": "3:44:38", "remaining_time": "1:15:48"}
1607
+ {"current_steps": 1607, "total_steps": 2148, "loss": 0.2524, "lr": 1.8176411089450618e-06, "epoch": 2.2441292722622648, "percentage": 74.81, "elapsed_time": "3:44:50", "remaining_time": "1:15:41"}
1608
+ {"current_steps": 1608, "total_steps": 2148, "loss": 0.2342, "lr": 1.8113775692301822e-06, "epoch": 2.2455242966751916, "percentage": 74.86, "elapsed_time": "3:44:58", "remaining_time": "1:15:33"}
1609
+ {"current_steps": 1609, "total_steps": 2148, "loss": 0.2391, "lr": 1.8051224519768817e-06, "epoch": 2.246919321088119, "percentage": 74.91, "elapsed_time": "3:45:06", "remaining_time": "1:15:24"}
1610
+ {"current_steps": 1610, "total_steps": 2148, "loss": 0.2179, "lr": 1.7988757737074959e-06, "epoch": 2.248314345501046, "percentage": 74.95, "elapsed_time": "3:45:17", "remaining_time": "1:15:16"}
1611
+ {"current_steps": 1611, "total_steps": 2148, "loss": 0.2222, "lr": 1.7926375509220695e-06, "epoch": 2.2497093699139734, "percentage": 75.0, "elapsed_time": "3:45:25", "remaining_time": "1:15:08"}
1612
+ {"current_steps": 1612, "total_steps": 2148, "loss": 0.2109, "lr": 1.7864078000983076e-06, "epoch": 2.2511043943269007, "percentage": 75.05, "elapsed_time": "3:45:32", "remaining_time": "1:14:59"}
1613
+ {"current_steps": 1613, "total_steps": 2148, "loss": 0.2215, "lr": 1.7801865376915451e-06, "epoch": 2.252499418739828, "percentage": 75.09, "elapsed_time": "3:45:42", "remaining_time": "1:14:51"}
1614
+ {"current_steps": 1614, "total_steps": 2148, "loss": 0.2469, "lr": 1.7739737801346895e-06, "epoch": 2.2538944431527552, "percentage": 75.14, "elapsed_time": "3:45:49", "remaining_time": "1:14:42"}
1615
+ {"current_steps": 1615, "total_steps": 2148, "loss": 0.2573, "lr": 1.7677695438381831e-06, "epoch": 2.2552894675656825, "percentage": 75.19, "elapsed_time": "3:45:57", "remaining_time": "1:14:34"}