sedrickkeh commited on
Commit
9010722
·
verified ·
1 Parent(s): bebbe4e

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:237405c321e8fb32c45e847b3fd7b833aa92b89f9202ee5498a19e6f9aedb693
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b354fffd7b84e79ac895bc8a1117f46139d240975a924c31cff85f21174fb0b7
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63caeb827b8d149bda2a0c77ebe50aea5cf4e98257bf2f3dad59ccbed8ff87d9
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:603e7982ef56e879785c28122dd2cfcccbb6e1d5dafd78a841530357816d2f12
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed3c289f79efc9e05edb820f76ee1667d528cb745069c034d98b7f71e24fe502
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5a3a686c96166a8f129125ee394d5e5b0f323682f7f58ed26439fb0b6b31dac
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12bbbc06c63f2359be5dcc1ad1e4bfcf6ab770923cee3db5da2e834584666049
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:198cc902e4eb81777ae407cb42df9ea1c16386f0183fda869ab0f639d8a0c09d
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -212,3 +212,102 @@
212
  {"current_steps": 212, "total_steps": 312, "loss": 0.3009, "lr": 1.132232521764884e-05, "epoch": 2.0319488817891376, "percentage": 67.95, "elapsed_time": "1:54:43", "remaining_time": "0:54:07"}
213
  {"current_steps": 213, "total_steps": 312, "loss": 0.3387, "lr": 1.1120698719390362e-05, "epoch": 2.0415335463258786, "percentage": 68.27, "elapsed_time": "1:55:18", "remaining_time": "0:53:35"}
214
  {"current_steps": 214, "total_steps": 312, "loss": 0.3105, "lr": 1.0920190005209066e-05, "epoch": 2.0511182108626196, "percentage": 68.59, "elapsed_time": "1:55:50", "remaining_time": "0:53:02"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
212
  {"current_steps": 212, "total_steps": 312, "loss": 0.3009, "lr": 1.132232521764884e-05, "epoch": 2.0319488817891376, "percentage": 67.95, "elapsed_time": "1:54:43", "remaining_time": "0:54:07"}
213
  {"current_steps": 213, "total_steps": 312, "loss": 0.3387, "lr": 1.1120698719390362e-05, "epoch": 2.0415335463258786, "percentage": 68.27, "elapsed_time": "1:55:18", "remaining_time": "0:53:35"}
214
  {"current_steps": 214, "total_steps": 312, "loss": 0.3105, "lr": 1.0920190005209066e-05, "epoch": 2.0511182108626196, "percentage": 68.59, "elapsed_time": "1:55:50", "remaining_time": "0:53:02"}
215
+ {"current_steps": 215, "total_steps": 312, "loss": 0.2901, "lr": 1.0720824316443321e-05, "epoch": 2.060702875399361, "percentage": 68.91, "elapsed_time": "1:56:25", "remaining_time": "0:52:31"}
216
+ {"current_steps": 216, "total_steps": 312, "loss": 0.3493, "lr": 1.0522626750540029e-05, "epoch": 2.070287539936102, "percentage": 69.23, "elapsed_time": "1:56:53", "remaining_time": "0:51:57"}
217
+ {"current_steps": 217, "total_steps": 312, "loss": 0.2985, "lr": 1.0325622257895205e-05, "epoch": 2.0798722044728435, "percentage": 69.55, "elapsed_time": "1:57:23", "remaining_time": "0:51:23"}
218
+ {"current_steps": 218, "total_steps": 312, "loss": 0.3166, "lr": 1.0129835638713064e-05, "epoch": 2.0894568690095845, "percentage": 69.87, "elapsed_time": "1:57:50", "remaining_time": "0:50:48"}
219
+ {"current_steps": 219, "total_steps": 312, "loss": 0.2843, "lr": 9.935291539884e-06, "epoch": 2.099041533546326, "percentage": 70.19, "elapsed_time": "1:58:25", "remaining_time": "0:50:17"}
220
+ {"current_steps": 220, "total_steps": 312, "loss": 0.3163, "lr": 9.74201445188188e-06, "epoch": 2.108626198083067, "percentage": 70.51, "elapsed_time": "1:58:54", "remaining_time": "0:49:43"}
221
+ {"current_steps": 221, "total_steps": 312, "loss": 0.3222, "lr": 9.550028705681024e-06, "epoch": 2.1182108626198084, "percentage": 70.83, "elapsed_time": "1:59:29", "remaining_time": "0:49:12"}
222
+ {"current_steps": 222, "total_steps": 312, "loss": 0.2909, "lr": 9.359358469693272e-06, "epoch": 2.1277955271565494, "percentage": 71.15, "elapsed_time": "1:59:56", "remaining_time": "0:48:37"}
223
+ {"current_steps": 223, "total_steps": 312, "loss": 0.3146, "lr": 9.170027746725487e-06, "epoch": 2.137380191693291, "percentage": 71.47, "elapsed_time": "2:00:32", "remaining_time": "0:48:06"}
224
+ {"current_steps": 224, "total_steps": 312, "loss": 0.3017, "lr": 8.982060370957953e-06, "epoch": 2.146964856230032, "percentage": 71.79, "elapsed_time": "2:01:02", "remaining_time": "0:47:33"}
225
+ {"current_steps": 225, "total_steps": 312, "loss": 0.3456, "lr": 8.795480004943946e-06, "epoch": 2.1565495207667733, "percentage": 72.12, "elapsed_time": "2:01:37", "remaining_time": "0:47:01"}
226
+ {"current_steps": 226, "total_steps": 312, "loss": 0.2761, "lr": 8.610310136630962e-06, "epoch": 2.1661341853035143, "percentage": 72.44, "elapsed_time": "2:02:10", "remaining_time": "0:46:29"}
227
+ {"current_steps": 227, "total_steps": 312, "loss": 0.302, "lr": 8.426574076403887e-06, "epoch": 2.1757188498402558, "percentage": 72.76, "elapsed_time": "2:02:37", "remaining_time": "0:45:54"}
228
+ {"current_steps": 228, "total_steps": 312, "loss": 0.338, "lr": 8.24429495415054e-06, "epoch": 2.1853035143769968, "percentage": 73.08, "elapsed_time": "2:03:10", "remaining_time": "0:45:22"}
229
+ {"current_steps": 229, "total_steps": 312, "loss": 0.3081, "lr": 8.063495716349929e-06, "epoch": 2.194888178913738, "percentage": 73.4, "elapsed_time": "2:03:39", "remaining_time": "0:44:49"}
230
+ {"current_steps": 230, "total_steps": 312, "loss": 0.3419, "lr": 7.884199123183604e-06, "epoch": 2.2044728434504792, "percentage": 73.72, "elapsed_time": "2:04:11", "remaining_time": "0:44:16"}
231
+ {"current_steps": 231, "total_steps": 312, "loss": 0.2749, "lr": 7.706427745670458e-06, "epoch": 2.2140575079872207, "percentage": 74.04, "elapsed_time": "2:04:46", "remaining_time": "0:43:44"}
232
+ {"current_steps": 232, "total_steps": 312, "loss": 0.3365, "lr": 7.530203962825331e-06, "epoch": 2.2236421725239617, "percentage": 74.36, "elapsed_time": "2:05:15", "remaining_time": "0:43:11"}
233
+ {"current_steps": 233, "total_steps": 312, "loss": 0.3282, "lr": 7.355549958841808e-06, "epoch": 2.2332268370607027, "percentage": 74.68, "elapsed_time": "2:05:51", "remaining_time": "0:42:40"}
234
+ {"current_steps": 234, "total_steps": 312, "loss": 0.2943, "lr": 7.182487720299518e-06, "epoch": 2.242811501597444, "percentage": 75.0, "elapsed_time": "2:06:20", "remaining_time": "0:42:06"}
235
+ {"current_steps": 235, "total_steps": 312, "loss": 0.3252, "lr": 7.01103903339633e-06, "epoch": 2.252396166134185, "percentage": 75.32, "elapsed_time": "2:06:52", "remaining_time": "0:41:34"}
236
+ {"current_steps": 236, "total_steps": 312, "loss": 0.2755, "lr": 6.841225481205749e-06, "epoch": 2.2619808306709266, "percentage": 75.64, "elapsed_time": "2:07:25", "remaining_time": "0:41:02"}
237
+ {"current_steps": 237, "total_steps": 312, "loss": 0.2962, "lr": 6.6730684409599225e-06, "epoch": 2.2715654952076676, "percentage": 75.96, "elapsed_time": "2:08:01", "remaining_time": "0:40:30"}
238
+ {"current_steps": 238, "total_steps": 312, "loss": 0.2951, "lr": 6.5065890813585145e-06, "epoch": 2.281150159744409, "percentage": 76.28, "elapsed_time": "2:08:37", "remaining_time": "0:39:59"}
239
+ {"current_steps": 239, "total_steps": 312, "loss": 0.317, "lr": 6.3418083599038624e-06, "epoch": 2.29073482428115, "percentage": 76.6, "elapsed_time": "2:09:10", "remaining_time": "0:39:27"}
240
+ {"current_steps": 240, "total_steps": 312, "loss": 0.2881, "lr": 6.178747020262708e-06, "epoch": 2.3003194888178915, "percentage": 76.92, "elapsed_time": "2:09:40", "remaining_time": "0:38:54"}
241
+ {"current_steps": 241, "total_steps": 312, "loss": 0.2595, "lr": 6.017425589654853e-06, "epoch": 2.3099041533546325, "percentage": 77.24, "elapsed_time": "2:10:13", "remaining_time": "0:38:21"}
242
+ {"current_steps": 242, "total_steps": 312, "loss": 0.326, "lr": 5.857864376269051e-06, "epoch": 2.319488817891374, "percentage": 77.56, "elapsed_time": "2:10:45", "remaining_time": "0:37:49"}
243
+ {"current_steps": 243, "total_steps": 312, "loss": 0.2744, "lr": 5.700083466706494e-06, "epoch": 2.329073482428115, "percentage": 77.88, "elapsed_time": "2:11:16", "remaining_time": "0:37:16"}
244
+ {"current_steps": 244, "total_steps": 312, "loss": 0.3105, "lr": 5.544102723452171e-06, "epoch": 2.3386581469648564, "percentage": 78.21, "elapsed_time": "2:11:47", "remaining_time": "0:36:43"}
245
+ {"current_steps": 245, "total_steps": 312, "loss": 0.316, "lr": 5.38994178237445e-06, "epoch": 2.3482428115015974, "percentage": 78.53, "elapsed_time": "2:12:22", "remaining_time": "0:36:11"}
246
+ {"current_steps": 246, "total_steps": 312, "loss": 0.3226, "lr": 5.237620050253189e-06, "epoch": 2.357827476038339, "percentage": 78.85, "elapsed_time": "2:12:56", "remaining_time": "0:35:40"}
247
+ {"current_steps": 247, "total_steps": 312, "loss": 0.2614, "lr": 5.087156702336689e-06, "epoch": 2.36741214057508, "percentage": 79.17, "elapsed_time": "2:13:26", "remaining_time": "0:35:07"}
248
+ {"current_steps": 248, "total_steps": 312, "loss": 0.3123, "lr": 4.938570679927784e-06, "epoch": 2.376996805111821, "percentage": 79.49, "elapsed_time": "2:14:01", "remaining_time": "0:34:35"}
249
+ {"current_steps": 249, "total_steps": 312, "loss": 0.3123, "lr": 4.791880687999382e-06, "epoch": 2.3865814696485623, "percentage": 79.81, "elapsed_time": "2:14:35", "remaining_time": "0:34:03"}
250
+ {"current_steps": 250, "total_steps": 312, "loss": 0.3176, "lr": 4.647105192839778e-06, "epoch": 2.3961661341853033, "percentage": 80.13, "elapsed_time": "2:15:06", "remaining_time": "0:33:30"}
251
+ {"current_steps": 251, "total_steps": 312, "loss": 0.3144, "lr": 4.504262419727983e-06, "epoch": 2.405750798722045, "percentage": 80.45, "elapsed_time": "2:15:34", "remaining_time": "0:32:56"}
252
+ {"current_steps": 252, "total_steps": 312, "loss": 0.34, "lr": 4.363370350639405e-06, "epoch": 2.415335463258786, "percentage": 80.77, "elapsed_time": "2:16:07", "remaining_time": "0:32:24"}
253
+ {"current_steps": 253, "total_steps": 312, "loss": 0.2955, "lr": 4.2244467219821806e-06, "epoch": 2.4249201277955272, "percentage": 81.09, "elapsed_time": "2:16:36", "remaining_time": "0:31:51"}
254
+ {"current_steps": 254, "total_steps": 312, "loss": 0.283, "lr": 4.087509022364382e-06, "epoch": 2.4345047923322682, "percentage": 81.41, "elapsed_time": "2:17:08", "remaining_time": "0:31:18"}
255
+ {"current_steps": 255, "total_steps": 312, "loss": 0.3177, "lr": 3.952574490392443e-06, "epoch": 2.4440894568690097, "percentage": 81.73, "elapsed_time": "2:17:43", "remaining_time": "0:30:47"}
256
+ {"current_steps": 256, "total_steps": 312, "loss": 0.302, "lr": 3.819660112501053e-06, "epoch": 2.4536741214057507, "percentage": 82.05, "elapsed_time": "2:18:16", "remaining_time": "0:30:14"}
257
+ {"current_steps": 257, "total_steps": 312, "loss": 0.302, "lr": 3.6887826208147968e-06, "epoch": 2.463258785942492, "percentage": 82.37, "elapsed_time": "2:18:47", "remaining_time": "0:29:42"}
258
+ {"current_steps": 258, "total_steps": 312, "loss": 0.2646, "lr": 3.5599584910418037e-06, "epoch": 2.472843450479233, "percentage": 82.69, "elapsed_time": "2:19:18", "remaining_time": "0:29:09"}
259
+ {"current_steps": 259, "total_steps": 312, "loss": 0.3084, "lr": 3.433203940399672e-06, "epoch": 2.4824281150159746, "percentage": 83.01, "elapsed_time": "2:19:48", "remaining_time": "0:28:36"}
260
+ {"current_steps": 260, "total_steps": 312, "loss": 0.3469, "lr": 3.3085349255739475e-06, "epoch": 2.4920127795527156, "percentage": 83.33, "elapsed_time": "2:20:21", "remaining_time": "0:28:04"}
261
+ {"current_steps": 261, "total_steps": 312, "loss": 0.3093, "lr": 3.1859671407093984e-06, "epoch": 2.501597444089457, "percentage": 83.65, "elapsed_time": "2:20:54", "remaining_time": "0:27:32"}
262
+ {"current_steps": 262, "total_steps": 312, "loss": 0.2979, "lr": 3.0655160154343177e-06, "epoch": 2.511182108626198, "percentage": 83.97, "elapsed_time": "2:21:28", "remaining_time": "0:26:59"}
263
+ {"current_steps": 263, "total_steps": 312, "loss": 0.3047, "lr": 2.947196712918157e-06, "epoch": 2.520766773162939, "percentage": 84.29, "elapsed_time": "2:21:55", "remaining_time": "0:26:26"}
264
+ {"current_steps": 264, "total_steps": 312, "loss": 0.2969, "lr": 2.8310241279626784e-06, "epoch": 2.5303514376996805, "percentage": 84.62, "elapsed_time": "2:22:24", "remaining_time": "0:25:53"}
265
+ {"current_steps": 265, "total_steps": 312, "loss": 0.2981, "lr": 2.7170128851269084e-06, "epoch": 2.539936102236422, "percentage": 84.94, "elapsed_time": "2:22:54", "remaining_time": "0:25:20"}
266
+ {"current_steps": 266, "total_steps": 312, "loss": 0.3308, "lr": 2.6051773368860935e-06, "epoch": 2.549520766773163, "percentage": 85.26, "elapsed_time": "2:23:22", "remaining_time": "0:24:47"}
267
+ {"current_steps": 267, "total_steps": 312, "loss": 0.3134, "lr": 2.4955315618249263e-06, "epoch": 2.559105431309904, "percentage": 85.58, "elapsed_time": "2:23:50", "remaining_time": "0:24:14"}
268
+ {"current_steps": 268, "total_steps": 312, "loss": 0.2988, "lr": 2.38808936286524e-06, "epoch": 2.5686900958466454, "percentage": 85.9, "elapsed_time": "2:24:19", "remaining_time": "0:23:41"}
269
+ {"current_steps": 269, "total_steps": 312, "loss": 0.275, "lr": 2.2828642655284038e-06, "epoch": 2.5782747603833864, "percentage": 86.22, "elapsed_time": "2:24:49", "remaining_time": "0:23:09"}
270
+ {"current_steps": 270, "total_steps": 312, "loss": 0.2913, "lr": 2.1798695162326444e-06, "epoch": 2.587859424920128, "percentage": 86.54, "elapsed_time": "2:25:22", "remaining_time": "0:22:36"}
271
+ {"current_steps": 271, "total_steps": 312, "loss": 0.3142, "lr": 2.0791180806254975e-06, "epoch": 2.597444089456869, "percentage": 86.86, "elapsed_time": "2:25:53", "remaining_time": "0:22:04"}
272
+ {"current_steps": 272, "total_steps": 312, "loss": 0.2994, "lr": 1.9806226419516195e-06, "epoch": 2.6070287539936103, "percentage": 87.18, "elapsed_time": "2:26:23", "remaining_time": "0:21:31"}
273
+ {"current_steps": 273, "total_steps": 312, "loss": 0.3301, "lr": 1.8843955994561191e-06, "epoch": 2.6166134185303513, "percentage": 87.5, "elapsed_time": "2:26:57", "remaining_time": "0:20:59"}
274
+ {"current_steps": 274, "total_steps": 312, "loss": 0.3136, "lr": 1.790449066823683e-06, "epoch": 2.626198083067093, "percentage": 87.82, "elapsed_time": "2:27:31", "remaining_time": "0:20:27"}
275
+ {"current_steps": 275, "total_steps": 312, "loss": 0.3265, "lr": 1.6987948706536038e-06, "epoch": 2.635782747603834, "percentage": 88.14, "elapsed_time": "2:28:06", "remaining_time": "0:19:55"}
276
+ {"current_steps": 276, "total_steps": 312, "loss": 0.3116, "lr": 1.6094445489709886e-06, "epoch": 2.6453674121405752, "percentage": 88.46, "elapsed_time": "2:28:39", "remaining_time": "0:19:23"}
277
+ {"current_steps": 277, "total_steps": 312, "loss": 0.3081, "lr": 1.5224093497742654e-06, "epoch": 2.6549520766773163, "percentage": 88.78, "elapsed_time": "2:29:12", "remaining_time": "0:18:51"}
278
+ {"current_steps": 278, "total_steps": 312, "loss": 0.2914, "lr": 1.4377002296192233e-06, "epoch": 2.6645367412140573, "percentage": 89.1, "elapsed_time": "2:29:48", "remaining_time": "0:18:19"}
279
+ {"current_steps": 279, "total_steps": 312, "loss": 0.3398, "lr": 1.3553278522397162e-06, "epoch": 2.6741214057507987, "percentage": 89.42, "elapsed_time": "2:30:21", "remaining_time": "0:17:47"}
280
+ {"current_steps": 280, "total_steps": 312, "loss": 0.2895, "lr": 1.275302587205256e-06, "epoch": 2.68370607028754, "percentage": 89.74, "elapsed_time": "2:30:52", "remaining_time": "0:17:14"}
281
+ {"current_steps": 281, "total_steps": 312, "loss": 0.3205, "lr": 1.1976345086156193e-06, "epoch": 2.693290734824281, "percentage": 90.06, "elapsed_time": "2:31:22", "remaining_time": "0:16:41"}
282
+ {"current_steps": 282, "total_steps": 312, "loss": 0.307, "lr": 1.1223333938326486e-06, "epoch": 2.702875399361022, "percentage": 90.38, "elapsed_time": "2:31:56", "remaining_time": "0:16:09"}
283
+ {"current_steps": 283, "total_steps": 312, "loss": 0.2977, "lr": 1.0494087222494253e-06, "epoch": 2.7124600638977636, "percentage": 90.71, "elapsed_time": "2:32:31", "remaining_time": "0:15:37"}
284
+ {"current_steps": 284, "total_steps": 312, "loss": 0.2727, "lr": 9.788696740969295e-07, "epoch": 2.722044728434505, "percentage": 91.03, "elapsed_time": "2:33:04", "remaining_time": "0:15:05"}
285
+ {"current_steps": 285, "total_steps": 312, "loss": 0.3241, "lr": 9.107251292883856e-07, "epoch": 2.731629392971246, "percentage": 91.35, "elapsed_time": "2:33:37", "remaining_time": "0:14:33"}
286
+ {"current_steps": 286, "total_steps": 312, "loss": 0.2888, "lr": 8.44983666301391e-07, "epoch": 2.741214057507987, "percentage": 91.67, "elapsed_time": "2:34:10", "remaining_time": "0:14:00"}
287
+ {"current_steps": 287, "total_steps": 312, "loss": 0.3236, "lr": 7.816535610980103e-07, "epoch": 2.7507987220447285, "percentage": 91.99, "elapsed_time": "2:34:46", "remaining_time": "0:13:28"}
288
+ {"current_steps": 288, "total_steps": 312, "loss": 0.3293, "lr": 7.207427860829352e-07, "epoch": 2.7603833865814695, "percentage": 92.31, "elapsed_time": "2:35:13", "remaining_time": "0:12:56"}
289
+ {"current_steps": 289, "total_steps": 312, "loss": 0.2896, "lr": 6.622590090998727e-07, "epoch": 2.769968051118211, "percentage": 92.63, "elapsed_time": "2:35:42", "remaining_time": "0:12:23"}
290
+ {"current_steps": 290, "total_steps": 312, "loss": 0.2977, "lr": 6.062095924662625e-07, "epoch": 2.779552715654952, "percentage": 92.95, "elapsed_time": "2:36:16", "remaining_time": "0:11:51"}
291
+ {"current_steps": 291, "total_steps": 312, "loss": 0.3527, "lr": 5.526015920464689e-07, "epoch": 2.7891373801916934, "percentage": 93.27, "elapsed_time": "2:36:48", "remaining_time": "0:11:18"}
292
+ {"current_steps": 292, "total_steps": 312, "loss": 0.2575, "lr": 5.014417563635276e-07, "epoch": 2.7987220447284344, "percentage": 93.59, "elapsed_time": "2:37:17", "remaining_time": "0:10:46"}
293
+ {"current_steps": 293, "total_steps": 312, "loss": 0.3026, "lr": 4.5273652574961745e-07, "epoch": 2.8083067092651754, "percentage": 93.91, "elapsed_time": "2:37:46", "remaining_time": "0:10:13"}
294
+ {"current_steps": 294, "total_steps": 312, "loss": 0.2953, "lr": 4.064920315352905e-07, "epoch": 2.817891373801917, "percentage": 94.23, "elapsed_time": "2:38:18", "remaining_time": "0:09:41"}
295
+ {"current_steps": 295, "total_steps": 312, "loss": 0.3698, "lr": 3.62714095277632e-07, "epoch": 2.8274760383386583, "percentage": 94.55, "elapsed_time": "2:38:53", "remaining_time": "0:09:09"}
296
+ {"current_steps": 296, "total_steps": 312, "loss": 0.2709, "lr": 3.214082280274067e-07, "epoch": 2.8370607028753994, "percentage": 94.87, "elapsed_time": "2:39:26", "remaining_time": "0:08:37"}
297
+ {"current_steps": 297, "total_steps": 312, "loss": 0.3268, "lr": 2.825796296352823e-07, "epoch": 2.8466453674121404, "percentage": 95.19, "elapsed_time": "2:40:01", "remaining_time": "0:08:04"}
298
+ {"current_steps": 298, "total_steps": 312, "loss": 0.3032, "lr": 2.462331880972468e-07, "epoch": 2.856230031948882, "percentage": 95.51, "elapsed_time": "2:40:29", "remaining_time": "0:07:32"}
299
+ {"current_steps": 299, "total_steps": 312, "loss": 0.3539, "lr": 2.123734789392673e-07, "epoch": 2.8658146964856233, "percentage": 95.83, "elapsed_time": "2:41:01", "remaining_time": "0:07:00"}
300
+ {"current_steps": 300, "total_steps": 312, "loss": 0.2696, "lr": 1.81004764641306e-07, "epoch": 2.8753993610223643, "percentage": 96.15, "elapsed_time": "2:41:38", "remaining_time": "0:06:27"}
301
+ {"current_steps": 301, "total_steps": 312, "loss": 0.3199, "lr": 1.5213099410071873e-07, "epoch": 2.8849840255591053, "percentage": 96.47, "elapsed_time": "2:42:09", "remaining_time": "0:05:55"}
302
+ {"current_steps": 302, "total_steps": 312, "loss": 0.3403, "lr": 1.2575580213514792e-07, "epoch": 2.8945686900958467, "percentage": 96.79, "elapsed_time": "2:42:41", "remaining_time": "0:05:23"}
303
+ {"current_steps": 303, "total_steps": 312, "loss": 0.3211, "lr": 1.0188250902495312e-07, "epoch": 2.9041533546325877, "percentage": 97.12, "elapsed_time": "2:43:18", "remaining_time": "0:04:51"}
304
+ {"current_steps": 304, "total_steps": 312, "loss": 0.3422, "lr": 8.051412009521864e-08, "epoch": 2.913738019169329, "percentage": 97.44, "elapsed_time": "2:43:48", "remaining_time": "0:04:18"}
305
+ {"current_steps": 305, "total_steps": 312, "loss": 0.2635, "lr": 6.165332533744072e-08, "epoch": 2.92332268370607, "percentage": 97.76, "elapsed_time": "2:44:16", "remaining_time": "0:03:46"}
306
+ {"current_steps": 306, "total_steps": 312, "loss": 0.2942, "lr": 4.530249907087836e-08, "epoch": 2.9329073482428116, "percentage": 98.08, "elapsed_time": "2:44:50", "remaining_time": "0:03:13"}
307
+ {"current_steps": 307, "total_steps": 312, "loss": 0.3829, "lr": 3.146369964366791e-08, "epoch": 2.9424920127795526, "percentage": 98.4, "elapsed_time": "2:45:20", "remaining_time": "0:02:41"}
308
+ {"current_steps": 308, "total_steps": 312, "loss": 0.2838, "lr": 2.0138669173708213e-08, "epoch": 2.952076677316294, "percentage": 98.72, "elapsed_time": "2:45:54", "remaining_time": "0:02:09"}
309
+ {"current_steps": 309, "total_steps": 312, "loss": 0.3031, "lr": 1.1328833329333767e-08, "epoch": 2.961661341853035, "percentage": 99.04, "elapsed_time": "2:46:27", "remaining_time": "0:01:36"}
310
+ {"current_steps": 310, "total_steps": 312, "loss": 0.3185, "lr": 5.0353011498693875e-09, "epoch": 2.9712460063897765, "percentage": 99.36, "elapsed_time": "2:46:59", "remaining_time": "0:01:04"}
311
+ {"current_steps": 311, "total_steps": 312, "loss": 0.2968, "lr": 1.2588649059885883e-09, "epoch": 2.9808306709265175, "percentage": 99.68, "elapsed_time": "2:47:31", "remaining_time": "0:00:32"}
312
+ {"current_steps": 312, "total_steps": 312, "loss": 0.3009, "lr": 0.0, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "2:48:07", "remaining_time": "0:00:00"}
313
+ {"current_steps": 312, "total_steps": 312, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "2:49:40", "remaining_time": "0:00:00"}