penfever commited on
Commit
9369d05
·
verified ·
1 Parent(s): bafa165

Training in progress, step 1600

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d253181c37bf2f9c403229890e52a8e06885829d38eee0fe85fb2f42969b232
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:520369d91a5fc56b95b5282a07a650e7e203baa659069316b53a1cfe1a547813
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43e9064a7b64df5d5d1d3d76744db6e5ce885697bbdaee82feab961e3f630752
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c5d69dd5c66cbbed45827521ef97b332bae7e791e0a2e5051b2b8b2c6a8a9c1
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54128798e4f3a663324713a3fcbb65d4a0e4d4f5461a1bb1203f759ddedd63dd
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4007d4f5275ff76e2c6f0998c3726c8a767dd6b8fd762d2dc22fb54a5a1cae50
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:314452e5b8fc6222c6513b9009a09d61055afadc7b12b37a0a04cb86bea683a7
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04cca09a1ce98372867c0ac1a146a550665ab6d8ebd1f439a5ef124dad568f04
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -278,3 +278,43 @@
278
  {"current_steps": 1390, "total_steps": 1652, "loss": 0.1604, "lr": 3.0127010028405303e-06, "epoch": 5.89171974522293, "percentage": 84.14, "elapsed_time": "14:40:49", "remaining_time": "2:46:01"}
279
  {"current_steps": 1395, "total_steps": 1652, "loss": 0.1683, "lr": 2.9020672473919107e-06, "epoch": 5.912951167728238, "percentage": 84.44, "elapsed_time": "14:43:58", "remaining_time": "2:42:51"}
280
  {"current_steps": 1400, "total_steps": 1652, "loss": 0.1706, "lr": 2.7933439684253616e-06, "epoch": 5.934182590233545, "percentage": 84.75, "elapsed_time": "14:47:07", "remaining_time": "2:39:41"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
278
  {"current_steps": 1390, "total_steps": 1652, "loss": 0.1604, "lr": 3.0127010028405303e-06, "epoch": 5.89171974522293, "percentage": 84.14, "elapsed_time": "14:40:49", "remaining_time": "2:46:01"}
279
  {"current_steps": 1395, "total_steps": 1652, "loss": 0.1683, "lr": 2.9020672473919107e-06, "epoch": 5.912951167728238, "percentage": 84.44, "elapsed_time": "14:43:58", "remaining_time": "2:42:51"}
280
  {"current_steps": 1400, "total_steps": 1652, "loss": 0.1706, "lr": 2.7933439684253616e-06, "epoch": 5.934182590233545, "percentage": 84.75, "elapsed_time": "14:47:07", "remaining_time": "2:39:41"}
281
+ {"current_steps": 1405, "total_steps": 1652, "loss": 0.1693, "lr": 2.6865433143842356e-06, "epoch": 5.955414012738854, "percentage": 85.05, "elapsed_time": "14:51:27", "remaining_time": "2:36:43"}
282
+ {"current_steps": 1410, "total_steps": 1652, "loss": 0.165, "lr": 2.5816772188830098e-06, "epoch": 5.976645435244161, "percentage": 85.35, "elapsed_time": "14:54:36", "remaining_time": "2:33:32"}
283
+ {"current_steps": 1415, "total_steps": 1652, "loss": 0.1631, "lr": 2.4787573993738524e-06, "epoch": 5.997876857749469, "percentage": 85.65, "elapsed_time": "14:57:46", "remaining_time": "2:30:22"}
284
+ {"current_steps": 1420, "total_steps": 1652, "loss": 0.1523, "lr": 2.377795355837349e-06, "epoch": 6.016985138004246, "percentage": 85.96, "elapsed_time": "15:00:37", "remaining_time": "2:27:08"}
285
+ {"current_steps": 1425, "total_steps": 1652, "loss": 0.1663, "lr": 2.2788023694975236e-06, "epoch": 6.038216560509555, "percentage": 86.26, "elapsed_time": "15:03:44", "remaining_time": "2:23:57"}
286
+ {"current_steps": 1430, "total_steps": 1652, "loss": 0.1575, "lr": 2.1817895015613134e-06, "epoch": 6.059447983014862, "percentage": 86.56, "elapsed_time": "15:06:53", "remaining_time": "2:20:47"}
287
+ {"current_steps": 1435, "total_steps": 1652, "loss": 0.1529, "lr": 2.086767591982608e-06, "epoch": 6.08067940552017, "percentage": 86.86, "elapsed_time": "15:10:02", "remaining_time": "2:17:36"}
288
+ {"current_steps": 1440, "total_steps": 1652, "loss": 0.1684, "lr": 1.9937472582510243e-06, "epoch": 6.101910828025478, "percentage": 87.17, "elapsed_time": "15:13:09", "remaining_time": "2:14:26"}
289
+ {"current_steps": 1445, "total_steps": 1652, "loss": 0.1554, "lr": 1.902738894205547e-06, "epoch": 6.123142250530786, "percentage": 87.47, "elapsed_time": "15:16:18", "remaining_time": "2:11:15"}
290
+ {"current_steps": 1450, "total_steps": 1652, "loss": 0.1596, "lr": 1.8137526688731365e-06, "epoch": 6.144373673036093, "percentage": 87.77, "elapsed_time": "15:19:27", "remaining_time": "2:08:05"}
291
+ {"current_steps": 1455, "total_steps": 1652, "loss": 0.1534, "lr": 1.7267985253324803e-06, "epoch": 6.165605095541402, "percentage": 88.08, "elapsed_time": "15:22:35", "remaining_time": "2:04:54"}
292
+ {"current_steps": 1460, "total_steps": 1652, "loss": 0.1738, "lr": 1.641886179602974e-06, "epoch": 6.186836518046709, "percentage": 88.38, "elapsed_time": "15:25:44", "remaining_time": "2:01:44"}
293
+ {"current_steps": 1465, "total_steps": 1652, "loss": 0.1723, "lr": 1.5590251195590811e-06, "epoch": 6.208067940552017, "percentage": 88.68, "elapsed_time": "15:28:53", "remaining_time": "1:58:34"}
294
+ {"current_steps": 1470, "total_steps": 1652, "loss": 0.1708, "lr": 1.4782246038701865e-06, "epoch": 6.229299363057325, "percentage": 88.98, "elapsed_time": "15:32:02", "remaining_time": "1:55:23"}
295
+ {"current_steps": 1475, "total_steps": 1652, "loss": 0.1735, "lr": 1.3994936609660493e-06, "epoch": 6.250530785562633, "percentage": 89.29, "elapsed_time": "15:35:11", "remaining_time": "1:52:13"}
296
+ {"current_steps": 1480, "total_steps": 1652, "loss": 0.1719, "lr": 1.3228410880280084e-06, "epoch": 6.2717622080679405, "percentage": 89.59, "elapsed_time": "15:38:20", "remaining_time": "1:49:03"}
297
+ {"current_steps": 1485, "total_steps": 1652, "loss": 0.158, "lr": 1.248275450005987e-06, "epoch": 6.292993630573249, "percentage": 89.89, "elapsed_time": "15:41:29", "remaining_time": "1:45:52"}
298
+ {"current_steps": 1490, "total_steps": 1652, "loss": 0.1674, "lr": 1.1758050786614872e-06, "epoch": 6.314225053078556, "percentage": 90.19, "elapsed_time": "15:44:37", "remaining_time": "1:42:42"}
299
+ {"current_steps": 1495, "total_steps": 1652, "loss": 0.1698, "lr": 1.1054380716366064e-06, "epoch": 6.3354564755838645, "percentage": 90.5, "elapsed_time": "15:47:46", "remaining_time": "1:39:31"}
300
+ {"current_steps": 1500, "total_steps": 1652, "loss": 0.1568, "lr": 1.0371822915492414e-06, "epoch": 6.356687898089172, "percentage": 90.8, "elapsed_time": "15:50:55", "remaining_time": "1:36:21"}
301
+ {"current_steps": 1505, "total_steps": 1652, "loss": 0.1634, "lr": 9.710453651145335e-07, "epoch": 6.37791932059448, "percentage": 91.1, "elapsed_time": "15:54:05", "remaining_time": "1:33:11"}
302
+ {"current_steps": 1510, "total_steps": 1652, "loss": 0.1658, "lr": 9.070346822926846e-07, "epoch": 6.399150743099788, "percentage": 91.4, "elapsed_time": "15:57:15", "remaining_time": "1:30:01"}
303
+ {"current_steps": 1515, "total_steps": 1652, "loss": 0.1619, "lr": 8.451573954632186e-07, "epoch": 6.420382165605096, "percentage": 91.71, "elapsed_time": "16:00:24", "remaining_time": "1:26:50"}
304
+ {"current_steps": 1520, "total_steps": 1652, "loss": 0.1543, "lr": 7.854204186257952e-07, "epoch": 6.441613588110403, "percentage": 92.01, "elapsed_time": "16:03:33", "remaining_time": "1:23:40"}
305
+ {"current_steps": 1525, "total_steps": 1652, "loss": 0.1555, "lr": 7.278304266276625e-07, "epoch": 6.462845010615712, "percentage": 92.31, "elapsed_time": "16:06:41", "remaining_time": "1:20:30"}
306
+ {"current_steps": 1530, "total_steps": 1652, "loss": 0.1524, "lr": 6.723938544178232e-07, "epoch": 6.484076433121019, "percentage": 92.62, "elapsed_time": "16:09:50", "remaining_time": "1:17:19"}
307
+ {"current_steps": 1535, "total_steps": 1652, "loss": 0.1545, "lr": 6.191168963280136e-07, "epoch": 6.505307855626327, "percentage": 92.92, "elapsed_time": "16:12:58", "remaining_time": "1:14:09"}
308
+ {"current_steps": 1540, "total_steps": 1652, "loss": 0.1439, "lr": 5.680055053805622e-07, "epoch": 6.526539278131635, "percentage": 93.22, "elapsed_time": "16:16:08", "remaining_time": "1:10:59"}
309
+ {"current_steps": 1545, "total_steps": 1652, "loss": 0.1787, "lr": 5.190653926232169e-07, "epoch": 6.547770700636943, "percentage": 93.52, "elapsed_time": "16:19:16", "remaining_time": "1:07:49"}
310
+ {"current_steps": 1550, "total_steps": 1652, "loss": 0.1493, "lr": 4.723020264910139e-07, "epoch": 6.56900212314225, "percentage": 93.83, "elapsed_time": "16:22:25", "remaining_time": "1:04:38"}
311
+ {"current_steps": 1555, "total_steps": 1652, "loss": 0.1871, "lr": 4.2772063219523875e-07, "epoch": 6.590233545647559, "percentage": 94.13, "elapsed_time": "16:25:33", "remaining_time": "1:01:28"}
312
+ {"current_steps": 1560, "total_steps": 1652, "loss": 0.162, "lr": 3.853261911395834e-07, "epoch": 6.611464968152866, "percentage": 94.43, "elapsed_time": "16:28:41", "remaining_time": "0:58:18"}
313
+ {"current_steps": 1565, "total_steps": 1652, "loss": 0.1771, "lr": 3.4512344036353727e-07, "epoch": 6.632696390658174, "percentage": 94.73, "elapsed_time": "16:31:50", "remaining_time": "0:55:08"}
314
+ {"current_steps": 1570, "total_steps": 1652, "loss": 0.1496, "lr": 3.071168720130779e-07, "epoch": 6.653927813163482, "percentage": 95.04, "elapsed_time": "16:34:58", "remaining_time": "0:51:58"}
315
+ {"current_steps": 1575, "total_steps": 1652, "loss": 0.1573, "lr": 2.7131073283873654e-07, "epoch": 6.67515923566879, "percentage": 95.34, "elapsed_time": "16:38:07", "remaining_time": "0:48:47"}
316
+ {"current_steps": 1580, "total_steps": 1652, "loss": 0.1609, "lr": 2.3770902372107772e-07, "epoch": 6.6963906581740975, "percentage": 95.64, "elapsed_time": "16:41:16", "remaining_time": "0:45:37"}
317
+ {"current_steps": 1585, "total_steps": 1652, "loss": 0.1427, "lr": 2.0631549922364824e-07, "epoch": 6.717622080679406, "percentage": 95.94, "elapsed_time": "16:44:25", "remaining_time": "0:42:27"}
318
+ {"current_steps": 1590, "total_steps": 1652, "loss": 0.1706, "lr": 1.7713366717344803e-07, "epoch": 6.738853503184713, "percentage": 96.25, "elapsed_time": "16:47:33", "remaining_time": "0:39:17"}
319
+ {"current_steps": 1595, "total_steps": 1652, "loss": 0.1495, "lr": 1.5016678826899055e-07, "epoch": 6.7600849256900215, "percentage": 96.55, "elapsed_time": "16:50:42", "remaining_time": "0:36:07"}
320
+ {"current_steps": 1600, "total_steps": 1652, "loss": 0.1599, "lr": 1.2541787571594522e-07, "epoch": 6.781316348195329, "percentage": 96.85, "elapsed_time": "16:53:51", "remaining_time": "0:32:57"}