penfever commited on
Commit
52ca4df
·
verified ·
1 Parent(s): a83b0d3

Training in progress, step 9000

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3678c246b0c544502d09d0df8232b622361f8d445e369a5bd9563fdc6afec285
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:223860e7f0179d9b6f3a24284210c62ec12ff943301c6f04bf27490ebf37c972
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30f5add51c1c220daf2aacad6a2104153f2106052fa2a3d2a20884dce75a4501
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:663265eda9d0fdd3446e87ac96535bf6ba220655641d1777144ea270cc29654f
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c77b57898eedc3c19f6227aa1c8d7f35c538960e12a3b70ff81847eb3575beb
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16939b5ddffa96e7bbe6b784746cc09c1a947b996e2b2e7869aaef88eecde3c1
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6db990d8b83ec36ba7c747815fb996569b3b3348ec2f378fa5157c4ebbfcb157
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dde6aa392da7ce8d96abe0ca8d4a3ad3c0c20704c47dc2c6b5eeeace82065c24
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1772,3 +1772,43 @@
1772
  {"current_steps": 8790, "total_steps": 9625, "loss": 0.1791, "lr": 9.12317883214886e-07, "epoch": 6.393597671880684, "percentage": 91.32, "elapsed_time": "10:29:34", "remaining_time": "0:59:48"}
1773
  {"current_steps": 8795, "total_steps": 9625, "loss": 0.1781, "lr": 9.015201149614427e-07, "epoch": 6.3972353583121135, "percentage": 91.38, "elapsed_time": "10:32:36", "remaining_time": "0:59:42"}
1774
  {"current_steps": 8800, "total_steps": 9625, "loss": 0.1657, "lr": 8.907851528443734e-07, "epoch": 6.400873044743543, "percentage": 91.43, "elapsed_time": "10:35:27", "remaining_time": "0:59:34"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1772
  {"current_steps": 8790, "total_steps": 9625, "loss": 0.1791, "lr": 9.12317883214886e-07, "epoch": 6.393597671880684, "percentage": 91.32, "elapsed_time": "10:29:34", "remaining_time": "0:59:48"}
1773
  {"current_steps": 8795, "total_steps": 9625, "loss": 0.1781, "lr": 9.015201149614427e-07, "epoch": 6.3972353583121135, "percentage": 91.38, "elapsed_time": "10:32:36", "remaining_time": "0:59:42"}
1774
  {"current_steps": 8800, "total_steps": 9625, "loss": 0.1657, "lr": 8.907851528443734e-07, "epoch": 6.400873044743543, "percentage": 91.43, "elapsed_time": "10:35:27", "remaining_time": "0:59:34"}
1775
+ {"current_steps": 8805, "total_steps": 9625, "loss": 0.1531, "lr": 8.801130321660411e-07, "epoch": 6.404510731174973, "percentage": 91.48, "elapsed_time": "10:39:18", "remaining_time": "0:59:32"}
1776
+ {"current_steps": 8810, "total_steps": 9625, "loss": 0.1525, "lr": 8.695037880221569e-07, "epoch": 6.4081484176064025, "percentage": 91.53, "elapsed_time": "10:42:06", "remaining_time": "0:59:24"}
1777
+ {"current_steps": 8815, "total_steps": 9625, "loss": 0.1632, "lr": 8.589574553016545e-07, "epoch": 6.411786104037832, "percentage": 91.58, "elapsed_time": "10:44:53", "remaining_time": "0:59:15"}
1778
+ {"current_steps": 8820, "total_steps": 9625, "loss": 0.1589, "lr": 8.484740686865778e-07, "epoch": 6.415423790469261, "percentage": 91.64, "elapsed_time": "10:47:40", "remaining_time": "0:59:06"}
1779
+ {"current_steps": 8825, "total_steps": 9625, "loss": 0.1631, "lr": 8.380536626519809e-07, "epoch": 6.4190614769006915, "percentage": 91.69, "elapsed_time": "10:50:28", "remaining_time": "0:58:57"}
1780
+ {"current_steps": 8830, "total_steps": 9625, "loss": 0.1524, "lr": 8.276962714657922e-07, "epoch": 6.422699163332121, "percentage": 91.74, "elapsed_time": "10:53:20", "remaining_time": "0:58:49"}
1781
+ {"current_steps": 8835, "total_steps": 9625, "loss": 0.1603, "lr": 8.174019291887258e-07, "epoch": 6.42633684976355, "percentage": 91.79, "elapsed_time": "10:56:01", "remaining_time": "0:58:39"}
1782
+ {"current_steps": 8840, "total_steps": 9625, "loss": 0.1629, "lr": 8.071706696741466e-07, "epoch": 6.42997453619498, "percentage": 91.84, "elapsed_time": "10:58:43", "remaining_time": "0:58:29"}
1783
+ {"current_steps": 8845, "total_steps": 9625, "loss": 0.1579, "lr": 7.970025265679648e-07, "epoch": 6.43361222262641, "percentage": 91.9, "elapsed_time": "11:01:33", "remaining_time": "0:58:20"}
1784
+ {"current_steps": 8850, "total_steps": 9625, "loss": 0.1646, "lr": 7.868975333085483e-07, "epoch": 6.437249909057839, "percentage": 91.95, "elapsed_time": "11:04:25", "remaining_time": "0:58:11"}
1785
+ {"current_steps": 8855, "total_steps": 9625, "loss": 0.1785, "lr": 7.76855723126575e-07, "epoch": 6.440887595489269, "percentage": 92.0, "elapsed_time": "11:07:14", "remaining_time": "0:58:01"}
1786
+ {"current_steps": 8860, "total_steps": 9625, "loss": 0.1346, "lr": 7.668771290449539e-07, "epoch": 6.444525281920699, "percentage": 92.05, "elapsed_time": "11:09:42", "remaining_time": "0:57:49"}
1787
+ {"current_steps": 8865, "total_steps": 9625, "loss": 0.1501, "lr": 7.569617838787024e-07, "epoch": 6.448162968352128, "percentage": 92.1, "elapsed_time": "11:12:32", "remaining_time": "0:57:39"}
1788
+ {"current_steps": 8870, "total_steps": 9625, "loss": 0.1558, "lr": 7.471097202348377e-07, "epoch": 6.451800654783558, "percentage": 92.16, "elapsed_time": "11:15:27", "remaining_time": "0:57:29"}
1789
+ {"current_steps": 8875, "total_steps": 9625, "loss": 0.1631, "lr": 7.373209705122808e-07, "epoch": 6.455438341214987, "percentage": 92.21, "elapsed_time": "11:18:11", "remaining_time": "0:57:18"}
1790
+ {"current_steps": 8880, "total_steps": 9625, "loss": 0.1606, "lr": 7.275955669017332e-07, "epoch": 6.459076027646417, "percentage": 92.26, "elapsed_time": "11:21:08", "remaining_time": "0:57:08"}
1791
+ {"current_steps": 8885, "total_steps": 9625, "loss": 0.1585, "lr": 7.179335413855893e-07, "epoch": 6.462713714077847, "percentage": 92.31, "elapsed_time": "11:24:11", "remaining_time": "0:56:59"}
1792
+ {"current_steps": 8890, "total_steps": 9625, "loss": 0.1391, "lr": 7.083349257378125e-07, "epoch": 6.466351400509276, "percentage": 92.36, "elapsed_time": "11:27:11", "remaining_time": "0:56:48"}
1793
+ {"current_steps": 8895, "total_steps": 9625, "loss": 0.1427, "lr": 6.987997515238443e-07, "epoch": 6.469989086940705, "percentage": 92.42, "elapsed_time": "11:30:10", "remaining_time": "0:56:38"}
1794
+ {"current_steps": 8900, "total_steps": 9625, "loss": 0.1375, "lr": 6.89328050100504e-07, "epoch": 6.4736267733721355, "percentage": 92.47, "elapsed_time": "11:33:02", "remaining_time": "0:56:27"}
1795
+ {"current_steps": 8905, "total_steps": 9625, "loss": 0.1554, "lr": 6.799198526158668e-07, "epoch": 6.477264459803565, "percentage": 92.52, "elapsed_time": "11:35:31", "remaining_time": "0:56:14"}
1796
+ {"current_steps": 8910, "total_steps": 9625, "loss": 0.1518, "lr": 6.705751900091773e-07, "epoch": 6.480902146234994, "percentage": 92.57, "elapsed_time": "11:38:07", "remaining_time": "0:56:01"}
1797
+ {"current_steps": 8915, "total_steps": 9625, "loss": 0.1646, "lr": 6.612940930107381e-07, "epoch": 6.4845398326664245, "percentage": 92.62, "elapsed_time": "11:40:56", "remaining_time": "0:55:49"}
1798
+ {"current_steps": 8920, "total_steps": 9625, "loss": 0.1665, "lr": 6.520765921418259e-07, "epoch": 6.488177519097854, "percentage": 92.68, "elapsed_time": "11:43:51", "remaining_time": "0:55:37"}
1799
+ {"current_steps": 8925, "total_steps": 9625, "loss": 0.164, "lr": 6.429227177145669e-07, "epoch": 6.491815205529283, "percentage": 92.73, "elapsed_time": "11:46:43", "remaining_time": "0:55:25"}
1800
+ {"current_steps": 8930, "total_steps": 9625, "loss": 0.1604, "lr": 6.33832499831859e-07, "epoch": 6.495452891960713, "percentage": 92.78, "elapsed_time": "11:49:43", "remaining_time": "0:55:14"}
1801
+ {"current_steps": 8935, "total_steps": 9625, "loss": 0.1651, "lr": 6.248059683872476e-07, "epoch": 6.499090578392143, "percentage": 92.83, "elapsed_time": "11:52:42", "remaining_time": "0:55:02"}
1802
+ {"current_steps": 8940, "total_steps": 9625, "loss": 0.1587, "lr": 6.158431530648612e-07, "epoch": 6.502728264823572, "percentage": 92.88, "elapsed_time": "11:55:40", "remaining_time": "0:54:50"}
1803
+ {"current_steps": 8945, "total_steps": 9625, "loss": 0.1631, "lr": 6.069440833392848e-07, "epoch": 6.506365951255002, "percentage": 92.94, "elapsed_time": "11:58:40", "remaining_time": "0:54:38"}
1804
+ {"current_steps": 8950, "total_steps": 9625, "loss": 0.1613, "lr": 5.981087884754711e-07, "epoch": 6.510003637686431, "percentage": 92.99, "elapsed_time": "12:01:40", "remaining_time": "0:54:25"}
1805
+ {"current_steps": 8955, "total_steps": 9625, "loss": 0.1615, "lr": 5.89337297528656e-07, "epoch": 6.513641324117861, "percentage": 93.04, "elapsed_time": "12:04:36", "remaining_time": "0:54:12"}
1806
+ {"current_steps": 8960, "total_steps": 9625, "loss": 0.1584, "lr": 5.806296393442412e-07, "epoch": 6.517279010549291, "percentage": 93.09, "elapsed_time": "12:07:17", "remaining_time": "0:53:58"}
1807
+ {"current_steps": 8965, "total_steps": 9625, "loss": 0.1562, "lr": 5.719858425577251e-07, "epoch": 6.52091669698072, "percentage": 93.14, "elapsed_time": "12:09:59", "remaining_time": "0:53:44"}
1808
+ {"current_steps": 8970, "total_steps": 9625, "loss": 0.1282, "lr": 5.634059355945876e-07, "epoch": 6.52455438341215, "percentage": 93.19, "elapsed_time": "12:12:03", "remaining_time": "0:53:27"}
1809
+ {"current_steps": 8975, "total_steps": 9625, "loss": 0.1566, "lr": 5.548899466702029e-07, "epoch": 6.52819206984358, "percentage": 93.25, "elapsed_time": "12:14:56", "remaining_time": "0:53:13"}
1810
+ {"current_steps": 8980, "total_steps": 9625, "loss": 0.1565, "lr": 5.464379037897539e-07, "epoch": 6.531829756275009, "percentage": 93.3, "elapsed_time": "12:17:35", "remaining_time": "0:52:58"}
1811
+ {"current_steps": 8985, "total_steps": 9625, "loss": 0.1588, "lr": 5.380498347481266e-07, "epoch": 6.535467442706439, "percentage": 93.35, "elapsed_time": "12:20:29", "remaining_time": "0:52:44"}
1812
+ {"current_steps": 8990, "total_steps": 9625, "loss": 0.1531, "lr": 5.297257671298384e-07, "epoch": 6.539105129137869, "percentage": 93.4, "elapsed_time": "12:23:28", "remaining_time": "0:52:30"}
1813
+ {"current_steps": 8995, "total_steps": 9625, "loss": 0.1595, "lr": 5.214657283089208e-07, "epoch": 6.542742815569298, "percentage": 93.45, "elapsed_time": "12:26:22", "remaining_time": "0:52:16"}
1814
+ {"current_steps": 9000, "total_steps": 9625, "loss": 0.1599, "lr": 5.132697454488545e-07, "epoch": 6.546380502000727, "percentage": 93.51, "elapsed_time": "12:29:10", "remaining_time": "0:52:01"}