penfever commited on
Commit
bcb74ba
·
verified ·
1 Parent(s): f286ddf

Training in progress, step 6600

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73b80334b2ac74a3be2a997b330af5ed9a7d660a0ebd7b0f25124a29ce83f9f4
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86a7d3a3786b2889a78008f687dd50e17c09fb1a08270fd2e40a2f7bcb0fd39d
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c68cbc0ba62c7e3baa8437d0abb9a00cfdd32ad94dcc2c79bddb702656a79c2f
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f208e6773ca8a295829bd603da52d02e02132d7641f668b325d4acba7a1053e4
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b832ad2b0e4cb9d347f47b307f2485247a2c962cb34cd503777dbf0d2f963d8
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20adcceb360a32c51d9ed77bf6a3ed1b2b33ada1b5f215ce39ef1dac9ff20e39
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1923752abb8851fd785728827d67c921df08a7abafcddb89158bd2b33d285d12
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5791c4e76d0b449f70f344bde7fa2be0021c61745263a26431b084af26d4e99c
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1285,3 +1285,42 @@
1285
  {"current_steps": 6425, "total_steps": 7140, "loss": 0.0738, "lr": 1.2128449453724556e-06, "epoch": 6.299019607843137, "percentage": 89.99, "elapsed_time": "8:32:33", "remaining_time": "0:57:02"}
1286
  {"current_steps": 6430, "total_steps": 7140, "loss": 0.066, "lr": 1.1961352342025135e-06, "epoch": 6.303921568627451, "percentage": 90.06, "elapsed_time": "8:32:50", "remaining_time": "0:56:37"}
1287
  {"current_steps": 6435, "total_steps": 7140, "loss": 0.075, "lr": 1.1795378813467727e-06, "epoch": 6.3088235294117645, "percentage": 90.13, "elapsed_time": "8:33:12", "remaining_time": "0:56:13"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1285
  {"current_steps": 6425, "total_steps": 7140, "loss": 0.0738, "lr": 1.2128449453724556e-06, "epoch": 6.299019607843137, "percentage": 89.99, "elapsed_time": "8:32:33", "remaining_time": "0:57:02"}
1286
  {"current_steps": 6430, "total_steps": 7140, "loss": 0.066, "lr": 1.1961352342025135e-06, "epoch": 6.303921568627451, "percentage": 90.06, "elapsed_time": "8:32:50", "remaining_time": "0:56:37"}
1287
  {"current_steps": 6435, "total_steps": 7140, "loss": 0.075, "lr": 1.1795378813467727e-06, "epoch": 6.3088235294117645, "percentage": 90.13, "elapsed_time": "8:33:12", "remaining_time": "0:56:13"}
1288
+ {"current_steps": 6440, "total_steps": 7140, "loss": 0.0926, "lr": 1.1630529859790318e-06, "epoch": 6.313725490196078, "percentage": 90.2, "elapsed_time": "8:33:42", "remaining_time": "0:55:50"}
1289
+ {"current_steps": 6445, "total_steps": 7140, "loss": 0.0882, "lr": 1.1466806466011127e-06, "epoch": 6.318627450980392, "percentage": 90.27, "elapsed_time": "8:34:09", "remaining_time": "0:55:26"}
1290
+ {"current_steps": 6450, "total_steps": 7140, "loss": 0.0675, "lr": 1.1304209610422933e-06, "epoch": 6.323529411764706, "percentage": 90.34, "elapsed_time": "8:34:32", "remaining_time": "0:55:02"}
1291
+ {"current_steps": 6455, "total_steps": 7140, "loss": 0.0654, "lr": 1.1142740264587104e-06, "epoch": 6.328431372549019, "percentage": 90.41, "elapsed_time": "8:34:55", "remaining_time": "0:54:38"}
1292
+ {"current_steps": 6460, "total_steps": 7140, "loss": 0.0736, "lr": 1.0982399393327813e-06, "epoch": 6.333333333333333, "percentage": 90.48, "elapsed_time": "8:35:22", "remaining_time": "0:54:14"}
1293
+ {"current_steps": 6465, "total_steps": 7140, "loss": 0.0786, "lr": 1.0823187954726322e-06, "epoch": 6.338235294117647, "percentage": 90.55, "elapsed_time": "8:35:46", "remaining_time": "0:53:51"}
1294
+ {"current_steps": 6470, "total_steps": 7140, "loss": 0.0706, "lr": 1.0665106900115174e-06, "epoch": 6.3431372549019605, "percentage": 90.62, "elapsed_time": "8:36:12", "remaining_time": "0:53:27"}
1295
+ {"current_steps": 6475, "total_steps": 7140, "loss": 0.072, "lr": 1.0508157174072563e-06, "epoch": 6.348039215686274, "percentage": 90.69, "elapsed_time": "8:36:31", "remaining_time": "0:53:02"}
1296
+ {"current_steps": 6480, "total_steps": 7140, "loss": 0.0792, "lr": 1.0352339714416715e-06, "epoch": 6.352941176470588, "percentage": 90.76, "elapsed_time": "8:36:57", "remaining_time": "0:52:39"}
1297
+ {"current_steps": 6485, "total_steps": 7140, "loss": 0.0916, "lr": 1.0197655452200172e-06, "epoch": 6.357843137254902, "percentage": 90.83, "elapsed_time": "8:37:17", "remaining_time": "0:52:14"}
1298
+ {"current_steps": 6490, "total_steps": 7140, "loss": 0.0762, "lr": 1.0044105311704455e-06, "epoch": 6.362745098039215, "percentage": 90.9, "elapsed_time": "8:37:40", "remaining_time": "0:51:50"}
1299
+ {"current_steps": 6495, "total_steps": 7140, "loss": 0.0756, "lr": 9.891690210434235e-07, "epoch": 6.367647058823529, "percentage": 90.97, "elapsed_time": "8:37:55", "remaining_time": "0:51:26"}
1300
+ {"current_steps": 6500, "total_steps": 7140, "loss": 0.0996, "lr": 9.740411059112031e-07, "epoch": 6.372549019607844, "percentage": 91.04, "elapsed_time": "8:38:20", "remaining_time": "0:51:02"}
1301
+ {"current_steps": 6505, "total_steps": 7140, "loss": 0.0713, "lr": 9.590268761672838e-07, "epoch": 6.377450980392156, "percentage": 91.11, "elapsed_time": "8:38:44", "remaining_time": "0:50:38"}
1302
+ {"current_steps": 6510, "total_steps": 7140, "loss": 0.0798, "lr": 9.441264215258595e-07, "epoch": 6.382352941176471, "percentage": 91.18, "elapsed_time": "8:39:07", "remaining_time": "0:50:14"}
1303
+ {"current_steps": 6515, "total_steps": 7140, "loss": 0.0781, "lr": 9.293398310212831e-07, "epoch": 6.387254901960785, "percentage": 91.25, "elapsed_time": "8:39:22", "remaining_time": "0:49:49"}
1304
+ {"current_steps": 6520, "total_steps": 7140, "loss": 0.0792, "lr": 9.146671930075412e-07, "epoch": 6.392156862745098, "percentage": 91.32, "elapsed_time": "8:39:47", "remaining_time": "0:49:25"}
1305
+ {"current_steps": 6525, "total_steps": 7140, "loss": 0.0713, "lr": 9.00108595157716e-07, "epoch": 6.397058823529412, "percentage": 91.39, "elapsed_time": "8:40:03", "remaining_time": "0:49:01"}
1306
+ {"current_steps": 6530, "total_steps": 7140, "loss": 0.0764, "lr": 8.856641244634767e-07, "epoch": 6.401960784313726, "percentage": 91.46, "elapsed_time": "8:40:23", "remaining_time": "0:48:36"}
1307
+ {"current_steps": 6535, "total_steps": 7140, "loss": 0.0709, "lr": 8.713338672345451e-07, "epoch": 6.4068627450980395, "percentage": 91.53, "elapsed_time": "8:40:45", "remaining_time": "0:48:12"}
1308
+ {"current_steps": 6540, "total_steps": 7140, "loss": 0.0751, "lr": 8.571179090981885e-07, "epoch": 6.411764705882353, "percentage": 91.6, "elapsed_time": "8:41:02", "remaining_time": "0:47:48"}
1309
+ {"current_steps": 6545, "total_steps": 7140, "loss": 0.0851, "lr": 8.430163349987075e-07, "epoch": 6.416666666666667, "percentage": 91.67, "elapsed_time": "8:41:21", "remaining_time": "0:47:23"}
1310
+ {"current_steps": 6550, "total_steps": 7140, "loss": 0.0824, "lr": 8.290292291969226e-07, "epoch": 6.421568627450981, "percentage": 91.74, "elapsed_time": "8:41:44", "remaining_time": "0:46:59"}
1311
+ {"current_steps": 6555, "total_steps": 7140, "loss": 0.0776, "lr": 8.151566752696704e-07, "epoch": 6.426470588235294, "percentage": 91.81, "elapsed_time": "8:42:11", "remaining_time": "0:46:36"}
1312
+ {"current_steps": 6560, "total_steps": 7140, "loss": 0.0795, "lr": 8.013987561093217e-07, "epoch": 6.431372549019608, "percentage": 91.88, "elapsed_time": "8:42:35", "remaining_time": "0:46:12"}
1313
+ {"current_steps": 6565, "total_steps": 7140, "loss": 0.0777, "lr": 7.877555539232551e-07, "epoch": 6.436274509803922, "percentage": 91.95, "elapsed_time": "8:42:53", "remaining_time": "0:45:47"}
1314
+ {"current_steps": 6570, "total_steps": 7140, "loss": 0.0738, "lr": 7.742271502333998e-07, "epoch": 6.4411764705882355, "percentage": 92.02, "elapsed_time": "8:43:14", "remaining_time": "0:45:23"}
1315
+ {"current_steps": 6575, "total_steps": 7140, "loss": 0.0748, "lr": 7.608136258757248e-07, "epoch": 6.446078431372549, "percentage": 92.09, "elapsed_time": "8:43:31", "remaining_time": "0:44:59"}
1316
+ {"current_steps": 6580, "total_steps": 7140, "loss": 0.0766, "lr": 7.475150609997595e-07, "epoch": 6.450980392156863, "percentage": 92.16, "elapsed_time": "8:43:58", "remaining_time": "0:44:35"}
1317
+ {"current_steps": 6585, "total_steps": 7140, "loss": 0.0809, "lr": 7.343315350681246e-07, "epoch": 6.455882352941177, "percentage": 92.23, "elapsed_time": "8:44:20", "remaining_time": "0:44:11"}
1318
+ {"current_steps": 6590, "total_steps": 7140, "loss": 0.0737, "lr": 7.212631268560466e-07, "epoch": 6.46078431372549, "percentage": 92.3, "elapsed_time": "8:44:40", "remaining_time": "0:43:47"}
1319
+ {"current_steps": 6595, "total_steps": 7140, "loss": 0.07, "lr": 7.083099144508976e-07, "epoch": 6.465686274509804, "percentage": 92.37, "elapsed_time": "8:44:57", "remaining_time": "0:43:22"}
1320
+ {"current_steps": 6600, "total_steps": 7140, "loss": 0.0676, "lr": 6.95471975251718e-07, "epoch": 6.470588235294118, "percentage": 92.44, "elapsed_time": "8:45:17", "remaining_time": "0:42:58"}
1321
+ {"current_steps": 6605, "total_steps": 7140, "loss": 0.0685, "lr": 6.827493859687572e-07, "epoch": 6.4754901960784315, "percentage": 92.51, "elapsed_time": "8:46:34", "remaining_time": "0:42:39"}
1322
+ {"current_steps": 6610, "total_steps": 7140, "loss": 0.0721, "lr": 6.701422226230225e-07, "epoch": 6.480392156862745, "percentage": 92.58, "elapsed_time": "8:46:59", "remaining_time": "0:42:15"}
1323
+ {"current_steps": 6615, "total_steps": 7140, "loss": 0.0744, "lr": 6.57650560545815e-07, "epoch": 6.485294117647059, "percentage": 92.65, "elapsed_time": "8:47:27", "remaining_time": "0:41:51"}
1324
+ {"current_steps": 6620, "total_steps": 7140, "loss": 0.0733, "lr": 6.452744743782835e-07, "epoch": 6.490196078431373, "percentage": 92.72, "elapsed_time": "8:47:42", "remaining_time": "0:41:27"}
1325
+ {"current_steps": 6625, "total_steps": 7140, "loss": 0.0712, "lr": 6.330140380709826e-07, "epoch": 6.495098039215686, "percentage": 92.79, "elapsed_time": "8:48:03", "remaining_time": "0:41:02"}
1326
+ {"current_steps": 6630, "total_steps": 7140, "loss": 0.0828, "lr": 6.208693248834241e-07, "epoch": 6.5, "percentage": 92.86, "elapsed_time": "8:48:25", "remaining_time": "0:40:38"}