penfever commited on
Commit
86b27fe
·
verified ·
1 Parent(s): 6f6ccd9

Training in progress, step 7140

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2cb317cc96bcc57b04a9c2601cdfbc2c8bc9be9727d6c2d98ebbbd69c120f48
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b649e1931e5a91c597ad961e8916767634ff3dbda93c1df435500de889e7cc02
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f082d03c737a10944c4631d3cfa75cd73dd8d5705a106aeef0541a1a5ea3059e
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e54e0168e6d72b7671a2e54ac50bd5366d68634694ee35220d14ddfaa411d5b
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d45669fcaf1ebfb6f3f202497c0dcfe4a382e76aaa73a19bc6c4be067d2e3ee
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cddbf690c9a0a6adc3f66d7c744e86f15c4d373bf7e303742d81d2da31e2e303
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ee4b5d127cbb138b272466b41f64e5ecca80769fdcdbab6c314c7bbe5603c77
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6114d729a4cc91441e7e95cb5910afe18e509bde87b09173a1f35a952fe810b1
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1404,3 +1404,26 @@
1404
  {"current_steps": 7020, "total_steps": 7140, "loss": 0.0831, "lr": 3.4983430440149733e-08, "epoch": 6.882352941176471, "percentage": 98.32, "elapsed_time": "9:20:27", "remaining_time": "0:09:34"}
1405
  {"current_steps": 7025, "total_steps": 7140, "loss": 0.0764, "lr": 3.215273213988734e-08, "epoch": 6.887254901960784, "percentage": 98.39, "elapsed_time": "9:20:48", "remaining_time": "0:09:10"}
1406
  {"current_steps": 7030, "total_steps": 7140, "loss": 0.0719, "lr": 2.9441347272543e-08, "epoch": 6.892156862745098, "percentage": 98.46, "elapsed_time": "9:21:05", "remaining_time": "0:08:46"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1404
  {"current_steps": 7020, "total_steps": 7140, "loss": 0.0831, "lr": 3.4983430440149733e-08, "epoch": 6.882352941176471, "percentage": 98.32, "elapsed_time": "9:20:27", "remaining_time": "0:09:34"}
1405
  {"current_steps": 7025, "total_steps": 7140, "loss": 0.0764, "lr": 3.215273213988734e-08, "epoch": 6.887254901960784, "percentage": 98.39, "elapsed_time": "9:20:48", "remaining_time": "0:09:10"}
1406
  {"current_steps": 7030, "total_steps": 7140, "loss": 0.0719, "lr": 2.9441347272543e-08, "epoch": 6.892156862745098, "percentage": 98.46, "elapsed_time": "9:21:05", "remaining_time": "0:08:46"}
1407
+ {"current_steps": 7035, "total_steps": 7140, "loss": 0.0685, "lr": 2.6849292039390352e-08, "epoch": 6.897058823529412, "percentage": 98.53, "elapsed_time": "9:21:28", "remaining_time": "0:08:22"}
1408
+ {"current_steps": 7040, "total_steps": 7140, "loss": 0.0931, "lr": 2.4376581928682307e-08, "epoch": 6.901960784313726, "percentage": 98.6, "elapsed_time": "9:21:43", "remaining_time": "0:07:58"}
1409
+ {"current_steps": 7045, "total_steps": 7140, "loss": 0.0721, "lr": 2.2023231715546655e-08, "epoch": 6.9068627450980395, "percentage": 98.67, "elapsed_time": "9:22:05", "remaining_time": "0:07:34"}
1410
+ {"current_steps": 7050, "total_steps": 7140, "loss": 0.0809, "lr": 1.9789255461906132e-08, "epoch": 6.911764705882353, "percentage": 98.74, "elapsed_time": "9:22:29", "remaining_time": "0:07:10"}
1411
+ {"current_steps": 7055, "total_steps": 7140, "loss": 0.0718, "lr": 1.7674666516387383e-08, "epoch": 6.916666666666667, "percentage": 98.81, "elapsed_time": "9:22:55", "remaining_time": "0:06:46"}
1412
+ {"current_steps": 7060, "total_steps": 7140, "loss": 0.0735, "lr": 1.56794775142477e-08, "epoch": 6.921568627450981, "percentage": 98.88, "elapsed_time": "9:23:16", "remaining_time": "0:06:22"}
1413
+ {"current_steps": 7065, "total_steps": 7140, "loss": 0.0717, "lr": 1.380370037729728e-08, "epoch": 6.926470588235294, "percentage": 98.95, "elapsed_time": "9:23:33", "remaining_time": "0:05:58"}
1414
+ {"current_steps": 7070, "total_steps": 7140, "loss": 0.0862, "lr": 1.204734631382154e-08, "epoch": 6.931372549019608, "percentage": 99.02, "elapsed_time": "9:23:58", "remaining_time": "0:05:35"}
1415
+ {"current_steps": 7075, "total_steps": 7140, "loss": 0.0749, "lr": 1.0410425818525582e-08, "epoch": 6.936274509803922, "percentage": 99.09, "elapsed_time": "9:24:21", "remaining_time": "0:05:11"}
1416
+ {"current_steps": 7080, "total_steps": 7140, "loss": 0.078, "lr": 8.892948672465373e-09, "epoch": 6.9411764705882355, "percentage": 99.16, "elapsed_time": "9:24:46", "remaining_time": "0:04:47"}
1417
+ {"current_steps": 7085, "total_steps": 7140, "loss": 0.0689, "lr": 7.494923942985566e-09, "epoch": 6.946078431372549, "percentage": 99.23, "elapsed_time": "9:25:08", "remaining_time": "0:04:23"}
1418
+ {"current_steps": 7090, "total_steps": 7140, "loss": 0.0725, "lr": 6.216359983675091e-09, "epoch": 6.950980392156863, "percentage": 99.3, "elapsed_time": "9:25:33", "remaining_time": "0:03:59"}
1419
+ {"current_steps": 7095, "total_steps": 7140, "loss": 0.0747, "lr": 5.057264434307208e-09, "epoch": 6.955882352941177, "percentage": 99.37, "elapsed_time": "9:25:50", "remaining_time": "0:03:35"}
1420
+ {"current_steps": 7100, "total_steps": 7140, "loss": 0.0685, "lr": 4.017644220797312e-09, "epoch": 6.96078431372549, "percentage": 99.44, "elapsed_time": "9:26:08", "remaining_time": "0:03:11"}
1421
+ {"current_steps": 7105, "total_steps": 7140, "loss": 0.071, "lr": 3.097505555169633e-09, "epoch": 6.965686274509804, "percentage": 99.51, "elapsed_time": "9:26:29", "remaining_time": "0:02:47"}
1422
+ {"current_steps": 7110, "total_steps": 7140, "loss": 0.0641, "lr": 2.2968539355061603e-09, "epoch": 6.970588235294118, "percentage": 99.58, "elapsed_time": "9:26:52", "remaining_time": "0:02:23"}
1423
+ {"current_steps": 7115, "total_steps": 7140, "loss": 0.0748, "lr": 1.6156941459222197e-09, "epoch": 6.9754901960784315, "percentage": 99.65, "elapsed_time": "9:27:14", "remaining_time": "0:01:59"}
1424
+ {"current_steps": 7120, "total_steps": 7140, "loss": 0.0655, "lr": 1.0540302565376081e-09, "epoch": 6.980392156862745, "percentage": 99.72, "elapsed_time": "9:27:43", "remaining_time": "0:01:35"}
1425
+ {"current_steps": 7125, "total_steps": 7140, "loss": 0.071, "lr": 6.118656234499476e-10, "epoch": 6.985294117647059, "percentage": 99.79, "elapsed_time": "9:28:20", "remaining_time": "0:01:11"}
1426
+ {"current_steps": 7130, "total_steps": 7140, "loss": 0.0717, "lr": 2.892028887147014e-10, "epoch": 6.990196078431373, "percentage": 99.86, "elapsed_time": "9:28:45", "remaining_time": "0:00:47"}
1427
+ {"current_steps": 7135, "total_steps": 7140, "loss": 0.0967, "lr": 8.604398032963091e-11, "epoch": 6.995098039215686, "percentage": 99.93, "elapsed_time": "9:29:11", "remaining_time": "0:00:23"}
1428
+ {"current_steps": 7140, "total_steps": 7140, "loss": 0.0753, "lr": 2.3901122303549018e-12, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "9:29:30", "remaining_time": "0:00:00"}
1429
+ {"current_steps": 7140, "total_steps": 7140, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "9:30:31", "remaining_time": "0:00:00"}