sedrickkeh commited on
Commit
8d21006
·
verified ·
1 Parent(s): d8b4047

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b1465c11b2c99d4b6b474dbd8dfabc5434db1adc30fe36edb02593560b872f1
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1f26d066bb6cf52c187390bc0d9f284deae93d17fb3f6d1d50dc2ba798f8b2b
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:996f637530d5b5b4ca55139c41f3c918698db39ced6bc6fb62eadc0307346358
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f3cd73dbe75492e0217884a456f781a074cdcc315257f8144fde0fc462dfe59
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0906c1ce2f0d9a6c488f777b0494e64f13811f71f4659f1dee3129c693b2f3a9
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae016ecd6a3e80e702c7c025705017e8ab2224265952dc652bbb49c7b1ba033a
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea9c7a0ec004d138aa155b6892ec30ffb623478291ac235d69055c541f7730c3
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a34edd4b5b1e690f2f0f38a809d60a94d3a635af44523b39cdfb38e99545065
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -14,3 +14,13 @@
14
  {"current_steps": 14, "total_steps": 30, "loss": 0.7208, "lr": 6.434016163555452e-06, "epoch": 1.34375, "percentage": 46.67, "elapsed_time": "0:07:06", "remaining_time": "0:08:07"}
15
  {"current_steps": 15, "total_steps": 30, "loss": 0.768, "lr": 5.8682408883346535e-06, "epoch": 1.4375, "percentage": 50.0, "elapsed_time": "0:07:37", "remaining_time": "0:07:37"}
16
  {"current_steps": 16, "total_steps": 30, "loss": 0.7986, "lr": 5.290724144552379e-06, "epoch": 1.53125, "percentage": 53.33, "elapsed_time": "0:08:06", "remaining_time": "0:07:05"}
 
 
 
 
 
 
 
 
 
 
 
14
  {"current_steps": 14, "total_steps": 30, "loss": 0.7208, "lr": 6.434016163555452e-06, "epoch": 1.34375, "percentage": 46.67, "elapsed_time": "0:07:06", "remaining_time": "0:08:07"}
15
  {"current_steps": 15, "total_steps": 30, "loss": 0.768, "lr": 5.8682408883346535e-06, "epoch": 1.4375, "percentage": 50.0, "elapsed_time": "0:07:37", "remaining_time": "0:07:37"}
16
  {"current_steps": 16, "total_steps": 30, "loss": 0.7986, "lr": 5.290724144552379e-06, "epoch": 1.53125, "percentage": 53.33, "elapsed_time": "0:08:06", "remaining_time": "0:07:05"}
17
+ {"current_steps": 17, "total_steps": 30, "loss": 0.6939, "lr": 4.7092758554476215e-06, "epoch": 1.625, "percentage": 56.67, "elapsed_time": "0:08:41", "remaining_time": "0:06:38"}
18
+ {"current_steps": 18, "total_steps": 30, "loss": 0.7287, "lr": 4.131759111665349e-06, "epoch": 1.71875, "percentage": 60.0, "elapsed_time": "0:09:09", "remaining_time": "0:06:06"}
19
+ {"current_steps": 19, "total_steps": 30, "loss": 0.7368, "lr": 3.5659838364445505e-06, "epoch": 1.8125, "percentage": 63.33, "elapsed_time": "0:09:34", "remaining_time": "0:05:32"}
20
+ {"current_steps": 20, "total_steps": 30, "loss": 0.6756, "lr": 3.019601169804216e-06, "epoch": 1.90625, "percentage": 66.67, "elapsed_time": "0:10:01", "remaining_time": "0:05:00"}
21
+ {"current_steps": 21, "total_steps": 30, "loss": 1.1922, "lr": 2.5000000000000015e-06, "epoch": 2.03125, "percentage": 70.0, "elapsed_time": "0:11:14", "remaining_time": "0:04:48"}
22
+ {"current_steps": 22, "total_steps": 30, "loss": 0.6695, "lr": 2.0142070414860704e-06, "epoch": 2.125, "percentage": 73.33, "elapsed_time": "0:11:46", "remaining_time": "0:04:16"}
23
+ {"current_steps": 23, "total_steps": 30, "loss": 0.6786, "lr": 1.5687918106563326e-06, "epoch": 2.21875, "percentage": 76.67, "elapsed_time": "0:12:09", "remaining_time": "0:03:42"}
24
+ {"current_steps": 24, "total_steps": 30, "loss": 0.7032, "lr": 1.1697777844051105e-06, "epoch": 2.3125, "percentage": 80.0, "elapsed_time": "0:12:35", "remaining_time": "0:03:08"}
25
+ {"current_steps": 25, "total_steps": 30, "loss": 0.6561, "lr": 8.225609429353187e-07, "epoch": 2.40625, "percentage": 83.33, "elapsed_time": "0:13:07", "remaining_time": "0:02:37"}
26
+ {"current_steps": 26, "total_steps": 30, "loss": 0.6628, "lr": 5.318367983829393e-07, "epoch": 2.5, "percentage": 86.67, "elapsed_time": "0:13:30", "remaining_time": "0:02:04"}