sedrickkeh commited on
Commit
dd54e27
·
verified ·
1 Parent(s): 2258d57

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ed477c72cc1abf6015c6938cf617942a495bdbe2c779bd3eed4c337cb8fb1c8
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88d9853b50fedfd085a56b8b5c514828e632b3623fc1032220551e1e02f933e5
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e316ce6697c0bc17df2a9dfa956d42db895f81c1d7168ef5225cd92d1391332
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cf86c6179a5a59d0018e7f3c1eefa8ebeda3cb3743a1104c9749e046b7c43fa
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c2c6dbed97356bb08e2eef1e7f9a4fe62bade042de87d27ea24831163c5e40b
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d4bd59dfac413584c46ea6da76e22303f6710ada932795fa8637807f1441781
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5c079f18c85ff23962a0b6598fcdefcafb0b50547d5ee434be69dbf78a80058
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13067522065f80d18728ddd25e1bcd6cee7e8ae73579daa5a64bdcb0e8351483
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -19,3 +19,19 @@
19
  {"current_steps": 19, "total_steps": 48, "loss": 0.7302, "lr": 7.604701702439652e-06, "epoch": 1.1875, "percentage": 39.58, "elapsed_time": "0:10:05", "remaining_time": "0:15:24"}
20
  {"current_steps": 20, "total_steps": 48, "loss": 0.8066, "lr": 7.286211616523193e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:10:32", "remaining_time": "0:14:45"}
21
  {"current_steps": 21, "total_steps": 48, "loss": 0.7155, "lr": 6.95552360245078e-06, "epoch": 1.3125, "percentage": 43.75, "elapsed_time": "0:10:58", "remaining_time": "0:14:07"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  {"current_steps": 19, "total_steps": 48, "loss": 0.7302, "lr": 7.604701702439652e-06, "epoch": 1.1875, "percentage": 39.58, "elapsed_time": "0:10:05", "remaining_time": "0:15:24"}
20
  {"current_steps": 20, "total_steps": 48, "loss": 0.8066, "lr": 7.286211616523193e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:10:32", "remaining_time": "0:14:45"}
21
  {"current_steps": 21, "total_steps": 48, "loss": 0.7155, "lr": 6.95552360245078e-06, "epoch": 1.3125, "percentage": 43.75, "elapsed_time": "0:10:58", "remaining_time": "0:14:07"}
22
+ {"current_steps": 22, "total_steps": 48, "loss": 0.7416, "lr": 6.614402023857231e-06, "epoch": 1.375, "percentage": 45.83, "elapsed_time": "0:11:27", "remaining_time": "0:13:32"}
23
+ {"current_steps": 23, "total_steps": 48, "loss": 0.7355, "lr": 6.264666911958404e-06, "epoch": 1.4375, "percentage": 47.92, "elapsed_time": "0:12:00", "remaining_time": "0:13:02"}
24
+ {"current_steps": 24, "total_steps": 48, "loss": 0.7514, "lr": 5.908184254897183e-06, "epoch": 1.5, "percentage": 50.0, "elapsed_time": "0:12:29", "remaining_time": "0:12:29"}
25
+ {"current_steps": 25, "total_steps": 48, "loss": 0.7772, "lr": 5.546856041889374e-06, "epoch": 1.5625, "percentage": 52.08, "elapsed_time": "0:12:57", "remaining_time": "0:11:55"}
26
+ {"current_steps": 26, "total_steps": 48, "loss": 0.7391, "lr": 5.182610115288296e-06, "epoch": 1.625, "percentage": 54.17, "elapsed_time": "0:13:23", "remaining_time": "0:11:19"}
27
+ {"current_steps": 27, "total_steps": 48, "loss": 0.7486, "lr": 4.817389884711706e-06, "epoch": 1.6875, "percentage": 56.25, "elapsed_time": "0:13:54", "remaining_time": "0:10:49"}
28
+ {"current_steps": 28, "total_steps": 48, "loss": 0.7909, "lr": 4.4531439581106295e-06, "epoch": 1.75, "percentage": 58.33, "elapsed_time": "0:14:25", "remaining_time": "0:10:18"}
29
+ {"current_steps": 29, "total_steps": 48, "loss": 0.7535, "lr": 4.091815745102818e-06, "epoch": 1.8125, "percentage": 60.42, "elapsed_time": "0:14:51", "remaining_time": "0:09:44"}
30
+ {"current_steps": 30, "total_steps": 48, "loss": 0.7276, "lr": 3.7353330880415963e-06, "epoch": 1.875, "percentage": 62.5, "elapsed_time": "0:15:15", "remaining_time": "0:09:09"}
31
+ {"current_steps": 31, "total_steps": 48, "loss": 0.7982, "lr": 3.3855979761427705e-06, "epoch": 1.9375, "percentage": 64.58, "elapsed_time": "0:15:43", "remaining_time": "0:08:37"}
32
+ {"current_steps": 32, "total_steps": 48, "loss": 0.7689, "lr": 3.044476397549221e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:16:18", "remaining_time": "0:08:09"}
33
+ {"current_steps": 33, "total_steps": 48, "loss": 0.735, "lr": 2.7137883834768076e-06, "epoch": 2.0625, "percentage": 68.75, "elapsed_time": "0:17:38", "remaining_time": "0:08:01"}
34
+ {"current_steps": 34, "total_steps": 48, "loss": 0.772, "lr": 2.3952982975603494e-06, "epoch": 2.125, "percentage": 70.83, "elapsed_time": "0:18:03", "remaining_time": "0:07:26"}
35
+ {"current_steps": 35, "total_steps": 48, "loss": 0.7111, "lr": 2.0907054222102367e-06, "epoch": 2.1875, "percentage": 72.92, "elapsed_time": "0:18:41", "remaining_time": "0:06:56"}
36
+ {"current_steps": 36, "total_steps": 48, "loss": 0.6825, "lr": 1.8016348922055448e-06, "epoch": 2.25, "percentage": 75.0, "elapsed_time": "0:19:13", "remaining_time": "0:06:24"}
37
+ {"current_steps": 37, "total_steps": 48, "loss": 0.6869, "lr": 1.5296290238968303e-06, "epoch": 2.3125, "percentage": 77.08, "elapsed_time": "0:19:45", "remaining_time": "0:05:52"}