ryanmarten commited on
Commit
a9ed480
·
verified ·
1 Parent(s): 9a0e411

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:457453d8185955d638851af464724c8bbea6f4c3c3bd0ac6734abc942501e4dd
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a303b84070f5c585fec3e860afcc199c8d0cb9200ce1330b95d45c4fd843e9c
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5a6fa90b330a0a2b6f5a20bc75af1871b3b96ffab0e4e75a4762450c0453b9c
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51169d2bf398480aa6e78672e22ee4466c4185a658afadbeffb83bc9531ab598
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:111f0eaaaf91145f5674aaf17e1996a41c8b9af7e61be7479d27e22175eda013
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f45d2c5f626a8672934eacf676d79331a6827b62168fe6d8036cf154baeab91
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5e1aa8993b82e1656b98b84d1fa0b10a222c848cd4ddc61721ef7fdc6a449f4
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0eaf0c6a76b771275b1305d9d7b5d9c7fd2f33a1071727f9943be04cfe9bfbe2
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -16,3 +16,13 @@
16
  {"current_steps": 16, "total_steps": 117, "loss": 0.5685, "lr": 9.964234631709188e-06, "epoch": 1.6582278481012658, "percentage": 13.68, "elapsed_time": "0:06:38", "remaining_time": "0:41:56"}
17
  {"current_steps": 17, "total_steps": 117, "loss": 0.5271, "lr": 9.944154131125643e-06, "epoch": 1.759493670886076, "percentage": 14.53, "elapsed_time": "0:06:55", "remaining_time": "0:40:44"}
18
  {"current_steps": 18, "total_steps": 117, "loss": 0.4994, "lr": 9.91964794299315e-06, "epoch": 1.8607594936708862, "percentage": 15.38, "elapsed_time": "0:07:15", "remaining_time": "0:39:53"}
 
 
 
 
 
 
 
 
 
 
 
16
  {"current_steps": 16, "total_steps": 117, "loss": 0.5685, "lr": 9.964234631709188e-06, "epoch": 1.6582278481012658, "percentage": 13.68, "elapsed_time": "0:06:38", "remaining_time": "0:41:56"}
17
  {"current_steps": 17, "total_steps": 117, "loss": 0.5271, "lr": 9.944154131125643e-06, "epoch": 1.759493670886076, "percentage": 14.53, "elapsed_time": "0:06:55", "remaining_time": "0:40:44"}
18
  {"current_steps": 18, "total_steps": 117, "loss": 0.4994, "lr": 9.91964794299315e-06, "epoch": 1.8607594936708862, "percentage": 15.38, "elapsed_time": "0:07:15", "remaining_time": "0:39:53"}
19
+ {"current_steps": 19, "total_steps": 117, "loss": 0.5071, "lr": 9.890738003669029e-06, "epoch": 1.9620253164556962, "percentage": 16.24, "elapsed_time": "0:07:45", "remaining_time": "0:40:01"}
20
+ {"current_steps": 20, "total_steps": 117, "loss": 0.4746, "lr": 9.857450191464337e-06, "epoch": 2.1012658227848102, "percentage": 17.09, "elapsed_time": "0:08:55", "remaining_time": "0:43:17"}
21
+ {"current_steps": 21, "total_steps": 117, "loss": 0.4618, "lr": 9.819814303479268e-06, "epoch": 2.2025316455696204, "percentage": 17.95, "elapsed_time": "0:09:24", "remaining_time": "0:43:02"}
22
+ {"current_steps": 22, "total_steps": 117, "loss": 0.4508, "lr": 9.777864028930705e-06, "epoch": 2.3037974683544302, "percentage": 18.8, "elapsed_time": "0:09:52", "remaining_time": "0:42:39"}
23
+ {"current_steps": 23, "total_steps": 117, "loss": 0.3964, "lr": 9.731636918995821e-06, "epoch": 2.4050632911392404, "percentage": 19.66, "elapsed_time": "0:10:09", "remaining_time": "0:41:29"}
24
+ {"current_steps": 24, "total_steps": 117, "loss": 0.4052, "lr": 9.681174353198687e-06, "epoch": 2.5063291139240507, "percentage": 20.51, "elapsed_time": "0:10:26", "remaining_time": "0:40:29"}
25
+ {"current_steps": 25, "total_steps": 117, "loss": 0.4393, "lr": 9.626521502369984e-06, "epoch": 2.607594936708861, "percentage": 21.37, "elapsed_time": "0:10:53", "remaining_time": "0:40:05"}
26
+ {"current_steps": 26, "total_steps": 117, "loss": 0.4439, "lr": 9.567727288213005e-06, "epoch": 2.708860759493671, "percentage": 22.22, "elapsed_time": "0:11:13", "remaining_time": "0:39:16"}
27
+ {"current_steps": 27, "total_steps": 117, "loss": 0.3915, "lr": 9.504844339512096e-06, "epoch": 2.810126582278481, "percentage": 23.08, "elapsed_time": "0:11:33", "remaining_time": "0:38:31"}
28
+ {"current_steps": 28, "total_steps": 117, "loss": 0.391, "lr": 9.437928945022772e-06, "epoch": 2.911392405063291, "percentage": 23.93, "elapsed_time": "0:11:50", "remaining_time": "0:37:37"}