ryanmarten commited on
Commit
b55794f
·
verified ·
1 Parent(s): 18a37c9

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a9ab982f9b869d2d8a186da68dc8c55c22d245964f43a78ceedb0828f8da23e
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c047aceced617b70ad4855be47a2c5a5f79882fcb21774e5e8731631c71bd2c8
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52a1e81747f739e8175be42aec6e6248b9270bc069426321556e9fb5db94dc02
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:179c627c37e4aa8bd199be3e8c60fda72e1907aea286a9c27397460d7142d31c
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4324e908d8bc6d501e8e44782129061b85a29e0a0457c1c241147c532662676a
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c32e0fe08179101bf2b9c9d4c4a90105454867d96017c1908632fcb3de1e3734
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ef15342e33894b3ce9ce86a8289bbde59a24b8156782f9be49014a3a4a46ae0
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f90345b36c6ae1c17287ca6d330458e77b86edb42866e2d9be3e11d38ef32ac
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -16,3 +16,13 @@
16
  {"current_steps": 16, "total_steps": 117, "loss": 0.6258, "lr": 9.964234631709188e-06, "epoch": 1.6582278481012658, "percentage": 13.68, "elapsed_time": "0:07:00", "remaining_time": "0:44:12"}
17
  {"current_steps": 17, "total_steps": 117, "loss": 0.6115, "lr": 9.944154131125643e-06, "epoch": 1.759493670886076, "percentage": 14.53, "elapsed_time": "0:07:20", "remaining_time": "0:43:13"}
18
  {"current_steps": 18, "total_steps": 117, "loss": 0.6621, "lr": 9.91964794299315e-06, "epoch": 1.8607594936708862, "percentage": 15.38, "elapsed_time": "0:07:54", "remaining_time": "0:43:30"}
 
 
 
 
 
 
 
 
 
 
 
16
  {"current_steps": 16, "total_steps": 117, "loss": 0.6258, "lr": 9.964234631709188e-06, "epoch": 1.6582278481012658, "percentage": 13.68, "elapsed_time": "0:07:00", "remaining_time": "0:44:12"}
17
  {"current_steps": 17, "total_steps": 117, "loss": 0.6115, "lr": 9.944154131125643e-06, "epoch": 1.759493670886076, "percentage": 14.53, "elapsed_time": "0:07:20", "remaining_time": "0:43:13"}
18
  {"current_steps": 18, "total_steps": 117, "loss": 0.6621, "lr": 9.91964794299315e-06, "epoch": 1.8607594936708862, "percentage": 15.38, "elapsed_time": "0:07:54", "remaining_time": "0:43:30"}
19
+ {"current_steps": 19, "total_steps": 117, "loss": 0.6426, "lr": 9.890738003669029e-06, "epoch": 1.9620253164556962, "percentage": 16.24, "elapsed_time": "0:08:25", "remaining_time": "0:43:29"}
20
+ {"current_steps": 20, "total_steps": 117, "loss": 0.5377, "lr": 9.857450191464337e-06, "epoch": 2.1012658227848102, "percentage": 17.09, "elapsed_time": "0:09:39", "remaining_time": "0:46:51"}
21
+ {"current_steps": 21, "total_steps": 117, "loss": 0.6157, "lr": 9.819814303479268e-06, "epoch": 2.2025316455696204, "percentage": 17.95, "elapsed_time": "0:10:03", "remaining_time": "0:45:59"}
22
+ {"current_steps": 22, "total_steps": 117, "loss": 0.5267, "lr": 9.777864028930705e-06, "epoch": 2.3037974683544302, "percentage": 18.8, "elapsed_time": "0:10:30", "remaining_time": "0:45:22"}
23
+ {"current_steps": 23, "total_steps": 117, "loss": 0.5002, "lr": 9.731636918995821e-06, "epoch": 2.4050632911392404, "percentage": 19.66, "elapsed_time": "0:10:50", "remaining_time": "0:44:19"}
24
+ {"current_steps": 24, "total_steps": 117, "loss": 0.4973, "lr": 9.681174353198687e-06, "epoch": 2.5063291139240507, "percentage": 20.51, "elapsed_time": "0:11:13", "remaining_time": "0:43:30"}
25
+ {"current_steps": 25, "total_steps": 117, "loss": 0.5686, "lr": 9.626521502369984e-06, "epoch": 2.607594936708861, "percentage": 21.37, "elapsed_time": "0:11:44", "remaining_time": "0:43:13"}
26
+ {"current_steps": 26, "total_steps": 117, "loss": 0.453, "lr": 9.567727288213005e-06, "epoch": 2.708860759493671, "percentage": 22.22, "elapsed_time": "0:12:14", "remaining_time": "0:42:52"}
27
+ {"current_steps": 27, "total_steps": 117, "loss": 0.5362, "lr": 9.504844339512096e-06, "epoch": 2.810126582278481, "percentage": 23.08, "elapsed_time": "0:12:38", "remaining_time": "0:42:09"}
28
+ {"current_steps": 28, "total_steps": 117, "loss": 0.4751, "lr": 9.437928945022772e-06, "epoch": 2.911392405063291, "percentage": 23.93, "elapsed_time": "0:12:57", "remaining_time": "0:41:12"}