sedrickkeh commited on
Commit
9e6937c
·
verified ·
1 Parent(s): 3a84096

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e52c085950f524d749e9bea93d8dfe77432b7f70a71d49ede9350c4d7e4df4c2
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eaae1741a1d0234c89719a2643feadbc868e24f09b0c31241c0d57ac7aebbbe
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:724ce38a1eb76d9a4ec0f1a4cc34e8bba57e8be9fde9dc8f0443c210546d7f9a
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:537c0ba8796466458d7b994096971d4603aac003b0788ba9d8c5cfddf73bdf57
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72f37d71aef6cbee24ba71f7f98cde35edfdf8c8a8b4bd664ac9cf83a76642a9
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90b827c366e55055ef35cd22b7289e353919f343bc7d35ed07277fb956750a81
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3634bab91f03c697e8eda9d65bc5373deb7ec7678882c7ad643c83c6d30d9ae6
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9ab0769c89106d4b7b4bb69507b68aa558166bed24b174ff6b2e07f33b4f399
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -2,3 +2,7 @@
2
  {"current_steps": 20, "total_steps": 87, "loss": 1.1183, "lr": 5e-06, "epoch": 0.6866952789699571, "percentage": 22.99, "elapsed_time": "0:19:12", "remaining_time": "1:04:20"}
3
  {"current_steps": 29, "total_steps": 87, "eval_loss": 1.0753060579299927, "epoch": 0.9957081545064378, "percentage": 33.33, "elapsed_time": "0:28:29", "remaining_time": "0:56:58"}
4
  {"current_steps": 30, "total_steps": 87, "loss": 1.1737, "lr": 5e-06, "epoch": 1.0300429184549356, "percentage": 34.48, "elapsed_time": "0:30:27", "remaining_time": "0:57:51"}
 
 
 
 
 
2
  {"current_steps": 20, "total_steps": 87, "loss": 1.1183, "lr": 5e-06, "epoch": 0.6866952789699571, "percentage": 22.99, "elapsed_time": "0:19:12", "remaining_time": "1:04:20"}
3
  {"current_steps": 29, "total_steps": 87, "eval_loss": 1.0753060579299927, "epoch": 0.9957081545064378, "percentage": 33.33, "elapsed_time": "0:28:29", "remaining_time": "0:56:58"}
4
  {"current_steps": 30, "total_steps": 87, "loss": 1.1737, "lr": 5e-06, "epoch": 1.0300429184549356, "percentage": 34.48, "elapsed_time": "0:30:27", "remaining_time": "0:57:51"}
5
+ {"current_steps": 40, "total_steps": 87, "loss": 1.0339, "lr": 5e-06, "epoch": 1.3733905579399142, "percentage": 45.98, "elapsed_time": "0:40:03", "remaining_time": "0:47:03"}
6
+ {"current_steps": 50, "total_steps": 87, "loss": 1.0128, "lr": 5e-06, "epoch": 1.7167381974248928, "percentage": 57.47, "elapsed_time": "0:49:39", "remaining_time": "0:36:44"}
7
+ {"current_steps": 58, "total_steps": 87, "eval_loss": 1.036221981048584, "epoch": 1.9914163090128756, "percentage": 66.67, "elapsed_time": "0:58:04", "remaining_time": "0:29:02"}
8
+ {"current_steps": 60, "total_steps": 87, "loss": 1.0832, "lr": 5e-06, "epoch": 2.060085836909871, "percentage": 68.97, "elapsed_time": "1:00:57", "remaining_time": "0:27:25"}