esfrankel17 commited on
Commit
d302fcc
·
verified ·
1 Parent(s): 5b44f17

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b695628be09a643508e52039fa60ef5a85a27ed1211ccf2eece774d03aab7cef
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69d34209399e25d8b8bb35a8da61e53a8a64c34bfc0c610309ec772543e7c328
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d5313703da7b83ddbff33c3a681204ee8ef616a71d4e628fa1c24c69abd7d51
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a282f30ca1bf34c31d98e7f8aec8605cf9e61dc560571423c7ef1c8fcc1e6b46
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2fa3e4c5a3c16a2016eba49f0f7c43638c11997bf7d7eca038d4b9a9e3c28ff2
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76c399cffe60a696d7c46c7cd77ea20f4c5b35376680bf5446d4338a1ad00c87
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:117839d6ff043f40f59f225d6a9759c08c62c74d2cc640c62b3207e140856160
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d6b869e0c40e2f864fb88d7494640d654b7b7a7288dd158c23a3a8289d21342
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -2,3 +2,8 @@
2
  {"current_steps": 20, "total_steps": 99, "loss": 0.5275, "learning_rate": 5e-06, "epoch": 0.599250936329588, "percentage": 20.2, "elapsed_time": "0:10:21", "remaining_time": "0:40:53"}
3
  {"current_steps": 30, "total_steps": 99, "loss": 0.4984, "learning_rate": 5e-06, "epoch": 0.898876404494382, "percentage": 30.3, "elapsed_time": "0:15:28", "remaining_time": "0:35:34"}
4
  {"current_steps": 33, "total_steps": 99, "eval_loss": 0.4796934723854065, "epoch": 0.9887640449438202, "percentage": 33.33, "elapsed_time": "0:17:34", "remaining_time": "0:35:09"}
 
 
 
 
 
 
2
  {"current_steps": 20, "total_steps": 99, "loss": 0.5275, "learning_rate": 5e-06, "epoch": 0.599250936329588, "percentage": 20.2, "elapsed_time": "0:10:21", "remaining_time": "0:40:53"}
3
  {"current_steps": 30, "total_steps": 99, "loss": 0.4984, "learning_rate": 5e-06, "epoch": 0.898876404494382, "percentage": 30.3, "elapsed_time": "0:15:28", "remaining_time": "0:35:34"}
4
  {"current_steps": 33, "total_steps": 99, "eval_loss": 0.4796934723854065, "epoch": 0.9887640449438202, "percentage": 33.33, "elapsed_time": "0:17:34", "remaining_time": "0:35:09"}
5
+ {"current_steps": 40, "total_steps": 99, "loss": 0.5026, "learning_rate": 5e-06, "epoch": 1.198501872659176, "percentage": 40.4, "elapsed_time": "0:21:58", "remaining_time": "0:32:24"}
6
+ {"current_steps": 50, "total_steps": 99, "loss": 0.4573, "learning_rate": 5e-06, "epoch": 1.4981273408239701, "percentage": 50.51, "elapsed_time": "0:27:19", "remaining_time": "0:26:46"}
7
+ {"current_steps": 60, "total_steps": 99, "loss": 0.4507, "learning_rate": 5e-06, "epoch": 1.797752808988764, "percentage": 60.61, "elapsed_time": "0:32:30", "remaining_time": "0:21:07"}
8
+ {"current_steps": 66, "total_steps": 99, "eval_loss": 0.4573969542980194, "epoch": 1.9775280898876404, "percentage": 66.67, "elapsed_time": "0:36:19", "remaining_time": "0:18:09"}
9
+ {"current_steps": 70, "total_steps": 99, "loss": 0.4661, "learning_rate": 5e-06, "epoch": 2.097378277153558, "percentage": 70.71, "elapsed_time": "0:39:02", "remaining_time": "0:16:10"}