rbelanec commited on
Commit
567a556
verified
1 Parent(s): cf07cc7

Training in progress, step 221

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +3 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:997774bf8b11eca81554198a1869b51edceac75e57ee798aee8c37dc441eeafe
3
  size 312947112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1f41d907e743b9486bd6bdd45c5b3600a59054e65f165c52b7f8cf15e44577b
3
  size 312947112
trainer_log.jsonl CHANGED
@@ -58,3 +58,6 @@
58
  {"current_steps": 210, "total_steps": 249, "loss": 0.553, "lr": 3.831895019292897e-06, "epoch": 0.8433734939759037, "percentage": 84.34, "elapsed_time": "0:00:57", "remaining_time": "0:00:10", "throughput": 643.63, "total_tokens": 36848}
59
  {"current_steps": 215, "total_steps": 249, "loss": 0.5892, "lr": 2.9519683912911266e-06, "epoch": 0.8634538152610441, "percentage": 86.35, "elapsed_time": "0:00:57", "remaining_time": "0:00:09", "throughput": 655.44, "total_tokens": 37888}
60
  {"current_steps": 220, "total_steps": 249, "loss": 0.5174, "lr": 2.1804183734670277e-06, "epoch": 0.8835341365461847, "percentage": 88.35, "elapsed_time": "0:00:58", "remaining_time": "0:00:07", "throughput": 664.72, "total_tokens": 38768}
 
 
 
 
58
  {"current_steps": 210, "total_steps": 249, "loss": 0.553, "lr": 3.831895019292897e-06, "epoch": 0.8433734939759037, "percentage": 84.34, "elapsed_time": "0:00:57", "remaining_time": "0:00:10", "throughput": 643.63, "total_tokens": 36848}
59
  {"current_steps": 215, "total_steps": 249, "loss": 0.5892, "lr": 2.9519683912911266e-06, "epoch": 0.8634538152610441, "percentage": 86.35, "elapsed_time": "0:00:57", "remaining_time": "0:00:09", "throughput": 655.44, "total_tokens": 37888}
60
  {"current_steps": 220, "total_steps": 249, "loss": 0.5174, "lr": 2.1804183734670277e-06, "epoch": 0.8835341365461847, "percentage": 88.35, "elapsed_time": "0:00:58", "remaining_time": "0:00:07", "throughput": 664.72, "total_tokens": 38768}
61
+ {"current_steps": 221, "total_steps": 249, "eval_loss": 0.4947091042995453, "epoch": 0.8875502008032129, "percentage": 88.76, "elapsed_time": "0:00:59", "remaining_time": "0:00:07", "throughput": 654.97, "total_tokens": 38912}
62
+ {"current_steps": 225, "total_steps": 249, "loss": 0.6159, "lr": 1.5210375028143097e-06, "epoch": 0.9036144578313253, "percentage": 90.36, "elapsed_time": "0:01:01", "remaining_time": "0:00:06", "throughput": 645.49, "total_tokens": 39488}
63
+ {"current_steps": 230, "total_steps": 249, "loss": 0.5318, "lr": 9.770669513725128e-07, "epoch": 0.9236947791164659, "percentage": 92.37, "elapsed_time": "0:01:01", "remaining_time": "0:00:05", "throughput": 654.32, "total_tokens": 40336}