rbelanec commited on
Commit
86ef5da
·
verified ·
1 Parent(s): 9a9dff2

Training in progress, step 250

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +3 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51ff13d7c0f9f3c84d5a0e7ac194d769d4f52a358e9402de5cec5ecbb30608b6
3
  size 8388736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bbe65086ab6ebbf11a17e3e59a9d020148eed4adc0be84a5b8f187cf682a190
3
  size 8388736
trainer_log.jsonl CHANGED
@@ -55,3 +55,6 @@
55
  {"current_steps": 230, "total_steps": 250, "loss": 0.1016, "lr": 2.134025123396638e-07, "epoch": 4.6, "percentage": 92.0, "elapsed_time": "0:01:10", "remaining_time": "0:00:06", "throughput": 2051.18, "total_tokens": 144960}
56
  {"current_steps": 235, "total_steps": 250, "loss": 0.1449, "lr": 1.2425322847218368e-07, "epoch": 4.7, "percentage": 94.0, "elapsed_time": "0:01:11", "remaining_time": "0:00:04", "throughput": 2068.53, "total_tokens": 147936}
57
  {"current_steps": 240, "total_steps": 250, "loss": 0.1232, "lr": 5.8858092767236084e-08, "epoch": 4.8, "percentage": 96.0, "elapsed_time": "0:01:12", "remaining_time": "0:00:03", "throughput": 2090.66, "total_tokens": 151392}
 
 
 
 
55
  {"current_steps": 230, "total_steps": 250, "loss": 0.1016, "lr": 2.134025123396638e-07, "epoch": 4.6, "percentage": 92.0, "elapsed_time": "0:01:10", "remaining_time": "0:00:06", "throughput": 2051.18, "total_tokens": 144960}
56
  {"current_steps": 235, "total_steps": 250, "loss": 0.1449, "lr": 1.2425322847218368e-07, "epoch": 4.7, "percentage": 94.0, "elapsed_time": "0:01:11", "remaining_time": "0:00:04", "throughput": 2068.53, "total_tokens": 147936}
57
  {"current_steps": 240, "total_steps": 250, "loss": 0.1232, "lr": 5.8858092767236084e-08, "epoch": 4.8, "percentage": 96.0, "elapsed_time": "0:01:12", "remaining_time": "0:00:03", "throughput": 2090.66, "total_tokens": 151392}
58
+ {"current_steps": 245, "total_steps": 250, "loss": 0.1831, "lr": 1.753570375247815e-08, "epoch": 4.9, "percentage": 98.0, "elapsed_time": "0:01:13", "remaining_time": "0:00:01", "throughput": 2107.95, "total_tokens": 154624}
59
+ {"current_steps": 250, "total_steps": 250, "loss": 0.1208, "lr": 4.87379953478806e-10, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:01:14", "remaining_time": "0:00:00", "throughput": 2130.97, "total_tokens": 158656}
60
+ {"current_steps": 250, "total_steps": 250, "eval_loss": 0.21456226706504822, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:01:15", "remaining_time": "0:00:00", "throughput": 2095.61, "total_tokens": 158656}