rbelanec commited on
Commit
acbab24
·
verified ·
1 Parent(s): 8ed6013

Training in progress, step 570

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +4 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01829a788bf14537ae6a2717e7cac9de7449292558f3ce12cfd60560f70e4461
3
  size 819328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:969cc9352ffc9154386dd5904f924bf167d0e8d5c56d417975fee09a659c6a21
3
  size 819328
trainer_log.jsonl CHANGED
@@ -128,3 +128,7 @@
128
  {"current_steps": 550, "total_steps": 570, "loss": 0.0748, "lr": 2.064500424599436e-07, "epoch": 9.649122807017545, "percentage": 96.49, "elapsed_time": "0:02:36", "remaining_time": "0:00:05", "throughput": 2270.36, "total_tokens": 355432}
129
  {"current_steps": 551, "total_steps": 570, "eval_loss": 0.16427111625671387, "epoch": 9.666666666666666, "percentage": 96.67, "elapsed_time": "0:02:37", "remaining_time": "0:00:05", "throughput": 2260.66, "total_tokens": 356456}
130
  {"current_steps": 555, "total_steps": 570, "loss": 0.0861, "lr": 1.1991334092484318e-07, "epoch": 9.736842105263158, "percentage": 97.37, "elapsed_time": "0:02:39", "remaining_time": "0:00:04", "throughput": 2251.5, "total_tokens": 358760}
 
 
 
 
 
128
  {"current_steps": 550, "total_steps": 570, "loss": 0.0748, "lr": 2.064500424599436e-07, "epoch": 9.649122807017545, "percentage": 96.49, "elapsed_time": "0:02:36", "remaining_time": "0:00:05", "throughput": 2270.36, "total_tokens": 355432}
129
  {"current_steps": 551, "total_steps": 570, "eval_loss": 0.16427111625671387, "epoch": 9.666666666666666, "percentage": 96.67, "elapsed_time": "0:02:37", "remaining_time": "0:00:05", "throughput": 2260.66, "total_tokens": 356456}
130
  {"current_steps": 555, "total_steps": 570, "loss": 0.0861, "lr": 1.1991334092484318e-07, "epoch": 9.736842105263158, "percentage": 97.37, "elapsed_time": "0:02:39", "remaining_time": "0:00:04", "throughput": 2251.5, "total_tokens": 358760}
131
+ {"current_steps": 560, "total_steps": 570, "loss": 0.2105, "lr": 5.6701710711626334e-08, "epoch": 9.824561403508772, "percentage": 98.25, "elapsed_time": "0:02:40", "remaining_time": "0:00:02", "throughput": 2256.25, "total_tokens": 362088}
132
+ {"current_steps": 565, "total_steps": 570, "loss": 0.2063, "lr": 1.6874412698408836e-08, "epoch": 9.912280701754385, "percentage": 99.12, "elapsed_time": "0:02:41", "remaining_time": "0:00:01", "throughput": 2261.43, "total_tokens": 365544}
133
+ {"current_steps": 570, "total_steps": 570, "loss": 0.0874, "lr": 4.687849611939576e-10, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "0:02:42", "remaining_time": "0:00:00", "throughput": 2261.78, "total_tokens": 367864}
134
+ {"current_steps": 570, "total_steps": 570, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "0:02:43", "remaining_time": "0:00:00", "throughput": 2250.45, "total_tokens": 367864}