rbelanec commited on
Commit
cd622dd
·
verified ·
1 Parent(s): 6760379

Training in progress, step 247

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +4 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f39a4d0181d83b75bea8d35343fe99264d206f013217af96252cad24c34eccdb
3
  size 335717200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7598b118796b1a30bbf291b15efef6a1ddf11a79a29338c929248412495fa19c
3
  size 335717200
trainer_log.jsonl CHANGED
@@ -63,3 +63,7 @@
63
  {"current_steps": 230, "total_steps": 249, "loss": 0.3419, "lr": 9.770669513725128e-07, "epoch": 0.9236947791164659, "percentage": 92.37, "elapsed_time": "0:00:56", "remaining_time": "0:00:04", "throughput": 710.8, "total_tokens": 40336}
64
  {"current_steps": 234, "total_steps": 249, "eval_loss": 0.3496658504009247, "epoch": 0.9397590361445783, "percentage": 93.98, "elapsed_time": "0:00:57", "remaining_time": "0:00:03", "throughput": 710.15, "total_tokens": 41120}
65
  {"current_steps": 235, "total_steps": 249, "loss": 0.3635, "lr": 5.5118059431781e-07, "epoch": 0.9437751004016064, "percentage": 94.38, "elapsed_time": "0:00:59", "remaining_time": "0:00:03", "throughput": 697.74, "total_tokens": 41328}
 
 
 
 
 
63
  {"current_steps": 230, "total_steps": 249, "loss": 0.3419, "lr": 9.770669513725128e-07, "epoch": 0.9236947791164659, "percentage": 92.37, "elapsed_time": "0:00:56", "remaining_time": "0:00:04", "throughput": 710.8, "total_tokens": 40336}
64
  {"current_steps": 234, "total_steps": 249, "eval_loss": 0.3496658504009247, "epoch": 0.9397590361445783, "percentage": 93.98, "elapsed_time": "0:00:57", "remaining_time": "0:00:03", "throughput": 710.15, "total_tokens": 41120}
65
  {"current_steps": 235, "total_steps": 249, "loss": 0.3635, "lr": 5.5118059431781e-07, "epoch": 0.9437751004016064, "percentage": 94.38, "elapsed_time": "0:00:59", "remaining_time": "0:00:03", "throughput": 697.74, "total_tokens": 41328}
66
+ {"current_steps": 240, "total_steps": 249, "loss": 0.3463, "lr": 2.454718665888589e-07, "epoch": 0.963855421686747, "percentage": 96.39, "elapsed_time": "0:00:59", "remaining_time": "0:00:02", "throughput": 707.56, "total_tokens": 42176}
67
+ {"current_steps": 245, "total_steps": 249, "loss": 0.3311, "lr": 6.14434726538493e-08, "epoch": 0.9839357429718876, "percentage": 98.39, "elapsed_time": "0:01:00", "remaining_time": "0:00:00", "throughput": 721.52, "total_tokens": 43312}
68
+ {"current_steps": 247, "total_steps": 249, "eval_loss": 0.3558541238307953, "epoch": 0.9919678714859438, "percentage": 99.2, "elapsed_time": "0:01:00", "remaining_time": "0:00:00", "throughput": 714.9, "total_tokens": 43600}
69
+ {"current_steps": 249, "total_steps": 249, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:01:03", "remaining_time": "0:00:00", "throughput": 686.86, "total_tokens": 43904}