rbelanec commited on
Commit
221d28e
·
verified ·
1 Parent(s): e486c2a

Training in progress, step 182

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +4 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7bcc6a76bf23dfba6cf601356c3f71909bef09a3af7da0d5008818996b8e4e2a
3
  size 312947112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4a73541b3fea040bb83694114c6ef5245d7da0e04edabe3972eb02c93e74026
3
  size 312947112
trainer_log.jsonl CHANGED
@@ -48,3 +48,7 @@
48
  {"current_steps": 175, "total_steps": 249, "loss": 0.494, "lr": 1.2601352710458313e-05, "epoch": 0.7028112449799196, "percentage": 70.28, "elapsed_time": "0:00:46", "remaining_time": "0:00:19", "throughput": 665.81, "total_tokens": 30976}
49
  {"current_steps": 180, "total_steps": 249, "loss": 0.4958, "lr": 1.1110744174509952e-05, "epoch": 0.7228915662650602, "percentage": 72.29, "elapsed_time": "0:00:46", "remaining_time": "0:00:18", "throughput": 676.56, "total_tokens": 31776}
50
  {"current_steps": 182, "total_steps": 249, "eval_loss": 0.5050697922706604, "epoch": 0.7309236947791165, "percentage": 73.09, "elapsed_time": "0:00:48", "remaining_time": "0:00:17", "throughput": 665.65, "total_tokens": 32080}
 
 
 
 
 
48
  {"current_steps": 175, "total_steps": 249, "loss": 0.494, "lr": 1.2601352710458313e-05, "epoch": 0.7028112449799196, "percentage": 70.28, "elapsed_time": "0:00:46", "remaining_time": "0:00:19", "throughput": 665.81, "total_tokens": 30976}
49
  {"current_steps": 180, "total_steps": 249, "loss": 0.4958, "lr": 1.1110744174509952e-05, "epoch": 0.7228915662650602, "percentage": 72.29, "elapsed_time": "0:00:46", "remaining_time": "0:00:18", "throughput": 676.56, "total_tokens": 31776}
50
  {"current_steps": 182, "total_steps": 249, "eval_loss": 0.5050697922706604, "epoch": 0.7309236947791165, "percentage": 73.09, "elapsed_time": "0:00:48", "remaining_time": "0:00:17", "throughput": 665.65, "total_tokens": 32080}
51
+ {"current_steps": 185, "total_steps": 249, "loss": 0.6199, "lr": 9.688407967401248e-06, "epoch": 0.7429718875502008, "percentage": 74.3, "elapsed_time": "0:00:49", "remaining_time": "0:00:17", "throughput": 652.8, "total_tokens": 32608}
52
+ {"current_steps": 190, "total_steps": 249, "loss": 0.6049, "lr": 8.341335551199902e-06, "epoch": 0.7630522088353414, "percentage": 76.31, "elapsed_time": "0:00:50", "remaining_time": "0:00:15", "throughput": 661.82, "total_tokens": 33360}
53
+ {"current_steps": 195, "total_steps": 249, "loss": 0.6547, "lr": 7.076148430479321e-06, "epoch": 0.7831325301204819, "percentage": 78.31, "elapsed_time": "0:00:50", "remaining_time": "0:00:14", "throughput": 671.85, "total_tokens": 34176}
54
+ {"current_steps": 195, "total_steps": 249, "eval_loss": 0.5061560273170471, "epoch": 0.7831325301204819, "percentage": 78.31, "elapsed_time": "0:00:51", "remaining_time": "0:00:14", "throughput": 659.28, "total_tokens": 34176}