rbelanec
/

train_cb_42_1760636478

Model card Files Files and versions

rbelanec commited on Oct 16, 2025

Commit

86ef5da

·

verified ·

1 Parent(s): 9a9dff2

Training in progress, step 250

Files changed (2) hide show

adapter_model.safetensors +1 -1
trainer_log.jsonl +3 -0

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:51ff13d7c0f9f3c84d5a0e7ac194d769d4f52a358e9402de5cec5ecbb30608b6
 size 8388736

 version https://git-lfs.github.com/spec/v1
+oid sha256:1bbe65086ab6ebbf11a17e3e59a9d020148eed4adc0be84a5b8f187cf682a190
 size 8388736

trainer_log.jsonl CHANGED Viewed

@@ -55,3 +55,6 @@
 {"current_steps": 230, "total_steps": 250, "loss": 0.1016, "lr": 2.134025123396638e-07, "epoch": 4.6, "percentage": 92.0, "elapsed_time": "0:01:10", "remaining_time": "0:00:06", "throughput": 2051.18, "total_tokens": 144960}
 {"current_steps": 235, "total_steps": 250, "loss": 0.1449, "lr": 1.2425322847218368e-07, "epoch": 4.7, "percentage": 94.0, "elapsed_time": "0:01:11", "remaining_time": "0:00:04", "throughput": 2068.53, "total_tokens": 147936}
 {"current_steps": 240, "total_steps": 250, "loss": 0.1232, "lr": 5.8858092767236084e-08, "epoch": 4.8, "percentage": 96.0, "elapsed_time": "0:01:12", "remaining_time": "0:00:03", "throughput": 2090.66, "total_tokens": 151392}

 {"current_steps": 230, "total_steps": 250, "loss": 0.1016, "lr": 2.134025123396638e-07, "epoch": 4.6, "percentage": 92.0, "elapsed_time": "0:01:10", "remaining_time": "0:00:06", "throughput": 2051.18, "total_tokens": 144960}
 {"current_steps": 235, "total_steps": 250, "loss": 0.1449, "lr": 1.2425322847218368e-07, "epoch": 4.7, "percentage": 94.0, "elapsed_time": "0:01:11", "remaining_time": "0:00:04", "throughput": 2068.53, "total_tokens": 147936}
 {"current_steps": 240, "total_steps": 250, "loss": 0.1232, "lr": 5.8858092767236084e-08, "epoch": 4.8, "percentage": 96.0, "elapsed_time": "0:01:12", "remaining_time": "0:00:03", "throughput": 2090.66, "total_tokens": 151392}
+{"current_steps": 245, "total_steps": 250, "loss": 0.1831, "lr": 1.753570375247815e-08, "epoch": 4.9, "percentage": 98.0, "elapsed_time": "0:01:13", "remaining_time": "0:00:01", "throughput": 2107.95, "total_tokens": 154624}
+{"current_steps": 250, "total_steps": 250, "loss": 0.1208, "lr": 4.87379953478806e-10, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:01:14", "remaining_time": "0:00:00", "throughput": 2130.97, "total_tokens": 158656}
+{"current_steps": 250, "total_steps": 250, "eval_loss": 0.21456226706504822, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:01:15", "remaining_time": "0:00:00", "throughput": 2095.61, "total_tokens": 158656}