Training in progress, step 250
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +3 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 8388736
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bbe65086ab6ebbf11a17e3e59a9d020148eed4adc0be84a5b8f187cf682a190
|
| 3 |
size 8388736
|
trainer_log.jsonl
CHANGED
|
@@ -55,3 +55,6 @@
|
|
| 55 |
{"current_steps": 230, "total_steps": 250, "loss": 0.1016, "lr": 2.134025123396638e-07, "epoch": 4.6, "percentage": 92.0, "elapsed_time": "0:01:10", "remaining_time": "0:00:06", "throughput": 2051.18, "total_tokens": 144960}
|
| 56 |
{"current_steps": 235, "total_steps": 250, "loss": 0.1449, "lr": 1.2425322847218368e-07, "epoch": 4.7, "percentage": 94.0, "elapsed_time": "0:01:11", "remaining_time": "0:00:04", "throughput": 2068.53, "total_tokens": 147936}
|
| 57 |
{"current_steps": 240, "total_steps": 250, "loss": 0.1232, "lr": 5.8858092767236084e-08, "epoch": 4.8, "percentage": 96.0, "elapsed_time": "0:01:12", "remaining_time": "0:00:03", "throughput": 2090.66, "total_tokens": 151392}
|
|
|
|
|
|
|
|
|
|
|
|
| 55 |
{"current_steps": 230, "total_steps": 250, "loss": 0.1016, "lr": 2.134025123396638e-07, "epoch": 4.6, "percentage": 92.0, "elapsed_time": "0:01:10", "remaining_time": "0:00:06", "throughput": 2051.18, "total_tokens": 144960}
|
| 56 |
{"current_steps": 235, "total_steps": 250, "loss": 0.1449, "lr": 1.2425322847218368e-07, "epoch": 4.7, "percentage": 94.0, "elapsed_time": "0:01:11", "remaining_time": "0:00:04", "throughput": 2068.53, "total_tokens": 147936}
|
| 57 |
{"current_steps": 240, "total_steps": 250, "loss": 0.1232, "lr": 5.8858092767236084e-08, "epoch": 4.8, "percentage": 96.0, "elapsed_time": "0:01:12", "remaining_time": "0:00:03", "throughput": 2090.66, "total_tokens": 151392}
|
| 58 |
+
{"current_steps": 245, "total_steps": 250, "loss": 0.1831, "lr": 1.753570375247815e-08, "epoch": 4.9, "percentage": 98.0, "elapsed_time": "0:01:13", "remaining_time": "0:00:01", "throughput": 2107.95, "total_tokens": 154624}
|
| 59 |
+
{"current_steps": 250, "total_steps": 250, "loss": 0.1208, "lr": 4.87379953478806e-10, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:01:14", "remaining_time": "0:00:00", "throughput": 2130.97, "total_tokens": 158656}
|
| 60 |
+
{"current_steps": 250, "total_steps": 250, "eval_loss": 0.21456226706504822, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:01:15", "remaining_time": "0:00:00", "throughput": 2095.61, "total_tokens": 158656}
|