Training in progress, step 20
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 80792096
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f0e0fce800cc49131846f1b0d9a7867ae8c807f4daae816a80c1c413d8ec058
|
| 3 |
size 80792096
|
trainer_log.jsonl
CHANGED
|
@@ -9,3 +9,14 @@
|
|
| 9 |
{"current_steps": 9, "total_steps": 125, "loss": 0.1318, "lr": 6.923076923076924e-05, "epoch": 0.35555555555555557, "percentage": 7.2, "elapsed_time": "0:05:54", "remaining_time": "1:16:10"}
|
| 10 |
{"current_steps": 10, "total_steps": 125, "loss": 0.1222, "lr": 7.692307692307693e-05, "epoch": 0.3950617283950617, "percentage": 8.0, "elapsed_time": "0:06:30", "remaining_time": "1:14:48"}
|
| 11 |
{"current_steps": 10, "total_steps": 125, "eval_loss": 0.1259034425020218, "epoch": 0.3950617283950617, "percentage": 8.0, "elapsed_time": "0:06:58", "remaining_time": "1:20:09"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9 |
{"current_steps": 9, "total_steps": 125, "loss": 0.1318, "lr": 6.923076923076924e-05, "epoch": 0.35555555555555557, "percentage": 7.2, "elapsed_time": "0:05:54", "remaining_time": "1:16:10"}
|
| 10 |
{"current_steps": 10, "total_steps": 125, "loss": 0.1222, "lr": 7.692307692307693e-05, "epoch": 0.3950617283950617, "percentage": 8.0, "elapsed_time": "0:06:30", "remaining_time": "1:14:48"}
|
| 11 |
{"current_steps": 10, "total_steps": 125, "eval_loss": 0.1259034425020218, "epoch": 0.3950617283950617, "percentage": 8.0, "elapsed_time": "0:06:58", "remaining_time": "1:20:09"}
|
| 12 |
+
{"current_steps": 11, "total_steps": 125, "loss": 0.1177, "lr": 8.461538461538461e-05, "epoch": 0.4345679012345679, "percentage": 8.8, "elapsed_time": "0:07:32", "remaining_time": "1:18:08"}
|
| 13 |
+
{"current_steps": 12, "total_steps": 125, "loss": 0.0781, "lr": 9.230769230769232e-05, "epoch": 0.4740740740740741, "percentage": 9.6, "elapsed_time": "0:08:28", "remaining_time": "1:19:47"}
|
| 14 |
+
{"current_steps": 13, "total_steps": 125, "loss": 0.0794, "lr": 0.0001, "epoch": 0.5135802469135803, "percentage": 10.4, "elapsed_time": "0:09:01", "remaining_time": "1:17:46"}
|
| 15 |
+
{"current_steps": 14, "total_steps": 125, "loss": 0.0857, "lr": 9.998033131915266e-05, "epoch": 0.5530864197530864, "percentage": 11.2, "elapsed_time": "0:09:34", "remaining_time": "1:15:53"}
|
| 16 |
+
{"current_steps": 15, "total_steps": 125, "loss": 0.0733, "lr": 9.992134075089084e-05, "epoch": 0.5925925925925926, "percentage": 12.0, "elapsed_time": "0:10:11", "remaining_time": "1:14:47"}
|
| 17 |
+
{"current_steps": 16, "total_steps": 125, "loss": 0.0601, "lr": 9.982307470588098e-05, "epoch": 0.6320987654320988, "percentage": 12.8, "elapsed_time": "0:11:01", "remaining_time": "1:15:03"}
|
| 18 |
+
{"current_steps": 17, "total_steps": 125, "loss": 0.0619, "lr": 9.968561049466214e-05, "epoch": 0.671604938271605, "percentage": 13.6, "elapsed_time": "0:11:41", "remaining_time": "1:14:13"}
|
| 19 |
+
{"current_steps": 18, "total_steps": 125, "loss": 0.0641, "lr": 9.950905626682228e-05, "epoch": 0.7111111111111111, "percentage": 14.4, "elapsed_time": "0:12:10", "remaining_time": "1:12:24"}
|
| 20 |
+
{"current_steps": 19, "total_steps": 125, "loss": 0.061, "lr": 9.92935509259118e-05, "epoch": 0.7506172839506173, "percentage": 15.2, "elapsed_time": "0:12:51", "remaining_time": "1:11:44"}
|
| 21 |
+
{"current_steps": 20, "total_steps": 125, "loss": 0.0678, "lr": 9.903926402016153e-05, "epoch": 0.7901234567901234, "percentage": 16.0, "elapsed_time": "0:13:18", "remaining_time": "1:09:52"}
|
| 22 |
+
{"current_steps": 20, "total_steps": 125, "eval_loss": 0.06134464964270592, "epoch": 0.7901234567901234, "percentage": 16.0, "elapsed_time": "0:13:46", "remaining_time": "1:12:18"}
|