Training in progress, step 70
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 80792096
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84b4fa685f278e4b0469c1382e427a1e53d767a517e55c9b88cb97401250e954
|
| 3 |
size 80792096
|
trainer_log.jsonl
CHANGED
|
@@ -64,3 +64,14 @@
|
|
| 64 |
{"current_steps": 59, "total_steps": 125, "loss": 0.0401, "lr": 6.384177557124247e-05, "epoch": 2.330864197530864, "percentage": 47.2, "elapsed_time": "0:26:56", "remaining_time": "0:30:07"}
|
| 65 |
{"current_steps": 60, "total_steps": 125, "loss": 0.0763, "lr": 6.248882390836135e-05, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:27:22", "remaining_time": "0:29:39"}
|
| 66 |
{"current_steps": 60, "total_steps": 125, "eval_loss": 0.07488537579774857, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:27:44", "remaining_time": "0:30:02"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 64 |
{"current_steps": 59, "total_steps": 125, "loss": 0.0401, "lr": 6.384177557124247e-05, "epoch": 2.330864197530864, "percentage": 47.2, "elapsed_time": "0:26:56", "remaining_time": "0:30:07"}
|
| 65 |
{"current_steps": 60, "total_steps": 125, "loss": 0.0763, "lr": 6.248882390836135e-05, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:27:22", "remaining_time": "0:29:39"}
|
| 66 |
{"current_steps": 60, "total_steps": 125, "eval_loss": 0.07488537579774857, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:27:44", "remaining_time": "0:30:02"}
|
| 67 |
+
{"current_steps": 61, "total_steps": 125, "loss": 0.0948, "lr": 6.112604669781572e-05, "epoch": 2.4098765432098768, "percentage": 48.8, "elapsed_time": "0:28:13", "remaining_time": "0:29:36"}
|
| 68 |
+
{"current_steps": 62, "total_steps": 125, "loss": 0.0565, "lr": 5.9754516100806423e-05, "epoch": 2.449382716049383, "percentage": 49.6, "elapsed_time": "0:28:37", "remaining_time": "0:29:05"}
|
| 69 |
+
{"current_steps": 63, "total_steps": 125, "loss": 0.0929, "lr": 5.837531116523682e-05, "epoch": 2.488888888888889, "percentage": 50.4, "elapsed_time": "0:29:03", "remaining_time": "0:28:35"}
|
| 70 |
+
{"current_steps": 64, "total_steps": 125, "loss": 0.0439, "lr": 5.698951697677498e-05, "epoch": 2.528395061728395, "percentage": 51.2, "elapsed_time": "0:29:27", "remaining_time": "0:28:04"}
|
| 71 |
+
{"current_steps": 65, "total_steps": 125, "loss": 0.0784, "lr": 5.559822380516539e-05, "epoch": 2.567901234567901, "percentage": 52.0, "elapsed_time": "0:29:52", "remaining_time": "0:27:34"}
|
| 72 |
+
{"current_steps": 66, "total_steps": 125, "loss": 0.062, "lr": 5.420252624646238e-05, "epoch": 2.6074074074074076, "percentage": 52.8, "elapsed_time": "0:30:18", "remaining_time": "0:27:05"}
|
| 73 |
+
{"current_steps": 67, "total_steps": 125, "loss": 0.1083, "lr": 5.2803522361859594e-05, "epoch": 2.6469135802469137, "percentage": 53.6, "elapsed_time": "0:30:43", "remaining_time": "0:26:35"}
|
| 74 |
+
{"current_steps": 68, "total_steps": 125, "loss": 0.0661, "lr": 5.140231281379345e-05, "epoch": 2.68641975308642, "percentage": 54.4, "elapsed_time": "0:31:06", "remaining_time": "0:26:04"}
|
| 75 |
+
{"current_steps": 69, "total_steps": 125, "loss": 0.0883, "lr": 5e-05, "epoch": 2.725925925925926, "percentage": 55.2, "elapsed_time": "0:31:31", "remaining_time": "0:25:35"}
|
| 76 |
+
{"current_steps": 70, "total_steps": 125, "loss": 0.0509, "lr": 4.859768718620656e-05, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:31:56", "remaining_time": "0:25:05"}
|
| 77 |
+
{"current_steps": 70, "total_steps": 125, "eval_loss": 0.07292327284812927, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:32:18", "remaining_time": "0:25:23"}
|