Training in progress, step 70
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 80792096
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4819a1ef093d8de22f1066b2d2d4102e5ebd599b946193aeaee1f16e15ad5e16
|
| 3 |
size 80792096
|
trainer_log.jsonl
CHANGED
|
@@ -64,3 +64,14 @@
|
|
| 64 |
{"current_steps": 59, "total_steps": 125, "loss": 0.1048, "lr": 6.384177557124247e-05, "epoch": 2.330864197530864, "percentage": 47.2, "elapsed_time": "0:27:36", "remaining_time": "0:30:53"}
|
| 65 |
{"current_steps": 60, "total_steps": 125, "loss": 0.0496, "lr": 6.248882390836135e-05, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:28:02", "remaining_time": "0:30:22"}
|
| 66 |
{"current_steps": 60, "total_steps": 125, "eval_loss": 0.07066290825605392, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:28:24", "remaining_time": "0:30:46"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 64 |
{"current_steps": 59, "total_steps": 125, "loss": 0.1048, "lr": 6.384177557124247e-05, "epoch": 2.330864197530864, "percentage": 47.2, "elapsed_time": "0:27:36", "remaining_time": "0:30:53"}
|
| 65 |
{"current_steps": 60, "total_steps": 125, "loss": 0.0496, "lr": 6.248882390836135e-05, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:28:02", "remaining_time": "0:30:22"}
|
| 66 |
{"current_steps": 60, "total_steps": 125, "eval_loss": 0.07066290825605392, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:28:24", "remaining_time": "0:30:46"}
|
| 67 |
+
{"current_steps": 61, "total_steps": 125, "loss": 0.0301, "lr": 6.112604669781572e-05, "epoch": 2.4098765432098768, "percentage": 48.8, "elapsed_time": "0:28:54", "remaining_time": "0:30:20"}
|
| 68 |
+
{"current_steps": 62, "total_steps": 125, "loss": 0.0887, "lr": 5.9754516100806423e-05, "epoch": 2.449382716049383, "percentage": 49.6, "elapsed_time": "0:29:19", "remaining_time": "0:29:48"}
|
| 69 |
+
{"current_steps": 63, "total_steps": 125, "loss": 0.052, "lr": 5.837531116523682e-05, "epoch": 2.488888888888889, "percentage": 50.4, "elapsed_time": "0:29:44", "remaining_time": "0:29:15"}
|
| 70 |
+
{"current_steps": 64, "total_steps": 125, "loss": 0.0575, "lr": 5.698951697677498e-05, "epoch": 2.528395061728395, "percentage": 51.2, "elapsed_time": "0:30:10", "remaining_time": "0:28:45"}
|
| 71 |
+
{"current_steps": 65, "total_steps": 125, "loss": 0.1102, "lr": 5.559822380516539e-05, "epoch": 2.567901234567901, "percentage": 52.0, "elapsed_time": "0:30:35", "remaining_time": "0:28:14"}
|
| 72 |
+
{"current_steps": 66, "total_steps": 125, "loss": 0.0616, "lr": 5.420252624646238e-05, "epoch": 2.6074074074074076, "percentage": 52.8, "elapsed_time": "0:31:00", "remaining_time": "0:27:42"}
|
| 73 |
+
{"current_steps": 67, "total_steps": 125, "loss": 0.0695, "lr": 5.2803522361859594e-05, "epoch": 2.6469135802469137, "percentage": 53.6, "elapsed_time": "0:31:27", "remaining_time": "0:27:13"}
|
| 74 |
+
{"current_steps": 68, "total_steps": 125, "loss": 0.1095, "lr": 5.140231281379345e-05, "epoch": 2.68641975308642, "percentage": 54.4, "elapsed_time": "0:31:52", "remaining_time": "0:26:42"}
|
| 75 |
+
{"current_steps": 69, "total_steps": 125, "loss": 0.0992, "lr": 5e-05, "epoch": 2.725925925925926, "percentage": 55.2, "elapsed_time": "0:32:15", "remaining_time": "0:26:11"}
|
| 76 |
+
{"current_steps": 70, "total_steps": 125, "loss": 0.1027, "lr": 4.859768718620656e-05, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:32:42", "remaining_time": "0:25:41"}
|
| 77 |
+
{"current_steps": 70, "total_steps": 125, "eval_loss": 0.06911057978868484, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:33:04", "remaining_time": "0:25:59"}
|