Training in progress, step 70
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 83945296
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:10b8490335e7c7e43f93ed3b6919b984c54b06a52522364c3f4ac4191797d344
|
| 3 |
size 83945296
|
trainer_log.jsonl
CHANGED
|
@@ -64,3 +64,14 @@
|
|
| 64 |
{"current_steps": 59, "total_steps": 125, "loss": 0.012, "lr": 6.384177557124247e-05, "epoch": 2.330864197530864, "percentage": 47.2, "elapsed_time": "0:43:10", "remaining_time": "0:48:17"}
|
| 65 |
{"current_steps": 60, "total_steps": 125, "loss": 0.0168, "lr": 6.248882390836135e-05, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:43:52", "remaining_time": "0:47:31"}
|
| 66 |
{"current_steps": 60, "total_steps": 125, "eval_loss": 0.020698141306638718, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:44:21", "remaining_time": "0:48:03"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 64 |
{"current_steps": 59, "total_steps": 125, "loss": 0.012, "lr": 6.384177557124247e-05, "epoch": 2.330864197530864, "percentage": 47.2, "elapsed_time": "0:43:10", "remaining_time": "0:48:17"}
|
| 65 |
{"current_steps": 60, "total_steps": 125, "loss": 0.0168, "lr": 6.248882390836135e-05, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:43:52", "remaining_time": "0:47:31"}
|
| 66 |
{"current_steps": 60, "total_steps": 125, "eval_loss": 0.020698141306638718, "epoch": 2.3703703703703702, "percentage": 48.0, "elapsed_time": "0:44:21", "remaining_time": "0:48:03"}
|
| 67 |
+
{"current_steps": 61, "total_steps": 125, "loss": 0.0141, "lr": 6.112604669781572e-05, "epoch": 2.4098765432098768, "percentage": 48.8, "elapsed_time": "0:45:07", "remaining_time": "0:47:20"}
|
| 68 |
+
{"current_steps": 62, "total_steps": 125, "loss": 0.0164, "lr": 5.9754516100806423e-05, "epoch": 2.449382716049383, "percentage": 49.6, "elapsed_time": "0:45:44", "remaining_time": "0:46:28"}
|
| 69 |
+
{"current_steps": 63, "total_steps": 125, "loss": 0.0149, "lr": 5.837531116523682e-05, "epoch": 2.488888888888889, "percentage": 50.4, "elapsed_time": "0:46:24", "remaining_time": "0:45:40"}
|
| 70 |
+
{"current_steps": 64, "total_steps": 125, "loss": 0.0138, "lr": 5.698951697677498e-05, "epoch": 2.528395061728395, "percentage": 51.2, "elapsed_time": "0:46:55", "remaining_time": "0:44:43"}
|
| 71 |
+
{"current_steps": 65, "total_steps": 125, "loss": 0.0179, "lr": 5.559822380516539e-05, "epoch": 2.567901234567901, "percentage": 52.0, "elapsed_time": "0:48:04", "remaining_time": "0:44:22"}
|
| 72 |
+
{"current_steps": 66, "total_steps": 125, "loss": 0.012, "lr": 5.420252624646238e-05, "epoch": 2.6074074074074076, "percentage": 52.8, "elapsed_time": "0:48:36", "remaining_time": "0:43:27"}
|
| 73 |
+
{"current_steps": 67, "total_steps": 125, "loss": 0.0169, "lr": 5.2803522361859594e-05, "epoch": 2.6469135802469137, "percentage": 53.6, "elapsed_time": "0:49:20", "remaining_time": "0:42:43"}
|
| 74 |
+
{"current_steps": 68, "total_steps": 125, "loss": 0.0154, "lr": 5.140231281379345e-05, "epoch": 2.68641975308642, "percentage": 54.4, "elapsed_time": "0:49:54", "remaining_time": "0:41:50"}
|
| 75 |
+
{"current_steps": 69, "total_steps": 125, "loss": 0.0114, "lr": 5e-05, "epoch": 2.725925925925926, "percentage": 55.2, "elapsed_time": "0:50:22", "remaining_time": "0:40:53"}
|
| 76 |
+
{"current_steps": 70, "total_steps": 125, "loss": 0.0153, "lr": 4.859768718620656e-05, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:50:52", "remaining_time": "0:39:58"}
|
| 77 |
+
{"current_steps": 70, "total_steps": 125, "eval_loss": 0.01982175186276436, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:51:21", "remaining_time": "0:40:21"}
|