Training in progress, step 100
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 80792096
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b12a0b2dde71f2f4391d1996d3bfcc5b3c561d3a4f46cc771c57bd045b47224
|
| 3 |
size 80792096
|
trainer_log.jsonl
CHANGED
|
@@ -4,3 +4,14 @@
|
|
| 4 |
{"current_steps": 40, "total_steps": 3245, "loss": 1.3791, "lr": 1.230769230769231e-05, "epoch": 0.06156213928434013, "percentage": 1.23, "elapsed_time": "0:05:28", "remaining_time": "7:18:20"}
|
| 5 |
{"current_steps": 50, "total_steps": 3245, "loss": 0.8754, "lr": 1.5384615384615387e-05, "epoch": 0.07695267410542517, "percentage": 1.54, "elapsed_time": "0:06:50", "remaining_time": "7:16:46"}
|
| 6 |
{"current_steps": 50, "total_steps": 3245, "eval_loss": 0.6955563426017761, "epoch": 0.07695267410542517, "percentage": 1.54, "elapsed_time": "0:09:25", "remaining_time": "10:02:43"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4 |
{"current_steps": 40, "total_steps": 3245, "loss": 1.3791, "lr": 1.230769230769231e-05, "epoch": 0.06156213928434013, "percentage": 1.23, "elapsed_time": "0:05:28", "remaining_time": "7:18:20"}
|
| 5 |
{"current_steps": 50, "total_steps": 3245, "loss": 0.8754, "lr": 1.5384615384615387e-05, "epoch": 0.07695267410542517, "percentage": 1.54, "elapsed_time": "0:06:50", "remaining_time": "7:16:46"}
|
| 6 |
{"current_steps": 50, "total_steps": 3245, "eval_loss": 0.6955563426017761, "epoch": 0.07695267410542517, "percentage": 1.54, "elapsed_time": "0:09:25", "remaining_time": "10:02:43"}
|
| 7 |
+
{"current_steps": 60, "total_steps": 3245, "loss": 0.5912, "lr": 1.8461538461538465e-05, "epoch": 0.0923432089265102, "percentage": 1.85, "elapsed_time": "0:10:51", "remaining_time": "9:36:38"}
|
| 8 |
+
{"current_steps": 70, "total_steps": 3245, "loss": 0.4086, "lr": 2.1538461538461542e-05, "epoch": 0.10773374374759523, "percentage": 2.16, "elapsed_time": "0:12:13", "remaining_time": "9:14:13"}
|
| 9 |
+
{"current_steps": 80, "total_steps": 3245, "loss": 0.2136, "lr": 2.461538461538462e-05, "epoch": 0.12312427856868026, "percentage": 2.47, "elapsed_time": "0:13:35", "remaining_time": "8:57:27"}
|
| 10 |
+
{"current_steps": 90, "total_steps": 3245, "loss": 0.2183, "lr": 2.7692307692307694e-05, "epoch": 0.1385148133897653, "percentage": 2.77, "elapsed_time": "0:14:56", "remaining_time": "8:44:01"}
|
| 11 |
+
{"current_steps": 100, "total_steps": 3245, "loss": 0.1571, "lr": 3.0769230769230774e-05, "epoch": 0.15390534821085033, "percentage": 3.08, "elapsed_time": "0:16:18", "remaining_time": "8:33:05"}
|
| 12 |
+
{"current_steps": 100, "total_steps": 3245, "eval_loss": 0.10784146934747696, "epoch": 0.15390534821085033, "percentage": 3.08, "elapsed_time": "0:18:54", "remaining_time": "9:54:46"}
|
| 13 |
+
{"current_steps": 110, "total_steps": 3245, "loss": 0.1103, "lr": 3.384615384615385e-05, "epoch": 0.16929588303193535, "percentage": 3.39, "elapsed_time": "0:20:21", "remaining_time": "9:40:04"}
|
| 14 |
+
{"current_steps": 120, "total_steps": 3245, "loss": 0.1089, "lr": 3.692307692307693e-05, "epoch": 0.1846864178530204, "percentage": 3.7, "elapsed_time": "0:21:43", "remaining_time": "9:25:40"}
|
| 15 |
+
{"current_steps": 130, "total_steps": 3245, "loss": 0.078, "lr": 4e-05, "epoch": 0.2000769526741054, "percentage": 4.01, "elapsed_time": "0:23:05", "remaining_time": "9:13:11"}
|
| 16 |
+
{"current_steps": 140, "total_steps": 3245, "loss": 0.0833, "lr": 4.3076923076923084e-05, "epoch": 0.21546748749519046, "percentage": 4.31, "elapsed_time": "0:24:27", "remaining_time": "9:02:22"}
|
| 17 |
+
{"current_steps": 150, "total_steps": 3245, "loss": 0.0871, "lr": 4.615384615384616e-05, "epoch": 0.2308580223162755, "percentage": 4.62, "elapsed_time": "0:25:48", "remaining_time": "8:52:40"}
|