Training in progress, step 80
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 80792096
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92ab4689480caf32dfc9a916cac7a88b18134bce72a945abd6f997431c7e6105
|
| 3 |
size 80792096
|
trainer_log.jsonl
CHANGED
|
@@ -75,3 +75,14 @@
|
|
| 75 |
{"current_steps": 69, "total_steps": 125, "loss": 0.0992, "lr": 5e-05, "epoch": 2.725925925925926, "percentage": 55.2, "elapsed_time": "0:32:15", "remaining_time": "0:26:11"}
|
| 76 |
{"current_steps": 70, "total_steps": 125, "loss": 0.1027, "lr": 4.859768718620656e-05, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:32:42", "remaining_time": "0:25:41"}
|
| 77 |
{"current_steps": 70, "total_steps": 125, "eval_loss": 0.06911057978868484, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:33:04", "remaining_time": "0:25:59"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 75 |
{"current_steps": 69, "total_steps": 125, "loss": 0.0992, "lr": 5e-05, "epoch": 2.725925925925926, "percentage": 55.2, "elapsed_time": "0:32:15", "remaining_time": "0:26:11"}
|
| 76 |
{"current_steps": 70, "total_steps": 125, "loss": 0.1027, "lr": 4.859768718620656e-05, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:32:42", "remaining_time": "0:25:41"}
|
| 77 |
{"current_steps": 70, "total_steps": 125, "eval_loss": 0.06911057978868484, "epoch": 2.765432098765432, "percentage": 56.0, "elapsed_time": "0:33:04", "remaining_time": "0:25:59"}
|
| 78 |
+
{"current_steps": 71, "total_steps": 125, "loss": 0.0677, "lr": 4.7196477638140404e-05, "epoch": 2.8049382716049385, "percentage": 56.8, "elapsed_time": "0:33:34", "remaining_time": "0:25:32"}
|
| 79 |
+
{"current_steps": 72, "total_steps": 125, "loss": 0.1371, "lr": 4.579747375353763e-05, "epoch": 2.8444444444444446, "percentage": 57.6, "elapsed_time": "0:34:01", "remaining_time": "0:25:02"}
|
| 80 |
+
{"current_steps": 73, "total_steps": 125, "loss": 0.0889, "lr": 4.4401776194834613e-05, "epoch": 2.8839506172839506, "percentage": 58.4, "elapsed_time": "0:34:27", "remaining_time": "0:24:32"}
|
| 81 |
+
{"current_steps": 74, "total_steps": 125, "loss": 0.0707, "lr": 4.3010483023225045e-05, "epoch": 2.9234567901234567, "percentage": 59.2, "elapsed_time": "0:34:54", "remaining_time": "0:24:03"}
|
| 82 |
+
{"current_steps": 75, "total_steps": 125, "loss": 0.0512, "lr": 4.162468883476319e-05, "epoch": 2.962962962962963, "percentage": 60.0, "elapsed_time": "0:35:20", "remaining_time": "0:23:33"}
|
| 83 |
+
{"current_steps": 76, "total_steps": 125, "loss": 0.0939, "lr": 4.0245483899193595e-05, "epoch": 3.0024691358024693, "percentage": 60.8, "elapsed_time": "0:35:45", "remaining_time": "0:23:03"}
|
| 84 |
+
{"current_steps": 77, "total_steps": 125, "loss": 0.1218, "lr": 3.887395330218429e-05, "epoch": 3.0419753086419754, "percentage": 61.6, "elapsed_time": "0:36:11", "remaining_time": "0:22:33"}
|
| 85 |
+
{"current_steps": 78, "total_steps": 125, "loss": 0.1469, "lr": 3.7511176091638653e-05, "epoch": 3.0814814814814815, "percentage": 62.4, "elapsed_time": "0:36:36", "remaining_time": "0:22:03"}
|
| 86 |
+
{"current_steps": 79, "total_steps": 125, "loss": 0.0381, "lr": 3.6158224428757535e-05, "epoch": 3.1209876543209876, "percentage": 63.2, "elapsed_time": "0:37:03", "remaining_time": "0:21:34"}
|
| 87 |
+
{"current_steps": 80, "total_steps": 125, "loss": 0.0985, "lr": 3.4816162744519263e-05, "epoch": 3.1604938271604937, "percentage": 64.0, "elapsed_time": "0:37:26", "remaining_time": "0:21:03"}
|
| 88 |
+
{"current_steps": 80, "total_steps": 125, "eval_loss": 0.06823357194662094, "epoch": 3.1604938271604937, "percentage": 64.0, "elapsed_time": "0:37:49", "remaining_time": "0:21:16"}
|