Training in progress, step 12600
Browse files- adapter_config.json +5 -5
- adapter_model.safetensors +1 -1
- trainer_log.jsonl +2 -11
- training_args.bin +1 -1
adapter_config.json
CHANGED
|
@@ -23,13 +23,13 @@
|
|
| 23 |
"rank_pattern": {},
|
| 24 |
"revision": null,
|
| 25 |
"target_modules": [
|
| 26 |
-
"gate_proj",
|
| 27 |
-
"q_proj",
|
| 28 |
"o_proj",
|
| 29 |
-
"
|
| 30 |
-
"
|
| 31 |
"k_proj",
|
| 32 |
-
"
|
|
|
|
|
|
|
| 33 |
],
|
| 34 |
"task_type": "CAUSAL_LM",
|
| 35 |
"use_dora": false,
|
|
|
|
| 23 |
"rank_pattern": {},
|
| 24 |
"revision": null,
|
| 25 |
"target_modules": [
|
|
|
|
|
|
|
| 26 |
"o_proj",
|
| 27 |
+
"down_proj",
|
| 28 |
+
"q_proj",
|
| 29 |
"k_proj",
|
| 30 |
+
"v_proj",
|
| 31 |
+
"gate_proj",
|
| 32 |
+
"up_proj"
|
| 33 |
],
|
| 34 |
"task_type": "CAUSAL_LM",
|
| 35 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 161533160
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:366c6b6fac1cdd0e18cf44acfca9bdaee8477bb25d98740a7f9f89e4f4ba07d2
|
| 3 |
size 161533160
|
trainer_log.jsonl
CHANGED
|
@@ -1,11 +1,2 @@
|
|
| 1 |
-
{"current_steps":
|
| 2 |
-
{"current_steps":
|
| 3 |
-
{"current_steps": 12100, "total_steps": 18120, "loss": 0.3221, "lr": 3.0028102791373535e-05, "epoch": 2.0033112582781456, "percentage": 66.78, "elapsed_time": "0:37:49", "remaining_time": "0:18:48"}
|
| 4 |
-
{"current_steps": 12150, "total_steps": 18120, "loss": 0.281, "lr": 2.9587521598880573e-05, "epoch": 2.01158940397351, "percentage": 67.05, "elapsed_time": "0:41:00", "remaining_time": "0:20:08"}
|
| 5 |
-
{"current_steps": 12200, "total_steps": 18120, "loss": 0.2824, "lr": 2.914883419163475e-05, "epoch": 2.019867549668874, "percentage": 67.33, "elapsed_time": "0:44:12", "remaining_time": "0:21:27"}
|
| 6 |
-
{"current_steps": 12250, "total_steps": 18120, "loss": 0.2986, "lr": 2.871208126923771e-05, "epoch": 2.0281456953642385, "percentage": 67.6, "elapsed_time": "0:47:14", "remaining_time": "0:22:38"}
|
| 7 |
-
{"current_steps": 12300, "total_steps": 18120, "loss": 0.2852, "lr": 2.827730335181765e-05, "epoch": 2.0364238410596025, "percentage": 67.88, "elapsed_time": "0:50:32", "remaining_time": "0:23:54"}
|
| 8 |
-
{"current_steps": 12350, "total_steps": 18120, "loss": 0.2905, "lr": 2.7844540776269924e-05, "epoch": 2.044701986754967, "percentage": 68.16, "elapsed_time": "0:53:57", "remaining_time": "0:25:12"}
|
| 9 |
-
{"current_steps": 12400, "total_steps": 18120, "loss": 0.2791, "lr": 2.7413833692514844e-05, "epoch": 2.052980132450331, "percentage": 68.43, "elapsed_time": "0:57:06", "remaining_time": "0:26:20"}
|
| 10 |
-
{"current_steps": 12450, "total_steps": 18120, "loss": 0.2887, "lr": 2.698522205977273e-05, "epoch": 2.0612582781456954, "percentage": 68.71, "elapsed_time": "1:00:18", "remaining_time": "0:27:27"}
|
| 11 |
-
{"current_steps": 12500, "total_steps": 18120, "loss": 0.2845, "lr": 2.655874564285656e-05, "epoch": 2.0695364238410594, "percentage": 68.98, "elapsed_time": "1:03:33", "remaining_time": "0:28:34"}
|
|
|
|
| 1 |
+
{"current_steps": 12550, "total_steps": 18120, "loss": 0.284, "lr": 2.613444400848287e-05, "epoch": 2.077814569536424, "percentage": 69.26, "elapsed_time": "0:03:10", "remaining_time": "0:01:24"}
|
| 2 |
+
{"current_steps": 12600, "total_steps": 18120, "loss": 0.2852, "lr": 2.571235652160091e-05, "epoch": 2.0860927152317883, "percentage": 69.54, "elapsed_time": "0:06:12", "remaining_time": "0:02:43"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03460364198bac94559385f580ca233415d6d940ccd70edd3903925ee0255ba2
|
| 3 |
size 5752
|