Training in progress, step 2
Browse files
adapter_config.json
CHANGED
|
@@ -29,27 +29,27 @@
|
|
| 29 |
"rank_pattern": {},
|
| 30 |
"revision": null,
|
| 31 |
"target_modules": [
|
| 32 |
-
"layers.
|
| 33 |
"layers.0.mlp.down_proj",
|
| 34 |
-
"layers.12.mlp.down_proj",
|
| 35 |
"q_proj",
|
| 36 |
-
"layers.
|
| 37 |
-
"o_proj",
|
| 38 |
-
"k_proj",
|
| 39 |
-
"layers.15.mlp.down_proj",
|
| 40 |
-
"layers.1.mlp.down_proj",
|
| 41 |
-
"layers.5.mlp.down_proj",
|
| 42 |
-
"layers.3.mlp.down_proj",
|
| 43 |
-
"gate_up_proj",
|
| 44 |
-
"layers.2.mlp.down_proj",
|
| 45 |
-
"layers.13.mlp.down_proj",
|
| 46 |
"layers.6.mlp.down_proj",
|
| 47 |
-
"v_proj",
|
| 48 |
-
"layers.10.mlp.down_proj",
|
| 49 |
"layers.11.mlp.down_proj",
|
| 50 |
-
"layers.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 51 |
"layers.7.mlp.down_proj",
|
| 52 |
-
"layers.
|
|
|
|
|
|
|
|
|
|
| 53 |
],
|
| 54 |
"target_parameters": null,
|
| 55 |
"task_type": "CAUSAL_LM",
|
|
|
|
| 29 |
"rank_pattern": {},
|
| 30 |
"revision": null,
|
| 31 |
"target_modules": [
|
| 32 |
+
"layers.2.mlp.down_proj",
|
| 33 |
"layers.0.mlp.down_proj",
|
|
|
|
| 34 |
"q_proj",
|
| 35 |
+
"layers.9.mlp.down_proj",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 36 |
"layers.6.mlp.down_proj",
|
|
|
|
|
|
|
| 37 |
"layers.11.mlp.down_proj",
|
| 38 |
+
"layers.10.mlp.down_proj",
|
| 39 |
+
"layers.15.mlp.down_proj",
|
| 40 |
+
"v_proj",
|
| 41 |
+
"gate_up_proj",
|
| 42 |
+
"layers.12.mlp.down_proj",
|
| 43 |
+
"layers.3.mlp.down_proj",
|
| 44 |
+
"o_proj",
|
| 45 |
+
"layers.14.mlp.down_proj",
|
| 46 |
+
"layers.8.mlp.down_proj",
|
| 47 |
+
"layers.5.mlp.down_proj",
|
| 48 |
"layers.7.mlp.down_proj",
|
| 49 |
+
"layers.1.mlp.down_proj",
|
| 50 |
+
"k_proj",
|
| 51 |
+
"layers.4.mlp.down_proj",
|
| 52 |
+
"layers.13.mlp.down_proj"
|
| 53 |
],
|
| 54 |
"target_parameters": null,
|
| 55 |
"task_type": "CAUSAL_LM",
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 29912904
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64df0764bfe053c84726c27244f3a4f48ca2824cda34102ebae5b1f6c142f440
|
| 3 |
size 29912904
|
runs/Apr09_05-18-42_cs-01knr8f8jy7kcvx4v0ce8jkn3q-1tpz/events.out.tfevents.1775711922.cs-01knr8f8jy7kcvx4v0ce8jkn3q-1tpz.131664.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80c23f3743cb3b30817c27ef57b88c9bc1587927e18ae9962d38b99b9e5862ff
|
| 3 |
+
size 6645
|
trainer_log.jsonl
CHANGED
|
@@ -1,8 +1,3 @@
|
|
| 1 |
{"current_steps": 1, "total_steps": 5, "loss": 2.965193033218384, "lr": 0.0, "epoch": 0.3076923076923077, "percentage": 20.0, "elapsed_time": "0:00:02", "remaining_time": "0:00:10"}
|
| 2 |
{"current_steps": 2, "total_steps": 5, "loss": 2.7841198444366455, "lr": 0.0001, "epoch": 0.6153846153846154, "percentage": 40.0, "elapsed_time": "0:00:03", "remaining_time": "0:00:05"}
|
| 3 |
{"current_steps": 2, "total_steps": 5, "eval_loss": 2.749584436416626, "epoch": 0.6153846153846154, "percentage": 40.0, "elapsed_time": "0:00:05", "remaining_time": "0:00:08"}
|
| 4 |
-
{"current_steps": 3, "total_steps": 5, "loss": 2.890326499938965, "lr": 8.535533905932738e-05, "epoch": 0.9230769230769231, "percentage": 60.0, "elapsed_time": "0:00:08", "remaining_time": "0:00:05"}
|
| 5 |
-
{"current_steps": 4, "total_steps": 5, "loss": 2.643332004547119, "lr": 5e-05, "epoch": 1.0, "percentage": 80.0, "elapsed_time": "0:00:08", "remaining_time": "0:00:02"}
|
| 6 |
-
{"current_steps": 4, "total_steps": 5, "eval_loss": 2.586768388748169, "epoch": 1.0, "percentage": 80.0, "elapsed_time": "0:00:10", "remaining_time": "0:00:02"}
|
| 7 |
-
{"current_steps": 5, "total_steps": 5, "loss": 2.5542030334472656, "lr": 1.4644660940672627e-05, "epoch": 1.3076923076923077, "percentage": 100.0, "elapsed_time": "0:00:13", "remaining_time": "0:00:00"}
|
| 8 |
-
{"current_steps": 5, "total_steps": 5, "epoch": 1.3076923076923077, "percentage": 100.0, "elapsed_time": "0:00:14", "remaining_time": "0:00:00"}
|
|
|
|
| 1 |
{"current_steps": 1, "total_steps": 5, "loss": 2.965193033218384, "lr": 0.0, "epoch": 0.3076923076923077, "percentage": 20.0, "elapsed_time": "0:00:02", "remaining_time": "0:00:10"}
|
| 2 |
{"current_steps": 2, "total_steps": 5, "loss": 2.7841198444366455, "lr": 0.0001, "epoch": 0.6153846153846154, "percentage": 40.0, "elapsed_time": "0:00:03", "remaining_time": "0:00:05"}
|
| 3 |
{"current_steps": 2, "total_steps": 5, "eval_loss": 2.749584436416626, "epoch": 0.6153846153846154, "percentage": 40.0, "elapsed_time": "0:00:05", "remaining_time": "0:00:08"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|