Upload folder using huggingface_hub
Browse files
README.md
CHANGED
|
@@ -199,4 +199,4 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
|
|
| 199 |
[More Information Needed]
|
| 200 |
### Framework versions
|
| 201 |
|
| 202 |
-
- PEFT 0.
|
|
|
|
| 199 |
[More Information Needed]
|
| 200 |
### Framework versions
|
| 201 |
|
| 202 |
+
- PEFT 0.13.2
|
adapter_config.json
CHANGED
|
@@ -10,20 +10,25 @@
|
|
| 10 |
"layers_pattern": null,
|
| 11 |
"layers_to_transform": null,
|
| 12 |
"loftq_config": {},
|
| 13 |
-
"lora_alpha":
|
| 14 |
-
"lora_dropout": 0.
|
| 15 |
"megatron_config": null,
|
| 16 |
"megatron_core": "megatron.core",
|
| 17 |
"modules_to_save": null,
|
| 18 |
"peft_type": "LORA",
|
| 19 |
-
"r":
|
| 20 |
"rank_pattern": {},
|
| 21 |
"revision": null,
|
| 22 |
"target_modules": [
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
"o_proj",
|
| 24 |
-
"
|
| 25 |
"down_proj",
|
| 26 |
-
"
|
|
|
|
| 27 |
],
|
| 28 |
"task_type": "CAUSAL_LM",
|
| 29 |
"use_dora": false,
|
|
|
|
| 10 |
"layers_pattern": null,
|
| 11 |
"layers_to_transform": null,
|
| 12 |
"loftq_config": {},
|
| 13 |
+
"lora_alpha": 64,
|
| 14 |
+
"lora_dropout": 0.0,
|
| 15 |
"megatron_config": null,
|
| 16 |
"megatron_core": "megatron.core",
|
| 17 |
"modules_to_save": null,
|
| 18 |
"peft_type": "LORA",
|
| 19 |
+
"r": 32,
|
| 20 |
"rank_pattern": {},
|
| 21 |
"revision": null,
|
| 22 |
"target_modules": [
|
| 23 |
+
"gate_up_proj",
|
| 24 |
+
"up_proj",
|
| 25 |
+
"k_proj",
|
| 26 |
+
"gate_proj",
|
| 27 |
"o_proj",
|
| 28 |
+
"q_proj",
|
| 29 |
"down_proj",
|
| 30 |
+
"qkv_proj",
|
| 31 |
+
"v_proj"
|
| 32 |
],
|
| 33 |
"task_type": "CAUSAL_LM",
|
| 34 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ca99efb978f25f66cb4568ab6e4ba1d0ebc7d9c68346a5fa8bcc29ff98666e4
|
| 3 |
+
size 201361312
|
runs/Jan28_14-20-00_t-20250128221901-wrvdh-worker-0/events.out.tfevents.1738074025.t-20250128221901-wrvdh-worker-0.617.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:996bb700c9e6f7c0832251fe626a7517ef4667be642c438fa7b34c0df58c3218
|
| 3 |
+
size 16636
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5432
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12efcd57b6a8086e328681cd6ac683048e2ee3e8c2f6af00cdf51a0190b0d8f3
|
| 3 |
size 5432
|