Instructions to use MF0619/SFTv18 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- PEFT
How to use MF0619/SFTv18 with PEFT:
from peft import PeftModel from transformers import AutoModelForCausalLM base_model = AutoModelForCausalLM.from_pretrained("unsloth/qwen3-4b-instruct-2507-unsloth-bnb-4bit") model = PeftModel.from_pretrained(base_model, "MF0619/SFTv18") - Notebooks
- Google Colab
- Kaggle
Upload 8 files
Browse files- README.md +3 -3
- adapter_config.json +3 -3
- adapter_model.safetensors +2 -2
README.md
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
---
|
| 2 |
base_model: Qwen/Qwen3-4B-Instruct-2507
|
| 3 |
datasets:
|
| 4 |
-
- u-10bei/
|
| 5 |
language:
|
| 6 |
- en
|
| 7 |
license: apache-2.0
|
|
@@ -36,7 +36,7 @@ while intermediate reasoning (Chain-of-Thought) is masked.
|
|
| 36 |
- Max sequence length: 2048
|
| 37 |
- Epochs: 2
|
| 38 |
- Learning rate: 2e-05
|
| 39 |
-
- LoRA: r=
|
| 40 |
|
| 41 |
## Usage
|
| 42 |
|
|
@@ -59,7 +59,7 @@ model = PeftModel.from_pretrained(model, adapter)
|
|
| 59 |
|
| 60 |
## Sources & Terms (IMPORTANT)
|
| 61 |
|
| 62 |
-
Training data: u-10bei/
|
| 63 |
|
| 64 |
Dataset License: MIT License. This dataset is used and distributed under the terms of the MIT License.
|
| 65 |
Compliance: Users must comply with the MIT license (including copyright notice) and the base model's original terms of use.
|
|
|
|
| 1 |
---
|
| 2 |
base_model: Qwen/Qwen3-4B-Instruct-2507
|
| 3 |
datasets:
|
| 4 |
+
- u-10bei/structured_data_with_cot_dataset_512_v5
|
| 5 |
language:
|
| 6 |
- en
|
| 7 |
license: apache-2.0
|
|
|
|
| 36 |
- Max sequence length: 2048
|
| 37 |
- Epochs: 2
|
| 38 |
- Learning rate: 2e-05
|
| 39 |
+
- LoRA: r=32, alpha=64
|
| 40 |
|
| 41 |
## Usage
|
| 42 |
|
|
|
|
| 59 |
|
| 60 |
## Sources & Terms (IMPORTANT)
|
| 61 |
|
| 62 |
+
Training data: u-10bei/structured_data_with_cot_dataset_512_v5
|
| 63 |
|
| 64 |
Dataset License: MIT License. This dataset is used and distributed under the terms of the MIT License.
|
| 65 |
Compliance: Users must comply with the MIT license (including copyright notice) and the base model's original terms of use.
|
adapter_config.json
CHANGED
|
@@ -20,16 +20,16 @@
|
|
| 20 |
"layers_pattern": null,
|
| 21 |
"layers_to_transform": null,
|
| 22 |
"loftq_config": {},
|
| 23 |
-
"lora_alpha":
|
| 24 |
"lora_bias": false,
|
| 25 |
-
"lora_dropout": 0.
|
| 26 |
"megatron_config": null,
|
| 27 |
"megatron_core": "megatron.core",
|
| 28 |
"modules_to_save": null,
|
| 29 |
"peft_type": "LORA",
|
| 30 |
"peft_version": "0.18.1",
|
| 31 |
"qalora_group_size": 16,
|
| 32 |
-
"r":
|
| 33 |
"rank_pattern": {},
|
| 34 |
"revision": null,
|
| 35 |
"target_modules": [
|
|
|
|
| 20 |
"layers_pattern": null,
|
| 21 |
"layers_to_transform": null,
|
| 22 |
"loftq_config": {},
|
| 23 |
+
"lora_alpha": 64,
|
| 24 |
"lora_bias": false,
|
| 25 |
+
"lora_dropout": 0.05,
|
| 26 |
"megatron_config": null,
|
| 27 |
"megatron_core": "megatron.core",
|
| 28 |
"modules_to_save": null,
|
| 29 |
"peft_type": "LORA",
|
| 30 |
"peft_version": "0.18.1",
|
| 31 |
"qalora_group_size": 16,
|
| 32 |
+
"r": 32,
|
| 33 |
"rank_pattern": {},
|
| 34 |
"revision": null,
|
| 35 |
"target_modules": [
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b691675d975607c342b28d8000efb8351664544a04ed80643eba37ea51c891cd
|
| 3 |
+
size 264308896
|