Tentoumaru commited on
Commit
100129f
·
verified ·
1 Parent(s): 95065c5

Upload LoRA adapter (README written by author)

Browse files
Files changed (3) hide show
  1. README.md +5 -5
  2. adapter_config.json +5 -5
  3. adapter_model.safetensors +1 -1
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: Qwen/Qwen3-4B-Instruct-2507
3
  datasets:
4
  - Tentoumaru/structured_data_with_cot_dataset_512_v2_nocot_whit_rules
5
  language:
@@ -13,10 +13,10 @@ tags:
13
  - structured-output
14
  ---
15
 
16
- <qwen3-4b-dataset_512_v2_nocot_whit_rules
17
 
18
  This repository provides a **LoRA adapter** fine-tuned from
19
- **Qwen/Qwen3-4B-Instruct-2507** using **QLoRA (4-bit, Unsloth)**.
20
 
21
  This repository contains **LoRA adapter weights only**.
22
  The base model must be loaded separately.
@@ -31,7 +31,7 @@ while intermediate reasoning (Chain-of-Thought) is masked.
31
 
32
  ## Training Configuration
33
 
34
- - Base model: Qwen/Qwen3-4B-Instruct-2507
35
  - Method: QLoRA (4-bit)
36
  - Max sequence length: 512
37
  - Epochs: 1
@@ -45,7 +45,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
45
  from peft import PeftModel
46
  import torch
47
 
48
- base = "Qwen/Qwen3-4B-Instruct-2507"
49
  adapter = "Tentoumaru/structured_data_with_cot_dataset_512_v2_nocot"
50
 
51
  tokenizer = AutoTokenizer.from_pretrained(base)
 
1
  ---
2
+ base_model: unsloth/Qwen3-4B-Instruct-2507
3
  datasets:
4
  - Tentoumaru/structured_data_with_cot_dataset_512_v2_nocot_whit_rules
5
  language:
 
13
  - structured-output
14
  ---
15
 
16
+ <qwen3-4b-dataset_512_v2_nocot_whit_rules2
17
 
18
  This repository provides a **LoRA adapter** fine-tuned from
19
+ **unsloth/Qwen3-4B-Instruct-2507** using **QLoRA (4-bit, Unsloth)**.
20
 
21
  This repository contains **LoRA adapter weights only**.
22
  The base model must be loaded separately.
 
31
 
32
  ## Training Configuration
33
 
34
+ - Base model: unsloth/Qwen3-4B-Instruct-2507
35
  - Method: QLoRA (4-bit)
36
  - Max sequence length: 512
37
  - Epochs: 1
 
45
  from peft import PeftModel
46
  import torch
47
 
48
+ base = "unsloth/Qwen3-4B-Instruct-2507"
49
  adapter = "Tentoumaru/structured_data_with_cot_dataset_512_v2_nocot"
50
 
51
  tokenizer = AutoTokenizer.from_pretrained(base)
adapter_config.json CHANGED
@@ -34,12 +34,12 @@
34
  "revision": null,
35
  "target_modules": [
36
  "up_proj",
37
- "v_proj",
38
- "q_proj",
39
- "gate_proj",
40
- "down_proj",
41
  "k_proj",
42
- "o_proj"
 
 
 
 
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
 
34
  "revision": null,
35
  "target_modules": [
36
  "up_proj",
 
 
 
 
37
  "k_proj",
38
+ "down_proj",
39
+ "gate_proj",
40
+ "o_proj",
41
+ "v_proj",
42
+ "q_proj"
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b62f497b65be420e19e0d5cddf4661132ab8b41e39fafec09e676ef36b1647c9
3
  size 528550256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3b1d6af081c9fedf7a86ee1fc9c8a255c5041e7a4afa6e5111817bce4d30fc3
3
  size 528550256