innoku commited on
Commit
b581555
·
verified ·
1 Parent(s): d118f04

Upload LoRA adapter (README written by author)

Browse files
Files changed (3) hide show
  1. README.md +5 -17
  2. adapter_config.json +5 -5
  3. adapter_model.safetensors +2 -2
README.md CHANGED
@@ -13,19 +13,7 @@ tags:
13
  - structured-output
14
  ---
15
 
16
- ## Model Description
17
-
18
- This adapter was trained for the StructEval competition
19
- to improve structured data generation accuracy.
20
-
21
- ## Base Model License
22
-
23
- The base model follows the Apache 2.0 license.
24
-
25
-
26
-
27
-
28
-
29
 
30
  This repository provides a **LoRA adapter** fine-tuned from
31
  **Qwen/Qwen3-4B-Instruct-2507** using **QLoRA (4-bit, Unsloth)**.
@@ -45,10 +33,10 @@ while intermediate reasoning (Chain-of-Thought) is masked.
45
 
46
  - Base model: Qwen/Qwen3-4B-Instruct-2507
47
  - Method: QLoRA (4-bit)
48
- - Max sequence length: 2048
49
- - Epochs: 3
50
- - Learning rate: 2e-06
51
- - LoRA: r=64, alpha=128
52
 
53
  ## Usage
54
 
 
13
  - structured-output
14
  ---
15
 
16
+ <【課題】ここは自分で記入して下さい>
 
 
 
 
 
 
 
 
 
 
 
 
17
 
18
  This repository provides a **LoRA adapter** fine-tuned from
19
  **Qwen/Qwen3-4B-Instruct-2507** using **QLoRA (4-bit, Unsloth)**.
 
33
 
34
  - Base model: Qwen/Qwen3-4B-Instruct-2507
35
  - Method: QLoRA (4-bit)
36
+ - Max sequence length: 3072
37
+ - Epochs: 6
38
+ - Learning rate: 1e-05
39
+ - LoRA: r=128, alpha=128
40
 
41
  ## Usage
42
 
adapter_config.json CHANGED
@@ -29,17 +29,17 @@
29
  "peft_type": "LORA",
30
  "peft_version": "0.18.1",
31
  "qalora_group_size": 16,
32
- "r": 64,
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
- "k_proj",
37
- "q_proj",
38
  "v_proj",
 
 
 
39
  "up_proj",
40
  "gate_proj",
41
- "down_proj",
42
- "o_proj"
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
 
29
  "peft_type": "LORA",
30
  "peft_version": "0.18.1",
31
  "qalora_group_size": 16,
32
+ "r": 128,
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
 
 
36
  "v_proj",
37
+ "down_proj",
38
+ "o_proj",
39
+ "k_proj",
40
  "up_proj",
41
  "gate_proj",
42
+ "q_proj"
 
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:969c15d2e63ee5b70dfc48fd3777b06a4faa740a63e41cfcdce4ffcd1d50e4bd
3
- size 528550256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a69d8a5e5919266f0170395d0285e4a05db652dd4766f153d77c5a92213f1c60
3
+ size 1057033224