Akira1101
/

lora-structeval-Ver14

Text Generation

structured-output

Model card Files Files and versions

Akira1101 commited on Feb 21

Commit

5ec47bf

·

verified ·

1 Parent(s): 8dc7b19

Update README.md

Files changed (1) hide show

README.md +3 -1

README.md CHANGED Viewed

@@ -37,6 +37,8 @@ while intermediate reasoning (Chain-of-Thought) is masked.
 - Epochs: 1
 - Learning rate: 5e-05
 - LoRA: r=2, alpha=2
 ## Usage
@@ -46,7 +48,7 @@ from peft import PeftModel
 import torch
 base = "Qwen/Qwen3-4B-Instruct-2507"
-adapter = "your_id/your-repo"
 tokenizer = AutoTokenizer.from_pretrained(base)
 model = AutoModelForCausalLM.from_pretrained(

 - Epochs: 1
 - Learning rate: 5e-05
 - LoRA: r=2, alpha=2
+- SFT_WARMUP_RATIO = 0.5
+- SFT WEIGHT_DECAY = 0.1
 ## Usage
 import torch
 base = "Qwen/Qwen3-4B-Instruct-2507"
+adapter = "Akira1101/lora-structeval-Ver14"
 tokenizer = AutoTokenizer.from_pretrained(base)
 model = AutoModelForCausalLM.from_pretrained(