File size: 805 Bytes
acf77ab | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 | # LoRA config (proven in DriftCall)
LORA_R = 16
LORA_ALPHA = 32
LORA_DROPOUT = 0.05
BASE_MODEL = "unsloth/Qwen2.5-Coder-1.5B-Instruct"
def load_model(max_seq_len=2048):
from unsloth import FastLanguageModel
model, tokenizer = FastLanguageModel.from_pretrained(
model_name=BASE_MODEL,
max_seq_length=max_seq_len,
load_in_4bit=False, # Standard unsloth behavior, space uses fp16/bf16
dtype="bfloat16",
)
model = FastLanguageModel.get_peft_model(
model, r=LORA_R, lora_alpha=LORA_ALPHA,
lora_dropout=LORA_DROPOUT,
target_modules=["q_proj","k_proj","v_proj","o_proj",
"gate_proj","up_proj","down_proj"],
bias="none",
use_gradient_checkpointing="unsloth",
)
return model, tokenizer
|