arasaltan commited on
Commit
12f607d
Β·
verified Β·
1 Parent(s): 540a424

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -8
app.py CHANGED
@@ -11,20 +11,18 @@ tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL)
11
  tokenizer.pad_token = tokenizer.eos_token
12
 
13
  # Base model (CPU)
 
14
  model = AutoModelForCausalLM.from_pretrained(
15
  BASE_MODEL,
16
  torch_dtype=torch.float32,
17
- offload_folder="offload",
18
- device_map={"": "cpu"},
 
19
  low_cpu_mem_usage=True
20
  )
21
 
22
- # Load LoRA
23
- model = PeftModel.from_pretrained(
24
- model,
25
- LORA_PATH,
26
- is_trainable=False
27
- )
28
  model.eval()
29
 
30
 
 
11
  tokenizer.pad_token = tokenizer.eos_token
12
 
13
  # Base model (CPU)
14
+ # 1. Base model (disk offload aktif)
15
  model = AutoModelForCausalLM.from_pretrained(
16
  BASE_MODEL,
17
  torch_dtype=torch.float32,
18
+ device_map="auto",
19
+ offload_dir="offload",
20
+ offload_state_dict=True,
21
  low_cpu_mem_usage=True
22
  )
23
 
24
+ # 2. LoRA (RAM'de kalΔ±r)
25
+ model = PeftModel.from_pretrained(model, LORA_PATH)
 
 
 
 
26
  model.eval()
27
 
28