GilbertAkham commited on
Commit
4b8bb26
·
verified ·
1 Parent(s): d3cb356

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +10 -6
handler.py CHANGED
@@ -1,21 +1,25 @@
1
  # handler.py
2
  import torch
3
  from transformers import AutoTokenizer, AutoModelForCausalLM
 
4
 
5
- MODEL_PATH = "GilbertAkham/deepseek-R1-multitask-lora"
 
6
 
7
  class EndpointHandler:
8
  def __init__(self, path=""):
9
- print("Loading merged model...")
10
- self.tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH, trust_remote_code=True)
11
- self.model = AutoModelForCausalLM.from_pretrained(
12
- MODEL_PATH,
13
  torch_dtype=torch.float16,
14
  device_map="auto",
15
  trust_remote_code=True
16
  )
 
 
17
  self.model.eval()
18
- print("✅ Model loaded successfully.")
19
 
20
  def __call__(self, data):
21
  prompt = data.get("inputs", "")
 
1
  # handler.py
2
  import torch
3
  from transformers import AutoTokenizer, AutoModelForCausalLM
4
+ from peft import PeftModel
5
 
6
+ BASE_MODEL = "deepseek-ai/deepseek-coder-6.7b-instruct" # or your real base
7
+ ADAPTER_PATH = "GilbertAkham/deepseek-R1-multitask-lora"
8
 
9
  class EndpointHandler:
10
  def __init__(self, path=""):
11
+ print("Loading base model...")
12
+ self.tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL, trust_remote_code=True)
13
+ base_model = AutoModelForCausalLM.from_pretrained(
14
+ BASE_MODEL,
15
  torch_dtype=torch.float16,
16
  device_map="auto",
17
  trust_remote_code=True
18
  )
19
+ print("Attaching LoRA adapter...")
20
+ self.model = PeftModel.from_pretrained(base_model, ADAPTER_PATH)
21
  self.model.eval()
22
+ print("✅ LoRA adapter loaded successfully.")
23
 
24
  def __call__(self, data):
25
  prompt = data.get("inputs", "")