MudassirFayaz commited on
Commit
6ef538a
·
verified ·
1 Parent(s): 270cdf9

added the handler

Browse files
Files changed (1) hide show
  1. handler.py +16 -0
handler.py ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import AutoTokenizer, AutoModelForCausalLM
2
+ import torch
3
+
4
+ class EndpointHandler:
5
+ def __init__(self, path=""):
6
+ self.tokenizer = AutoTokenizer.from_pretrained(path)
7
+ self.model = AutoModelForCausalLM.from_pretrained(path, torch_dtype=torch.float16)
8
+ self.model.eval()
9
+
10
+ def __call__(self, inputs):
11
+ prompt = inputs.get("inputs", "")
12
+ inputs = self.tokenizer(prompt, return_tensors="pt").to(self.model.device)
13
+ with torch.no_grad():
14
+ outputs = self.model.generate(**inputs, max_new_tokens=200)
15
+ response = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
16
+ return {"generated_text": response}