Reyad-Ahmmed commited on
Commit
cacb98b
·
verified ·
1 Parent(s): 97349c3

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +8 -1
handler.py CHANGED
@@ -25,7 +25,14 @@ class EndpointHandler:
25
  model_name = model_dir2 #"./json_extraction_all" # Pretrained model for sentiment analysis
26
  self.tokenizer = T5Tokenizer.from_pretrained(model_name)
27
 
28
- self.model = T5ForConditionalGeneration.from_pretrained(model_name, device_map="auto")
 
 
 
 
 
 
 
29
  self.model.eval() # Set model to evaluation mode (no training)
30
 
31
  # Check if the model is on GPU
 
25
  model_name = model_dir2 #"./json_extraction_all" # Pretrained model for sentiment analysis
26
  self.tokenizer = T5Tokenizer.from_pretrained(model_name)
27
 
28
+ #self.model = T5ForConditionalGeneration.from_pretrained(model_name, device_map="auto")
29
+ # Load model in float16 for faster inference
30
+ self.model = T5ForConditionalGeneration.from_pretrained(
31
+ model_name,
32
+ torch_dtype=torch.float16, # Use float16 for faster computation
33
+ device_map="auto" # Automatically uses GPU if available
34
+ )
35
+
36
  self.model.eval() # Set model to evaluation mode (no training)
37
 
38
  # Check if the model is on GPU