RanjithaRuttala commited on
Commit
c4ffa19
·
verified ·
1 Parent(s): 4791ca0

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +1 -1
handler.py CHANGED
@@ -20,7 +20,7 @@ class EndpointHandler:
20
  torch_dtype=torch.bfloat16, # ✅ Changed to bfloat16
21
  trust_remote_code=True,
22
  device_map="auto",
23
- attn_implementation="flash_attention_2" # ✅ Faster + stable
24
  )
25
  self.model.eval()
26
  print("✅ Model loaded successfully!")
 
20
  torch_dtype=torch.bfloat16, # ✅ Changed to bfloat16
21
  trust_remote_code=True,
22
  device_map="auto",
23
+ # attn_implementation="flash_attention_2" # ✅ Faster + stable
24
  )
25
  self.model.eval()
26
  print("✅ Model loaded successfully!")