Update handler.py
Browse files- handler.py +1 -1
handler.py
CHANGED
|
@@ -20,7 +20,7 @@ class EndpointHandler:
|
|
| 20 |
torch_dtype=torch.bfloat16, # ✅ Changed to bfloat16
|
| 21 |
trust_remote_code=True,
|
| 22 |
device_map="auto",
|
| 23 |
-
attn_implementation="flash_attention_2" # ✅ Faster + stable
|
| 24 |
)
|
| 25 |
self.model.eval()
|
| 26 |
print("✅ Model loaded successfully!")
|
|
|
|
| 20 |
torch_dtype=torch.bfloat16, # ✅ Changed to bfloat16
|
| 21 |
trust_remote_code=True,
|
| 22 |
device_map="auto",
|
| 23 |
+
# attn_implementation="flash_attention_2" # ✅ Faster + stable
|
| 24 |
)
|
| 25 |
self.model.eval()
|
| 26 |
print("✅ Model loaded successfully!")
|