Update handler.py
Browse files- handler.py +1 -1
handler.py
CHANGED
|
@@ -57,7 +57,7 @@ class EndpointHandler:
|
|
| 57 |
model_id,
|
| 58 |
trust_remote_code=True,
|
| 59 |
torch_dtype=torch.bfloat16 if torch.cuda.is_available() else torch.float32,
|
| 60 |
-
attn_implementation="
|
| 61 |
device_map="auto" if torch.cuda.is_available() else None,
|
| 62 |
token=hf_token,
|
| 63 |
)
|
|
|
|
| 57 |
model_id,
|
| 58 |
trust_remote_code=True,
|
| 59 |
torch_dtype=torch.bfloat16 if torch.cuda.is_available() else torch.float32,
|
| 60 |
+
attn_implementation="sdpa", # Use SDPA - flash_attn not installed in HF containers
|
| 61 |
device_map="auto" if torch.cuda.is_available() else None,
|
| 62 |
token=hf_token,
|
| 63 |
)
|