Spaces:
Running
on
Zero
Running
on
Zero
Upload folder using huggingface_hub
Browse files
app.py
CHANGED
|
@@ -72,7 +72,8 @@ class ModelHandler:
|
|
| 72 |
self.model_path,
|
| 73 |
torch_dtype=torch.bfloat16 if torch.cuda.is_available() else torch.float32,
|
| 74 |
device_map="auto",
|
| 75 |
-
attn_implementation="flash_attention_2" if use_flash_attention else "
|
|
|
|
| 76 |
trust_remote_code=True
|
| 77 |
)
|
| 78 |
print("✅ Model loaded successfully!")
|
|
|
|
| 72 |
self.model_path,
|
| 73 |
torch_dtype=torch.bfloat16 if torch.cuda.is_available() else torch.float32,
|
| 74 |
device_map="auto",
|
| 75 |
+
# attn_implementation="flash_attention_2" if use_flash_attention else "sdpa",
|
| 76 |
+
attn_implementation="sdpa",
|
| 77 |
trust_remote_code=True
|
| 78 |
)
|
| 79 |
print("✅ Model loaded successfully!")
|