Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -32,6 +32,7 @@ def load_model():
|
|
| 32 |
attn_implementation="sdpa", # SDPA is fine on CPU; avoid flash-attn on CPU
|
| 33 |
torch_dtype=torch.float32, # Safer default for CPU
|
| 34 |
device_map="cpu" # Ensure CPU execution
|
|
|
|
| 35 |
)
|
| 36 |
model.eval()
|
| 37 |
|
|
|
|
| 32 |
attn_implementation="sdpa", # SDPA is fine on CPU; avoid flash-attn on CPU
|
| 33 |
torch_dtype=torch.float32, # Safer default for CPU
|
| 34 |
device_map="cpu" # Ensure CPU execution
|
| 35 |
+
quantization_config=None,
|
| 36 |
)
|
| 37 |
model.eval()
|
| 38 |
|