Spaces:
Paused
Paused
zR commited on
Commit ·
5cecc58
1
Parent(s): 85c524d
cuda
Browse files
app.py
CHANGED
|
@@ -38,6 +38,7 @@ model = AutoModelForCausalLM.from_pretrained(
|
|
| 38 |
model_name,
|
| 39 |
torch_dtype=torch.bfloat16,
|
| 40 |
trust_remote_code=True,
|
|
|
|
| 41 |
attn_implementation="flash_attention_2",
|
| 42 |
)
|
| 43 |
|
|
|
|
| 38 |
model_name,
|
| 39 |
torch_dtype=torch.bfloat16,
|
| 40 |
trust_remote_code=True,
|
| 41 |
+
device="cuda",
|
| 42 |
attn_implementation="flash_attention_2",
|
| 43 |
)
|
| 44 |
|