Update app.py
Browse files
app.py
CHANGED
|
@@ -27,7 +27,7 @@ model = AutoModelForCausalLM.from_pretrained(model_id,
|
|
| 27 |
)
|
| 28 |
|
| 29 |
replace_linears_in_hf(model)
|
| 30 |
-
model
|
| 31 |
@spaces.GPU
|
| 32 |
def generate_response(user_input, max_new_tokens, temperature):
|
| 33 |
os.system("nvidia-smi")
|
|
|
|
| 27 |
)
|
| 28 |
|
| 29 |
replace_linears_in_hf(model)
|
| 30 |
+
model.to('cuda').eval()
|
| 31 |
@spaces.GPU
|
| 32 |
def generate_response(user_input, max_new_tokens, temperature):
|
| 33 |
os.system("nvidia-smi")
|