Update app.py
Browse files
app.py
CHANGED
|
@@ -14,8 +14,8 @@ def load_model():
|
|
| 14 |
model = AutoModelForCausalLM.from_pretrained(
|
| 15 |
"umar141/Gemma_1B_Baro_v2_vllm",
|
| 16 |
torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
|
| 17 |
-
|
| 18 |
-
)
|
| 19 |
return tokenizer, model
|
| 20 |
|
| 21 |
tokenizer, model = load_model()
|
|
|
|
| 14 |
model = AutoModelForCausalLM.from_pretrained(
|
| 15 |
"umar141/Gemma_1B_Baro_v2_vllm",
|
| 16 |
torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
|
| 17 |
+
|
| 18 |
+
).to("cuda" if torch.cuda.is_available() else "cpu")
|
| 19 |
return tokenizer, model
|
| 20 |
|
| 21 |
tokenizer, model = load_model()
|