Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -33,7 +33,7 @@ def load_model():
|
|
| 33 |
base_model = AutoModelForCausalLM.from_pretrained(
|
| 34 |
BASE_MODEL,
|
| 35 |
quantization_config = bnb_config,
|
| 36 |
-
|
| 37 |
device_map="auto",
|
| 38 |
trust_remote_code=True,
|
| 39 |
offload_folder="./offload_base" # === Specify a folder for disk offloading since we are using free CPU not GPU===
|
|
|
|
| 33 |
base_model = AutoModelForCausalLM.from_pretrained(
|
| 34 |
BASE_MODEL,
|
| 35 |
quantization_config = bnb_config,
|
| 36 |
+
dtype=torch.float16, # Use half precision for faster GPU inference
|
| 37 |
device_map="auto",
|
| 38 |
trust_remote_code=True,
|
| 39 |
offload_folder="./offload_base" # === Specify a folder for disk offloading since we are using free CPU not GPU===
|