dynamodenis254 commited on
Commit
7b70643
·
verified ·
1 Parent(s): 3197abd

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -33,7 +33,7 @@ def load_model():
33
  base_model = AutoModelForCausalLM.from_pretrained(
34
  BASE_MODEL,
35
  quantization_config = bnb_config,
36
- torch_dtype=torch.float16, # Use half precision for faster GPU inference
37
  device_map="auto",
38
  trust_remote_code=True,
39
  offload_folder="./offload_base" # === Specify a folder for disk offloading since we are using free CPU not GPU===
 
33
  base_model = AutoModelForCausalLM.from_pretrained(
34
  BASE_MODEL,
35
  quantization_config = bnb_config,
36
+ dtype=torch.float16, # Use half precision for faster GPU inference
37
  device_map="auto",
38
  trust_remote_code=True,
39
  offload_folder="./offload_base" # === Specify a folder for disk offloading since we are using free CPU not GPU===