Shahbazakbar commited on
Commit
fffa177
·
verified ·
1 Parent(s): 5afc8e2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -5,8 +5,8 @@ import torch
5
  zephyr_tokenizer = AutoTokenizer.from_pretrained("HuggingFaceH4/zephyr-7b-alpha")
6
  zephyr_model = AutoModelForCausalLM.from_pretrained(
7
  "HuggingFaceH4/zephyr-7b-alpha",
8
- #torch_dtype=torch.float16, # Use half-precision for faster inference
9
- #device_map="auto" # Automatically loads the model on GPU if available
10
  )
11
 
12
  def generate_response(prompt):
 
5
  zephyr_tokenizer = AutoTokenizer.from_pretrained("HuggingFaceH4/zephyr-7b-alpha")
6
  zephyr_model = AutoModelForCausalLM.from_pretrained(
7
  "HuggingFaceH4/zephyr-7b-alpha",
8
+ torch_dtype=torch.float16, # Use half-precision for faster inference
9
+ device_map="auto" # Automatically loads the model on GPU if available
10
  )
11
 
12
  def generate_response(prompt):