handaru2002 commited on
Commit
14cf7fa
·
verified ·
1 Parent(s): 4a20f56

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -42,11 +42,12 @@ LLM_MODEL = "mistralai/Mistral-7B-Instruct-v0.2"
42
  # "Qwen/Qwen2.5-7B-Instruct"
43
 
44
  llm_tokenizer = AutoTokenizer.from_pretrained(LLM_MODEL)
 
45
  llm_model = AutoModelForCausalLM.from_pretrained(
46
  LLM_MODEL,
47
- device_map="auto",
48
  torch_dtype=torch.float16 if device == "cuda" else torch.float32
49
- )
 
50
  llm_model.eval()
51
 
52
  # ============================================================
 
42
  # "Qwen/Qwen2.5-7B-Instruct"
43
 
44
  llm_tokenizer = AutoTokenizer.from_pretrained(LLM_MODEL)
45
+
46
  llm_model = AutoModelForCausalLM.from_pretrained(
47
  LLM_MODEL,
 
48
  torch_dtype=torch.float16 if device == "cuda" else torch.float32
49
+ ).to(device)
50
+
51
  llm_model.eval()
52
 
53
  # ============================================================