TymaaHammouda commited on
Commit
9d495ed
·
verified ·
1 Parent(s): a4960af

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -2
app.py CHANGED
@@ -49,12 +49,15 @@ def load_models():
49
  model_name = "deepseek-ai/DeepSeek-R1-Distill-Llama-8B"
50
  app.state.deepseek_tokenizer = AutoTokenizer.from_pretrained(model_name)
51
  app.state.deepseek_tokenizer.pad_token = app.state.deepseek_tokenizer.eos_token
52
-
53
  app.state.deepseek_model = AutoModelForCausalLM.from_pretrained(
54
  model_name,
55
- load_in_8bit=True, # requires bitsandbytes device_map="auto"
 
 
56
  )
57
 
 
58
  # -----------------------------
59
  # Model handlers
60
  # -----------------------------
 
49
  model_name = "deepseek-ai/DeepSeek-R1-Distill-Llama-8B"
50
  app.state.deepseek_tokenizer = AutoTokenizer.from_pretrained(model_name)
51
  app.state.deepseek_tokenizer.pad_token = app.state.deepseek_tokenizer.eos_token
52
+
53
  app.state.deepseek_model = AutoModelForCausalLM.from_pretrained(
54
  model_name,
55
+ torch_dtype="auto",
56
+ device_map="auto",
57
+ offload_folder="offload"
58
  )
59
 
60
+
61
  # -----------------------------
62
  # Model handlers
63
  # -----------------------------