TymaaHammouda commited on
Commit
24eadb0
·
verified ·
1 Parent(s): c3dacfc

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -46,7 +46,7 @@ def build_prompt(req1, req2, prompt_type="zero-shot"):
46
  @app.on_event("startup")
47
  def load_models():
48
  print("Loading smaller DeepSeek model into memory...")
49
- deepseek_name = "deepseek-ai/deepseek-vl2-small" # smaller model
50
  app.state.deepseek_tokenizer = AutoTokenizer.from_pretrained(deepseek_name)
51
  app.state.deepseek_tokenizer.pad_token = app.state.deepseek_tokenizer.eos_token
52
  app.state.deepseek_model = AutoModelForCausalLM.from_pretrained(
@@ -54,6 +54,7 @@ def load_models():
54
  torch_dtype=torch.float32 # CPU only
55
  )
56
 
 
57
  # -----------------------------
58
  # Model handlers
59
  # -----------------------------
 
46
  @app.on_event("startup")
47
  def load_models():
48
  print("Loading smaller DeepSeek model into memory...")
49
+ deepseek_name = "deepseek-ai/deepseek-coder-1.3b-base" # smaller, supported model
50
  app.state.deepseek_tokenizer = AutoTokenizer.from_pretrained(deepseek_name)
51
  app.state.deepseek_tokenizer.pad_token = app.state.deepseek_tokenizer.eos_token
52
  app.state.deepseek_model = AutoModelForCausalLM.from_pretrained(
 
54
  torch_dtype=torch.float32 # CPU only
55
  )
56
 
57
+
58
  # -----------------------------
59
  # Model handlers
60
  # -----------------------------