Valtry commited on
Commit
6fc208d
·
verified ·
1 Parent(s): bdc78db

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -17,7 +17,8 @@ tokenizer = AutoTokenizer.from_pretrained(model_name)
17
  print("Loading model...")
18
  model = AutoModelForCausalLM.from_pretrained(
19
  model_name,
20
- dtype=torch.float32
 
21
  ).to("cpu")
22
 
23
  print("Model loaded successfully!")
@@ -122,4 +123,4 @@ async def chat(req: ChatRequest):
122
 
123
  # Required for HuggingFace Spaces
124
  if __name__ == "__main__":
125
- uvicorn.run(app, host="0.0.0.0", port=7860)
 
17
  print("Loading model...")
18
  model = AutoModelForCausalLM.from_pretrained(
19
  model_name,
20
+ dtype=torch.float32,
21
+ low_cpu_mem_usage=True
22
  ).to("cpu")
23
 
24
  print("Model loaded successfully!")
 
123
 
124
  # Required for HuggingFace Spaces
125
  if __name__ == "__main__":
126
+ uvicorn.run(app, host="0.0.0.0", port=7860, workers=3)