CGQN commited on
Commit
71021b9
·
verified ·
1 Parent(s): 547dee4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -32,6 +32,7 @@ def load_model():
32
  attn_implementation="sdpa", # SDPA is fine on CPU; avoid flash-attn on CPU
33
  torch_dtype=torch.float32, # Safer default for CPU
34
  device_map="cpu" # Ensure CPU execution
 
35
  )
36
  model.eval()
37
 
 
32
  attn_implementation="sdpa", # SDPA is fine on CPU; avoid flash-attn on CPU
33
  torch_dtype=torch.float32, # Safer default for CPU
34
  device_map="cpu" # Ensure CPU execution
35
+ quantization_config=None,
36
  )
37
  model.eval()
38