newtechdevng commited on
Commit
48c2c2d
·
verified ·
1 Parent(s): 01f27e4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -4
app.py CHANGED
@@ -7,16 +7,19 @@ MODEL_ID = "newtechdevng/qwen-math-tutor"
7
 
8
  tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
9
 
10
- # Load config and strip quantization settings
11
  config = AutoConfig.from_pretrained(MODEL_ID)
12
- config.quantization_config = {} # ← remove baked-in quantization
 
13
 
14
  model = AutoModelForCausalLM.from_pretrained(
15
  MODEL_ID,
16
- config = config,
17
- dtype = torch.float32, # ← fixed from torch_dtype
 
18
  )
19
  model = model.to("cpu")
 
20
  print("Model loaded!")
21
 
22
  def solve(question, history):
 
7
 
8
  tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
9
 
10
+ # Load and fix config remove quantization completely
11
  config = AutoConfig.from_pretrained(MODEL_ID)
12
+ if hasattr(config, "quantization_config"):
13
+ delattr(config, "quantization_config") # ← delete it entirely
14
 
15
  model = AutoModelForCausalLM.from_pretrained(
16
  MODEL_ID,
17
+ config = config,
18
+ torch_dtype = torch.float32,
19
+ low_cpu_mem_usage = True,
20
  )
21
  model = model.to("cpu")
22
+ model.eval()
23
  print("Model loaded!")
24
 
25
  def solve(question, history):