newtechdevng commited on
Commit
139a6d6
·
verified ·
1 Parent(s): 48c2c2d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -12
app.py CHANGED
@@ -1,26 +1,18 @@
1
  import gradio as gr
2
- from transformers import AutoTokenizer, AutoModelForCausalLM, AutoConfig
3
  import torch
4
 
5
  print("Loading model...")
6
  MODEL_ID = "newtechdevng/qwen-math-tutor"
7
 
8
  tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
9
-
10
- # Load and fix config — remove quantization completely
11
- config = AutoConfig.from_pretrained(MODEL_ID)
12
- if hasattr(config, "quantization_config"):
13
- delattr(config, "quantization_config") # ← delete it entirely
14
-
15
  model = AutoModelForCausalLM.from_pretrained(
16
  MODEL_ID,
17
- config = config,
18
- torch_dtype = torch.float32,
19
- low_cpu_mem_usage = True,
20
  )
21
- model = model.to("cpu")
22
  model.eval()
23
- print("Model loaded!")
24
 
25
  def solve(question, history):
26
  messages = [
 
1
  import gradio as gr
2
+ from transformers import AutoTokenizer, AutoModelForCausalLM
3
  import torch
4
 
5
  print("Loading model...")
6
  MODEL_ID = "newtechdevng/qwen-math-tutor"
7
 
8
  tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
 
 
 
 
 
 
9
  model = AutoModelForCausalLM.from_pretrained(
10
  MODEL_ID,
11
+ torch_dtype = torch.float16,
12
+ device_map = "cpu",
 
13
  )
 
14
  model.eval()
15
+ print("Model loaded!")
16
 
17
  def solve(question, history):
18
  messages = [