Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -12,11 +12,11 @@ import torch
12
  # torch_dtype=torch.float16, # Reduce memory usage
13
  # )
14
 
15
- from optimum.intel import OVModelForCausalLM
16
  from transformers import AutoTokenizer
17
 
18
  model_name = "abhifdsdf/good_disease_8bit"
19
- model = OVModelForCausalLM.from_pretrained(model_name)
20
  tokenizer = AutoTokenizer.from_pretrained(model_name)
21
 
22
 
 
12
  # torch_dtype=torch.float16, # Reduce memory usage
13
  # )
14
 
15
+ from auto_gptq import AutoGPTQForCausalLM
16
  from transformers import AutoTokenizer
17
 
18
  model_name = "abhifdsdf/good_disease_8bit"
19
+ model = AutoGPTQForCausalLM.from_pretrained(model_name)
20
  tokenizer = AutoTokenizer.from_pretrained(model_name)
21
 
22