anthonyfang commited on
Commit
b47b6d7
·
1 Parent(s): 67abd31

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -1,8 +1,8 @@
1
  from transformers import AutoModel, AutoTokenizer
2
  import gradio as gr
3
 
4
- tokenizer = AutoTokenizer.from_pretrained("anthonyfang/myllm3", trust_remote_code=True)
5
- model = AutoModel.from_pretrained("anthonyfang/myllm3", trust_remote_code=True).half()
6
  model = model.eval()
7
 
8
  def predict(input, history=None):
 
1
  from transformers import AutoModel, AutoTokenizer
2
  import gradio as gr
3
 
4
+ tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
5
+ model = AutoModel.from_pretrained("anthonyfang/myllm3", trust_remote_code=True).quantize(bits=4, compile_parallel_kernel=True, parallel_num=2).cpu().float()
6
  model = model.eval()
7
 
8
  def predict(input, history=None):