tcml-chatglm-chat

Runtime error

Heng666 commited on Jan 17, 2024

Commit

97208c2

verified ·

1 Parent(s): df5154d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,14 +2,21 @@ import gradio as gr
 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, AutoModel
 from transformers import StoppingCriteria, StoppingCriteriaList, TextIteratorStreamer
 from threading import Thread
 # Loading the tokenizer and model from Hugging Face's model hub.
 # model_name_or_path = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
 model_name_or_path = "Flmc/DISC-MedLLM"
-tokenizer = AutoTokenizer.from_pretrained(model_name_or_path,trust_remote_code=True)
 # model = AutoModelForCausalLM.from_pretrained(model_name,trust_remote_code=True)
-model = AutoModel.from_pretrained(model_name_or_path, trust_remote_code=True)
 # using CUDA for an optimal experience
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, AutoModel
 from transformers import StoppingCriteria, StoppingCriteriaList, TextIteratorStreamer
+from transformers.generation.utils import GenerationConfig
 from threading import Thread
 # Loading the tokenizer and model from Hugging Face's model hub.
 # model_name_or_path = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
 model_name_or_path = "Flmc/DISC-MedLLM"
+# tokenizer = AutoTokenizer.from_pretrained(model_name_or_path,trust_remote_code=True)
 # model = AutoModelForCausalLM.from_pretrained(model_name,trust_remote_code=True)
+# model = AutoModel.from_pretrained(model_name_or_path, trust_remote_code=True)
+tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, use_fast=False, trust_remote_code=True)
+ model = AutoModelForCausalLM.from_pretrained(model_name_or_path, device_map="auto", torch_dtype=torch.float16, trust_remote_code=True)
+model.generation_config = GenerationConfig.from_pretrained(model_name_or_path)
 # using CUDA for an optimal experience
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')