Spaces:
Runtime error
Runtime error
| import gradio as gr | |
| import torch | |
| from transformers import AutoModel, AutoTokenizer, AutoConfig | |
| import mdtex2html | |
| # ------------------- 模型加载 ------------------- | |
| device = "cuda" if torch.cuda.is_available() else "cpu" | |
| model_name_or_path = "THUDM/chatglm2-6b" | |
| config = AutoConfig.from_pretrained(model_name_or_path, trust_remote_code=True) | |
| config.pre_seq_len = 128 | |
| config.prefix_projection = False | |
| tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, trust_remote_code=True) | |
| model = AutoModel.from_pretrained(model_name_or_path, config=config, trust_remote_code=True).float() | |
| # 加载 Prefix 参数 | |
| prefix_state_dict = torch.load("pytorch_model.bin", map_location="cpu") | |
| new_prefix_state_dict = {} | |
| for k, v in prefix_state_dict.items(): | |
| if k.startswith("transformer.prefix_encoder."): | |
| new_prefix_state_dict[k[len("transformer.prefix_encoder."):]] = v | |
| model.transformer.prefix_encoder.load_state_dict(new_prefix_state_dict) | |
| model = model.to(device) | |
| model.eval() | |
| # ------------------- Markdown 渲染 ------------------- | |
| def postprocess(self, y): | |
| if y is None: return [] | |
| for i, (message, response) in enumerate(y): | |
| y[i] = ( | |
| None if message is None else mdtex2html.convert(message), | |
| None if response is None else mdtex2html.convert(response), | |
| ) | |
| return y | |
| gr.Chatbot.postprocess = postprocess | |
| def parse_text(text): | |
| lines = [line for line in text.split("\n") if line] | |
| count = 0 | |
| for i, line in enumerate(lines): | |
| if "```" in line: | |
| count += 1 | |
| lines[i] = "<pre><code>" if count % 2 == 1 else "</code></pre>" | |
| else: | |
| if count % 2 == 1: | |
| line = (line.replace("&", "&").replace("<", "<") | |
| .replace(">", ">").replace(" ", " ")) | |
| lines[i] = "<br>" + line | |
| return "".join(lines) | |
| # ------------------- 推理函数 ------------------- | |
| def predict(input, chatbot, history, past_key_values): | |
| chatbot.append((parse_text(input), "")) | |
| history = [] # 清空历史(如需保留记忆,请改为保留) | |
| for response, history, past_key_values in model.stream_chat( | |
| tokenizer, input, history, | |
| return_past_key_values=True, | |
| past_key_values=past_key_values | |
| ): | |
| chatbot[-1] = (parse_text(input), parse_text(response)) | |
| yield chatbot, history, past_key_values | |
| def reset_user_input(): return gr.update(value='') | |
| def reset_state(): return [], [], None | |
| # ------------------- Gradio UI ------------------- | |
| with gr.Blocks(css="#chatbot .overflow-y-auto{height:400px}") as demo: | |
| gr.HTML("<h1 align='center'>DaiyuLM 🌸<br><small>林黛玉式情绪对话生成模型</small></h1>") | |
| chatbot = gr.Chatbot(elem_id="chatbot") | |
| user_input = gr.Textbox(show_label=False, placeholder="请输入一句话...", lines=2) | |
| with gr.Row(): | |
| submitBtn = gr.Button("发送", variant="primary") | |
| clearBtn = gr.Button("清空对话") | |
| history = gr.State([]) | |
| past_key_values = gr.State(None) | |
| submitBtn.click(predict, [user_input, chatbot, history, past_key_values], | |
| [chatbot, history, past_key_values]) | |
| submitBtn.click(reset_user_input, [], [user_input]) | |
| clearBtn.click(reset_state, outputs=[chatbot, history, past_key_values]) | |
| demo.queue().launch(share=True) | |