Spaces:

caixiaoshun
/

DaiyuLM

Runtime error

App Files Files Community

DaiyuLM / app.py

caixiaoshun

Update app.py

4c6dac5 verified 10 months ago

raw

history blame contribute delete

3.35 kB

	import gradio as gr
	import torch
	from transformers import AutoModel, AutoTokenizer, AutoConfig
	import mdtex2html

	# ------------------- 模型加载 -------------------
	device = "cuda" if torch.cuda.is_available() else "cpu"
	model_name_or_path = "THUDM/chatglm2-6b"

	config = AutoConfig.from_pretrained(model_name_or_path, trust_remote_code=True)
	config.pre_seq_len = 128
	config.prefix_projection = False

	tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, trust_remote_code=True)
	model = AutoModel.from_pretrained(model_name_or_path, config=config, trust_remote_code=True).float()

	# 加载 Prefix 参数
	prefix_state_dict = torch.load("pytorch_model.bin", map_location="cpu")
	new_prefix_state_dict = {}
	for k, v in prefix_state_dict.items():
	if k.startswith("transformer.prefix_encoder."):
	new_prefix_state_dict[k[len("transformer.prefix_encoder."):]] = v
	model.transformer.prefix_encoder.load_state_dict(new_prefix_state_dict)

	model = model.to(device)
	model.eval()

	# ------------------- Markdown 渲染 -------------------
	def postprocess(self, y):
	if y is None: return []
	for i, (message, response) in enumerate(y):
	y[i] = (
	None if message is None else mdtex2html.convert(message),
	None if response is None else mdtex2html.convert(response),
	)
	return y

	gr.Chatbot.postprocess = postprocess

	def parse_text(text):
	lines = [line for line in text.split("\n") if line]
	count = 0
	for i, line in enumerate(lines):
	if "```" in line:
	count += 1
	lines[i] = "<pre><code>" if count % 2 == 1 else "</code></pre>"
	else:
	if count % 2 == 1:
	line = (line.replace("&", "&").replace("<", "<")
	.replace(">", ">").replace(" ", " "))
	lines[i] = "<br>" + line
	return "".join(lines)

	# ------------------- 推理函数 -------------------
	def predict(input, chatbot, history, past_key_values):
	chatbot.append((parse_text(input), ""))
	history = [] # 清空历史（如需保留记忆，请改为保留）

	for response, history, past_key_values in model.stream_chat(
	tokenizer, input, history,
	return_past_key_values=True,
	past_key_values=past_key_values
	):
	chatbot[-1] = (parse_text(input), parse_text(response))
	yield chatbot, history, past_key_values

	def reset_user_input(): return gr.update(value='')
	def reset_state(): return [], [], None

	# ------------------- Gradio UI -------------------
	with gr.Blocks(css="#chatbot .overflow-y-auto{height:400px}") as demo:
	gr.HTML("<h1 align='center'>DaiyuLM 🌸<br><small>林黛玉式情绪对话生成模型</small></h1>")
	chatbot = gr.Chatbot(elem_id="chatbot")
	user_input = gr.Textbox(show_label=False, placeholder="请输入一句话...", lines=2)

	with gr.Row():
	submitBtn = gr.Button("发送", variant="primary")
	clearBtn = gr.Button("清空对话")

	history = gr.State([])
	past_key_values = gr.State(None)

	submitBtn.click(predict, [user_input, chatbot, history, past_key_values],
	[chatbot, history, past_key_values])
	submitBtn.click(reset_user_input, [], [user_input])
	clearBtn.click(reset_state, outputs=[chatbot, history, past_key_values])

	demo.queue().launch(share=True)