Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -89,10 +89,7 @@ def append_log(logs: str, msg: str) -> str:
|
|
| 89 |
# ==========================================
|
| 90 |
|
| 91 |
def ensure_model(model_state: Dict, repo_id: str, device_map: str, dtype_name: str, logs: str):
|
| 92 |
-
|
| 93 |
-
Only (re)load when repo_id changes or model_state is empty.
|
| 94 |
-
device_map/dtype_name 变更不会触发重新加载(按你的要求)。
|
| 95 |
-
"""
|
| 96 |
ms = model_state or {"repo_id": None, "tok": None, "model": None}
|
| 97 |
if ms.get("repo_id") != repo_id or ms.get("model") is None:
|
| 98 |
logs = append_log(logs, f"加载模型 {repo_id}(触发:repo 变更)…")
|
|
@@ -114,10 +111,7 @@ def predict(user_text: str,
|
|
| 114 |
max_new_token: int, top_k: int,
|
| 115 |
logs_state: str,
|
| 116 |
model_state: Dict):
|
| 117 |
-
|
| 118 |
-
Only reload when repo_id changes.
|
| 119 |
-
Expects custom model.chat(conversations, tokenizer, max_new_token=..., top_k=...).
|
| 120 |
-
"""
|
| 121 |
messages_state = messages_state or []
|
| 122 |
logs_state = logs_state or ""
|
| 123 |
|
|
@@ -181,11 +175,6 @@ def preload_on_repo_change(repo_id: str, device_map: str, dtype_name: str, logs_
|
|
| 181 |
# Gradio UI
|
| 182 |
# ==========================================
|
| 183 |
with gr.Blocks(title="mini-moe Chat (Gradio)") as demo:
|
| 184 |
-
gr.Markdown("""
|
| 185 |
-
# 🤖 mini-moe Chat UI (Gradio)
|
| 186 |
-
仅在 **repo 变更** 时重新加载模型;设备/精度变更不会触发重新加载(按你的要求)。
|
| 187 |
-
右侧含 **日志面板**,实时显示加载与推理步骤;**不使用 system prompt**。
|
| 188 |
-
""")
|
| 189 |
|
| 190 |
messages_state = gr.State([]) # 保存 role/content 历史
|
| 191 |
logs_state = gr.State("") # 保存日志文本
|
|
|
|
| 89 |
# ==========================================
|
| 90 |
|
| 91 |
def ensure_model(model_state: Dict, repo_id: str, device_map: str, dtype_name: str, logs: str):
|
| 92 |
+
|
|
|
|
|
|
|
|
|
|
| 93 |
ms = model_state or {"repo_id": None, "tok": None, "model": None}
|
| 94 |
if ms.get("repo_id") != repo_id or ms.get("model") is None:
|
| 95 |
logs = append_log(logs, f"加载模型 {repo_id}(触发:repo 变更)…")
|
|
|
|
| 111 |
max_new_token: int, top_k: int,
|
| 112 |
logs_state: str,
|
| 113 |
model_state: Dict):
|
| 114 |
+
|
|
|
|
|
|
|
|
|
|
| 115 |
messages_state = messages_state or []
|
| 116 |
logs_state = logs_state or ""
|
| 117 |
|
|
|
|
| 175 |
# Gradio UI
|
| 176 |
# ==========================================
|
| 177 |
with gr.Blocks(title="mini-moe Chat (Gradio)") as demo:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 178 |
|
| 179 |
messages_state = gr.State([]) # 保存 role/content 历史
|
| 180 |
logs_state = gr.State("") # 保存日志文本
|