Spaces:

sshenai
/

DPLproject

Runtime error

App Files Files Community

sshenai commited on May 20, 2025

Commit

d32f0b3

verified ·

1 Parent(s): e164259

Update app.py

Browse files

Files changed (1) hide show

app.py +82 -51

app.py CHANGED Viewed

@@ -1,73 +1,99 @@
 # -*- coding: utf-8 -*-
 """
-鸟类知识科普系统（Qwen3优化版） by [你的名字]
 ISOM5240 Group Project
 """
 import gradio as gr
-from transformers import pipeline, AutoModelForCausalLM, AutoTokenizer
 from PIL import Image
 import torch
-# 强制清理旧版缓存
-from transformers.utils import move_cache
-move_cache()
-# 初始化模型（兼容Qwen3）
 def init_models():
-    # 鸟类分类模型（保持不变）
     classifier = pipeline(
-        "image-classification",
         model="chriamue/bird-species-classifier",
         device=0 if torch.cuda.is_available() else -1
     )
-    # 更新为Qwen3模型（官方支持版本）
     text_generator = pipeline(
-        "text-generation",
-        model="Qwen/Qwen-7B-Chat",  # 使用官方维护版本
         device_map="auto",
         torch_dtype=torch.bfloat16,
-        trust_remote_code=True,     # 必须开启
         model_kwargs={
             "revision": "main",
-            "force_download": True  # 替换弃用参数
         }
     )
-    # 语音合成模型（保持不变）
     tts = pipeline(
-        "text-to-speech",
         model="facebook/mms-tts-eng",
         device=0 if torch.cuda.is_available() else -1
     )
     return classifier, text_generator, tts
-# 生成儿童友好的鸟类描述
 def generate_child_friendly_text(bird_name):
     PROMPT = f"""以6-12岁儿童能理解的方式描述{bird_name}：
-1. 用比喻手法（如：羽毛像彩虹糖纸）
-2. 包含一个趣味冷知识（例如：每天吃相当于自身体重30%的食物）
-3. 语句长度不超过15个英文单词
-4. 避免使用专业术语"""
     response = text_generator(
         PROMPT,
         max_new_tokens=150,
         temperature=0.7,
         do_sample=True
     )
-    return response[0]['generated_text'].split('\n')[2]
-# 主处理流程
 def process_image(image):
     try:
         classification = classifier(image)
         bird_name = classification[0]['label']
         description = generate_child_friendly_text(bird_name)
-        speech = tts(description, forward_params={"speaker_id": 6})
         return {
             "bird_name": bird_name,
@@ -77,33 +103,38 @@ def process_image(image):
     except Exception as e:
         return f"处理错误: {str(e)}"
-# 初始化模型
-classifier, text_generator, tts = init_models()
-# 创建Gradio界面
-with gr.Blocks(theme=gr.themes.Soft(), css=".gradio-container {max-width: 800px}") as demo:
-    gr.Markdown("# 🐦 鸟类知识小课堂（Qwen3版）")
-    with gr.Row():
-        image_input = gr.Image(type="pil", label="上传鸟类图片", height=300)
-        audio_output = gr.Audio(label="语音讲解", autoplay=True)
-    with gr.Column():
-        name_output = gr.Textbox(label="识别到的鸟类")
-        text_output = gr.Textbox(label="趣味知识", lines=4)
-    examples = gr.Examples(
-        examples=["eagle.jpg", "penguin.jpg", "peacock.jpg"],
-        inputs=image_input,
-        label="示例图片"
-    )
-    image_input.change(
-        process_image,
-        inputs=image_input,
-        outputs=[name_output, text_output, audio_output]
-    )
-# 部署配置
-if __name__ == "__main__":
-    demo.launch(server_name="0.0.0.0", server_port=7860)

 # -*- coding: utf-8 -*-
 """
+鸟类知识科普系统（兼容版）by [你的名字]
 ISOM5240 Group Project
 """
 import gradio as gr
+from transformers import pipeline, AutoModelForCausalLM
 from PIL import Image
 import torch
+import shutil
+import os
+from pathlib import Path
+# ---- 兼容性缓存清理方案 ----
+def clear_hf_cache():
+    """清除Hugging Face缓存目录（兼容所有版本）"""
+    cache_paths = [
+        Path("~/.cache/huggingface/hub"),  # Linux/Mac
+        Path(os.environ.get("TRANSFORMERS_CACHE", "")),  # 自定义缓存路径
+        Path("transformers")  # Colab环境
+    ]
+    for path in cache_paths:
+        expanded_path = path.expanduser()
+        if expanded_path.exists():
+            print(f"清理缓存目录: {expanded_path}")
+            shutil.rmtree(expanded_path, ignore_errors=True)
+# ---- 模型初始化 ----
 def init_models():
+    clear_hf_cache()  # 执行缓存清理
+    # 1. 鸟类分类模型
     classifier = pipeline(
+        task="image-classification",
         model="chriamue/bird-species-classifier",
         device=0 if torch.cuda.is_available() else -1
     )
+    # 2. 文本生成模型（Qwen3）
     text_generator = pipeline(
+        task="text-generation",
+        model="Qwen/Qwen-7B-Chat",
         device_map="auto",
         torch_dtype=torch.bfloat16,
+        trust_remote_code=True,
         model_kwargs={
             "revision": "main",
+            "force_download": True
         }
     )
+    # 3. 语音合成模型
     tts = pipeline(
+        task="text-to-speech",
         model="facebook/mms-tts-eng",
         device=0 if torch.cuda.is_available() else -1
     )
     return classifier, text_generator, tts
+# ---- 核心处理逻辑 ----
 def generate_child_friendly_text(bird_name):
+    """生成儿童友好的鸟类描述"""
     PROMPT = f"""以6-12岁儿童能理解的方式描述{bird_name}：
+    1. 使用比喻手法（如：羽毛像彩虹糖纸）
+    2. 包含一个趣味冷知识（例如：每天吃相当于自身体重30%的食物）
+    3. 语句长度不超过15个英文单词
+    4. 避免使用专业术语"""
     response = text_generator(
         PROMPT,
         max_new_tokens=150,
         temperature=0.7,
+        top_p=0.9,
         do_sample=True
     )
+    # 清洗输出文本
+    full_text = response[0]['generated_text']
+    clean_text = full_text.split("描述{}：".format(bird_name))[-1].strip()
+    return clean_text.replace("**", "").replace("```", "")
 def process_image(image):
+    """处理图片生成结果的完整流程"""
     try:
+        # 步骤1: 鸟类识别
         classification = classifier(image)
         bird_name = classification[0]['label']
+        # 步骤2: 生成描述
         description = generate_child_friendly_text(bird_name)
+        # 步骤3: 语音合成
+        speech = tts(description, forward_params={"speaker_id": 6})  # 使用儿童音色
         return {
             "bird_name": bird_name,
     except Exception as e:
         return f"处理错误: {str(e)}"
+# ---- 初始化与界面 ----
+if __name__ == "__main__":
+    # 初始化模型（显式指定设备）
+    classifier, text_generator, tts = init_models()
+    # 构建Gradio界面
+    with gr.Blocks(theme=gr.themes.Soft(), css=".gradio-container {max-width: 800px}") as demo:
+        gr.Markdown("# 🐦 鸟类知识小课堂（兼容版）")
+        with gr.Row():
+            image_input = gr.Image(type="pil", label="上传鸟类图片", height=300)
+            audio_output = gr.Audio(label="语音讲解", autoplay=True)
+        with gr.Column():
+            name_output = gr.Textbox(label="识别到的鸟类")
+            text_output = gr.Textbox(label="趣味知识", lines=4)
+        examples = gr.Examples(
+            examples=["eagle.jpg", "penguin.jpg", "peacock.jpg"],
+            inputs=image_input,
+            label="示例图片"
+        )
+        image_input.change(
+            process_image,
+            inputs=image_input,
+            outputs=[name_output, text_output, audio_output]
+        )
+    # 启动服务
+    demo.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        share=True
+    )