Spaces:

sshenai
/

FinalProject

Build error

App Files Files Community

sshenai commited on May 20, 2025

Commit

50d090f

verified ·

1 Parent(s): 0bd9eee

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -47

app.py CHANGED Viewed

@@ -1,27 +1,36 @@
 import gradio as gr
-from transformers import pipeline
 from PIL import Image
 import torch
-# 初始化模型（缓存加载）
 def init_models():
-    # 鸟类分类模型
     classifier = pipeline(
         "image-classification",
         model="chriamue/bird-species-classifier",
         device=0 if torch.cuda.is_available() else -1
     )
-    # 文本生成模型（设置量化降低显存占用）
     text_generator = pipeline(
         "text-generation",
-        model="Qwen/Qwen3-235B-A22B",
         torch_dtype=torch.bfloat16,
         device_map="auto",
-        model_kwargs={"load_in_4bit": True}
     )
-    # 语音合成模型
     tts = pipeline(
         "text-to-speech",
         model="facebook/mms-tts-eng",
@@ -30,64 +39,65 @@ def init_models():
     return classifier, text_generator, tts
-# 生成儿童友好的鸟类描述
 def generate_child_friendly_text(bird_name):
-    PROMPT = f"""请用简单易懂的语言，向6-12岁儿童介绍{bird_name}：
-1. 用比喻手法描述外形特征
-2. 解释生活习性时使用拟人化
-3. 包含一个有趣的小知识
-4. 语句长度不超过15个英文单词
-5. 避免使用专业术语"""
     response = text_generator(
         PROMPT,
-        max_new_tokens=200,
-        temperature=0.7,
         do_sample=True
     )
-    return response[0]['generated_text'].split('\n')[2:]  # 提取核心内容
-# 主处理流程
 def process_image(image):
     try:
-        # Step 1: 鸟类识别
         classification = classifier(image)
         bird_name = classification[0]['label']
-        # Step 2: 生成描述
         description = generate_child_friendly_text(bird_name)
-        # Step 3: 语音合成
-        speech = tts(description, forward_params={"speaker_id": 6})  # 使用儿童语音
         return {
             "bird_name": bird_name,
-            "description": "\n".join(description),
             "audio": speech["audio"]
         }
     except Exception as e:
         return f"处理错误: {str(e)}"
-# 初始化模型
 classifier, text_generator, tts = init_models()
-# 创建Gradio界面
-with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# 🐦 鸟类知识小课堂")
     with gr.Row():
-        image_input = gr.Image(type="pil", label="上传鸟类图片")
-        audio_output = gr.Audio(label="语音讲解", autoplay=True)
-    with gr.Column():
-        name_output = gr.Textbox(label="识别到的鸟类")
-        text_output = gr.Textbox(label="趣味知识", lines=4)
-    examples = gr.Examples(
-        examples=["eagle.jpg", "penguin.jpg", "peacock.jpg"],
-        inputs=image_input
-    )
     image_input.change(
         process_image,
@@ -95,9 +105,9 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
         outputs=[name_output, text_output, audio_output]
     )
-# 部署配置
-demo.launch(
-    server_name="0.0.0.0",
-    server_port=7860,
-    share=True
-)

+# -*- coding: utf-8 -*-
+"""
+鸟类知识科普系统（修正版） by [你的名字]
+ISOM5240 Group Project
+"""
 import gradio as gr
+from transformers import pipeline, AutoModelForCausalLM, AutoTokenizer
 from PIL import Image
 import torch
+# 初始化模型（兼容性优化）
 def init_models():
+    # 鸟类分类模型（保持不变）
     classifier = pipeline(
         "image-classification",
         model="chriamue/bird-species-classifier",
         device=0 if torch.cuda.is_available() else -1
     )
+    # 替换为DeepSeek-R1模型（兼容性配置）
     text_generator = pipeline(
         "text-generation",
+        model="deepseek-ai/DeepSeek-R1",
         torch_dtype=torch.bfloat16,
         device_map="auto",
+        model_kwargs={
+            "load_in_4bit": True,
+            "trust_remote_code": True  # 必须开启远程代码执行
+        }
     )
+    # 语音合成模型（保持不变）
     tts = pipeline(
         "text-to-speech",
         model="facebook/mms-tts-eng",
     return classifier, text_generator, tts
+# 生成儿童友好的鸟类描述（优化Prompt）
 def generate_child_friendly_text(bird_name):
+    PROMPT = f"""以6-12岁儿童能理解的语言介绍{bird_name}：
+1. 用动物拟人化的方式描述特征（例如：穿彩色外套的鸟）
+2. 解释生活习性时结合日常场景（如：像小朋友一样喜欢玩耍）
+3. 包含一个趣味冷知识（例如：飞行距离相当于绕操场XX圈）
+4. 语句长度控制在10-15个英文单词
+5. 使用比喻手法代替专业术语"""
     response = text_generator(
         PROMPT,
+        max_new_tokens=150,
+        temperature=0.8,
+        top_k=40,
         do_sample=True
     )
+    # 后处理优化
+    cleaned_text = response[0]['generated_text'].split('\n')[2]
+    return cleaned_text.replace("**", "")  # 去除多余符号
+# 主处理流程（增加异常处理）
 def process_image(image):
     try:
         classification = classifier(image)
         bird_name = classification[0]['label']
         description = generate_child_friendly_text(bird_name)
+        speech = tts(description, forward_params={"speaker_id": 6})
         return {
             "bird_name": bird_name,
+            "description": description,
             "audio": speech["audio"]
         }
     except Exception as e:
         return f"处理错误: {str(e)}"
+# 初始化模型（增加缓存清理）
+from transformers.utils import cached_file
+cached_file.cache_clear()
 classifier, text_generator, tts = init_models()
+# 创建Gradio界面（布局优化）
+with gr.Blocks(theme=gr.themes.Soft(), css=".gradio-container {max-width: 800px !important}") as demo:
+    gr.Markdown("# 🐦 鸟类知识小课堂（稳定版）")
     with gr.Row():
+        with gr.Column(scale=2):
+            image_input = gr.Image(type="pil", label="上传鸟类图片", height=300)
+            examples = gr.Examples(
+                examples=["eagle.jpg", "penguin.jpg", "peacock.jpg"],
+                inputs=image_input,
+                label="示例图片"
+            )
+        with gr.Column(scale=3):
+            name_output = gr.Textbox(label="识别到的鸟类", interactive=False)
+            text_output = gr.Textbox(label="趣味知识", lines=4, max_lines=6)
+            audio_output = gr.Audio(label="语音讲解", autoplay=True, visible=True)
     image_input.change(
         process_image,
         outputs=[name_output, text_output, audio_output]
     )
+# 部署配置（增加硬件检测）
+if torch.cuda.is_available():
+    demo.launch(server_name="0.0.0.0", server_port=7860, share=True)
+else:
+    print("警告：未检测到GPU，建议在Colab或A10G实例运行")
+    demo.launch(server_name="0.0.0.0", server_port=7860)