Spaces:

XiaoBai1221
/

SignView2.0

Sleeping

App Files Files Community

XiaoBai1221 commited on Jun 23, 2025

Commit

35d308c

1 Parent(s): 65a0ce8

重新創建完整的 app.py - 修復 Hugging Face Spaces 初始化問題

Browse files

Files changed (1) hide show

app.py +178 -1

app.py CHANGED Viewed

	@@ -1 +1,178 @@
1	-

+import os
+import cv2
+import numpy as np
+import gradio as gr
+from realtime_sign_prediction import RealtimeSignPredictor
+class GradioSignPredictor:
+    def __init__(self):
+        """初始化手語辨識預測器"""
+        self.predictor = RealtimeSignPredictor(
+            model_path="tsflow/models/best_model.pt",
+            config_path="tsflow/results/test_results.json",
+            sequence_length=50,
+            use_segmentation=True
+        )
+        print("✅ 手語辨識系統初始化完成！")
+    def process_frame(self, frame):
+        """處理單一畫面並返回結果"""
+        if frame is None:
+            return frame, "等待攝像頭輸入..."
+        try:
+            # 處理畫面
+            results, keypoints, flow_features = self.predictor.process_frame(frame)
+            # 繪製關鍵點
+            annotated_frame = self.predictor.draw_landmarks(frame.copy(), results)
+            # 獲取預測結果
+            top_predictions = self.predictor.get_top_predictions(top_k=3)
+            # 格式化預測結果
+            if top_predictions:
+                prediction_text = "🎯 即時預測結果:\n\n"
+                for i, (label, confidence) in enumerate(top_predictions, 1):
+                    confidence_bar = "█" * int(confidence * 20)
+                    prediction_text += f"{i}. {label}: {confidence:.2%} {confidence_bar}\n"
+                # 添加序列資訊
+                prediction_text += f"\n📊 序列進度: {len(self.predictor.keypoint_sequence)}/{self.predictor.sequence_length}"
+            else:
+                prediction_text = "📡 正在收集動作序列...\n請在攝像頭前做手語動作"
+            return annotated_frame, prediction_text
+        except Exception as e:
+            return frame, f"❌ 處理錯誤: {str(e)}"
+    def clear_predictions(self):
+        """清除預測序列"""
+        self.predictor.keypoint_sequence.clear()
+        self.predictor.flow_sequence.clear()
+        return "✅ 已清除預測序列，請重新開始"
+# 初始化全域預測器
+print("🚀 正在初始化手語辨識系統...")
+global_predictor = GradioSignPredictor()
+def process_video_frame(frame):
+    """處理視訊畫面的包裝函數"""
+    return global_predictor.process_frame(frame)
+def clear_predictions():
+    """清除預測的包裝函數"""
+    return global_predictor.clear_predictions()
+# 創建 Gradio 介面
+with gr.Blocks(
+    title="SignView2.0 - 手語辨識系統",
+    theme=gr.themes.Soft(),
+    css="""
+    .container { max-width: 1200px; margin: auto; }
+    .header { text-align: center; margin-bottom: 2rem; }
+    .prediction-box {
+        background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
+        color: white;
+        padding: 1rem;
+        border-radius: 10px;
+        font-family: monospace;
+    }
+    """
+) as demo:
+    gr.Markdown("""
+    # 🤟 SignView2.0 - 手語辨識系統
+    **支援34種手語詞彙的即時辨識系統，準確率達94.25%**
+    ## 📋 支援詞彙
+    `again`, `all`, `apple`, `bad`, `bathroom`, `beautiful`, `bird`, `black`, `blue`, `book`,
+    `bored`, `boy`, `brother`, `brown`, `but`, `computer`, `cousin`, `dance`, `day`, `deaf`,
+    `doctor`, `dog`, `draw`, `drink`, `eat`, `english`, `family`, `father`, `fine`, `finish`,
+    `fish`, `forget`, `friend`, `girl`
+    ## 🚀 使用說明
+    1. 點擊下方攝像頭區域允許權限
+    2. 在攝像頭前做手語動作
+    3. 系統會即時顯示辨識結果
+    4. 點擊「清除預測」重新開始
+    """, elem_classes=["header"])
+    with gr.Row():
+        with gr.Column(scale=2):
+            # 視訊輸入
+            video_input = gr.Video(
+                label="📹 攝像頭輸入",
+                sources=["webcam"],
+                streaming=True,
+                height=400
+            )
+            # 清除按鈕
+            clear_btn = gr.Button(
+                "🗑️ 清除預測序列",
+                variant="secondary",
+                size="lg"
+            )
+        with gr.Column(scale=1):
+            # 預測輸出
+            prediction_output = gr.Textbox(
+                label="🎯 辨識結果",
+                lines=12,
+                value="等待攝像頭輸入...",
+                elem_classes=["prediction-box"]
+            )
+            # 系統資訊
+            gr.Markdown("""
+            ## 📊 系統資訊
+            - **模型準確率**: 94.25%
+            - **F1分數**: 94.24%
+            - **處理速度**: 30 FPS
+            - **特徵提取**: MediaPipe + 光流
+            - **模型架構**: BiLSTM + 注意力機制
+            - **背景分割**: MediaPipe Segmentation
+            ## 🔧 技術特色
+            - MediaPipe Holistic 關鍵點���測
+            - 光流動作特徵捕捉
+            - 人體分割背景去除
+            - 深度學習時序建模
+            """)
+    # 事件處理器
+    video_input.stream(
+        fn=process_video_frame,
+        inputs=[video_input],
+        outputs=[video_input, prediction_output],
+        stream_every=0.1,
+        show_progress=False
+    )
+    clear_btn.click(
+        fn=clear_predictions,
+        outputs=[prediction_output]
+    )
+    gr.Markdown("""
+    ---
+    ### 📈 關於此系統
+    SignView2.0 使用最先進的深度學習技術進行手語辨識：
+    - **特徵提取**: 使用 MediaPipe 提取手部、身體關鍵點 + 光流特徵
+    - **背景處理**: MediaPipe Segmentation 自動去除背景干擾
+    - **時序建模**: 雙向LSTM + GRU + 多頭注意力機制
+    - **訓練資料**: 2380個手語視頻，經過數據增強和正規化
+    **開發者**: XiaoBai1221 | **平台**: Hugging Face Spaces
+    """)
+# 啟動應用程式 - Hugging Face Spaces 會自動檢測 demo 變數
+print("🎉 SignView2.0 手語辨識系統已啟動！")
+# 直接啟動，不使用條件判斷
+demo.launch()