Spaces:

mrdbourke
/

WeDetect-demo

Paused

App Files Files Community

mrdbourke commited on Jan 26

Commit

98545e4

verified ·

1 Parent(s): ccca3cf

Upload 3 files

Browse files

Files changed (3) hide show

README.md +9 -1
app.py +46 -30
requirements.txt +12 -3

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ emoji: 🔍
 colorFrom: blue
 colorTo: green
 sdk: gradio
-sdk_version: "4.44.0"
 app_file: app.py
 pinned: false
 license: gpl-3.0
@@ -72,6 +72,14 @@ tags:
 - **Unknown Words**: If a word isn't in the dictionary, it will be passed through unchanged. Check the Chinese preview to verify translations.
 - **GPU Required**: This demo requires GPU acceleration. If you encounter memory errors, try using a smaller model.
 ## 📖 Citation
 If you use WeDetect in your research, please cite:

 colorFrom: blue
 colorTo: green
 sdk: gradio
+sdk_version: 5.50.0
 app_file: app.py
 pinned: false
 license: gpl-3.0
 - **Unknown Words**: If a word isn't in the dictionary, it will be passed through unchanged. Check the Chinese preview to verify translations.
 - **GPU Required**: This demo requires GPU acceleration. If you encounter memory errors, try using a smaller model.
+## 🔧 Technical Details
+This Space uses:
+- **Gradio 5.50.0+** - Compatible with huggingface_hub 1.x
+- **huggingface_hub 1.x** - Latest HF Hub API
+- **MMDetection 3.3.0** - Object detection framework
+- **@spaces.GPU** decorator for GPU acceleration
 ## 📖 Citation
 If you use WeDetect in your research, please cite:

app.py CHANGED Viewed

@@ -11,12 +11,17 @@ Features:
 - Automatic English→Chinese translation with editable preview
 - Adjustable confidence threshold
 - Visual results with bounding boxes
 """
 import os
 import sys
 import tempfile
 import colorsys
 from typing import List, Tuple, Optional
 import gradio as gr
@@ -134,6 +139,7 @@ ENGLISH_TO_CHINESE = {
     "kite": "风筝", "balloon": "气球", "flag": "旗帜",
 }
 # ============================================================================
 # TRANSLATION FUNCTIONS
 # ============================================================================
@@ -175,10 +181,10 @@ def translate_class_list(classes_text: str, input_mode: str) -> str:
     if input_mode == "English":
         translated = [translate_to_chinese(c) for c in classes]
-        return ','.join(translated)
     else:
         # Already Chinese, return as-is
-        return ','.join(classes)
 # ============================================================================
@@ -188,6 +194,7 @@ def translate_class_list(classes_text: str, input_mode: str) -> str:
 _model_cache = {}
 _repo_path = None
 def setup_repo():
     """Clone the WeDetect repository if not already present."""
     global _repo_path
@@ -195,18 +202,21 @@ def setup_repo():
     if _repo_path is not None and os.path.exists(_repo_path):
         return _repo_path
-    import subprocess
     repo_dir = "/tmp/WeDetect"
     if not os.path.exists(repo_dir):
         print("📥 Cloning WeDetect repository...")
-        subprocess.run(
-            ["git", "clone", "--depth", "1", "https://github.com/WeChatCV/WeDetect.git", repo_dir],
-            check=True,
-            capture_output=True
-        )
-        print("✅ Repository cloned!")
     # Add to Python path for imports
     if repo_dir not in sys.path:
@@ -279,7 +289,7 @@ def draw_detections(
     labels: np.ndarray,
     class_names: List[str],
     threshold: float
-) -> Image.Image:
     """Draw bounding boxes and labels on an image."""
     img_draw = image.copy()
@@ -291,8 +301,8 @@ def draw_detections(
         "/usr/share/fonts/truetype/wqy/wqy-zenhei.ttc",
         "/usr/share/fonts/truetype/wqy/wqy-microhei.ttc",
         "/usr/share/fonts/opentype/noto/NotoSansCJK-Regular.ttc",
-        "simsun.ttc",
         "/usr/share/fonts/truetype/dejavu/DejaVuSans.ttf",
     ]
     for font_path in font_paths:
@@ -303,7 +313,11 @@ def draw_detections(
             continue
     if font is None:
-        font = ImageFont.load_default()
     colors = generate_colors(len(class_names))
     detection_count = 0
@@ -409,9 +423,13 @@ def detect_objects(
         finally:
             # Cleanup
-            os.unlink(temp_path)
     except Exception as e:
         return image, f"❌ Error: {str(e)}"
@@ -470,22 +488,20 @@ def create_demo():
                     lines=2
                 )
-                with gr.Row():
-                    threshold_slider = gr.Slider(
-                        minimum=0.0,
-                        maximum=1.0,
-                        value=0.3,
-                        step=0.05,
-                        label="📊 Confidence Threshold"
-                    )
-                with gr.Row():
-                    model_dropdown = gr.Dropdown(
-                        choices=["large", "base", "tiny"],
-                        value=DEFAULT_MODEL,
-                        label="🧠 Model Size",
-                        info="Large=best quality, Tiny=fastest"
-                    )
                 detect_btn = gr.Button(
                     "🔍 Detect Objects",
@@ -507,7 +523,7 @@ def create_demo():
                     lines=2
                 )
-        # Examples
         gr.Markdown("### 📸 Examples")
         gr.Examples(
             examples=[

 - Automatic English→Chinese translation with editable preview
 - Adjustable confidence threshold
 - Visual results with bounding boxes
+Compatible with:
+- Gradio 5.50.0+ / 6.x
+- huggingface_hub 1.x
 """
 import os
 import sys
 import tempfile
 import colorsys
+import subprocess
 from typing import List, Tuple, Optional
 import gradio as gr
     "kite": "风筝", "balloon": "气球", "flag": "旗帜",
 }
 # ============================================================================
 # TRANSLATION FUNCTIONS
 # ============================================================================
     if input_mode == "English":
         translated = [translate_to_chinese(c) for c in classes]
+        return ', '.join(translated)
     else:
         # Already Chinese, return as-is
+        return ', '.join(classes)
 # ============================================================================
 _model_cache = {}
 _repo_path = None
 def setup_repo():
     """Clone the WeDetect repository if not already present."""
     global _repo_path
     if _repo_path is not None and os.path.exists(_repo_path):
         return _repo_path
     repo_dir = "/tmp/WeDetect"
     if not os.path.exists(repo_dir):
         print("📥 Cloning WeDetect repository...")
+        try:
+            subprocess.run(
+                ["git", "clone", "--depth", "1", "https://github.com/WeChatCV/WeDetect.git", repo_dir],
+                check=True,
+                capture_output=True,
+                text=True
+            )
+            print("✅ Repository cloned!")
+        except subprocess.CalledProcessError as e:
+            print(f"❌ Failed to clone repository: {e.stderr}")
+            raise
     # Add to Python path for imports
     if repo_dir not in sys.path:
     labels: np.ndarray,
     class_names: List[str],
     threshold: float
+) -> Tuple[Image.Image, int]:
     """Draw bounding boxes and labels on an image."""
     img_draw = image.copy()
         "/usr/share/fonts/truetype/wqy/wqy-zenhei.ttc",
         "/usr/share/fonts/truetype/wqy/wqy-microhei.ttc",
         "/usr/share/fonts/opentype/noto/NotoSansCJK-Regular.ttc",
         "/usr/share/fonts/truetype/dejavu/DejaVuSans.ttf",
+        "simsun.ttc",
     ]
     for font_path in font_paths:
             continue
     if font is None:
+        try:
+            font = ImageFont.load_default(size=16)
+        except TypeError:
+            # Older Pillow versions don't support size argument
+            font = ImageFont.load_default()
     colors = generate_colors(len(class_names))
     detection_count = 0
         finally:
             # Cleanup
+            if os.path.exists(temp_path):
+                os.unlink(temp_path)
     except Exception as e:
+        import traceback
+        error_msg = f"❌ Error: {str(e)}\n{traceback.format_exc()}"
+        print(error_msg)
         return image, f"❌ Error: {str(e)}"
                     lines=2
                 )
+                threshold_slider = gr.Slider(
+                    minimum=0.0,
+                    maximum=1.0,
+                    value=0.3,
+                    step=0.05,
+                    label="📊 Confidence Threshold"
+                )
+                model_dropdown = gr.Dropdown(
+                    choices=["large", "base", "tiny"],
+                    value=DEFAULT_MODEL,
+                    label="🧠 Model Size",
+                    info="Large=best quality, Tiny=fastest"
+                )
                 detect_btn = gr.Button(
                     "🔍 Detect Objects",
                     lines=2
                 )
+        # Examples section
         gr.Markdown("### 📸 Examples")
         gr.Examples(
             examples=[

requirements.txt CHANGED Viewed

@@ -1,11 +1,20 @@
 # Core ML frameworks
 torch>=2.0.0
 torchvision>=0.15.0
 # Gradio and HF integration
-gradio>=4.0.0
 spaces
-huggingface_hub
 # Image processing
 Pillow>=9.0.0
@@ -26,4 +35,4 @@ terminaltables
 jsonlines
 tabulate
-# Note: git is required for cloning the config files (pre-installed in HF Spaces)

+# =============================================================================
+# WeDetect HuggingFace Spaces - Requirements
+# =============================================================================
+# Compatible with Gradio 5.50.0+ and huggingface_hub 1.x
+# The HfFolder class was removed in huggingface_hub 1.0, and Gradio 5.50.0+
+# updated to use get_token() instead.
+# =============================================================================
 # Core ML frameworks
 torch>=2.0.0
 torchvision>=0.15.0
 # Gradio and HF integration
+# Gradio 5.50.0+ is compatible with huggingface_hub 1.x (uses get_token() not HfFolder)
+gradio>=5.50.0
+huggingface_hub>=1.0.0
 spaces
 # Image processing
 Pillow>=9.0.0
 jsonlines
 tabulate
+# Note: git is pre-installed in HF Spaces (required for cloning config files)