Spaces:

EtanHey
/

hand-detection-api

Sleeping

App Files Files Community

EtanHey commited on Sep 15, 2025

Commit

777c63c

1 Parent(s): 10b39cb

Deploy hand detection API with Gradio interface and FastAPI endpoints

Browse files

Files changed (2) hide show

app.py +291 -0
requirements.txt +9 -0

app.py ADDED Viewed

	@@ -0,0 +1,291 @@

+"""
+HuggingFace Spaces App for Hand/Arm Detection
+Provides both Gradio UI and API endpoints
+Model: https://huggingface.co/EtanHey/hand-sign-detection
+"""
+import gradio as gr
+from ultralytics import YOLO
+import numpy as np
+from PIL import Image
+import json
+import base64
+from io import BytesIO
+from typing import Dict, Tuple, Any
+import logging
+from fastapi import FastAPI, File, UploadFile, HTTPException
+from fastapi.responses import JSONResponse
+import uvicorn
+from threading import Thread
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# Initialize FastAPI app for API endpoints
+app = FastAPI(title="Hand Detection API")
+# Load the model
+MODEL_PATH = "https://huggingface.co/EtanHey/hand-sign-detection/resolve/main/model.pt"
+model = None
+def load_model():
+    """Load YOLO model from HuggingFace"""
+    global model
+    try:
+        logger.info(f"Loading model from {MODEL_PATH}")
+        model = YOLO(MODEL_PATH)
+        logger.info("✅ Model loaded successfully!")
+        return True
+    except Exception as e:
+        logger.error(f"❌ Failed to load model: {e}")
+        return False
+# Load model on startup
+load_model()
+# Class names (alphabetical order as YOLO expects)
+CLASS_NAMES = ['arm', 'hand', 'not_hand']
+CLASS_LABELS = {
+    'arm': '💪 Arm',
+    'hand': '✋ Hand',
+    'not_hand': '❌ Not Hand/Arm'
+}
+def process_image(image: Image.Image) -> Dict[str, Any]:
+    """Process image and return detection results"""
+    if model is None:
+        return {
+            "error": "Model not loaded",
+            "class": "unknown",
+            "confidence": 0.0,
+            "probabilities": {"hand": 0, "arm": 0, "not_hand": 0}
+        }
+    try:
+        # Convert PIL image to RGB if needed
+        if image.mode != 'RGB':
+            image = image.convert('RGB')
+        # Run inference
+        results = model.predict(image, verbose=False)
+        if not results or not results[0].probs:
+            return {
+                "class": "not_hand",
+                "confidence": 0.0,
+                "probabilities": {"hand": 0, "arm": 0, "not_hand": 1.0}
+            }
+        # Extract probabilities
+        probs = results[0].probs
+        top_class_idx = probs.top1
+        top_confidence = float(probs.top1conf)
+        # Build probability dictionary
+        probabilities = {
+            "hand": float(probs.data[1]),  # Index 1
+            "arm": float(probs.data[0]),   # Index 0
+            "not_hand": float(probs.data[2]) # Index 2
+        }
+        return {
+            "class": CLASS_NAMES[top_class_idx],
+            "confidence": top_confidence,
+            "probabilities": probabilities,
+            "label": CLASS_LABELS[CLASS_NAMES[top_class_idx]]
+        }
+    except Exception as e:
+        logger.error(f"Error processing image: {e}")
+        return {
+            "error": str(e),
+            "class": "error",
+            "confidence": 0.0,
+            "probabilities": {"hand": 0, "arm": 0, "not_hand": 0}
+        }
+def gradio_predict(image: Image.Image) -> Tuple[str, Dict, str]:
+    """Gradio interface prediction function"""
+    if image is None:
+        return "Please upload an image", {}, ""
+    # Process the image
+    result = process_image(image)
+    # Format output
+    if "error" in result:
+        return f"Error: {result['error']}", {}, ""
+    # Create confidence bars
+    confidence_scores = {
+        "✋ Hand": result["probabilities"]["hand"],
+        "💪 Arm": result["probabilities"]["arm"],
+        "❌ Neither": result["probabilities"]["not_hand"]
+    }
+    # Create detailed output
+    main_label = result["label"]
+    confidence = result["confidence"]
+    output_text = f"""
+    ## Detection Result
+    **Detected:** {main_label}
+    **Confidence:** {confidence:.1%}
+    ### Detailed Probabilities:
+    - Hand: {result['probabilities']['hand']:.1%}
+    - Arm: {result['probabilities']['arm']:.1%}
+    - Not Hand/Arm: {result['probabilities']['not_hand']:.1%}
+    ### Understanding the Classes:
+    - **Hand**: Close-up view with fingers visible
+    - **Arm**: Forearm or elbow area without fingers
+    - **Not Hand/Arm**: Neither hand nor arm detected
+    """
+    # Create JSON output for developers
+    json_output = json.dumps(result, indent=2)
+    return output_text, confidence_scores, json_output
+# FastAPI endpoints for API access
+@app.get("/")
+async def root():
+    """Health check endpoint"""
+    return {
+        "status": "online",
+        "model": "hand-sign-detection",
+        "classes": CLASS_NAMES,
+        "api_endpoints": {
+            "health": "/",
+            "predict": "/api/predict",
+            "predict_base64": "/api/predict/base64"
+        }
+    }
+@app.post("/api/predict")
+async def predict_api(file: UploadFile = File(...)):
+    """API endpoint for file upload prediction"""
+    try:
+        # Read image
+        contents = await file.read()
+        image = Image.open(BytesIO(contents))
+        # Process
+        result = process_image(image)
+        return JSONResponse(content=result)
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=str(e))
+@app.post("/api/predict/base64")
+async def predict_base64_api(data: Dict[str, str]):
+    """API endpoint for base64 image prediction"""
+    try:
+        # Decode base64 image
+        image_data = base64.b64decode(data["image"])
+        image = Image.open(BytesIO(image_data))
+        # Process
+        result = process_image(image)
+        return JSONResponse(content=result)
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=str(e))
+# Gradio Interface
+def create_gradio_interface():
+    """Create the Gradio interface"""
+    # Custom CSS for better styling
+    custom_css = """
+    .gradio-container {
+        font-family: 'Inter', sans-serif;
+    }
+    .output-class {
+        font-size: 24px;
+        font-weight: bold;
+    }
+    """
+    # Example images
+    examples = [
+        ["examples/hand_example.jpg"],
+        ["examples/arm_example.jpg"],
+        ["examples/face_example.jpg"]
+    ]
+    # Create interface
+    interface = gr.Interface(
+        fn=gradio_predict,
+        inputs=[
+            gr.Image(
+                type="pil",
+                label="Upload Image",
+                sources=["upload", "webcam", "clipboard"]
+            )
+        ],
+        outputs=[
+            gr.Markdown(label="Detection Result"),
+            gr.Label(label="Confidence Scores", num_top_classes=3),
+            gr.JSON(label="API Response (for developers)")
+        ],
+        title="🤚 Hand/Arm Detection AI",
+        description="""
+        Upload an image or use your webcam to detect hands and arms.
+        **Model:** YOLOv8 trained on 1,740 images | **Accuracy:** 96.3%
+        **API Access:** Use the `/api/predict` endpoint for programmatic access.
+        """,
+        article="""
+        ### About
+        This model distinguishes between:
+        - **Hands**: Close-up views with visible fingers
+        - **Arms**: Forearm/elbow areas without fingers
+        - **Neither**: Images without hands or arms
+        ### API Usage
+        ```python
+        import requests
+        # Upload file
+        response = requests.post(
+            "https://huggingface.co/spaces/EtanHey/hand-detection/api/predict",
+            files={"file": open("image.jpg", "rb")}
+        )
+        print(response.json())
+        ```
+        ### Model Card
+        View the full model details at [HuggingFace Model Hub](https://huggingface.co/EtanHey/hand-sign-detection)
+        """,
+        examples=examples if examples else None,
+        cache_examples=True,
+        css=custom_css,
+        theme=gr.themes.Soft()
+    )
+    return interface
+# Run FastAPI in background thread
+def run_api():
+    """Run FastAPI server in background"""
+    uvicorn.run(app, host="0.0.0.0", port=7860)
+# Start API server in background
+api_thread = Thread(target=run_api, daemon=True)
+api_thread.start()
+# Create and launch Gradio interface
+if __name__ == "__main__":
+    interface = create_gradio_interface()
+    interface.launch(
+        server_name="0.0.0.0",
+        server_port=7861,  # Different port for Gradio
+        share=False,
+        debug=True
+    )

requirements.txt ADDED Viewed

	@@ -0,0 +1,9 @@

+gradio>=4.44.0
+ultralytics>=8.3.0
+Pillow>=10.0.0
+numpy>=1.24.0
+torch>=2.0.0
+fastapi>=0.104.0
+uvicorn>=0.24.0
+python-multipart>=0.0.6
+opencv-python-headless>=4.8.0