Spaces:

danielquillanroxas
/

Privacy_Preservation

Build error

App Files Files Community

danielquillanroxas commited on May 15, 2025

Commit

83aae9f

1 Parent(s): 60d1e42

stuff

Browse files

Files changed (3) hide show

app.py +250 -0
models/unified_detector(1).pt +3 -0
utils/processing.py +290 -0

app.py ADDED Viewed

	@@ -0,0 +1,250 @@

+import gradio as gr
+import os
+import cv2
+import numpy as np
+import torch
+from PIL import Image
+from ultralytics import YOLO
+from utils.processing import detect_and_blur, process_video
+import tempfile
+import time
+# Style and theme configuration
+PRIMARY_COLOR = "#4F46E5"  # Indigo
+SECONDARY_COLOR = "#6366F1"  # Lighter indigo
+# Setup paths and model
+MODEL_DIR = os.path.join(os.path.dirname(__file__), "models")
+MODEL_PATH = os.path.join(MODEL_DIR, "unified_detector.pt")
+RESULTS_DIR = os.path.join(os.path.dirname(__file__), "results")
+os.makedirs(RESULTS_DIR, exist_ok=True)
+# Load model (with error handling and GPU support)
+def load_model():
+    try:
+        print(f"CUDA Available: {torch.cuda.is_available()}")
+        device = "cuda" if torch.cuda.is_available() else "cpu"
+        print(f"Loading model from {MODEL_PATH} on {device}...")
+        model = YOLO(MODEL_PATH)
+        model.to(device)
+        print(f"Model loaded successfully")
+        return model
+    except Exception as e:
+        print(f"Error loading model: {e}")
+        return None
+# Load model at startup
+model = load_model()
+# Image processing function
+def process_image_interface(input_image, blur_strength=0.7):
+    if input_image is None:
+        return None, "Please upload an image to process"
+    start_time = time.time()
+    try:
+        # Convert from Gradio's PIL format to numpy
+        if isinstance(input_image, Image.Image):
+            img_array = np.array(input_image.convert('RGB'))
+        else:
+            img_array = input_image
+        # Adjust blur strength (scale from 0.3 to 1.0)
+        real_blur = 0.3 + (blur_strength * 0.7)
+        # Process the image
+        result_rgb, detections, _ = detect_and_blur(img_array, model)
+        # Create result message
+        elapsed_time = time.time() - start_time
+        message = (
+            f"✅ Processing complete in {elapsed_time:.2f}s\n"
+            f"👤 Detected and blurred {detections['faces']} faces\n"
+            f"🔢 Detected and blurred {detections['plates']} plates/text regions"
+        )
+        return result_rgb, message
+    except Exception as e:
+        return None, f"❌ Error processing image: {str(e)}"
+# Video processing function
+def process_video_interface(input_video, frame_skip=3, blur_strength=0.7):
+    if input_video is None:
+        return None, "Please upload a video to process"
+    try:
+        # Create a temporary file for the output
+        with tempfile.NamedTemporaryFile(delete=False, suffix='.mp4') as temp_output:
+            output_path = temp_output.name
+        # Get original file
+        output_path = process_video(
+            input_path=input_video,
+            output_path=output_path,
+            model=model,
+            frame_skip=int(frame_skip)
+        )
+        if output_path and os.path.exists(output_path):
+            return output_path, f"✅ Video processed successfully. Skipped every {frame_skip} frames for efficiency."
+        else:
+            return None, "❌ Error processing video"
+    except Exception as e:
+        return None, f"❌ Error processing video: {str(e)}"
+# Welcome message (Markdown)
+welcome_md = """
+# 🔒 Privacy Protector: AI-Powered Content Blurring
+This application automatically detects and blurs sensitive content in your images and videos, including:
+- 👤 **Faces**: Protects identity by blurring all human faces
+- 🚗 **License Plates**: Ensures vehicle privacy
+- 📝 **Text**: Blurs potentially sensitive text in images
+## How to Use
+1. Upload an image or video using the appropriate tab
+2. Adjust blurring settings if needed
+3. Click the "Process" button
+4. Download your privacy-protected result
+*Powered by YOLOv8 deep learning technology*
+"""
+# Create Gradio interface
+with gr.Blocks(theme=gr.themes.Default(primary_hue="indigo", secondary_hue="indigo")) as demo:
+    gr.Markdown(welcome_md)
+    # Model status indicator
+    with gr.Row():
+        if model is not None:
+            gr.Markdown(
+                f"<div style='background-color: #dcfce7; padding: 10px; border-radius: 4px; margin-bottom: 15px'>"
+                f"✅ <b>Model Status:</b> Loaded and Ready"
+                f"</div>"
+            )
+        else:
+            gr.Markdown(
+                f"<div style='background-color: #fee2e2; padding: 10px; border-radius: 4px; margin-bottom: 15px'>"
+                f"❌ <b>Model Status:</b> Error Loading Model"
+                f"</div>"
+            )
+    # Tabs for different functions
+    with gr.Tabs():
+        # Image Processing Tab
+        with gr.TabItem("Image Processing"):
+            with gr.Row():
+                with gr.Column():
+                    image_input = gr.Image(label="Upload Image", type="pil")
+                    with gr.Row():
+                        image_blur_strength = gr.Slider(
+                            label="Blur Strength",
+                            minimum=0,
+                            maximum=1,
+                            value=0.7,
+                            step=0.1
+                        )
+                    image_process_btn = gr.Button("Process Image", variant="primary")
+                with gr.Column():
+                    image_output = gr.Image(label="Result with Blurring")
+                    image_output_text = gr.Textbox(label="Processing Results", lines=3)
+            # Set up examples for image processing
+            gr.Examples(
+                examples=[
+                    os.path.join(os.path.dirname(__file__), "examples", "example1.jpg"),
+                    os.path.join(os.path.dirname(__file__), "examples", "example2.jpg"),
+                ],
+                inputs=image_input,
+                outputs=[image_output, image_output_text],
+                fn=process_image_interface,
+                cache_examples=True,
+            )
+        # Video Processing Tab
+        with gr.TabItem("Video Processing"):
+            with gr.Row():
+                with gr.Column():
+                    video_input = gr.Video(label="Upload Video")
+                    with gr.Row():
+                        video_frame_skip = gr.Slider(
+                            label="Frame Skip Rate (higher = faster but less smooth)",
+                            minimum=1,
+                            maximum=10,
+                            value=3,
+                            step=1
+                        )
+                        video_blur_strength = gr.Slider(
+                            label="Blur Strength",
+                            minimum=0,
+                            maximum=1,
+                            value=0.7,
+                            step=0.1
+                        )
+                    video_process_btn = gr.Button("Process Video", variant="primary")
+                with gr.Column():
+                    video_output = gr.Video(label="Processed Video")
+                    video_output_text = gr.Textbox(label="Processing Results", lines=3)
+        # About Tab
+        with gr.TabItem("About & Help"):
+            gr.Markdown("""
+            ## About Privacy Protector
+            This application uses a custom-trained YOLOv8 model to detect and blur sensitive content in images and videos.
+            ### Technical Details
+            - **Model Architecture**: YOLOv8 Medium
+            - **Training Dataset**: Custom dataset of faces, license plates, and text samples
+            - **Performance**: Fast inference suitable for real-time applications
+            ### Privacy Information
+            - All processing is done on the server - no data is stored
+            - Uploaded images and videos are automatically deleted after processing
+            - The application does not collect any personal information
+            ### Limitations
+            - May not detect all faces or text in low-quality images
+            - Very small text may be missed
+            - Processing large videos may take some time
+            ### Need Help?
+            If you're experiencing issues or have questions, please visit the repository or contact the developer.
+            """)
+    # Set up event handlers
+    image_process_btn.click(
+        fn=process_image_interface,
+        inputs=[image_input, image_blur_strength],
+        outputs=[image_output, image_output_text]
+    )
+    video_process_btn.click(
+        fn=process_video_interface,
+        inputs=[video_input, video_frame_skip, video_blur_strength],
+        outputs=[video_output, video_output_text]
+    )
+    # Footer
+    gr.Markdown("""
+    <div style="text-align: center; margin-top: 30px; padding-top: 10px; border-top: 1px solid #eee">
+    <p>Developed with ❤️ using YOLOv8 and Gradio | © 2025 Privacy Protector</p>
+    </div>
+    """)
+# Launch the app
+if __name__ == "__main__":
+    # Create examples directory if it doesn't exist
+    os.makedirs(os.path.join(os.path.dirname(__file__), "examples"), exist_ok=True)
+    # Launch Gradio app
+    demo.launch()

models/unified_detector(1).pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aff7271ad02c42539099973d8de79ea553b5cbb539c037840a5c777a702c7e10
+size 52048876

utils/processing.py ADDED Viewed

	@@ -0,0 +1,290 @@

+import cv2
+import numpy as np
+import time
+import os
+from ultralytics import YOLO
+from PIL import Image
+import matplotlib.pyplot as plt
+def detect_and_blur(input_source, model=None, frame_skip=3):
+    """Detect and blur sensitive elements in images or video frames
+    Args:
+        input_source: Image path or video frame (numpy array)
+        model: YOLO model instance
+        frame_skip: Frame skip rate for video processing
+    Returns:
+        result_rgb: Processed image with blurred regions
+        detections: Dict with counts of detected objects
+        boxes: Dict with bounding boxes of detected objects
+    """
+    if isinstance(input_source, str):  # Image path
+        frame = cv2.imread(input_source)
+        if frame is None:
+            raise ValueError(f"Could not read image from {input_source}")
+    else:  # Video frame or numpy array
+        frame = input_source.copy()
+    # Handle RGB vs BGR input
+    if len(frame.shape) == 3 and frame.shape[2] == 3:
+        if isinstance(input_source, str) or input_source is not None:
+            frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+        else:
+            frame_rgb = frame  # Assume RGB if directly passed
+    else:
+        raise ValueError("Input must be a color image with 3 channels")
+    result_img = frame.copy()
+    detections = {'faces': 0, 'plates': 0}
+    boxes = {'faces': [], 'plates': []}
+    if model:
+        try:
+            # Run YOLOv8 inference
+            results = model.predict(frame_rgb, conf=0.5)
+            for r in results:
+                for box in r.boxes:
+                    x1, y1, x2, y2 = map(int, box.xyxy[0].tolist())
+                    cls_id = int(box.cls[0])
+                    conf = float(box.conf[0])
+                    # Ensure coordinates are within image bounds
+                    x1, y1 = max(0, x1), max(0, y1)
+                    x2, y2 = min(frame.shape[1], x2), min(frame.shape[0], y2)
+                    # Skip invalid boxes
+                    if x2 <= x1 or y2 <= y1:
+                        continue
+                    # Apply Gaussian blur to the detected region
+                    region = result_img[y1:y2, x1:x2]
+                    # Adjust kernel size based on detection type and region size
+                    kernel_size = 55 if cls_id == 1 else 71  # Different blur for faces vs plates/text
+                    kernel_size = max(25, min(kernel_size, (x2-x1)//2*2+1, (y2-y1)//2*2+1))
+                    kernel_size = kernel_size + 1 if kernel_size % 2 == 0 else kernel_size
+                    # Apply blur only if kernel size is valid
+                    if kernel_size >= 3:
+                        blurred = cv2.GaussianBlur(region, (kernel_size, kernel_size), 15)
+                        result_img[y1:y2, x1:x2] = blurred
+                        # Update detection counts and boxes
+                        if cls_id == 0:  # Assuming 0 is plate/text
+                            detections['plates'] += 1
+                            boxes['plates'].append((x1, y1, x2, y2))
+                        else:  # Assuming 1 is face
+                            detections['faces'] += 1
+                            boxes['faces'].append((x1, y1, x2, y2))
+        except Exception as e:
+            print(f"Detection error: {e}")
+    # Ensure output is RGB for consistent interface
+    if isinstance(input_source, str) or input_source is not None:
+        result_rgb = cv2.cvtColor(result_img, cv2.COLOR_BGR2RGB)
+    else:
+        result_rgb = result_img
+    return result_rgb, detections, boxes
+def process_video(input_path, output_path=None, model=None, frame_skip=3, output_fps=30):
+    """Process video with optimized frame skipping
+    Args:
+        input_path: Path to input video
+        output_path: Path to save processed video (if None, auto-generated)
+        model: YOLO model instance
+        frame_skip: Process 1 in every N frames
+        output_fps: Output video frame rate
+    Returns:
+        output_path: Path to processed video file
+    """
+    try:
+        # Open video file
+        cap = cv2.VideoCapture(input_path)
+        if not cap.isOpened():
+            raise ValueError(f"Could not open video file {input_path}")
+        # Get video properties
+        frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+        frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+        original_fps = cap.get(cv2.CAP_PROP_FPS)
+        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+        # Set output parameters
+        fps = original_fps if original_fps > 0 else output_fps
+        if output_path is None:
+            # Create results directory if it doesn't exist
+            results_dir = os.path.join(os.path.dirname(os.path.abspath(__file__)), "..", "results")
+            os.makedirs(results_dir, exist_ok=True)
+            output_path = os.path.join(results_dir, f"processed_{os.path.basename(input_path)}")
+        # Create video writer
+        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+        out = cv2.VideoWriter(output_path, fourcc, fps//frame_skip, (frame_width, frame_height))
+        # Display processing information
+        print(f"Processing video: {os.path.basename(input_path)}")
+        print(f"Original: {frame_width}x{frame_height} @ {original_fps:.1f}fps")
+        print(f"Processing: 1 every {frame_skip} frames")
+        print(f"Output: {fps//frame_skip:.1f}fps | Estimated time: {total_frames/(fps*frame_skip):.1f}s")
+        # Process video frames
+        frame_count = 0
+        processed_frames = 0
+        start_time = time.time()
+        while True:
+            ret, frame = cap.read()
+            if not ret:
+                break
+            # Skip frames according to frame_skip
+            if frame_count % frame_skip != 0:
+                frame_count += 1
+                continue
+            try:
+                # Process frame
+                result_rgb, _, _ = detect_and_blur(frame, model)
+                result_bgr = cv2.cvtColor(result_rgb, cv2.COLOR_RGB2BGR)
+                out.write(result_bgr)
+                processed_frames += 1
+                # Print progress periodically
+                if time.time() - start_time >= 5:
+                    elapsed = time.time() - start_time
+                    fps = processed_frames / elapsed
+                    print(f"Progress: {frame_count}/{total_frames} | "
+                          f"Processed: {processed_frames} | "
+                          f"Current FPS: {fps:.1f}")
+                    start_time = time.time()
+                    processed_frames = 0
+            except Exception as e:
+                print(f"Error processing frame {frame_count}: {e}")
+            frame_count += 1
+        # Clean up
+        cap.release()
+        out.release()
+        print(f"\nVideo processing complete! Saved to {output_path}")
+        return output_path
+    except Exception as e:
+        print(f"Video processing failed: {e}")
+        return None
+def process_image(image_path, output_path=None, model=None, visualize=False):
+    """Process single image with optional visualization
+    Args:
+        image_path: Path to input image or numpy array
+        output_path: Path to save processed image (if None, auto-generated)
+        model: YOLO model instance
+        visualize: Whether to create visualization with original, detections, and result
+    Returns:
+        result_path: Path to processed image file
+        or
+        result_rgb: Processed image as numpy array (if output_path is None)
+    """
+    try:
+        # Process image
+        result_rgb, detections, boxes = detect_and_blur(image_path, model)
+        # Handle input as numpy array
+        if not isinstance(image_path, str):
+            if output_path is None:
+                return result_rgb
+            image_filename = "processed_image.jpg"
+        else:
+            image_filename = os.path.basename(image_path)
+        # Create visualization if requested
+        if visualize:
+            # Load original image
+            if isinstance(image_path, str):
+                original = cv2.cvtColor(cv2.imread(image_path), cv2.COLOR_BGR2RGB)
+            else:
+                original = image_path
+            # Create image with detection boxes
+            detection_img = original.copy()
+            # Draw face boxes
+            for box in boxes['faces']:
+                x1, y1, x2, y2 = box
+                cv2.rectangle(detection_img, (x1, y1), (x2, y2), (255, 0, 0), 2)
+                cv2.putText(detection_img, "Face", (x1, y1-10),
+                           cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 0, 0), 2)
+            # Draw plate/text boxes
+            for box in boxes['plates']:
+                x1, y1, x2, y2 = box
+                cv2.rectangle(detection_img, (x1, y1), (x2, y2), (0, 0, 255), 2)
+                cv2.putText(detection_img, "Plate/Text", (x1, y1-10),
+                           cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 255), 2)
+            # Create comparison visualization (only for local debugging)
+            fig, axes = plt.subplots(1, 3, figsize=(20, 7))
+            titles = ["Original", "Detections", "Blurred Result"]
+            images = [original, detection_img, result_rgb]
+            for ax, title, img in zip(axes, titles, images):
+                ax.imshow(img)
+                ax.set_title(title)
+                ax.axis("off")
+            plt.tight_layout()
+            plt.show()
+        # Save result if output path provided
+        if output_path is not None:
+            # Save the processed image
+            cv2.imwrite(output_path, cv2.cvtColor(result_rgb, cv2.COLOR_RGB2BGR))
+            print(f"Saved result to {output_path}")
+        else:
+            # Auto-generate output path if not provided
+            results_dir = os.path.join(os.path.dirname(os.path.abspath(__file__)), "..", "results")
+            os.makedirs(results_dir, exist_ok=True)
+            result_path = os.path.join(results_dir, f"processed_{image_filename}")
+            cv2.imwrite(result_path, cv2.cvtColor(result_rgb, cv2.COLOR_RGB2BGR))
+            print(f"Saved result to {result_path}")
+            output_path = result_path
+        print(f"Detections: {detections['faces']} faces, {detections['plates']} plates/text regions")
+        return output_path if isinstance(image_path, str) else result_rgb
+    except Exception as e:
+        print(f"Image processing error: {e}")
+        return None
+def process_pil_image(pil_image, model=None):
+    """Process PIL Image for Gradio interface
+    Args:
+        pil_image: PIL Image
+        model: YOLO model instance
+    Returns:
+        result_pil: Processed PIL Image
+        detections: Dict with counts of detected objects
+    """
+    try:
+        # Convert PIL to numpy array
+        img_array = np.array(pil_image)
+        # Process the image
+        result_rgb, detections, _ = detect_and_blur(img_array, model)
+        # Convert back to PIL if needed
+        result_pil = Image.fromarray(result_rgb)
+        return result_pil, detections
+    except Exception as e:
+        print(f"PIL image processing error: {e}")
+        return pil_image, {'faces': 0, 'plates': 0}