Spaces:

MogensR
/

VideoBackgroundReplacer2

Paused

App Files Files Community

MogensR commited on Sep 12, 2025

Commit

8f6e77a

1 Parent(s): 10e40ec

fix 2

Browse files

Files changed (1) hide show

app.py +291 -784

app.py CHANGED Viewed

@@ -1,7 +1,7 @@
 #!/usr/bin/env python3
 """
-🎬 BackgroundFX Pro - Complete Fixed Version
-Professional video background replacement with SAM2 segmentation
 """
 import os
@@ -15,6 +15,7 @@
 import requests
 import tempfile
 import subprocess
 import numpy as np
 import io
 from PIL import Image
@@ -24,7 +25,12 @@
 import gradio as gr
-# Configure logging first
 logging.basicConfig(
     level=logging.INFO,
     format='%(asctime)s - %(levelname)s - %(message)s'
@@ -36,495 +42,212 @@
     SKLEARN_AVAILABLE = True
 except ImportError:
     SKLEARN_AVAILABLE = False
-    logger.warning("⚠️ sklearn not available, using fallback color detection")
-# ===============================================================================
-# SYSTEM CONFIGURATION
-# ===============================================================================
-def setup_environment():
-    """Configure environment and check system capabilities"""
-    logger.info("Starting BackgroundFX Pro with SAM2...")
-    # GPU detection
-    if torch.cuda.is_available():
-        device = torch.device("cuda")
-        gpu_name = torch.cuda.get_device_name(0)
-        gpu_memory = torch.cuda.get_device_properties(0).total_memory / (1024**3)
-        logger.info(f"Device: cuda")
-        logger.info(f"GPU: {gpu_name} ({gpu_memory:.1f}GB)")
-        # GPU type detection for model selection
-        gpu_type = "T4" if "T4" in gpu_name else "other"
-        model_size = "small" if gpu_type == "T4" else "base_plus"
-    else:
-        device = torch.device("cpu")
-        logger.info("Device: cpu")
-        gpu_name = "CPU"
-        gpu_memory = 0
-        model_size = "small"
-    return device, gpu_name, gpu_memory, model_size
-# Initialize system
-DEVICE, GPU_NAME, GPU_MEMORY, MODEL_SIZE = setup_environment()
-# ===============================================================================
-# SAM2 INTEGRATION
-# ===============================================================================
-def check_sam2_availability():
-    """Check if SAM2 is available"""
-    try:
-        import sam2
-        logger.info("✅ SAM2 is available")
-        return True
-    except ImportError:
-        logger.warning("❌ SAM2 not available - using fallback methods")
-        return False
-def check_matanyone_availability():
-    """Check if MatAnyone is available"""
-    try:
-        from matanyone import InferenceCore
-        logger.info("✅ MatAnyone is available")
-        return True
-    except ImportError:
-        logger.warning("❌ MatAnyone not available - using fallback methods")
-        return False
-SAM2_AVAILABLE = check_sam2_availability()
-MATANYONE_AVAILABLE = check_matanyone_availability()
-# Global model instances
-matanyone_processor = None
-class SAM2Segmenter:
-    """SAM2 + MatAnyone professional video segmentation"""
-    def __init__(self):
-        self.sam2_model = None
-        self.sam2_predictor = None
-        self.matanyone_processor = None
-    def load_models(self):
-        """Load both SAM2 and MatAnyone models"""
-        sam2_loaded = self.load_sam2_model()
-        matanyone_loaded = self.load_matanyone_model()
-        if sam2_loaded and matanyone_loaded:
-            logger.info("✅ SAM2 + MatAnyone professional pipeline ready")
-            return True
-        elif sam2_loaded:
-            logger.info("✅ SAM2 loaded, MatAnyone unavailable - using SAM2 + OpenCV")
-            return True
-        else:
-            logger.warning("⚠️ Both SAM2 and MatAnyone unavailable - using fallback")
-            return False
-    def load_sam2_model(self):
-        """Load SAM2 model with auto-download"""
-        if not SAM2_AVAILABLE:
-            return False
-        try:
-            # Ensure checkpoints directory exists
-            os.makedirs("checkpoints", exist_ok=True)
-            if MODEL_SIZE == "small":
-                from sam2.build_sam import build_sam2_video_predictor
-                checkpoint_file = "checkpoints/sam2_hiera_small.pt"
-                config = "sam2_hiera_s.yaml"
-                checkpoint_url = "https://dl.fbaipublicfiles.com/segment_anything_2/072824/sam2_hiera_small.pt"
-            else:
-                from sam2.build_sam import build_sam2_video_predictor
-                checkpoint_file = "checkpoints/sam2_hiera_base_plus.pt"
-                config = "sam2_hiera_b+.yaml"
-                checkpoint_url = "https://dl.fbaipublicfiles.com/segment_anything_2/072824/sam2_hiera_base_plus.pt"
-            # Download checkpoint if it doesn't exist
-            if not os.path.exists(checkpoint_file):
-                logger.info(f"📥 Downloading SAM2 checkpoint: {MODEL_SIZE}")
-                self.download_checkpoint(checkpoint_url, checkpoint_file)
-            # Also need config file
-            config_file = f"checkpoints/{config}"
-            if not os.path.exists(config_file):
-                logger.info(f"📥 Downloading SAM2 config: {config}")
-                config_url = f"https://raw.githubusercontent.com/facebookresearch/segment-anything-2/main/sam2/configs/{config}"
-                self.download_checkpoint(config_url, config_file)
-            self.sam2_predictor = build_sam2_video_predictor(config_file, checkpoint_file, device=DEVICE)
-            logger.info(f"✅ SAM2 model loaded: {MODEL_SIZE}")
-            return True
-        except Exception as e:
-            logger.error(f"❌ Failed to load SAM2 model: {e}")
-            return False
-    def load_matanyone_model(self):
-        """Load MatAnyone model"""
-        if not MATANYONE_AVAILABLE:
-            return False
-        try:
-            from matanyone import InferenceCore
-            self.matanyone_processor = InferenceCore("PeiqingYang/MatAnyone")
-            logger.info("✅ MatAnyone processor loaded")
-            return True
-        except Exception as e:
-            logger.error(f"❌ Failed to load MatAnyone: {e}")
-            return False
-    def download_checkpoint(self, url: str, filepath: str):
-        """Download SAM2 checkpoint with progress"""
-        try:
-            response = requests.get(url, stream=True)
-            response.raise_for_status()
-            total_size = int(response.headers.get('content-length', 0))
-            block_size = 8192
-            downloaded = 0
-            with open(filepath, 'wb') as f:
-                for chunk in response.iter_content(chunk_size=block_size):
-                    if chunk:
-                        f.write(chunk)
-                        downloaded += len(chunk)
-                        if total_size > 0:
-                            progress = (downloaded / total_size) * 100
-                            if downloaded % (block_size * 100) == 0:  # Log every ~800KB
-                                logger.info(f"📥 Download progress: {progress:.1f}%")
-            logger.info(f"✅ Downloaded: {filepath}")
-        except Exception as e:
-            logger.error(f"❌ Download failed: {e}")
-            raise
-    def segment_video(self, video_path: str, output_path: str) -> Tuple[bool, str]:
-        """Professional SAM2 + MatAnyone video segmentation"""
-        try:
-            if not self.sam2_predictor and not self.load_models():
-                logger.warning("⚠️ Professional models unavailable, using fallback")
-                return self.fallback_segmentation(video_path, output_path)
-            if self.sam2_predictor and self.matanyone_processor:
-                # Full professional pipeline: SAM2 mask + MatAnyone processing
-                return self.professional_sam2_matanyone_pipeline(video_path, output_path)
-            elif self.sam2_predictor:
-                # SAM2 mask + OpenCV replacement
-                return self.sam2_opencv_pipeline(video_path, output_path)
-            else:
-                # Fallback
-                return self.fallback_segmentation(video_path, output_path)
-        except Exception as e:
-            logger.error(f"❌ Error in video segmentation: {e}")
-            # Try fallback method
-            logger.warning("⚠️ Trying fallback segmentation method...")
-            return self.fallback_segmentation(video_path, output_path)
-    def professional_sam2_matanyone_pipeline(self, video_path: str, output_path: str) -> Tuple[bool, str]:
-        """Professional SAM2 + MatAnyone pipeline"""
-        try:
-            logger.info("🎬 Using PROFESSIONAL SAM2 + MatAnyone pipeline")
-            # Step 1: Extract first frame for SAM2 analysis
-            first_frame_path = self.extract_first_frame(video_path)
-            if not first_frame_path:
-                raise Exception("Failed to extract first frame")
-            # Step 2: Generate high-quality mask with SAM2
-            mask_path = self.generate_sam2_mask(first_frame_path)
-            if not mask_path:
-                raise Exception("Failed to generate SAM2 mask")
-            # Step 3: Process with MatAnyone
-            logger.info("⚡ Processing video with MatAnyone professional matting...")
-            # Create temp directory for MatAnyone output
-            temp_dir = tempfile.mkdtemp()
-            try:
-                # Use MatAnyone for professional video matting
-                foreground_path, alpha_path = self.matanyone_processor.process_video(
-                    input_path=video_path,
-                    mask_path=mask_path,
-                    output_path=temp_dir
-                )
-                # For now, copy foreground to output (can add background compositing later)
-                shutil.copy2(foreground_path, output_path)
-                logger.info("✅ Professional SAM2 + MatAnyone processing completed")
-                return True, "Professional SAM2 + MatAnyone segmentation completed successfully"
-            finally:
-                # Cleanup temp files
-                try:
-                    shutil.rmtree(temp_dir)
-                    os.unlink(first_frame_path)
-                    os.unlink(mask_path)
-                except:
-                    pass
-        except Exception as e:
-            logger.error(f"❌ Professional pipeline failed: {e}")
-            return False, f"Professional pipeline error: {str(e)}"
-    def sam2_opencv_pipeline(self, video_path: str, output_path: str) -> Tuple[bool, str]:
-        """SAM2 mask + OpenCV replacement pipeline"""
         try:
-            logger.info("🎯 Using SAM2 + OpenCV pipeline")
-            # Extract first frame
-            first_frame_path = self.extract_first_frame(video_path)
-            if not first_frame_path:
-                raise Exception("Failed to extract first frame")
-            # Generate SAM2 mask
-            mask_path = self.generate_sam2_mask(first_frame_path)
-            if not mask_path:
-                raise Exception("Failed to generate SAM2 mask")
-            # Apply mask to video using OpenCV
-            return self.apply_sam2_mask_to_video(video_path, mask_path, output_path)
         except Exception as e:
-            logger.error(f"❌ SAM2 + OpenCV pipeline failed: {e}")
-            return False, f"SAM2 + OpenCV error: {str(e)}"
-    def extract_first_frame(self, video_path: str) -> Optional[str]:
-        """Extract first frame for SAM2 processing"""
         try:
-            cap = cv2.VideoCapture(video_path)
-            ret, frame = cap.read()
-            cap.release()
-            if not ret:
-                return None
-            # Save first frame
-            with tempfile.NamedTemporaryFile(suffix='.jpg', delete=False) as tmp:
-                cv2.imwrite(tmp.name, frame)
-                return tmp.name
-        except Exception as e:
-            logger.error(f"Error extracting first frame: {e}")
-            return None
-    def generate_sam2_mask(self, frame_path: str) -> Optional[str]:
-        """Generate person mask using SAM2"""
-        try:
-            if not self.sam2_predictor:
-                return None
-            # Load image
-            image = cv2.imread(frame_path)
-            image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
-            # Set image for SAM2
-            self.sam2_predictor.set_image(image_rgb)
-            # Auto-detect person in center
-            height, width = image_rgb.shape[:2]
-            center_point = np.array([[width//2, height//2]])
-            point_labels = np.array([1])  # 1 = foreground
-            # Generate mask
-            masks, scores, logits = self.sam2_predictor.predict(
-                point_coords=center_point,
-                point_labels=point_labels,
-                multimask_output=False
             )
-            # Save mask
-            mask = masks[0].astype(np.uint8) * 255
-            with tempfile.NamedTemporaryFile(suffix='.png', delete=False) as tmp:
-                cv2.imwrite(tmp.name, mask)
-                return tmp.name
         except Exception as e:
-            logger.error(f"Error generating SAM2 mask: {e}")
-            return None
-    def apply_sam2_mask_to_video(self, video_path: str, mask_path: str, output_path: str) -> Tuple[bool, str]:
-        """Apply SAM2 mask to video using OpenCV"""
-        try:
-            # Load mask
-            mask = cv2.imread(mask_path, cv2.IMREAD_GRAYSCALE)
-            if mask is None:
-                raise Exception("Could not load mask")
-            # Process video
-            cap = cv2.VideoCapture(video_path)
-            if not cap.isOpened():
-                raise Exception("Could not open video")
-            # Get video properties
-            fps = int(cap.get(cv2.CAP_PROP_FPS))
-            width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
-            height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
-            total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
-            # Resize mask to match video
-            mask_resized = cv2.resize(mask, (width, height))
-            # Setup video writer
-            fourcc = cv2.VideoWriter_fourcc(*'mp4v')
-            out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
-            frame_count = 0
-            while True:
-                ret, frame = cap.read()
-                if not ret:
-                    break
-                # Apply green screen using SAM2 mask
-                green_bg = np.zeros_like(frame)
-                green_bg[:, :] = [0, 255, 0]
-                mask_3d = cv2.cvtColor(mask_resized, cv2.COLOR_GRAY2BGR).astype(np.float32) / 255.0
-                result_frame = frame.astype(np.float32) * mask_3d + green_bg.astype(np.float32) * (1 - mask_3d)
-                out.write(result_frame.astype(np.uint8))
-                frame_count += 1
-                if frame_count % 30 == 0:
-                    progress = (frame_count / total_frames) * 100
-                    logger.info(f"SAM2 processing: {progress:.1f}% ({frame_count}/{total_frames})")
             cap.release()
-            out.release()
-            return True, "SAM2 + OpenCV segmentation completed successfully"
-        except Exception as e:
-            logger.error(f"Error applying SAM2 mask: {e}")
-            return False, f"SAM2 mask application error: {str(e)}"
-    def fallback_segmentation(self, video_path: str, output_path: str) -> Tuple[bool, str]:
-        """Simple but effective segmentation that works with ANY background"""
-        try:
-            logger.info("🎯 Using robust universal segmentation...")
-            cap = cv2.VideoCapture(video_path)
-            if not cap.isOpened():
-                return False, "Could not open video file"
-            # Get video properties
-            fps = int(cap.get(cv2.CAP_PROP_FPS))
-            width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
-            height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
-            total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
-            # Setup video writer
-            fourcc = cv2.VideoWriter_fourcc(*'mp4v')
-            out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
-            logger.info(f"📊 Video: {width}x{height}, {fps}fps, {total_frames} frames")
-            frame_count = 0
-            while True:
-                ret, frame = cap.read()
-                if not ret:
-                    break
-                # Create person mask using multiple methods combined
-                mask = self.create_universal_person_mask(frame, width, height)
-                # Apply green screen
-                result_frame = self.apply_green_screen_robust(frame, mask)
-                out.write(result_frame)
-                frame_count += 1
-                if frame_count % 30 == 0:
-                    progress = (frame_count / total_frames) * 100
-                    logger.info(f"Universal processing: {progress:.1f}% ({frame_count}/{total_frames})")
-            cap.release()
-            out.release()
-            logger.info(f"✅ Universal segmentation completed: {output_path}")
-            return True, "Universal segmentation completed successfully"
-        except Exception as e:
-            logger.error(f"❌ Error in universal segmentation: {e}")
-            return False, f"Universal segmentation error: {str(e)}"
-    def create_universal_person_mask(self, frame, width, height) -> np.ndarray:
-        """Create person mask using fast optimized method"""
-        # Use ONLY the fastest method that still works well
-        mask = self.fast_grabcut_segmentation(frame, width, height)
-        # Quick cleanup only
-        kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (5, 5))
-        mask = cv2.morphologyEx(mask, cv2.MORPH_CLOSE, kernel)
-        # Light smoothing
-        mask = cv2.GaussianBlur(mask, (7, 7), 0)
-        return mask
-    def fast_grabcut_segmentation(self, frame, width, height) -> np.ndarray:
-        """Fast GrabCut with minimal iterations"""
-        try:
-            # Create rectangle around likely person area (center 60% of frame)
-            margin_x = int(width * 0.2)
-            margin_y = int(height * 0.1)
-            rect = (margin_x, margin_y, width - 2*margin_x, height - 2*margin_y)
-            # Initialize mask
-            mask = np.zeros((height, width), np.uint8)
-            bgd_model = np.zeros((1, 65), np.float64)
-            fgd_model = np.zeros((1, 65), np.float64)
-            # Apply GrabCut with ONLY 2 iterations (much faster)
-            cv2.grabCut(frame, mask, rect, bgd_model, fgd_model, 2, cv2.GC_INIT_WITH_RECT)
-            # Create binary mask
-            mask2 = np.where((mask == 2) | (mask == 0), 0, 255).astype('uint8')
-            return mask2
-        except Exception as e:
-            logger.warning(f"Fast GrabCut failed: {e}, using simple fallback")
-            # Ultra-simple fallback
-            mask = np.zeros((height, width), dtype=np.uint8)
-            margin_x = int(width * 0.25)
-            margin_y = int(height * 0.15)
-            mask[margin_y:height-margin_y, margin_x:width-margin_x] = 255
-            return mask
-    def apply_green_screen_robust(self, frame, mask) -> np.ndarray:
-        """Apply green screen with robust blending"""
-        # Create green background
-        green_bg = np.zeros_like(frame)
-        green_bg[:, :] = [0, 255, 0]  # Green background (BGR format)
-        # Ensure mask is 3-channel
-        if len(mask.shape) == 2:
-            mask_3d = cv2.cvtColor(mask, cv2.COLOR_GRAY2BGR).astype(np.float32) / 255.0
-        else:
-            mask_3d = mask.astype(np.float32) / 255.0
-        # Robust blending with smooth transitions
-        # Person (mask=1) keeps original color, background (mask=0) becomes green
-        result_frame = frame.astype(np.float32) * mask_3d + green_bg.astype(np.float32) * (1 - mask_3d)
-        return result_frame.astype(np.uint8)
-# Initialize SAM2 segmenter
-sam2_segmenter = SAM2Segmenter()
-# ===============================================================================
-# MYAVATAR API INTEGRATION
-# ===============================================================================
 class MyAvatarAPI:
-    """MyAvatar API integration for video management"""
     def __init__(self):
         self.api_base = "https://app.myavatar.dk/api"
@@ -534,7 +257,6 @@ def __init__(self):
     def fetch_videos(self) -> List[Dict[str, Any]]:
         """Fetch videos from MyAvatar API"""
         try:
-            # Cache for 5 minutes
             if time.time() - self.last_refresh < 300 and self.videos_cache:
                 return self.videos_cache
@@ -543,14 +265,14 @@ def fetch_videos(self) -> List[Dict[str, Any]]:
                 data = response.json()
                 self.videos_cache = data.get('videos', [])
                 self.last_refresh = time.time()
-                logger.info(f"✅ Fetched {len(self.videos_cache)} videos from MyAvatar")
                 return self.videos_cache
             else:
-                logger.error(f"❌ API error: {response.status_code}")
                 return []
         except Exception as e:
-            logger.error(f"❌ Error fetching videos: {e}")
             return []
     def get_video_choices(self) -> List[str]:
@@ -574,11 +296,9 @@ def get_video_url(self, selection: str) -> Optional[str]:
             return None
         try:
-            # Extract ID from selection
             if "(ID: " in selection:
                 video_id = selection.split("(ID: ")[1].split(")")[0]
-                # Find video in cache
                 for video in self.videos_cache:
                     if str(video.get('id')) == video_id:
                         return video.get('video_url')
@@ -586,16 +306,12 @@ def get_video_url(self, selection: str) -> Optional[str]:
             return None
         except Exception as e:
-            logger.error(f"❌ Error extracting video URL: {e}")
             return None
-# Initialize MyAvatar API
 myavatar_api = MyAvatarAPI()
-# ===============================================================================
-# BACKGROUND PROCESSING
-# ===============================================================================
 def create_gradient_background(gradient_type: str, width: int, height: int) -> Image.Image:
     """Create gradient backgrounds"""
     try:
@@ -634,7 +350,6 @@ def create_gradient_background(gradient_type: str, width: int, height: int) -> I
     except Exception as e:
         logger.error(f"Error creating gradient: {e}")
-        # Return solid blue as fallback
         img = np.full((height, width, 3), [70, 130, 180], dtype=np.uint8)
         return Image.fromarray(img)
@@ -655,178 +370,33 @@ def create_solid_color(color: str, width: int, height: int) -> Image.Image:
     img = np.full((height, width, 3), rgb, dtype=np.uint8)
     return Image.fromarray(img)
-def replace_green_screen(video_path: str, background_image: Image.Image, output_path: str) -> Tuple[bool, str]:
-    """Replace green screen in video with new background using OpenCV only"""
-    try:
-        # Open video capture
-        cap = cv2.VideoCapture(video_path)
-        if not cap.isOpened():
-            return False, "Could not open video file"
-        # Get video properties
-        fps = int(cap.get(cv2.CAP_PROP_FPS))
-        width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
-        height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
-        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
-        # Resize background to match video dimensions
-        background_resized = background_image.resize((width, height), Image.Resampling.LANCZOS)
-        bg_array = np.array(background_resized)
-        # Create temporary video without audio first
-        temp_video_path = output_path.replace('.mp4', '_no_audio.mp4')
-        # Setup video writer
-        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
-        out = cv2.VideoWriter(temp_video_path, fourcc, fps, (width, height))
-        frame_count = 0
-        while True:
-            ret, frame = cap.read()
-            if not ret:
-                break
-            # Convert BGR to RGB for consistency
-            frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
-            # Convert to HSV for better green detection
-            hsv = cv2.cvtColor(frame_rgb, cv2.COLOR_RGB2HSV)
-            # Define green range (adjusted for green screen)
-            lower_green = np.array([40, 50, 50])
-            upper_green = np.array([80, 255, 255])
-            # Create mask
-            mask = cv2.inRange(hsv, lower_green, upper_green)
-            # Improve mask with morphological operations
-            kernel = np.ones((3, 3), np.uint8)
-            mask = cv2.morphologyEx(mask, cv2.MORPH_OPEN, kernel)
-            mask = cv2.morphologyEx(mask, cv2.MORPH_CLOSE, kernel)
-            # Apply Gaussian blur for smoother edges
-            mask = cv2.GaussianBlur(mask, (5, 5), 0)
-            mask = mask.astype(np.float32) / 255.0  # Normalize to 0-1
-            # Create 3-channel mask
-            mask_3d = np.stack([mask, mask, mask], axis=2)
-            # Blend frame with background
-            result = frame_rgb * (1 - mask_3d) + bg_array * mask_3d
-            result = result.astype(np.uint8)
-            # Convert back to BGR for video writer
-            result_bgr = cv2.cvtColor(result, cv2.COLOR_RGB2BGR)
-            out.write(result_bgr)
-            frame_count += 1
-            if frame_count % 30 == 0:  # Log progress every 30 frames
-                progress = (frame_count / total_frames) * 100
-                logger.info(f"Processing: {progress:.1f}% ({frame_count}/{total_frames})")
-        # Cleanup
-        cap.release()
-        out.release()
-        # Step 4: Add audio back using ffmpeg
-        logger.info("🔊 Adding audio back to final video...")
-        success = add_audio_to_video(video_path, temp_video_path, output_path)
-        # Cleanup temporary file
-        try:
-            os.unlink(temp_video_path)
-        except:
-            pass
-        if success:
-            logger.info(f"✅ Green screen replacement with audio completed: {output_path}")
-            return True, "Background replacement with audio completed successfully"
-        else:
-            logger.warning("⚠️ Audio addition failed, but video processing completed")
-            # Move temp file to final output as fallback
-            try:
-                os.rename(temp_video_path, output_path)
-            except:
-                pass
-            return True, "Background replacement completed (audio may be missing)"
-    except Exception as e:
-        logger.error(f"❌ Error in green screen replacement: {e}")
-        return False, f"Background replacement error: {str(e)}"
-def add_audio_to_video(source_video: str, video_no_audio: str, output_path: str) -> bool:
-    """Add audio from source video to processed video using ffmpeg"""
-    try:
-        # Check if ffmpeg is available
-        try:
-            subprocess.run(['ffmpeg', '-version'], capture_output=True, check=True)
-        except (subprocess.CalledProcessError, FileNotFoundError):
-            logger.warning("⚠️ ffmpeg not available, skipping audio")
-            return False
-        # FFmpeg command to combine video (no audio) with audio from original
-        cmd = [
-            'ffmpeg', '-y',  # -y to overwrite output file
-            '-i', video_no_audio,  # Video input (no audio)
-            '-i', source_video,    # Audio source
-            '-c:v', 'copy',        # Copy video codec
-            '-c:a', 'aac',         # Audio codec
-            '-map', '0:v:0',       # Use video from first input
-            '-map', '1:a:0',       # Use audio from second input
-            '-shortest',           # End when shortest stream ends
-            output_path
-        ]
-        # Run ffmpeg
-        result = subprocess.run(cmd, capture_output=True, text=True)
-        if result.returncode == 0:
-            logger.info("✅ Audio successfully added to video")
-            return True
-        else:
-            logger.error(f"❌ ffmpeg error: {result.stderr}")
-            return False
-    except Exception as e:
-        logger.error(f"❌ Error adding audio: {e}")
-        return False
-# ===============================================================================
-# AI BACKGROUND GENERATION
-# ===============================================================================
 def generate_ai_background(prompt: str) -> Tuple[Optional[Image.Image], str]:
     """Generate AI background using Hugging Face Inference API"""
     try:
         if not prompt.strip():
             return None, "Please enter a prompt"
-        # Try multiple AI models for image generation
         models = [
-            "black-forest-labs/FLUX.1-schnell",  # Fast FLUX model
-            "stabilityai/stable-diffusion-xl-base-1.0",  # SDXL
-            "runwayml/stable-diffusion-v1-5"  # SD 1.5 fallback
         ]
-        # Enhanced prompt for backgrounds
         enhanced_prompt = f"professional video background, {prompt}, high quality, 16:9 aspect ratio, cinematic lighting, detailed"
         for model in models:
             try:
-                logger.info(f"🎨 Trying AI generation with {model}...")
-                # Hugging Face Inference API
                 api_url = f"https://api-inference.huggingface.co/models/{model}"
                 headers = {
                     "Authorization": f"Bearer {os.getenv('HUGGINGFACE_TOKEN', 'hf_placeholder')}"
                 }
                 payload = {
                     "inputs": enhanced_prompt,
                     "parameters": {
                         "width": 1024,
-                        "height": 576,  # 16:9 aspect ratio
                         "num_inference_steps": 20,
                         "guidance_scale": 7.5
                     }
@@ -835,27 +405,22 @@ def generate_ai_background(prompt: str) -> Tuple[Optional[Image.Image], str]:
                 response = requests.post(api_url, headers=headers, json=payload, timeout=30)
                 if response.status_code == 200:
-                    # Success! Convert response to image
                     image = Image.open(io.BytesIO(response.content))
-                    logger.info(f"✅ AI background generated successfully with {model}")
-                    return image, f"✅ AI background generated: {prompt}"
                 elif response.status_code == 503:
-                    # Model loading, try next
-                    logger.warning(f"⏳ Model {model} is loading, trying next...")
                     continue
                 else:
-                    logger.warning(f"⚠️ Error with {model}: {response.status_code}")
                     continue
             except Exception as e:
-                logger.warning(f"⚠️ Error with {model}: {e}")
                 continue
-        # If all AI models fail, create an intelligent gradient fallback
-        logger.info("🔄 AI generation failed, creating intelligent gradient fallback...")
-        return create_intelligent_gradient(prompt), f"✅ Created gradient background inspired by: {prompt}"
     except Exception as e:
         logger.error(f"Error in AI background generation: {e}")
@@ -865,47 +430,16 @@ def create_intelligent_gradient(prompt: str) -> Image.Image:
     """Create intelligent gradient based on prompt analysis"""
     prompt_lower = prompt.lower()
-    # Analyze prompt for colors and themes
     if any(word in prompt_lower for word in ["sunset", "orange", "warm", "fire", "autumn"]):
         return create_gradient_background("sunset", 1920, 1080)
     elif any(word in prompt_lower for word in ["ocean", "sea", "blue", "water", "sky", "calm"]):
         return create_gradient_background("ocean", 1920, 1080)
     elif any(word in prompt_lower for word in ["forest", "green", "nature", "trees", "jungle"]):
         return create_gradient_background("forest", 1920, 1080)
-    elif any(word in prompt_lower for word in ["night", "dark", "purple", "space", "cosmic"]):
-        return create_cosmic_gradient(1920, 1080)
-    elif any(word in prompt_lower for word in ["professional", "business", "corporate", "office"]):
-        return create_professional_gradient(1920, 1080)
     else:
         return create_gradient_background("default", 1920, 1080)
-def create_cosmic_gradient(width: int, height: int) -> Image.Image:
-    """Create a cosmic/space gradient"""
-    img = np.zeros((height, width, 3), dtype=np.uint8)
-    for i in range(height):
-        ratio = i / height
-        r = int(25 * (1 - ratio) + 75 * ratio)
-        g = int(25 * (1 - ratio) + 0 * ratio)
-        b = int(112 * (1 - ratio) + 130 * ratio)
-        img[i, :] = [r, g, b]
-    return Image.fromarray(img)
-def create_professional_gradient(width: int, height: int) -> Image.Image:
-    """Create a professional business gradient"""
-    img = np.zeros((height, width, 3), dtype=np.uint8)
-    for i in range(height):
-        ratio = i / height
-        r = int(240 * (1 - ratio) + 200 * ratio)
-        g = int(240 * (1 - ratio) + 200 * ratio)
-        b = int(240 * (1 - ratio) + 200 * ratio)
-        img[i, :] = [r, g, b]
-    return Image.fromarray(img)
-# ===============================================================================
-# MAIN PROCESSING FUNCTIONS
-# ===============================================================================
-def process_video_with_background(
     input_video: Optional[str],
     myavatar_selection: str,
     background_type: str,
@@ -913,10 +447,16 @@ def process_video_with_background(
     solid_color: str,
     custom_background: Optional[str],
     ai_prompt: str
-) -> Tuple[Optional[str], str]:
-    """Main video processing function"""
     try:
-        # Determine input video source
         video_path = None
         if input_video:
             video_path = input_video
@@ -924,7 +464,6 @@ def process_video_with_background(
         elif myavatar_selection and myavatar_selection != "No videos available":
             video_url = myavatar_api.get_video_url(myavatar_selection)
             if video_url:
-                # Download video temporarily
                 response = requests.get(video_url)
                 if response.status_code == 200:
                     temp_video = tempfile.NamedTemporaryFile(suffix='.mp4', delete=False)
@@ -932,28 +471,15 @@ def process_video_with_background(
                     temp_video.close()
                     video_path = temp_video.name
                     logger.info("Using MyAvatar video")
-                else:
-                    return None, "❌ Failed to download MyAvatar video"
-            else:
-                return None, "❌ Could not get video URL from MyAvatar"
         if not video_path:
-            return None, "❌ No video provided"
-        # Step 1: Create green screen version using SAM2
-        with tempfile.NamedTemporaryFile(suffix='_greenscreen.mp4', delete=False) as tmp_green:
-            green_video_path = tmp_green.name
-        logger.info("🎬 Step 1: Creating green screen version with SAM2...")
-        success, message = sam2_segmenter.segment_video(video_path, green_video_path)
-        if not success:
-            return None, f"❌ SAM2 segmentation failed: {message}"
-        # Step 2: Generate background
-        logger.info("🎨 Step 2: Generating background...")
         background_image = None
         if background_type == "gradient":
             background_image = create_gradient_background(gradient_type, 1920, 1080)
         elif background_type == "solid":
@@ -962,81 +488,75 @@ def process_video_with_background(
             background_image = Image.open(custom_background)
         elif background_type == "ai" and ai_prompt:
             bg_img, ai_msg = generate_ai_background(ai_prompt)
-            if bg_img:
-                background_image = bg_img
-            else:
-                return None, f"❌ AI background generation failed: {ai_msg}"
         if not background_image:
-            return None, "❌ No background generated"
-        # Step 3: Replace green screen with background
-        logger.info("🔄 Step 3: Replacing green screen with background...")
-        with tempfile.NamedTemporaryFile(suffix='_final.mp4', delete=False) as tmp_final:
             final_video_path = tmp_final.name
-        success, message = replace_green_screen(green_video_path, background_image, final_video_path)
-        # Cleanup temporary files
         try:
-            os.unlink(green_video_path)
-            if video_path != input_video:  # Don't delete uploaded file
                 os.unlink(video_path)
         except:
             pass
-        if success:
-            logger.info("✅ Video processing completed successfully!")
-            return final_video_path, "✅ Video processing completed successfully!"
         else:
-            return None, f"❌ Background replacement failed: {message}"
     except Exception as e:
-        logger.error(f"❌ Error in video processing: {e}")
-        return None, f"❌ Processing error: {str(e)}"
-# ===============================================================================
-# GRADIO INTERFACE
-# ===============================================================================
 def create_interface():
     """Create the Gradio interface"""
     logger.info("Creating Gradio interface...")
-    logger.info(f"Device: {DEVICE} | GPU: {GPU_NAME} | Memory: {GPU_MEMORY:.1f}GB | Type: {MODEL_SIZE}")
-    # Custom CSS
     css = """
     .main-container { max-width: 1200px; margin: 0 auto; }
     .status-box { border: 2px solid #4CAF50; border-radius: 10px; padding: 15px; }
     .gradient-preview { border: 2px solid #ddd; border-radius: 10px; }
     """
-    with gr.Blocks(css=css, title="🎬 BackgroundFX Pro") as app:
-        # Header
         gr.Markdown("""
-        # 🎬 BackgroundFX Pro
-        ### Professional Video Background Replacement with SAM2 Segmentation
         """)
-        # System Status
         with gr.Row():
             gr.Markdown(f"""
-            **System Status:** 🟢 Online | **GPU:** {GPU_NAME} | **SAM2:** {'✅ Ready' if SAM2_AVAILABLE else '❌ Not Available'}
             """)
-        # Main Interface
         with gr.Row():
-            # Left Column - Input
             with gr.Column(scale=1):
-                gr.Markdown("## 📹 Video Input")
                 with gr.Tabs():
-                    with gr.Tab("📁 Upload Video"):
                         video_upload = gr.Video(label="Upload Video File", height=300)
-                    with gr.Tab("📱 MyAvatar Videos"):
-                        refresh_btn = gr.Button("🔄 Refresh Videos", size="sm")
                         myavatar_dropdown = gr.Dropdown(
                             label="Select MyAvatar Video",
                             choices=["Click refresh to load videos"],
@@ -1044,7 +564,7 @@ def create_interface():
                         )
                         video_preview = gr.Video(label="Preview", height=200)
-                gr.Markdown("## 🎨 Background Options")
                 background_type = gr.Radio(
                     choices=["gradient", "solid", "custom", "ai"],
@@ -1053,7 +573,6 @@ def create_interface():
                 )
                 with gr.Group():
-                    # Gradient options
                     gradient_type = gr.Dropdown(
                         choices=["sunset", "ocean", "forest", "default"],
                         value="sunset",
@@ -1062,7 +581,6 @@ def create_interface():
                     )
                     gradient_preview = gr.Image(label="Gradient Preview", height=150)
-                    # Solid color options
                     solid_color = gr.Dropdown(
                         choices=["white", "black", "blue", "green", "red", "purple", "orange", "yellow"],
                         value="blue",
@@ -1071,28 +589,26 @@ def create_interface():
                     )
                     color_preview = gr.Image(label="Color Preview", height=150, visible=False)
-                    # Custom background upload
                     custom_bg_upload = gr.Image(
                         label="Upload Custom Background",
                         type="filepath",
                         visible=False
                     )
-                    # AI generation
                     ai_prompt = gr.Textbox(
                         label="AI Background Prompt",
                         placeholder="Describe the background you want...",
                         visible=False
                     )
-                    ai_generate_btn = gr.Button("🤖 Generate AI Background", visible=False)
                     ai_preview = gr.Image(label="AI Generated Background", height=150, visible=False)
-                # Process button
-                process_btn = gr.Button("🎬 Process Video", variant="primary", size="lg")
-            # Right Column - Output
             with gr.Column(scale=1):
-                gr.Markdown("## 🎯 Results")
                 result_video = gr.Video(label="Processed Video", height=400)
@@ -1103,21 +619,18 @@ def create_interface():
                     elem_classes=["status-box"]
                 )
-                # Processing info
                 gr.Markdown("""
-                ### 🔧 Processing Steps:
-                1. **SAM2 Segmentation** - Extract person from video
-                2. **Green Screen Creation** - Replace background with green
-                3. **Background Replacement** - Apply your chosen background
-                4. **Final Rendering** - Output processed video
-                **Estimated Time:** 2-5 minutes depending on video length
                 """)
-        # ===== EVENT HANDLERS (All defined after components) =====
         def update_background_options(bg_type):
-            """Update visible background options based on type"""
             return {
                 gradient_type: gr.update(visible=(bg_type == "gradient")),
                 gradient_preview: gr.update(visible=(bg_type == "gradient")),
@@ -1130,23 +643,18 @@ def update_background_options(bg_type):
             }
         def update_gradient_preview(grad_type):
-            """Update gradient preview"""
             try:
-                img = create_gradient_background(grad_type, 400, 200)
-                return img
             except:
                 return None
         def update_color_preview(color):
-            """Update solid color preview"""
             try:
-                img = create_solid_color(color, 400, 200)
-                return img
             except:
                 return None
         def refresh_myavatar_videos():
-            """Refresh MyAvatar video list"""
             try:
                 choices = myavatar_api.get_video_choices()
                 return gr.update(choices=choices, value=None)
@@ -1155,7 +663,6 @@ def refresh_myavatar_videos():
                 return gr.update(choices=["Error loading videos"])
         def load_video_preview(selection):
-            """Load video preview from MyAvatar selection"""
             try:
                 if not selection or selection == "No videos available":
                     return None
@@ -1167,7 +674,6 @@ def load_video_preview(selection):
                 return None
         def generate_ai_bg(prompt):
-            """Generate AI background"""
             bg_img, message = generate_ai_background(prompt)
             return bg_img
@@ -1209,7 +715,7 @@ def generate_ai_bg(prompt):
         )
         process_btn.click(
-            fn=process_video_with_background,
             inputs=[
                 video_upload,
                 myavatar_dropdown,
@@ -1219,10 +725,14 @@ def generate_ai_bg(prompt):
                 custom_bg_upload,
                 ai_prompt
             ],
-            outputs=[result_video, status_output]
         )
-        # Initialize gradient preview
         app.load(
             fn=lambda: create_gradient_background("sunset", 400, 200),
             outputs=[gradient_preview]
@@ -1230,19 +740,16 @@ def generate_ai_bg(prompt):
     return app
-# ===============================================================================
-# MAIN APPLICATION
-# ===============================================================================
 def main():
     """Main application entry point"""
     try:
-        # Pre-load AI models
-        if SAM2_AVAILABLE or MATANYONE_AVAILABLE:
-            logger.info("Pre-loading AI models...")
-            sam2_segmenter.load_models()
-        # Create and launch interface
         app = create_interface()
         app.launch(
@@ -1254,7 +761,7 @@ def main():
         )
     except Exception as e:
-        logger.error(f"❌ Failed to start application: {e}")
         sys.exit(1)
 if __name__ == "__main__":

 #!/usr/bin/env python3
 """
+BackgroundFX Pro - GPU Optimized Version
+Professional video background replacement with SAM2 + MatAnyone
 """
 import os
 import requests
 import tempfile
 import subprocess
+import threading
 import numpy as np
 import io
 from PIL import Image
 import gradio as gr
+# Import optimized modules
+from utils.accelerator import pick_device, torch_global_tuning, memory_checkpoint, cleanup
+from models.sam2_loader import SAM2Predictor
+from models.matanyone_loader import MatAnyoneSession
+# Configure logging
 logging.basicConfig(
     level=logging.INFO,
     format='%(asctime)s - %(levelname)s - %(message)s'
     SKLEARN_AVAILABLE = True
 except ImportError:
     SKLEARN_AVAILABLE = False
+    logger.warning("sklearn not available, using fallback color detection")
+# Global processing control
+processing_active = False
+processing_thread = None
+# Initialize optimized system
+device = pick_device()
+torch_global_tuning()
+GPU_NAME = torch.cuda.get_device_name(0) if torch.cuda.is_available() else "CPU"
+GPU_MEMORY = torch.cuda.get_device_properties(0).total_memory / (1024**3) if torch.cuda.is_available() else 0
+MODEL_SIZE = "large" if "T4" in GPU_NAME else "base"
+logger.info(f"System initialized - Device: {device} | GPU: {GPU_NAME} | Memory: {GPU_MEMORY:.1f}GB")
+# Environment variables for model control
+SAM2_ENABLED = os.environ.get("ENABLE_SAM2", "1") == "1"
+MATANY_ENABLED = os.environ.get("ENABLE_MATANY", "1") == "1"
+MAX_SIDE = int(os.environ.get("MAX_SIDE", "1280"))
+FRAME_CHUNK = int(os.environ.get("FRAME_CHUNK", "64"))
+# Global optimized model instances
+sam2_predictor = None
+matanyone_session = None
+def get_sam2():
+    """Get SAM2 predictor with lazy loading"""
+    global sam2_predictor
+    if sam2_predictor is None and SAM2_ENABLED:
         try:
+            sam2_predictor = SAM2Predictor(device).load()
+            logger.info("SAM2 loaded with optimized pipeline")
         except Exception as e:
+            logger.error(f"SAM2 loading failed: {e}")
+            sam2_predictor = None
+    return sam2_predictor
+def get_matanyone():
+    """Get MatAnyone session with lazy loading"""
+    global matanyone_session
+    if matanyone_session is None and MATANY_ENABLED:
         try:
+            repo_id = os.environ.get("MATANY_REPO_ID", "PeiqingYang/MatAnyone")
+            filename = os.environ.get("MATANY_FILENAME", "matanyone_v1.0.pth")
+            matanyone_session = MatAnyoneSession(device).load(
+                repo_id=repo_id,
+                filename=filename
             )
+            logger.info("MatAnyone loaded with optimized pipeline")
         except Exception as e:
+            logger.error(f"MatAnyone loading failed: {e}")
+            matanyone_session = None
+    return matanyone_session
+def iter_video_frames(path, target_max_side=MAX_SIDE, chunk=FRAME_CHUNK):
+    """Memory-mapped video frame generator"""
+    import cv2
+    cap = cv2.VideoCapture(path)
+    if not cap.isOpened():
+        raise RuntimeError("Cannot open video")
+    # Get video properties
+    w = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+    h = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    fps = cap.get(cv2.CAP_PROP_FPS) or 25.0
+    # Scale to fit GPU memory constraints
+    scale = min(1.0, float(target_max_side) / float(max(w, h)))
+    new_w, new_h = (w, h) if scale >= 0.999 else (int(w*scale)//2*2, int(h*scale)//2*2)
+    batch = []
+    while True:
+        if not processing_active:
             cap.release()
+            return
+        ok, f = cap.read()
+        if not ok:
+            if batch:
+                yield batch, fps, (w, h), (new_w, new_h)
+            break
+        if new_w != w or new_h != h:
+            f = cv2.resize(f, (new_w, new_h), interpolation=cv2.INTER_AREA)
+        f = cv2.cvtColor(f, cv2.COLOR_BGR2RGB)
+        batch.append(f)
+        if len(batch) >= chunk:
+            yield batch, fps, (w, h), (new_w, new_h)
+            batch = []
+    cap.release()
+def composite_frame(frame_rgb, bg_rgb, alpha01):
+    """GPU-optimized frame compositing"""
+    if bg_rgb is None:
+        bg = np.full_like(frame_rgb, 200, dtype=np.uint8)
+    else:
+        bg = bg_rgb
+        if bg.shape[:2] != frame_rgb.shape[:2]:
+            bg = cv2.resize(bg, (frame_rgb.shape[1], frame_rgb.shape[0]), interpolation=cv2.INTER_AREA)
+    a = np.clip(alpha01[..., None], 0.0, 1.0)
+    out = (frame_rgb.astype("float32") * a + bg.astype("float32") * (1.0 - a)).astype("uint8")
+    return out
+def cheap_fallback_alpha(fr, seed_mask=None):
+    """Fast CPU fallback alpha generation"""
+    if seed_mask is not None:
+        return seed_mask
+    # Center-focused soft alpha
+    H, W = fr.shape[:2]
+    yy, xx = np.mgrid[0:H, 0:W].astype("float32")
+    cx, cy = W/2.0, H/2.0
+    r = np.sqrt((xx-cx)**2 + (yy-cy)**2) / max(W, H)
+    a = 1.0 - np.clip((r-0.2)/0.4, 0.0, 1.0)
+    return a.astype("float32")
+def process_video_gpu_optimized(input_path, bg_image_rgb=None, out_path="output.mp4"):
+    """GPU-optimized video processing pipeline"""
+    global processing_active
+    writer = None
+    seed_mask = None
+    total = 0
+    try:
+        for frames, fps, orig_hw, new_hw in iter_video_frames(input_path, MAX_SIDE, FRAME_CHUNK):
+            if not processing_active:
+                logger.info("Processing stopped by user")
+                break
+            H, W = frames[0].shape[:2]
+            if writer is None:
+                writer = cv2.VideoWriter(
+                    out_path, cv2.VideoWriter_fourcc(*"mp4v"), fps, (W, H)
+                )
+            # First frame: try SAM2 for seed mask
+            if seed_mask is None:
+                try:
+                    sam2 = get_sam2()
+                    if sam2:
+                        seed_mask = sam2.first_frame_mask(frames[0].astype("float32") / 255.0)
+                        seed_mask = (cv2.GaussianBlur(seed_mask, (0, 0), 1.0) > 0.5).astype("float32")
+                        logger.info("SAM2 seed mask generated")
+                except Exception as e:
+                    logger.warning(f"SAM2 failed, continuing without: {e}")
+                    seed_mask = None
+            # Professional matting pipeline
+            matany = get_matanyone()
+            if matany and MATANY_ENABLED:
+                try:
+                    with torch.autocast(device_type=str(device).split(":")[0], dtype=torch.float16, enabled=(device.type=="cuda")):
+                        for i, fr in enumerate(frames):
+                            if not processing_active:
+                                break
+                            alpha = matany.step(fr, seed_mask if total == 0 and i == 0 else None)
+                            comp = composite_frame(fr, bg_image_rgb, alpha)
+                            writer.write(cv2.cvtColor(comp, cv2.COLOR_RGB2BGR))
+                            total += 1
+                            if total % 64 == 0:
+                                cleanup()
+                                memory_checkpoint(f"frames={total}")
+                except Exception as e:
+                    logger.warning(f"MatAnyone failed: {e}")
+                    matany = None
+            # Fallback if MatAnyone unavailable
+            if not matany:
+                for fr in frames:
+                    if not processing_active:
+                        break
+                    alpha = cheap_fallback_alpha(fr, seed_mask)
+                    comp = composite_frame(fr, bg_image_rgb, alpha)
+                    writer.write(cv2.cvtColor(comp, cv2.COLOR_RGB2BGR))
+                    total += 1
+                    if total % 64 == 0:
+                        cleanup()
+            memory_checkpoint(f"processed={total}")
+    except Exception as e:
+        logger.error(f"Processing error: {e}")
+    finally:
+        if writer:
+            writer.release()
+        cleanup()
+    return out_path if processing_active else None
+def stop_processing():
+    """Stop video processing"""
+    global processing_active
+    processing_active = False
+    return gr.update(visible=False), "Processing stopped by user"
 class MyAvatarAPI:
+    """MyAvatar API integration"""
     def __init__(self):
         self.api_base = "https://app.myavatar.dk/api"
     def fetch_videos(self) -> List[Dict[str, Any]]:
         """Fetch videos from MyAvatar API"""
         try:
             if time.time() - self.last_refresh < 300 and self.videos_cache:
                 return self.videos_cache
                 data = response.json()
                 self.videos_cache = data.get('videos', [])
                 self.last_refresh = time.time()
+                logger.info(f"Fetched {len(self.videos_cache)} videos from MyAvatar")
                 return self.videos_cache
             else:
+                logger.error(f"API error: {response.status_code}")
                 return []
         except Exception as e:
+            logger.error(f"Error fetching videos: {e}")
             return []
     def get_video_choices(self) -> List[str]:
             return None
         try:
             if "(ID: " in selection:
                 video_id = selection.split("(ID: ")[1].split(")")[0]
                 for video in self.videos_cache:
                     if str(video.get('id')) == video_id:
                         return video.get('video_url')
             return None
         except Exception as e:
+            logger.error(f"Error extracting video URL: {e}")
             return None
+# Initialize API
 myavatar_api = MyAvatarAPI()
 def create_gradient_background(gradient_type: str, width: int, height: int) -> Image.Image:
     """Create gradient backgrounds"""
     try:
     except Exception as e:
         logger.error(f"Error creating gradient: {e}")
         img = np.full((height, width, 3), [70, 130, 180], dtype=np.uint8)
         return Image.fromarray(img)
     img = np.full((height, width, 3), rgb, dtype=np.uint8)
     return Image.fromarray(img)
 def generate_ai_background(prompt: str) -> Tuple[Optional[Image.Image], str]:
     """Generate AI background using Hugging Face Inference API"""
     try:
         if not prompt.strip():
             return None, "Please enter a prompt"
         models = [
+            "black-forest-labs/FLUX.1-schnell",
+            "stabilityai/stable-diffusion-xl-base-1.0",
+            "runwayml/stable-diffusion-v1-5"
         ]
         enhanced_prompt = f"professional video background, {prompt}, high quality, 16:9 aspect ratio, cinematic lighting, detailed"
         for model in models:
             try:
+                logger.info(f"Trying AI generation with {model}...")
                 api_url = f"https://api-inference.huggingface.co/models/{model}"
                 headers = {
                     "Authorization": f"Bearer {os.getenv('HUGGINGFACE_TOKEN', 'hf_placeholder')}"
                 }
                 payload = {
                     "inputs": enhanced_prompt,
                     "parameters": {
                         "width": 1024,
+                        "height": 576,
                         "num_inference_steps": 20,
                         "guidance_scale": 7.5
                     }
                 response = requests.post(api_url, headers=headers, json=payload, timeout=30)
                 if response.status_code == 200:
                     image = Image.open(io.BytesIO(response.content))
+                    logger.info(f"AI background generated successfully with {model}")
+                    return image, f"AI background generated: {prompt}"
                 elif response.status_code == 503:
+                    logger.warning(f"Model {model} is loading, trying next...")
                     continue
                 else:
+                    logger.warning(f"Error with {model}: {response.status_code}")
                     continue
             except Exception as e:
+                logger.warning(f"Error with {model}: {e}")
                 continue
+        logger.info("AI generation failed, creating intelligent gradient fallback...")
+        return create_intelligent_gradient(prompt), f"Created gradient background inspired by: {prompt}"
     except Exception as e:
         logger.error(f"Error in AI background generation: {e}")
     """Create intelligent gradient based on prompt analysis"""
     prompt_lower = prompt.lower()
     if any(word in prompt_lower for word in ["sunset", "orange", "warm", "fire", "autumn"]):
         return create_gradient_background("sunset", 1920, 1080)
     elif any(word in prompt_lower for word in ["ocean", "sea", "blue", "water", "sky", "calm"]):
         return create_gradient_background("ocean", 1920, 1080)
     elif any(word in prompt_lower for word in ["forest", "green", "nature", "trees", "jungle"]):
         return create_gradient_background("forest", 1920, 1080)
     else:
         return create_gradient_background("default", 1920, 1080)
+def process_video_with_background_stoppable(
     input_video: Optional[str],
     myavatar_selection: str,
     background_type: str,
     solid_color: str,
     custom_background: Optional[str],
     ai_prompt: str
+):
+    """Main processing function with stop capability"""
+    global processing_active
+    processing_active = True
     try:
+        # Show stop button, hide process button
+        yield gr.update(visible=False), gr.update(visible=True), None, "Starting processing..."
+        # Determine video source
         video_path = None
         if input_video:
             video_path = input_video
         elif myavatar_selection and myavatar_selection != "No videos available":
             video_url = myavatar_api.get_video_url(myavatar_selection)
             if video_url:
                 response = requests.get(video_url)
                 if response.status_code == 200:
                     temp_video = tempfile.NamedTemporaryFile(suffix='.mp4', delete=False)
                     temp_video.close()
                     video_path = temp_video.name
                     logger.info("Using MyAvatar video")
         if not video_path:
+            yield gr.update(visible=True), gr.update(visible=False), None, "No video provided"
+            return
+        # Generate background
+        yield gr.update(visible=False), gr.update(visible=True), None, "Generating background..."
         background_image = None
         if background_type == "gradient":
             background_image = create_gradient_background(gradient_type, 1920, 1080)
         elif background_type == "solid":
             background_image = Image.open(custom_background)
         elif background_type == "ai" and ai_prompt:
             bg_img, ai_msg = generate_ai_background(ai_prompt)
+            background_image = bg_img
         if not background_image:
+            yield gr.update(visible=True), gr.update(visible=False), None, "No background generated"
+            return
+        # Process video
+        yield gr.update(visible=False), gr.update(visible=True), None, "Processing video with GPU optimization..."
+        bg_array = np.array(background_image.resize((1280, 720), Image.Resampling.LANCZOS))
+        with tempfile.NamedTemporaryFile(suffix='_processed.mp4', delete=False) as tmp_final:
             final_video_path = tmp_final.name
+        result_path = process_video_gpu_optimized(video_path, bg_array, final_video_path)
+        # Cleanup
         try:
+            if video_path != input_video:
                 os.unlink(video_path)
         except:
             pass
+        if result_path and processing_active:
+            yield gr.update(visible=True), gr.update(visible=False), result_path, "Video processing completed successfully!"
         else:
+            yield gr.update(visible=True), gr.update(visible=False), None, "Processing was stopped or failed"
     except Exception as e:
+        logger.error(f"Error in video processing: {e}")
+        yield gr.update(visible=True), gr.update(visible=False), None, f"Processing error: {str(e)}"
+    finally:
+        processing_active = False
 def create_interface():
     """Create the Gradio interface"""
     logger.info("Creating Gradio interface...")
+    logger.info(f"Device: {device} | GPU: {GPU_NAME} | Memory: {GPU_MEMORY:.1f}GB")
     css = """
     .main-container { max-width: 1200px; margin: 0 auto; }
     .status-box { border: 2px solid #4CAF50; border-radius: 10px; padding: 15px; }
     .gradient-preview { border: 2px solid #ddd; border-radius: 10px; }
     """
+    with gr.Blocks(css=css, title="BackgroundFX Pro - GPU Optimized") as app:
         gr.Markdown("""
+        # BackgroundFX Pro - GPU Optimized
+        ### Professional Video Background Replacement with SAM2 + MatAnyone
         """)
         with gr.Row():
+            sam2_status = "Ready" if SAM2_ENABLED else "Disabled"
+            matany_status = "Ready" if MATANY_ENABLED else "Disabled"
             gr.Markdown(f"""
+            **System Status:** Online | **GPU:** {GPU_NAME} | **SAM2:** {sam2_status} | **MatAnyone:** {matany_status}
             """)
         with gr.Row():
             with gr.Column(scale=1):
+                gr.Markdown("## Video Input")
                 with gr.Tabs():
+                    with gr.Tab("Upload Video"):
                         video_upload = gr.Video(label="Upload Video File", height=300)
+                    with gr.Tab("MyAvatar Videos"):
+                        refresh_btn = gr.Button("Refresh Videos", size="sm")
                         myavatar_dropdown = gr.Dropdown(
                             label="Select MyAvatar Video",
                             choices=["Click refresh to load videos"],
                         )
                         video_preview = gr.Video(label="Preview", height=200)
+                gr.Markdown("## Background Options")
                 background_type = gr.Radio(
                     choices=["gradient", "solid", "custom", "ai"],
                 )
                 with gr.Group():
                     gradient_type = gr.Dropdown(
                         choices=["sunset", "ocean", "forest", "default"],
                         value="sunset",
                     )
                     gradient_preview = gr.Image(label="Gradient Preview", height=150)
                     solid_color = gr.Dropdown(
                         choices=["white", "black", "blue", "green", "red", "purple", "orange", "yellow"],
                         value="blue",
                     )
                     color_preview = gr.Image(label="Color Preview", height=150, visible=False)
                     custom_bg_upload = gr.Image(
                         label="Upload Custom Background",
                         type="filepath",
                         visible=False
                     )
                     ai_prompt = gr.Textbox(
                         label="AI Background Prompt",
                         placeholder="Describe the background you want...",
                         visible=False
                     )
+                    ai_generate_btn = gr.Button("Generate AI Background", visible=False)
                     ai_preview = gr.Image(label="AI Generated Background", height=150, visible=False)
+                with gr.Row():
+                    process_btn = gr.Button("Process Video", variant="primary", size="lg")
+                    stop_btn = gr.Button("Stop Processing", variant="stop", size="lg", visible=False)
             with gr.Column(scale=1):
+                gr.Markdown("## Results")
                 result_video = gr.Video(label="Processed Video", height=400)
                     elem_classes=["status-box"]
                 )
                 gr.Markdown("""
+                ### Processing Pipeline:
+                1. **SAM2 Segmentation** - GPU-accelerated person detection
+                2. **MatAnyone Matting** - Professional temporal consistency
+                3. **GPU Compositing** - Real-time background replacement
+                4. **Memory Optimization** - Chunked processing for efficiency
+                **Performance:** ~3-5 minutes per 1000 frames on T4 GPU
                 """)
+        # Event handlers
         def update_background_options(bg_type):
             return {
                 gradient_type: gr.update(visible=(bg_type == "gradient")),
                 gradient_preview: gr.update(visible=(bg_type == "gradient")),
             }
         def update_gradient_preview(grad_type):
             try:
+                return create_gradient_background(grad_type, 400, 200)
             except:
                 return None
         def update_color_preview(color):
             try:
+                return create_solid_color(color, 400, 200)
             except:
                 return None
         def refresh_myavatar_videos():
             try:
                 choices = myavatar_api.get_video_choices()
                 return gr.update(choices=choices, value=None)
                 return gr.update(choices=["Error loading videos"])
         def load_video_preview(selection):
             try:
                 if not selection or selection == "No videos available":
                     return None
                 return None
         def generate_ai_bg(prompt):
             bg_img, message = generate_ai_background(prompt)
             return bg_img
         )
         process_btn.click(
+            fn=process_video_with_background_stoppable,
             inputs=[
                 video_upload,
                 myavatar_dropdown,
                 custom_bg_upload,
                 ai_prompt
             ],
+            outputs=[process_btn, stop_btn, result_video, status_output]
+        )
+        stop_btn.click(
+            fn=stop_processing,
+            outputs=[stop_btn, status_output]
         )
         app.load(
             fn=lambda: create_gradient_background("sunset", 400, 200),
             outputs=[gradient_preview]
     return app
 def main():
     """Main application entry point"""
     try:
+        # Pre-warm models
+        logger.info("Pre-warming GPU models...")
+        if SAM2_ENABLED:
+            get_sam2()
+        if MATANY_ENABLED:
+            get_matanyone()
         app = create_interface()
         app.launch(
         )
     except Exception as e:
+        logger.error(f"Failed to start application: {e}")
         sys.exit(1)
 if __name__ == "__main__":