Spaces:

MogensR
/

VideoBackgroundReplacer2

Paused

App Files Files Community

MogensR commited on Sep 18, 2025

Commit

87680ff

1 Parent(s): 6fd9fe7

Update to Streamlit UI with new features and logo

Browse files

Files changed (26) hide show

Dockerfile +23 -27
VideoBackgroundReplacer2/.dockerignore +78 -0
VideoBackgroundReplacer2/5.0.0 +60 -0
VideoBackgroundReplacer2/DEPLOYMENT.md +90 -0
VideoBackgroundReplacer2/Dockerfile +137 -0
VideoBackgroundReplacer2/README.md +94 -0
VideoBackgroundReplacer2/app.py +300 -0
VideoBackgroundReplacer2/integrated_pipeline.py +421 -0
VideoBackgroundReplacer2/models/__init__.py +868 -0
VideoBackgroundReplacer2/models/matanyone_loader.py +290 -0
VideoBackgroundReplacer2/models/sam2_loader.py +262 -0
VideoBackgroundReplacer2/pipeline.py +477 -0
VideoBackgroundReplacer2/requirements.txt +72 -0
VideoBackgroundReplacer2/two_stage_pipeline.py +388 -0
VideoBackgroundReplacer2/ui.py +140 -0
VideoBackgroundReplacer2/ui_core_functionality.py +662 -0
VideoBackgroundReplacer2/ui_core_interface.py +430 -0
VideoBackgroundReplacer2/update_pins.py +197 -0
VideoBackgroundReplacer2/utils/__init__.py +0 -0
VideoBackgroundReplacer2/utils/paths.py +29 -0
VideoBackgroundReplacer2/utils/perf_tuning.py +21 -0
app.py +558 -288
app_backup.py +300 -0
pipeline_utils.py +191 -0
requirements.txt +10 -11
streamlit_app.py +301 -0

Dockerfile CHANGED Viewed

@@ -1,6 +1,6 @@
 # ===============================
 # Hugging Face Space — Stable Dockerfile
-# CUDA 12.1.1 + PyTorch 2.5.1 (cu121) + Gradio 4.41.3
 # SAM2 installed from source; MatAnyone via pip (repo)
 # ===============================
@@ -20,7 +20,9 @@ ENV DEBIAN_FRONTEND=noninteractive \
     NUMEXPR_NUM_THREADS=1 \
     HF_HOME=/home/user/app/.hf \
     TORCH_HOME=/home/user/app/.torch \
-    GRADIO_SERVER_PORT=7860
 # ---- Non-root user ----
 RUN useradd -m -u 1000 user
@@ -34,7 +36,7 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
     build-essential gcc g++ pkg-config \
     libffi-dev libssl-dev libc6-dev \
     libgl1-mesa-glx libglib2.0-0 libsm6 libxext6 libxrender1 libgomp1 \
- && rm -rf /var/lib/apt/lists/*
 # ---- Python bootstrap ----
 RUN python3 -m pip install --upgrade pip setuptools wheel
@@ -42,17 +44,11 @@ RUN python3 -m pip install --upgrade pip setuptools wheel
 # ---- Install PyTorch (CUDA 12.1 wheels) ----
 RUN python3 -m pip install --no-cache-dir --index-url https://download.pytorch.org/whl/cu121 \
       torch==2.5.1 torchvision==0.20.1 torchaudio==2.5.1 \
- && python3 - <<'PY'
 import torch
 print("PyTorch:", torch.__version__)
 print("CUDA available:", torch.cuda.is_available())
 print("torch.version.cuda:", getattr(torch.version, "cuda", None))
-try:
-    import torchaudio, torchvision
-    print("torchaudio:", torchaudio.__version__)
-    import torchvision as tv; print("torchvision:", tv.__version__)
-except Exception as e:
-    print("aux libs check:", e)
 PY
 # ---- Copy deps first (better caching) ----
@@ -92,19 +88,20 @@ RUN mkdir -p /home/user/app/checkpoints /home/user/app/.hf /home/user/app/.torch
     chmod -R 755 /home/user/app && \
     find /home/user/app -type d -exec chmod 755 {} \; && \
     find /home/user/app -type f -exec chmod 644 {} \; && \
-    chmod +x /home/user/app/ui.py || true
-# ---- Healthcheck (use exec-form, no heredoc) ----
 HEALTHCHECK --interval=30s --timeout=5s --retries=3 CMD \
   ["python3","-c","import torch; print('torch', torch.__version__, '| cuda', getattr(torch.version,'cuda',None), '| ok=', torch.cuda.is_available())"]
 # ---- Runtime ----
 USER user
-EXPOSE 7860
 CMD ["sh", "-c", "\
   echo '===========================================' && \
-  echo '=== BACKGROUNDFX PRO CONTAINER STARTUP ===' && \
   echo '===========================================' && \
   echo 'Timestamp:' $(date) && \
   echo 'Current directory:' $(pwd) && \
@@ -115,23 +112,22 @@ CMD ["sh", "-c", "\
   echo 'Files in app directory:' && \
   ls -la && \
   echo '' && \
-  echo '=== UI.PY VERIFICATION ===' && \
-  if [ -f ui.py ]; then \
-      echo '✅ ui.py found' && \
-      echo 'File size:' $(wc -c < ui.py) 'bytes' && \
-      echo 'File permissions:' $(ls -l ui.py) && \
       echo 'Testing Python imports...' && \
-      python3 -B -c 'import gradio; print(\"✅ Gradio:\", gradio.__version__)' && \
       python3 -B -c 'import torch; print(\"✅ Torch:\", torch.__version__)' && \
-      echo 'Testing ui.py import...' && \
-      python3 -B -c 'import sys; sys.path.insert(0, \".\"); import ui; print(\"✅ ui.py imports successfully\")' && \
       echo '✅ All checks passed!'; \
   else \
-      echo '❌ ERROR: ui.py not found!' && \
       exit 1; \
   fi && \
   echo '' && \
-  echo '=== STARTING APPLICATION ===' && \
-  echo 'Launching ui.py with bytecode disabled...' && \
-  python3 -B -u ui.py \
-"]

 # ===============================
 # Hugging Face Space — Stable Dockerfile
+# CUDA 12.1.1 + PyTorch 2.5.1 (cu121) + Streamlit 1.32.0
 # SAM2 installed from source; MatAnyone via pip (repo)
 # ===============================
     NUMEXPR_NUM_THREADS=1 \
     HF_HOME=/home/user/app/.hf \
     TORCH_HOME=/home/user/app/.torch \
+    STREAMLIT_SERVER_PORT=8501 \
+    STREAMLIT_SERVER_HEADLESS=true \
+    STREAMLIT_BROWSER_GATHER_USAGE_STATS=false
 # ---- Non-root user ----
 RUN useradd -m -u 1000 user
     build-essential gcc g++ pkg-config \
     libffi-dev libssl-dev libc6-dev \
     libgl1-mesa-glx libglib2.0-0 libsm6 libxext6 libxrender1 libgomp1 \
+    && rm -rf /var/lib/apt/lists/*
 # ---- Python bootstrap ----
 RUN python3 -m pip install --upgrade pip setuptools wheel
 # ---- Install PyTorch (CUDA 12.1 wheels) ----
 RUN python3 -m pip install --no-cache-dir --index-url https://download.pytorch.org/whl/cu121 \
       torch==2.5.1 torchvision==0.20.1 torchaudio==2.5.1 \
+    && python3 - <<'PY'
 import torch
 print("PyTorch:", torch.__version__)
 print("CUDA available:", torch.cuda.is_available())
 print("torch.version.cuda:", getattr(torch.version, "cuda", None))
 PY
 # ---- Copy deps first (better caching) ----
     chmod -R 755 /home/user/app && \
     find /home/user/app -type d -exec chmod 755 {} \; && \
     find /home/user/app -type f -exec chmod 644 {} \; && \
+    chmod +x /home/user/app/app.py || true
+# ---- Healthcheck ----
 HEALTHCHECK --interval=30s --timeout=5s --retries=3 CMD \
   ["python3","-c","import torch; print('torch', torch.__version__, '| cuda', getattr(torch.version,'cuda',None), '| ok=', torch.cuda.is_available())"]
 # ---- Runtime ----
 USER user
+EXPOSE 8501
+# Streamlit server command
 CMD ["sh", "-c", "\
   echo '===========================================' && \
+  echo '=== MYAVATAR STREAMLIT CONTAINER STARTUP ===' && \
   echo '===========================================' && \
   echo 'Timestamp:' $(date) && \
   echo 'Current directory:' $(pwd) && \
   echo 'Files in app directory:' && \
   ls -la && \
   echo '' && \
+  echo '=== APP.PY VERIFICATION ===' && \
+  if [ -f app.py ]; then \
+      echo '✅ app.py found' && \
+      echo 'File size:' $(wc -c < app.py) 'bytes' && \
+      echo 'File permissions:' $(ls -l app.py) && \
       echo 'Testing Python imports...' && \
+      python3 -B -c 'import streamlit; print(\"✅ Streamlit:\", streamlit.__version__)' && \
       python3 -B -c 'import torch; print(\"✅ Torch:\", torch.__version__)' && \
+      echo 'Testing app.py import...' && \
+      python3 -B -c 'import sys; sys.path.insert(0, \".\"); import app; print(\"✅ app.py imports successfully\")' && \
       echo '✅ All checks passed!'; \
   else \
+      echo '❌ ERROR: app.py not found!' && \
       exit 1; \
   fi && \
   echo '' && \
+  echo '=== STARTING STREAMLIT SERVER ===' && \
+  streamlit run --server.port=8501 --server.address=0.0.0.0 app.py \
+"]

VideoBackgroundReplacer2/.dockerignore ADDED Viewed

	@@ -0,0 +1,78 @@

+# ===========================
+# .dockerignore for HF Spaces
+# ===========================
+# VCS
+.git
+.gitignore
+.gitattributes
+# Python cache / build
+__pycache__/
+*.py[cod]
+*.pyo
+*.pyd
+*.pdb
+*.egg-info/
+dist/
+build/
+.pytest_cache/
+.python-version
+# Virtual environments
+.env
+.venv/
+env/
+venv/
+# External repos (cloned in Docker, not copied from local)
+third_party/
+# Hugging Face / Torch caches
+.cache/
+huggingface/
+torch/
+data/
+# HF Space metadata/state
+.hf_space/
+space.log
+gradio_cached_examples/
+gradio_static/
+__outputs__/
+# Logs & temp files
+*.log
+logs/
+tmp/
+temp/
+*.swp
+.coverage
+coverage.xml
+# Media test assets
+*.mp4
+*.avi
+*.mov
+*.mkv
+*.png
+*.jpg
+*.jpeg
+*.gif
+# OS / IDE cruft
+.DS_Store
+Thumbs.db
+.vscode/
+.idea/
+*.sublime-project
+*.sublime-workspace
+# Node / frontend (if present)
+node_modules/
+npm-debug.log
+yarn-debug.log
+yarn-error.log
+# ---- Optional: allow specific checkpoints if needed ----
+!checkpoints/

VideoBackgroundReplacer2/5.0.0 ADDED Viewed

	@@ -0,0 +1,60 @@

+Defaulting to user installation because normal site-packages is not writeable
+Requirement already satisfied: gradio in c:\users\mogen\appdata\roaming\python\python313\site-packages (4.44.0)
+Requirement already satisfied: aiofiles<24.0,>=22.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (23.2.1)
+Requirement already satisfied: anyio<5.0,>=3.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (4.9.0)
+Requirement already satisfied: fastapi<1.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.115.12)
+Requirement already satisfied: ffmpy in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.6.1)
+Requirement already satisfied: gradio-client==1.3.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (1.3.0)
+Requirement already satisfied: httpx>=0.24.1 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.27.2)
+Requirement already satisfied: huggingface-hub>=0.19.3 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.34.4)
+Requirement already satisfied: importlib-resources<7.0,>=1.3 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (6.5.2)
+Requirement already satisfied: jinja2<4.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (3.1.6)
+Requirement already satisfied: markupsafe~=2.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (2.1.5)
+Requirement already satisfied: matplotlib~=3.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (3.10.5)
+Requirement already satisfied: numpy<3.0,>=1.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (1.26.4)
+Requirement already satisfied: orjson~=3.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (3.11.2)
+Requirement already satisfied: packaging in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (24.2)
+Requirement already satisfied: pandas<3.0,>=1.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (2.2.3)
+Requirement already satisfied: pillow<11.0,>=8.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (10.4.0)
+Requirement already satisfied: pydantic>=2.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (2.11.5)
+Requirement already satisfied: pydub in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.25.1)
+Requirement already satisfied: python-multipart>=0.0.9 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.0.20)
+Requirement already satisfied: pyyaml<7.0,>=5.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (6.0.2)
+Requirement already satisfied: ruff>=0.2.2 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.12.9)
+Requirement already satisfied: semantic-version~=2.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (2.10.0)
+Requirement already satisfied: tomlkit==0.12.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.12.0)
+Requirement already satisfied: typer<1.0,>=0.12 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.16.0)
+Requirement already satisfied: typing-extensions~=4.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (4.14.1)
+Requirement already satisfied: urllib3~=2.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (2.5.0)
+Requirement already satisfied: uvicorn>=0.14.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio) (0.34.3)
+Requirement already satisfied: fsspec in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio-client==1.3.0->gradio) (2025.5.1)
+Requirement already satisfied: websockets<13.0,>=10.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from gradio-client==1.3.0->gradio) (10.4)
+Requirement already satisfied: idna>=2.8 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from anyio<5.0,>=3.0->gradio) (3.10)
+Requirement already satisfied: sniffio>=1.1 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from anyio<5.0,>=3.0->gradio) (1.3.1)
+Requirement already satisfied: starlette<0.47.0,>=0.40.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from fastapi<1.0->gradio) (0.46.2)
+Requirement already satisfied: certifi in c:\users\mogen\appdata\roaming\python\python313\site-packages (from httpx>=0.24.1->gradio) (2025.7.9)
+Requirement already satisfied: httpcore==1.* in c:\users\mogen\appdata\roaming\python\python313\site-packages (from httpx>=0.24.1->gradio) (1.0.9)
+Requirement already satisfied: h11>=0.16 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from httpcore==1.*->httpx>=0.24.1->gradio) (0.16.0)
+Requirement already satisfied: filelock in c:\users\mogen\appdata\roaming\python\python313\site-packages (from huggingface-hub>=0.19.3->gradio) (3.18.0)
+Requirement already satisfied: requests in c:\users\mogen\appdata\roaming\python\python313\site-packages (from huggingface-hub>=0.19.3->gradio) (2.32.3)
+Requirement already satisfied: tqdm>=4.42.1 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from huggingface-hub>=0.19.3->gradio) (4.67.1)
+Requirement already satisfied: contourpy>=1.0.1 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from matplotlib~=3.0->gradio) (1.3.3)
+Requirement already satisfied: cycler>=0.10 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from matplotlib~=3.0->gradio) (0.12.1)
+Requirement already satisfied: fonttools>=4.22.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from matplotlib~=3.0->gradio) (4.59.1)
+Requirement already satisfied: kiwisolver>=1.3.1 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from matplotlib~=3.0->gradio) (1.4.9)
+Requirement already satisfied: pyparsing>=2.3.1 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from matplotlib~=3.0->gradio) (3.2.3)
+Requirement already satisfied: python-dateutil>=2.7 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from matplotlib~=3.0->gradio) (2.8.2)
+Requirement already satisfied: pytz>=2020.1 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from pandas<3.0,>=1.0->gradio) (2025.2)
+Requirement already satisfied: tzdata>=2022.7 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from pandas<3.0,>=1.0->gradio) (2025.2)
+Requirement already satisfied: annotated-types>=0.6.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from pydantic>=2.0->gradio) (0.7.0)
+Requirement already satisfied: pydantic-core==2.33.2 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from pydantic>=2.0->gradio) (2.33.2)
+Requirement already satisfied: typing-inspection>=0.4.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from pydantic>=2.0->gradio) (0.4.1)
+Requirement already satisfied: click>=8.0.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from typer<1.0,>=0.12->gradio) (8.2.1)
+Requirement already satisfied: shellingham>=1.3.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from typer<1.0,>=0.12->gradio) (1.5.4)
+Requirement already satisfied: rich>=10.11.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from typer<1.0,>=0.12->gradio) (14.0.0)
+Requirement already satisfied: colorama in c:\users\mogen\appdata\roaming\python\python313\site-packages (from click>=8.0.0->typer<1.0,>=0.12->gradio) (0.4.6)
+Requirement already satisfied: six>=1.5 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from python-dateutil>=2.7->matplotlib~=3.0->gradio) (1.17.0)
+Requirement already satisfied: markdown-it-py>=2.2.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from rich>=10.11.0->typer<1.0,>=0.12->gradio) (3.0.0)
+Requirement already satisfied: pygments<3.0.0,>=2.13.0 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from rich>=10.11.0->typer<1.0,>=0.12->gradio) (2.19.1)
+Requirement already satisfied: charset-normalizer<4,>=2 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from requests->huggingface-hub>=0.19.3->gradio) (3.4.2)
+Requirement already satisfied: mdurl~=0.1 in c:\users\mogen\appdata\roaming\python\python313\site-packages (from markdown-it-py>=2.2.0->rich>=10.11.0->typer<1.0,>=0.12->gradio) (0.1.2)

VideoBackgroundReplacer2/DEPLOYMENT.md ADDED Viewed

	@@ -0,0 +1,90 @@

+# VideoBackgroundReplacer2 Deployment Guide
+This guide provides instructions for deploying the VideoBackgroundReplacer2 application to Hugging Face Spaces with GPU acceleration.
+## Prerequisites
+- Docker
+- Git
+- Python 3.8+
+- NVIDIA Container Toolkit (for local GPU testing)
+- Hugging Face account with access to GPU Spaces
+## Local Development
+### 1. Clone the repository
+```bash
+git clone <repository-url>
+cd VideoBackgroundReplacer2
+```
+### 2. Build the Docker image
+```bash
+# Make the build script executable
+chmod +x build_and_deploy.sh
+# Build the image
+./build_and_deploy.sh
+```
+### 3. Run the container locally
+```bash
+docker run --gpus all -p 7860:7860 -v $(pwd)/checkpoints:/home/user/app/checkpoints videobackgroundreplacer2:latest
+```
+## Hugging Face Spaces Deployment
+### 1. Create a new Space
+- Go to [Hugging Face Spaces](https://huggingface.co/spaces)
+- Click "Create new Space"
+- Select "Docker" as the SDK
+- Choose a name and set the space to private if needed
+- Select GPU as the hardware
+### 2. Configure the Space
+Add the following environment variables to your Space settings:
+- `SAM2_DEVICE`: `cuda`
+- `MATANY_DEVICE`: `cuda`
+- `PYTORCH_CUDA_ALLOC_CONF`: `max_split_size_mb:256,garbage_collection_threshold:0.8`
+- `TORCH_CUDA_ARCH_LIST`: `7.5 8.0 8.6+PTX`
+### 3. Deploy to Hugging Face
+```bash
+# Set your Hugging Face token
+export HF_TOKEN=your_hf_token
+export HF_USERNAME=your_username
+# Build and deploy
+./build_and_deploy.sh
+```
+## Health Check
+You can verify the installation by running:
+```bash
+docker run --rm videobackgroundreplacer2:latest python3 health_check.py
+```
+## Troubleshooting
+### Build Failures
+- Ensure you have enough disk space (at least 10GB free)
+- Check Docker logs for specific error messages
+- Verify your internet connection is stable
+### Runtime Issues
+- Check container logs: `docker logs <container_id>`
+- Verify GPU is detected: `nvidia-smi` inside the container
+- Check disk space: `df -h`
+## Performance Optimization
+- For faster inference, use the `sam2_hiera_tiny` model
+- Adjust batch size based on available GPU memory
+- Enable gradient checkpointing for large models
+## Monitoring
+- Use `nvidia-smi` to monitor GPU usage
+- Check container logs for any warnings or errors
+- Monitor memory usage with `htop` or similar tools

VideoBackgroundReplacer2/Dockerfile ADDED Viewed

	@@ -0,0 +1,137 @@

+# ===============================
+# Hugging Face Space — Stable Dockerfile
+# CUDA 12.1.1 + PyTorch 2.5.1 (cu121) + Gradio 4.41.3
+# SAM2 installed from source; MatAnyone via pip (repo)
+# ===============================
+FROM nvidia/cuda:12.1.1-cudnn8-runtime-ubuntu22.04
+# ---- Environment (runtime hygiene) ----
+ENV DEBIAN_FRONTEND=noninteractive \
+    PYTHONUNBUFFERED=1 \
+    PYTHONDONTWRITEBYTECODE=1 \
+    PIP_NO_CACHE_DIR=1 \
+    PIP_DISABLE_PIP_VERSION_CHECK=1 \
+    TORCH_CUDA_ARCH_LIST="7.5 8.0 8.6+PTX" \
+    CUDA_VISIBLE_DEVICES="0" \
+    OMP_NUM_THREADS=4 \
+    OPENBLAS_NUM_THREADS=1 \
+    MKL_NUM_THREADS=1 \
+    NUMEXPR_NUM_THREADS=1 \
+    HF_HOME=/home/user/app/.hf \
+    TORCH_HOME=/home/user/app/.torch \
+    GRADIO_SERVER_PORT=7860
+# ---- Non-root user ----
+RUN useradd -m -u 1000 user
+ENV HOME=/home/user
+WORKDIR $HOME/app
+# ---- System deps ----
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    git ffmpeg wget curl \
+    python3 python3-pip python3-venv python3-dev \
+    build-essential gcc g++ pkg-config \
+    libffi-dev libssl-dev libc6-dev \
+    libgl1-mesa-glx libglib2.0-0 libsm6 libxext6 libxrender1 libgomp1 \
+ && rm -rf /var/lib/apt/lists/*
+# ---- Python bootstrap ----
+RUN python3 -m pip install --upgrade pip setuptools wheel
+# ---- Install PyTorch (CUDA 12.1 wheels) ----
+RUN python3 -m pip install --no-cache-dir --index-url https://download.pytorch.org/whl/cu121 \
+      torch==2.5.1 torchvision==0.20.1 torchaudio==2.5.1 \
+ && python3 - <<'PY'
+import torch
+print("PyTorch:", torch.__version__)
+print("CUDA available:", torch.cuda.is_available())
+print("torch.version.cuda:", getattr(torch.version, "cuda", None))
+try:
+    import torchaudio, torchvision
+    print("torchaudio:", torchaudio.__version__)
+    import torchvision as tv; print("torchvision:", tv.__version__)
+except Exception as e:
+    print("aux libs check:", e)
+PY
+# ---- Copy deps first (better caching) ----
+COPY --chown=user:user requirements.txt ./
+# ---- Install remaining Python deps ----
+RUN python3 -m pip install --no-cache-dir -r requirements.txt
+# ---- MatAnyone (pip install from repo with retry) ----
+RUN echo "Installing MatAnyone..." && \
+    (python3 -m pip install --no-cache-dir -v git+https://github.com/pq-yang/MatAnyone@main#egg=matanyone || \
+     (echo "Retrying MatAnyone..." && \
+      python3 -m pip install --no-cache-dir -v git+https://github.com/pq-yang/MatAnyone@main#egg=matanyone)) && \
+    python3 -c "import matanyone; print('MatAnyone import OK')"
+# ---- App code ----
+COPY --chown=user:user . .
+# ---- SAM2 from source (editable) ----
+RUN echo "Installing SAM2 (editable)..." && \
+    git clone --depth=1 https://github.com/facebookresearch/segment-anything-2.git third_party/sam2 && \
+    cd third_party/sam2 && python3 -m pip install --no-cache-dir -e .
+# ---- App env ----
+ENV PYTHONPATH=/home/user/app:/home/user/app/third_party:/home/user/app/third_party/sam2 \
+    FFMPEG_BIN=ffmpeg \
+    THIRD_PARTY_SAM2_DIR=/home/user/app/third_party/sam2 \
+    ENABLE_MATANY=1 \
+    SAM2_DEVICE=cuda \
+    MATANY_DEVICE=cuda \
+    TF_CPP_MIN_LOG_LEVEL=2 \
+    SAM2_CHECKPOINT=/home/user/app/checkpoints/sam2_hiera_large.pt
+# ---- Create writable dirs (caches + checkpoints) ----
+RUN mkdir -p /home/user/app/checkpoints /home/user/app/.hf /home/user/app/.torch && \
+    chown -R user:user /home/user/app && \
+    chmod -R 755 /home/user/app && \
+    find /home/user/app -type d -exec chmod 755 {} \; && \
+    find /home/user/app -type f -exec chmod 644 {} \; && \
+    chmod +x /home/user/app/ui.py || true
+# ---- Healthcheck (use exec-form, no heredoc) ----
+HEALTHCHECK --interval=30s --timeout=5s --retries=3 CMD \
+  ["python3","-c","import torch; print('torch', torch.__version__, '| cuda', getattr(torch.version,'cuda',None), '| ok=', torch.cuda.is_available())"]
+# ---- Runtime ----
+USER user
+EXPOSE 7860
+CMD ["sh", "-c", "\
+  echo '===========================================' && \
+  echo '=== BACKGROUNDFX PRO CONTAINER STARTUP ===' && \
+  echo '===========================================' && \
+  echo 'Timestamp:' $(date) && \
+  echo 'Current directory:' $(pwd) && \
+  echo 'Current user:' $(whoami) && \
+  echo 'User ID:' $(id) && \
+  echo '' && \
+  echo '=== FILE SYSTEM CHECK ===' && \
+  echo 'Files in app directory:' && \
+  ls -la && \
+  echo '' && \
+  echo '=== UI.PY VERIFICATION ===' && \
+  if [ -f ui.py ]; then \
+      echo '✅ ui.py found' && \
+      echo 'File size:' $(wc -c < ui.py) 'bytes' && \
+      echo 'File permissions:' $(ls -l ui.py) && \
+      echo 'Testing Python imports...' && \
+      python3 -B -c 'import gradio; print(\"✅ Gradio:\", gradio.__version__)' && \
+      python3 -B -c 'import torch; print(\"✅ Torch:\", torch.__version__)' && \
+      echo 'Testing ui.py import...' && \
+      python3 -B -c 'import sys; sys.path.insert(0, \".\"); import ui; print(\"✅ ui.py imports successfully\")' && \
+      echo '✅ All checks passed!'; \
+  else \
+      echo '❌ ERROR: ui.py not found!' && \
+      exit 1; \
+  fi && \
+  echo '' && \
+  echo '=== STARTING APPLICATION ===' && \
+  echo 'Launching ui.py with bytecode disabled...' && \
+  python3 -B -u ui.py \
+"]

VideoBackgroundReplacer2/README.md ADDED Viewed

	@@ -0,0 +1,94 @@

+---
+title: 🎬 BackgroundFX Pro - SAM2 + MatAnyone
+emoji: 🎥
+colorFrom: indigo
+colorTo: purple
+sdk: docker
+app_port: 7860
+license: mit
+tags:
+  - video
+  - background-removal
+  - segmentation
+  - matting
+  - SAM2
+  - MatAnyone
+---
+# 🎬 BackgroundFX Pro — Professional Video Background Replacement
+BackgroundFX Pro is a GPU-accelerated app for Hugging Face Spaces (Docker) that replaces video backgrounds using:
+- **SAM2** — high-quality object segmentation
+- **MatAnyone** — temporal video matting for stable alpha over time
+Built on: **CUDA 12.1.1**, **PyTorch 2.5.1 (cu121)**, **torchvision 0.20.1**, **Gradio 4.41.0**.
+---
+## ✨ Features
+- Replace backgrounds with: **solid color**, **AI-generated** image (procedural), **custom uploaded image**, or **Unsplash** search
+- Optimized for **T4 GPUs** on Hugging Face
+- Caching & logs stored in the repo volume:
+  - HF cache → `./.hf`
+  - Torch cache → `./.torch`
+  - App data & logs → `./data` (see `data/run.log`)
+---
+## 🚀 Try It
+Open the Space in your browser (GPU required):
+https://huggingface.co/spaces/MogensR/VideoBackgroundReplacer2
+---
+## 🖱️ How to Use
+1. **Upload a video** (`.mp4`, `.avi`, `.mov`, `.mkv`).
+2. Choose a **Background Type**: Upload Image, AI Generate, Gradient, Solid, or Unsplash.
+3. If not uploading, enter a prompt and click **Generate Background**.
+4. Click **Process Video**.
+5. Preview and **Download Result**.
+> Tip: Start with 720p/1080p on T4; 4K can exceed memory.
+---
+## 🗂️ Project Structure (key files)
+- `Dockerfile`
+- `requirements.txt`
+- `ui.py`
+- `ui_core_interface.py`
+- `ui_core_functionality.py`
+- `two_stage_pipeline.py`
+- `models/sam2_loader.py`
+- `models/matanyone_loader.py`
+- `utils/__init__.py`
+- `data/`  (created at runtime for logs/outputs)
+- `tmp/`   (created at runtime for jobs/temp files)
+---
+## ⚙️ Runtime Notes
+- Binds to `PORT` / `GRADIO_SERVER_PORT` (defaults to **7860**).
+- Heartbeat logs every ~2s with memory & disk stats.
+- If there’s no final “PROCESS EXITING” line, it was likely an **OOM** or hard kill.
+---
+## 🧪 Local Development (Docker)
+Requires an NVIDIA GPU with CUDA drivers.
+```bash
+git clone https://huggingface.co/spaces/MogensR/VideoBackgroundReplacer2
+cd VideoBackgroundReplacer2
+# Build (Ubuntu 22.04, CUDA 12.1.1; installs Torch 2.5.1+cu121)
+docker build -t backgroundfx-pro .
+# Run
+docker run --gpus all -p 7860:7860 backgroundfx-pro

VideoBackgroundReplacer2/app.py ADDED Viewed

	@@ -0,0 +1,300 @@

+#!/usr/bin/env python3
+"""
+VideoBackgroundReplacer2 - SAM2 + MatAnyone Integration
+=======================================================
+- Sets up Gradio UI and launches pipeline
+- Aligned with torch/cu121 stack; runs on HF Spaces (Docker)
+Changes (2025-09-18):
+- Added precise web-stack probes (FastAPI/Starlette/Pydantic/etc. versions + file paths)
+- Added toggleable "mount mode": run Gradio inside our own FastAPI app
+  and provide a safe /config route shim (uses demo.get_config_file()).
+- Kept your startup diagnostics, GPU logging, and heartbeats
+"""
+print("=== APP STARTUP: Initializing VideoBackgroundReplacer2 ===")
+# ---------------------------------------------------------------------
+# Imports & basic setup
+# ---------------------------------------------------------------------
+import sys
+import os
+import gc
+import json
+import logging
+import threading
+import time
+import warnings
+import traceback
+import subprocess
+from pathlib import Path
+from loguru import logger
+# Logging (loguru to stderr)
+logger.remove()
+logger.add(
+    sys.stderr,
+    format="<green>{time:YYYY-MM-DD HH:mm:ss}</green> | <level>{level: <8}</level> "
+           "| <cyan>{name}</cyan>:<cyan>{function}</cyan>:<cyan>{line}</cyan> - <level>{message}</level>"
+)
+# Warnings
+warnings.filterwarnings("ignore", category=UserWarning)
+warnings.filterwarnings("ignore", category=FutureWarning)
+warnings.filterwarnings("ignore", module="torchvision.io._video_deprecation_warning")
+# Environment (lightweight & safe in Spaces)
+os.environ.setdefault("OMP_NUM_THREADS", "1")
+os.environ.setdefault("TOKENIZERS_PARALLELISM", "false")
+# Paths
+BASE_DIR = Path(__file__).parent.absolute()
+THIRD_PARTY_DIR = BASE_DIR / "third_party"
+SAM2_DIR = THIRD_PARTY_DIR / "sam2"
+CHECKPOINTS_DIR = BASE_DIR / "checkpoints"
+# Python path extends
+for p in (str(THIRD_PARTY_DIR), str(SAM2_DIR)):
+    if p not in sys.path:
+        sys.path.insert(0, p)
+logger.info(f"Base directory: {BASE_DIR}")
+logger.info(f"Python path[0:5]: {sys.path[:5]}")
+# ---------------------------------------------------------------------
+# GPU / Torch diagnostics (non-blocking)
+# ---------------------------------------------------------------------
+try:
+    import torch
+except Exception as e:
+    logger.warning("Torch import failed at startup: %s", e)
+    torch = None
+DEVICE = "cuda" if (torch and torch.cuda.is_available()) else "cpu"
+if DEVICE == "cuda":
+    os.environ["SAM2_DEVICE"] = "cuda"
+    os.environ["MATANY_DEVICE"] = "cuda"
+    os.environ.setdefault("CUDA_LAUNCH_BLOCKING", "0")
+    try:
+        logger.info(f"CUDA available: {torch.cuda.get_device_name(0)}")
+    except Exception:
+        logger.info("CUDA device name not available at startup.")
+else:
+    os.environ["SAM2_DEVICE"] = "cpu"
+    os.environ["MATANY_DEVICE"] = "cpu"
+    logger.warning("CUDA not available, falling back to CPU")
+def verify_models():
+    """Verify critical model files exist and are loadable (cheap checks)."""
+    results = {"status": "success", "details": {}}
+    try:
+        sam2_model_path = os.getenv("SAM2_MODEL_PATH", str(CHECKPOINTS_DIR / "sam2_hiera_large.pt"))
+        if not os.path.exists(sam2_model_path):
+            raise FileNotFoundError(f"SAM2 model not found at {sam2_model_path}")
+        # Cheap load test (map to CPU to avoid VRAM use during boot)
+        if torch:
+            sd = torch.load(sam2_model_path, map_location="cpu")
+            if not isinstance(sd, dict):
+                raise ValueError("Invalid SAM2 checkpoint format")
+        results["details"]["sam2"] = {
+            "status": "success",
+            "path": sam2_model_path,
+            "size_mb": round(os.path.getsize(sam2_model_path) / (1024 * 1024), 2),
+        }
+    except Exception as e:
+        results["status"] = "error"
+        results["details"]["sam2"] = {
+            "status": "error",
+            "error": str(e),
+            "traceback": traceback.format_exc(),
+        }
+    return results
+def run_startup_diagnostics():
+    diag = {
+        "system": {
+            "python": sys.version,
+            "pytorch": getattr(torch, "__version__", None) if torch else None,
+            "cuda_available": bool(torch and torch.cuda.is_available()),
+            "device_count": (torch.cuda.device_count() if torch and torch.cuda.is_available() else 0),
+            "cuda_version": getattr(getattr(torch, "version", None), "cuda", None) if torch else None,
+        },
+        "paths": {
+            "base_dir": str(BASE_DIR),
+            "checkpoints_dir": str(CHECKPOINTS_DIR),
+            "sam2_dir": str(SAM2_DIR),
+        },
+        "env_subset": {k: v for k, v in os.environ.items() if k in ("HOST", "PORT", "SPACE_ID", "SPACE_AUTHOR_NAME")},
+    }
+    diag["model_verification"] = verify_models()
+    return diag
+startup_diag = run_startup_diagnostics()
+logger.info("Startup diagnostics completed")
+# Noisy heartbeat so logs show life during import time
+def _heartbeat():
+    i = 0
+    while True:
+        i += 1
+        print(f"[startup-heartbeat] {i*5}s…", flush=True)
+        time.sleep(5)
+threading.Thread(target=_heartbeat, daemon=True).start()
+# Optional perf tuning import (non-fatal)
+try:
+    import perf_tuning  # noqa: F401
+    logger.info("perf_tuning imported successfully.")
+except Exception as e:
+    logger.info("perf_tuning not available: %s", e)
+# MatAnyone non-instantiating probe
+try:
+    import inspect
+    from matanyone.inference import inference_core as ic  # type: ignore
+    sigs = {}
+    for name in ("InferenceCore",):
+        obj = getattr(ic, name, None)
+        if obj:
+            sigs[name] = "callable" if callable(obj) else "present"
+    logger.info(f"[MATANY] probe (non-instantiating): {sigs}")
+except Exception as e:
+    logger.info(f"[MATANY] probe skipped: {e}")
+# ---------------------------------------------------------------------
+# Gradio import and web-stack probes
+# ---------------------------------------------------------------------
+import gradio as gr
+# Standard logger for some libs that use stdlib logging
+py_logger = logging.getLogger("backgroundfx_pro")
+if not py_logger.handlers:
+    h = logging.StreamHandler()
+    h.setFormatter(logging.Formatter("[%(asctime)s] %(levelname)s: %(message)s"))
+    py_logger.addHandler(h)
+py_logger.setLevel(logging.INFO)
+def _log_web_stack_versions_and_paths():
+    import inspect
+    try:
+        import fastapi, starlette, pydantic, httpx, anyio
+        try:
+            import pydantic_core
+            pc_ver = pydantic_core.__version__
+        except Exception:
+            pc_ver = "unknown"
+        logger.info(
+            "[WEB-STACK] fastapi=%s | starlette=%s | pydantic=%s | pydantic-core=%s | httpx=%s | anyio=%s",
+            getattr(fastapi, "__version__", "?"),
+            getattr(starlette, "__version__", "?"),
+            getattr(pydantic, "__version__", "?"),
+            pc_ver,
+            getattr(httpx, "__version__", "?"),
+            getattr(anyio, "__version__", "?"),
+        )
+    except Exception as e:
+        logger.warning("[WEB-STACK] version probe failed: %s", e)
+    try:
+        import gradio
+        import gradio.routes as gr_routes
+        import gradio.queueing as gr_queueing
+        logger.info("[PATH] gradio.__file__     = %s", getattr(gradio, "__file__", "?"))
+        logger.info("[PATH] gradio.routes       = %s", inspect.getfile(gr_routes))
+        logger.info("[PATH] gradio.queueing     = %s", inspect.getfile(gr_queueing))
+        import starlette.exceptions as st_exc
+        logger.info("[PATH] starlette.exceptions= %s", inspect.getfile(st_exc))
+    except Exception as e:
+        logger.warning("[PATH] probe failed: %s", e)
+def _post_launch_diag():
+    try:
+        if not torch:
+            return
+        avail = torch.cuda.is_available()
+        logger.info("CUDA available (post-launch): %s", avail)
+        if avail:
+            idx = torch.cuda.current_device()
+            name = torch.cuda.get_device_name(idx)
+            cap = torch.cuda.get_device_capability(idx)
+            logger.info("CUDA device %d: %s (cc %d.%d)", idx, name, cap[0], cap[1])
+    except Exception as e:
+        logger.warning("Post-launch CUDA diag failed: %s", e)
+# ---------------------------------------------------------------------
+# UI factory (uses your existing builder)
+# ---------------------------------------------------------------------
+def build_ui() -> gr.Blocks:
+    # FIX: import from ui_core_interface (not from ui)
+    from ui_core_interface import create_interface
+    return create_interface()
+# ---------------------------------------------------------------------
+# Optional: custom FastAPI mount mode
+# ---------------------------------------------------------------------
+def build_fastapi_with_gradio(demo: gr.Blocks):
+    """
+    Returns a FastAPI app with Gradio mounted at root.
+    Also exposes JSON health and a config shim using demo.get_config_file().
+    """
+    from fastapi import FastAPI
+    from fastapi.responses import JSONResponse
+    app = FastAPI(title="VideoBackgroundReplacer2")
+    @app.get("/healthz")
+    def _healthz():
+        return {"ok": True, "ts": time.time()}
+    @app.get("/config")
+    def _config():
+        try:
+            cfg = demo.get_config_file()
+            return JSONResponse(content=cfg)
+        except Exception as e:
+            return JSONResponse(
+                status_code=500,
+                content={"error": "config_generation_failed", "detail": str(e)},
+            )
+    # Mount Gradio UI at root; our /config route remains at parent level
+    app = gr.mount_gradio_app(app, demo, path="/")
+    return app
+# ---------------------------------------------------------------------
+# Entrypoint
+# ---------------------------------------------------------------------
+if __name__ == "__main__":
+    host = os.environ.get("HOST", "0.0.0.0")
+    port = int(os.environ.get("PORT", "7860"))
+    mount_mode = os.environ.get("GRADIO_MOUNT_MODE", "0") == "1"
+    logger.info("Launching on %s:%s (mount_mode=%s)…", host, port, mount_mode)
+    _log_web_stack_versions_and_paths()
+    demo = build_ui()
+    demo.queue(max_size=16, api_open=False)
+    threading.Thread(target=_post_launch_diag, daemon=True).start()
+    if mount_mode:
+        try:
+            from uvicorn import run as uvicorn_run
+        except Exception:
+            logger.error("uvicorn is not installed; mount mode cannot start.")
+            raise
+        app = build_fastapi_with_gradio(demo)
+        uvicorn_run(app=app, host=host, port=port, log_level="info")
+    else:
+        demo.launch(
+            server_name=host,
+            server_port=port,
+            share=False,
+            show_api=False,
+            show_error=True,
+            quiet=False,
+            debug=True,
+            max_threads=1,
+        )

VideoBackgroundReplacer2/integrated_pipeline.py ADDED Viewed

	@@ -0,0 +1,421 @@

+#!/usr/bin/env python3
+"""
+integrated_pipeline.py - Two-stage pipeline with fallback compatibility
+- Stage 1: SAM2 -> lossless mask stream + metadata, then unload SAM2
+- Stage 2: Read masks -> MatAnyone -> composite -> final output
+- Maintains compatibility with existing UI calls
+"""
+import os
+import sys
+import gc
+import json
+import subprocess
+import tempfile
+from pathlib import Path
+from typing import Dict, Any, Optional, Tuple
+import numpy as np
+import cv2
+# Add the parent directory to Python path for imports
+current_dir = Path(__file__).parent
+parent_dir = current_dir.parent
+sys.path.append(str(parent_dir))
+class TwoStageProcessor:
+    def __init__(self, temp_dir: Optional[str] = None):
+        self.temp_dir = Path(temp_dir) if temp_dir else Path(tempfile.mkdtemp())
+        self.temp_dir.mkdir(exist_ok=True)
+        # Stage outputs
+        self.masks_path = self.temp_dir / "masks.mkv"
+        self.metadata_path = self.temp_dir / "meta.json"
+    def process_video(self, input_video: str, background_video: str,
+                     click_points: list, output_path: str,
+                     use_matanyone: bool = True, progress_callback=None) -> bool:
+        """
+        Main entry point - maintains compatibility with existing UI
+        """
+        try:
+            # Stage 1: Generate masks
+            if progress_callback:
+                progress_callback("Stage 1: Generating masks with SAM2...")
+            if not self._stage1_generate_masks(input_video, click_points, progress_callback):
+                return False
+            # Stage 2: Process and composite
+            if progress_callback:
+                progress_callback("Stage 2: Processing and compositing...")
+            return self._stage2_composite(input_video, background_video,
+                                        output_path, use_matanyone, progress_callback)
+        except Exception as e:
+            print(f"Two-stage processing failed: {e}")
+            return False
+    def _stage1_generate_masks(self, input_video: str, click_points: list,
+                              progress_callback=None) -> bool:
+        """Stage 1: SAM2 mask generation with complete memory cleanup"""
+        try:
+            # Import SAM2 only when needed
+            print("Loading SAM2...")
+            import torch
+            from sam2.build_sam import build_sam2_video_predictor
+            # Initialize SAM2
+            checkpoint = "checkpoints/sam2.1_hiera_large.pt"
+            model_cfg = "configs/sam2.1/sam2.1_hiera_l.yaml"
+            if not os.path.exists(checkpoint):
+                print(f"SAM2 checkpoint not found: {checkpoint}")
+                return False
+            predictor = build_sam2_video_predictor(model_cfg, checkpoint)
+            # Get video info
+            cap = cv2.VideoCapture(input_video)
+            fps = cap.get(cv2.CAP_PROP_FPS)
+            frame_count = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+            width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+            height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+            cap.release()
+            # Save metadata
+            metadata = {
+                "fps": fps,
+                "frame_count": frame_count,
+                "width": width,
+                "height": height,
+                "click_points": click_points
+            }
+            with open(self.metadata_path, 'w') as f:
+                json.dump(metadata, f, indent=2)
+            # Initialize inference state
+            inference_state = predictor.init_state(video_path=input_video)
+            # Add prompts
+            for i, point in enumerate(click_points):
+                x, y = point
+                predictor.add_new_points_or_box(
+                    inference_state=inference_state,
+                    frame_idx=0,
+                    obj_id=i,
+                    points=np.array([[x, y]], dtype=np.float32),
+                    labels=np.array([1], np.int32),
+                )
+            # Setup FFmpeg for lossless mask encoding
+            ffmpeg_cmd = [
+                'ffmpeg', '-y', '-f', 'rawvideo',
+                '-pix_fmt', 'gray', '-s', f'{width}x{height}',
+                '-r', str(fps), '-i', '-',
+                '-c:v', 'ffv1', '-level', '3', '-pix_fmt', 'gray',
+                str(self.masks_path)
+            ]
+            ffmpeg_process = subprocess.Popen(
+                ffmpeg_cmd, stdin=subprocess.PIPE,
+                stderr=subprocess.PIPE, stdout=subprocess.PIPE
+            )
+            # Generate and stream masks
+            print(f"Processing {frame_count} frames...")
+            for out_frame_idx, out_obj_ids, out_mask_logits in predictor.propagate_in_video(inference_state):
+                if progress_callback:
+                    progress = (out_frame_idx + 1) / frame_count * 50  # 50% of total progress for stage 1
+                    progress_callback(f"Generating masks... Frame {out_frame_idx + 1}/{frame_count}", progress)
+                # Combine masks from all objects
+                combined_mask = np.zeros((height, width), dtype=np.uint8)
+                for obj_id in out_obj_ids:
+                    mask = (out_mask_logits[obj_id] > 0.0).squeeze()
+                    combined_mask = np.logical_or(combined_mask, mask).astype(np.uint8) * 255
+                # Write to FFmpeg
+                ffmpeg_process.stdin.write(combined_mask.tobytes())
+            # Finalize FFmpeg
+            ffmpeg_process.stdin.close()
+            ffmpeg_process.wait()
+            if ffmpeg_process.returncode != 0:
+                error = ffmpeg_process.stderr.read().decode()
+                print(f"FFmpeg error: {error}")
+                return False
+            print("Stage 1 complete: Masks saved")
+            # CRITICAL: Complete memory cleanup
+            del predictor
+            del inference_state
+            if 'torch' in locals():
+                if torch.cuda.is_available():
+                    torch.cuda.empty_cache()
+                    torch.cuda.synchronize()
+            # Force garbage collection
+            gc.collect()
+            # Clear SAM2 from sys.modules to prevent memory leaks
+            modules_to_clear = [mod for mod in sys.modules.keys() if 'sam2' in mod.lower()]
+            for mod in modules_to_clear:
+                del sys.modules[mod]
+            print("SAM2 completely unloaded from memory")
+            return True
+        except Exception as e:
+            print(f"Stage 1 failed: {e}")
+            return False
+    def _stage2_composite(self, input_video: str, background_video: str,
+                         output_path: str, use_matanyone: bool, progress_callback=None) -> bool:
+        """Stage 2: Read masks, refine with MatAnyone, and composite"""
+        try:
+            # Load metadata
+            with open(self.metadata_path, 'r') as f:
+                metadata = json.load(f)
+            frame_count = metadata["frame_count"]
+            # Read masks back from lossless stream
+            masks = self._read_mask_stream()
+            if masks is None:
+                return False
+            # Optional MatAnyone refinement
+            if use_matanyone:
+                if progress_callback:
+                    progress_callback("Refining masks with MatAnyone...")
+                masks = self._refine_with_matanyone(input_video, masks, progress_callback)
+                if masks is None:
+                    return False
+            # Final composition
+            if progress_callback:
+                progress_callback("Compositing final video...")
+            return self._composite_final_video(input_video, background_video,
+                                             masks, output_path, metadata, progress_callback)
+        except Exception as e:
+            print(f"Stage 2 failed: {e}")
+            return False
+    def _read_mask_stream(self) -> Optional[list]:
+        """Read masks from the lossless FFV1 stream"""
+        try:
+            # Load metadata for dimensions
+            with open(self.metadata_path, 'r') as f:
+                metadata = json.load(f)
+            width = metadata["width"]
+            height = metadata["height"]
+            frame_count = metadata["frame_count"]
+            # Use FFmpeg to decode masks
+            ffmpeg_cmd = [
+                'ffmpeg', '-i', str(self.masks_path),
+                '-f', 'rawvideo', '-pix_fmt', 'gray', '-'
+            ]
+            process = subprocess.Popen(
+                ffmpeg_cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE
+            )
+            masks = []
+            frame_size = width * height
+            for frame_idx in range(frame_count):
+                frame_data = process.stdout.read(frame_size)
+                if len(frame_data) != frame_size:
+                    print(f"Unexpected frame size at frame {frame_idx}")
+                    break
+                mask = np.frombuffer(frame_data, dtype=np.uint8).reshape((height, width))
+                masks.append(mask)
+            process.stdout.close()
+            process.wait()
+            if process.returncode != 0:
+                error = process.stderr.read().decode()
+                print(f"FFmpeg decode error: {error}")
+                return None
+            print(f"Successfully read {len(masks)} masks from stream")
+            return masks
+        except Exception as e:
+            print(f"Failed to read mask stream: {e}")
+            return None
+    def _refine_with_matanyone(self, input_video: str, masks: list, progress_callback=None) -> Optional[list]:
+        """Apply MatAnyone refinement to masks"""
+        try:
+            # Import MatAnyone only when needed
+            from matanyone.mat_anywhere import matting_inference_video
+            # Create temp directory for MatAnyone
+            matanyone_temp = self.temp_dir / "matanyone"
+            matanyone_temp.mkdir(exist_ok=True)
+            # Save masks as individual frames for MatAnyone
+            mask_dir = matanyone_temp / "masks"
+            mask_dir.mkdir(exist_ok=True)
+            for i, mask in enumerate(masks):
+                cv2.imwrite(str(mask_dir / f"mask_{i:06d}.png"), mask)
+            # Run MatAnyone
+            refined_masks_dir = matanyone_temp / "refined"
+            refined_masks_dir.mkdir(exist_ok=True)
+            success = matting_inference_video(
+                video_path=input_video,
+                mask_dir=str(mask_dir),
+                output_dir=str(refined_masks_dir),
+                progress_callback=progress_callback
+            )
+            if not success:
+                print("MatAnyone refinement failed, using original masks")
+                return masks
+            # Load refined masks
+            refined_masks = []
+            for i in range(len(masks)):
+                refined_path = refined_masks_dir / f"refined_{i:06d}.png"
+                if refined_path.exists():
+                    refined_mask = cv2.imread(str(refined_path), cv2.IMREAD_GRAYSCALE)
+                    refined_masks.append(refined_mask)
+                else:
+                    refined_masks.append(masks[i])  # Fallback to original
+            return refined_masks
+        except Exception as e:
+            print(f"MatAnyone refinement failed: {e}, using original masks")
+            return masks
+    def _composite_final_video(self, input_video: str, background_video: str,
+                              masks: list, output_path: str, metadata: Dict[str, Any],
+                              progress_callback=None) -> bool:
+        """Create final composite video"""
+        try:
+            # Setup video capture
+            fg_cap = cv2.VideoCapture(input_video)
+            bg_cap = cv2.VideoCapture(background_video)
+            fps = metadata["fps"]
+            width = metadata["width"]
+            height = metadata["height"]
+            # Setup output writer
+            fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+            out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
+            frame_idx = 0
+            total_frames = len(masks)
+            while frame_idx < total_frames:
+                # Read frames
+                ret_fg, fg_frame = fg_cap.read()
+                ret_bg, bg_frame = bg_cap.read()
+                if not ret_fg:
+                    break
+                if not ret_bg:
+                    # Loop background if shorter
+                    bg_cap.set(cv2.CAP_PROP_POS_FRAMES, 0)
+                    ret_bg, bg_frame = bg_cap.read()
+                if not ret_bg:
+                    print("No background frame available")
+                    break
+                # Resize background to match foreground
+                bg_frame = cv2.resize(bg_frame, (width, height))
+                # Get mask
+                mask = masks[frame_idx]
+                mask_norm = mask.astype(np.float32) / 255.0
+                mask_3ch = np.stack([mask_norm, mask_norm, mask_norm], axis=-1)
+                # Composite
+                composite = (fg_frame * mask_3ch + bg_frame * (1 - mask_3ch)).astype(np.uint8)
+                out.write(composite)
+                frame_idx += 1
+                if progress_callback and frame_idx % 10 == 0:
+                    progress = 50 + (frame_idx / total_frames) * 50  # 50-100% for stage 2
+                    progress_callback(f"Compositing... Frame {frame_idx}/{total_frames}", progress)
+            # Cleanup
+            fg_cap.release()
+            bg_cap.release()
+            out.release()
+            print(f"Final video saved to: {output_path}")
+            return True
+        except Exception as e:
+            print(f"Final composition failed: {e}")
+            return False
+    def cleanup(self):
+        """Clean up temporary files"""
+        try:
+            if self.temp_dir.exists():
+                import shutil
+                shutil.rmtree(self.temp_dir)
+        except Exception as e:
+            print(f"Cleanup failed: {e}")
+# Compatibility wrapper for existing UI
+def process_video_two_stage(input_video: str, background_video: str,
+                           click_points: list, output_path: str,
+                           use_matanyone: bool = True, progress_callback=None) -> bool:
+    """
+    Drop-in replacement for existing process_video function
+    """
+    processor = TwoStageProcessor()
+    try:
+        result = processor.process_video(
+            input_video, background_video, click_points,
+            output_path, use_matanyone, progress_callback
+        )
+        return result
+    finally:
+        processor.cleanup()
+if __name__ == "__main__":
+    # Test the pipeline
+    import argparse
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--input", required=True)
+    parser.add_argument("--background", required=True)
+    parser.add_argument("--output", required=True)
+    parser.add_argument("--clicks", required=True, help="JSON string of click points")
+    parser.add_argument("--no-matanyone", action="store_true")
+    args = parser.parse_args()
+    click_points = json.loads(args.clicks)
+    use_matanyone = not args.no_matanyone
+    success = process_video_two_stage(
+        args.input, args.background, click_points,
+        args.output, use_matanyone,
+        lambda msg, prog=None: print(f"Progress: {msg} ({prog}%)" if prog else msg)
+    )
+    print("Processing completed!" if success else "Processing failed!")

VideoBackgroundReplacer2/models/__init__.py ADDED Viewed

	@@ -0,0 +1,868 @@

+#!/usr/bin/env python3
+"""
+BackgroundFX Pro - Model Loading & Utilities (Hardened)
+======================================================
+- Avoids heavy CUDA/Hydra work at import time
+- Adds timeouts to subprocess probes
+- Safer sys.path wiring for third_party repos
+- MatAnyone loader is probe-only here; actual run happens in matanyone_loader.MatAnyoneSession
+Changes (2025-09-16):
+- Aligned with torch==2.3.1+cu121 and MatAnyone v1.0.0
+- Updated load_matany to apply T=1 squeeze patch before InferenceCore import
+- Added patch status logging and MatAnyone version
+- Added InferenceCore attributes logging for debugging
+- Fixed InferenceCore import path to matanyone.inference.inference_core
+"""
+from __future__ import annotations
+import os
+import sys
+import cv2
+import subprocess
+import inspect
+import logging
+import importlib.metadata
+from pathlib import Path
+from typing import Optional, Tuple, Dict, Any, Union, Callable
+import numpy as np
+import yaml
+# Import torch for GPU memory monitoring
+try:
+    import torch
+except ImportError:
+    torch = None
+# --------------------------------------------------------------------------------------
+# Logging (ensure a handler exists very early)
+# --------------------------------------------------------------------------------------
+logger = logging.getLogger("backgroundfx_pro")
+if not logger.handlers:
+    _h = logging.StreamHandler()
+    _h.setFormatter(logging.Formatter("[%(asctime)s] %(levelname)s: %(message)s"))
+    logger.addHandler(_h)
+logger.setLevel(logging.INFO)
+# Pin OpenCV threads (helps libgomp stability in Spaces)
+try:
+    cv_threads = int(os.environ.get("CV_THREADS", "1"))
+    if hasattr(cv2, "setNumThreads"):
+        cv2.setNumThreads(cv_threads)
+except Exception:
+    pass
+# --------------------------------------------------------------------------------------
+# Optional dependencies
+# --------------------------------------------------------------------------------------
+try:
+    import mediapipe as mp  # type: ignore
+    _HAS_MEDIAPIPE = True
+except Exception:
+    _HAS_MEDIAPIPE = False
+# --------------------------------------------------------------------------------------
+# Path setup for third_party repos
+# --------------------------------------------------------------------------------------
+ROOT = Path(__file__).resolve().parent.parent  # project root
+TP_SAM2 = Path(os.environ.get("THIRD_PARTY_SAM2_DIR", ROOT / "third_party" / "sam2")).resolve()
+TP_MATANY = Path(os.environ.get("THIRD_PARTY_MATANY_DIR", ROOT / "third_party" / "matanyone")).resolve()
+def _add_sys_path(p: Path) -> None:
+    if p.exists():
+        p_str = str(p)
+        if p_str not in sys.path:
+            sys.path.insert(0, p_str)
+    else:
+        logger.warning(f"third_party path not found: {p}")
+_add_sys_path(TP_SAM2)
+_add_sys_path(TP_MATANY)
+# --------------------------------------------------------------------------------------
+# Safe Torch accessors (no top-level import)
+# --------------------------------------------------------------------------------------
+def _torch():
+    try:
+        import torch  # local import avoids early CUDA init during module import
+        return torch
+    except Exception as e:
+        logger.warning(f"[models.safe-torch] import failed: {e}")
+        return None
+def _has_cuda() -> bool:
+    t = _torch()
+    if t is None:
+        return False
+    try:
+        return bool(t.cuda.is_available())
+    except Exception as e:
+        logger.warning(f"[models.safe-torch] cuda.is_available() failed: {e}")
+        return False
+def _pick_device(env_key: str) -> str:
+    requested = os.environ.get(env_key, "").strip().lower()
+    has_cuda = _has_cuda()
+    # Log all CUDA-related environment variables
+    cuda_env_vars = {
+        'FORCE_CUDA_DEVICE': os.environ.get('FORCE_CUDA_DEVICE', ''),
+        'CUDA_MEMORY_FRACTION': os.environ.get('CUDA_MEMORY_FRACTION', ''),
+        'PYTORCH_CUDA_ALLOC_CONF': os.environ.get('PYTORCH_CUDA_ALLOC_CONF', ''),
+        'REQUIRE_CUDA': os.environ.get('REQUIRE_CUDA', ''),
+        'SAM2_DEVICE': os.environ.get('SAM2_DEVICE', ''),
+        'MATANY_DEVICE': os.environ.get('MATANY_DEVICE', ''),
+    }
+    logger.info(f"CUDA environment variables: {cuda_env_vars}")
+    logger.info(f"_pick_device({env_key}): requested='{requested}', has_cuda={has_cuda}")
+    # Force CUDA if available (empty string counts as no explicit CPU request)
+    if has_cuda and requested not in {"cpu"}:
+        logger.info(f"FORCING CUDA device (GPU available, requested='{requested}')")
+        return "cuda"
+    elif requested in {"cuda", "cpu"}:
+        logger.info(f"Using explicitly requested device: {requested}")
+        return requested
+    result = "cuda" if has_cuda else "cpu"
+    logger.info(f"Auto-selected device: {result}")
+    return result
+# --------------------------------------------------------------------------------------
+# Basic Utilities
+# --------------------------------------------------------------------------------------
+def _ffmpeg_bin() -> str:
+    return os.environ.get("FFMPEG_BIN", "ffmpeg")
+def _probe_ffmpeg(timeout: int = 2) -> bool:
+    try:
+        subprocess.run([_ffmpeg_bin(), "-version"], stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL, check=True, timeout=timeout)
+        return True
+    except Exception:
+        return False
+def _ensure_dir(p: Path) -> None:
+    p.mkdir(parents=True, exist_ok=True)
+def _cv_read_first_frame(video_path: Union[str, Path]) -> Tuple[Optional[np.ndarray], int, Tuple[int, int]]:
+    cap = cv2.VideoCapture(str(video_path))
+    if not cap.isOpened():
+        return None, 0, (0, 0)
+    fps = int(round(cap.get(cv2.CAP_PROP_FPS) or 25))
+    ok, frame = cap.read()
+    w = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH) or 0)
+    h = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT) or 0)
+    cap.release()
+    if not ok:
+        return None, fps, (w, h)
+    return frame, fps, (w, h)
+def _save_mask_png(mask: np.ndarray, path: Union[str, Path]) -> str:
+    if mask.dtype == bool:
+        mask = (mask.astype(np.uint8) * 255)
+    elif mask.dtype != np.uint8:
+        mask = np.clip(mask, 0, 255).astype(np.uint8)
+    cv2.imwrite(str(path), mask)
+    return str(path)
+def _resize_keep_ar(image: np.ndarray, target_wh: Tuple[int, int]) -> np.ndarray:
+    tw, th = target_wh
+    h, w = image.shape[:2]
+    if h == 0 or w == 0 or tw == 0 or th == 0:
+        return image
+    scale = min(tw / w, th / h)
+    nw, nh = max(1, int(round(w * scale))), max(1, int(round(h * scale)))
+    resized = cv2.resize(image, (nw, nh), interpolation=cv2.INTER_CUBIC)
+    canvas = np.zeros((th, tw, 3), dtype=resized.dtype)
+    x0 = (tw - nw) // 2
+    y0 = (th - nh) // 2
+    canvas[y0:y0+nh, x0:x0+nw] = resized
+    return canvas
+def _video_writer(out_path: Path, fps: int, size: Tuple[int, int]) -> cv2.VideoWriter:
+    fourcc = cv2.VideoWriter_fourcc(*"mp4v")
+    return cv2.VideoWriter(str(out_path), fourcc, max(1, fps), size)
+def _mux_audio(src_video: Union[str, Path], silent_video: Union[str, Path], out_path: Union[str, Path]) -> bool:
+    """Copy video from silent_video + audio from src_video into out_path (AAC)."""
+    try:
+        cmd = [
+            _ffmpeg_bin(), "-y",
+            "-i", str(silent_video),
+            "-i", str(src_video),
+            "-map", "0:v:0",
+            "-map", "1:a:0?",
+            "-c:v", "copy",
+            "-c:a", "aac", "-b:a", "192k",
+            "-shortest",
+            str(out_path)
+        ]
+        subprocess.run(cmd, check=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+        return True
+    except Exception as e:
+        logger.warning(f"Audio mux failed; returning silent video. Reason: {e}")
+        return False
+# --------------------------------------------------------------------------------------
+# Compositing & Image Processing
+# --------------------------------------------------------------------------------------
+def _refine_alpha(alpha: np.ndarray, erode_px: int = 1, dilate_px: int = 2, blur_px: float = 1.5) -> np.ndarray:
+    if alpha.dtype != np.float32:
+        a = alpha.astype(np.float32)
+        if a.max() > 1.0:
+            a = a / 255.0
+    else:
+        a = alpha.copy()
+    a_u8 = np.clip(np.round(a * 255.0), 0, 255).astype(np.uint8)
+    if erode_px > 0:
+        k = max(1, int(erode_px))
+        a_u8 = cv2.erode(a_u8, cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (k, k)), iterations=1)
+    if dilate_px > 0:
+        k = max(1, int(dilate_px))
+        a_u8 = cv2.dilate(a_u8, cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (k, k)), iterations=1)
+    a = a_u8.astype(np.float32) / 255.0
+    if blur_px and blur_px > 0:
+        rad = max(1, int(round(blur_px)))
+        a = cv2.GaussianBlur(a, (rad | 1, rad | 1), 0)
+    return np.clip(a, 0.0, 1.0)
+def _to_linear(rgb: np.ndarray, gamma: float = 2.2) -> np.ndarray:
+    x = np.clip(rgb.astype(np.float32) / 255.0, 0.0, 1.0)
+    return np.power(x, gamma)
+def _to_srgb(lin: np.ndarray, gamma: float = 2.2) -> np.ndarray:
+    x = np.clip(lin, 0.0, 1.0)
+    return np.clip(np.power(x, 1.0 / gamma) * 255.0, 0, 255).astype(np.uint8)
+def _light_wrap(bg_rgb: np.ndarray, alpha01: np.ndarray, radius: int = 5, amount: float = 0.18) -> np.ndarray:
+    r = max(1, int(radius))
+    inv = 1.0 - alpha01
+    inv_blur = cv2.GaussianBlur(inv, (r | 1, r | 1), 0)
+    lw = (bg_rgb.astype(np.float32) * inv_blur[..., None] * float(amount))
+    return lw
+def _despill_edges(fg_rgb: np.ndarray, alpha01: np.ndarray, amount: float = 0.35) -> np.ndarray:
+    w = 1.0 - 2.0 * np.abs(alpha01 - 0.5)
+    w = np.clip(w, 0.0, 1.0)
+    hsv = cv2.cvtColor(fg_rgb.astype(np.uint8), cv2.COLOR_RGB2HSV).astype(np.float32)
+    H, S, V = cv2.split(hsv)
+    S = S * (1.0 - amount * w)
+    hsv2 = cv2.merge([H, np.clip(S, 0, 255), V])
+    out = cv2.cvtColor(hsv2.astype(np.uint8), cv2.COLOR_HSV2RGB)
+    return out
+def _composite_frame_pro(
+    fg_rgb: np.ndarray, alpha: np.ndarray, bg_rgb: np.ndarray,
+    erode_px: int = None, dilate_px: int = None, blur_px: float = None,
+    lw_radius: int = None, lw_amount: float = None, despill_amount: float = None
+) -> np.ndarray:
+    erode_px = erode_px if erode_px is not None else int(os.environ.get("EDGE_ERODE", "1"))
+    dilate_px = dilate_px if dilate_px is not None else int(os.environ.get("EDGE_DILATE", "2"))
+    blur_px = blur_px if blur_px is not None else float(os.environ.get("EDGE_BLUR", "1.5"))
+    lw_radius = lw_radius if lw_radius is not None else int(os.environ.get("LIGHTWRAP_RADIUS", "5"))
+    lw_amount = lw_amount if lw_amount is not None else float(os.environ.get("LIGHTWRAP_AMOUNT", "0.18"))
+    despill_amount = despill_amount if despill_amount is not None else float(os.environ.get("DESPILL_AMOUNT", "0.35"))
+    a = _refine_alpha(alpha, erode_px=erode_px, dilate_px=dilate_px, blur_px=blur_px)
+    fg_rgb = _despill_edges(fg_rgb, a, amount=despill_amount)
+    fg_lin = _to_linear(fg_rgb)
+    bg_lin = _to_linear(bg_rgb)
+    lw = _light_wrap(bg_rgb, a, radius=lw_radius, amount=lw_amount)
+    lw_lin = _to_linear(np.clip(lw, 0, 255).astype(np.uint8))
+    comp_lin = fg_lin * a[..., None] + bg_lin * (1.0 - a[..., None]) + lw_lin
+    comp = _to_srgb(comp_lin)
+    return comp
+# --------------------------------------------------------------------------------------
+# SAM2 Integration
+# --------------------------------------------------------------------------------------
+def _resolve_sam2_cfg(cfg_str: str) -> str:
+    """Resolve SAM2 config path - return relative path for Hydra compatibility."""
+    logger.info(f"_resolve_sam2_cfg called with cfg_str={cfg_str}")
+    # Get the third-party SAM2 directory
+    tp_sam2 = os.environ.get("THIRD_PARTY_SAM2_DIR", "/home/user/app/third_party/sam2")
+    logger.info(f"TP_SAM2 = {tp_sam2}")
+    # Check if the full path exists
+    candidate = os.path.join(tp_sam2, cfg_str)
+    logger.info(f"Candidate path: {candidate}")
+    logger.info(f"Candidate exists: {os.path.exists(candidate)}")
+    if os.path.exists(candidate):
+        # For Hydra compatibility, return just the relative path within sam2 package
+        if cfg_str.startswith("sam2/configs/"):
+            relative_path = cfg_str.replace("sam2/configs/", "configs/")
+        else:
+            relative_path = cfg_str
+        logger.info(f"Returning Hydra-compatible relative path: {relative_path}")
+        return relative_path
+    # If not found, try some fallback paths
+    fallbacks = [
+        os.path.join(tp_sam2, "sam2", cfg_str),
+        os.path.join(tp_sam2, "configs", cfg_str),
+    ]
+    for fallback in fallbacks:
+        logger.info(f"Trying fallback: {fallback}")
+        if os.path.exists(fallback):
+            # Extract relative path for Hydra
+            if "configs/" in fallback:
+                relative_path = "configs/" + fallback.split("configs/")[-1]
+                logger.info(f"Returning fallback relative path: {relative_path}")
+                return relative_path
+    logger.warning(f"Config not found, returning original: {cfg_str}")
+    return cfg_str
+def _find_hiera_config_if_hieradet(cfg_path: str) -> Optional[str]:
+    """If config references 'hieradet', try to find a 'hiera' config."""
+    try:
+        with open(cfg_path, "r") as f:
+            data = yaml.safe_load(f)
+        model = data.get("model", {}) or {}
+        enc = model.get("image_encoder") or {}
+        trunk = enc.get("trunk") or {}
+        target = trunk.get("_target_") or trunk.get("target")
+        if isinstance(target, str) and "hieradet" in target:
+            for y in TP_SAM2.rglob("*.yaml"):
+                try:
+                    with open(y, "r") as f2:
+                        d2 = yaml.safe_load(f2) or {}
+                    e2 = (d2.get("model", {}) or {}).get("image_encoder") or {}
+                    t2 = (e2.get("trunk") or {})
+                    tgt2 = t2.get("_target_") or t2.get("target")
+                    if isinstance(tgt2, str) and ".hiera." in tgt2:
+                        logger.info(f"SAM2: switching config from 'hieradet' → 'hiera': {y}")
+                        return str(y)
+                except Exception:
+                    continue
+    except Exception:
+        pass
+    return None
+def load_sam2() -> Tuple[Optional[object], bool, Dict[str, Any]]:
+    """Robust SAM2 loader with config resolution and error handling."""
+    meta = {"sam2_import_ok": False, "sam2_init_ok": False}
+    try:
+        from sam2.build_sam import build_sam2             # type: ignore
+        from sam2.sam2_image_predictor import SAM2ImagePredictor  # type: ignore
+        meta["sam2_import_ok"] = True
+    except Exception as e:
+        logger.warning(f"SAM2 import failed: {e}")
+        return None, False, meta
+    # Check GPU memory before loading
+    if torch and torch.cuda.is_available():
+        mem_before = torch.cuda.memory_allocated() / 1024**3
+        logger.info(f"🔍 GPU memory before SAM2 load: {mem_before:.2f}GB")
+    device = _pick_device("SAM2_DEVICE")
+    cfg_env = os.environ.get("SAM2_MODEL_CFG", "sam2/configs/sam2/sam2_hiera_l.yaml")
+    cfg = _resolve_sam2_cfg(cfg_env)
+    ckpt = os.environ.get("SAM2_CHECKPOINT", "")
+    def _try_build(cfg_path: str):
+        logger.info(f"_try_build called with cfg_path: {cfg_path}")
+        params = set(inspect.signature(build_sam2).parameters.keys())
+        logger.info(f"build_sam2 parameters: {list(params)}")
+        kwargs = {}
+        if "config_file" in params:
+            kwargs["config_file"] = cfg_path
+            logger.info(f"Using config_file parameter: {cfg_path}")
+        elif "model_cfg" in params:
+            kwargs["model_cfg"] = cfg_path
+            logger.info(f"Using model_cfg parameter: {cfg_path}")
+        if ckpt:
+            if "checkpoint" in params:
+                kwargs["checkpoint"] = ckpt
+            elif "ckpt_path" in params:
+                kwargs["ckpt_path"] = ckpt
+            elif "weights" in params:
+                kwargs["weights"] = ckpt
+        if "device" in params:
+            kwargs["device"] = device
+        try:
+            logger.info(f"Calling build_sam2 with kwargs: {kwargs}")
+            result = build_sam2(**kwargs)
+            logger.info(f"build_sam2 succeeded with kwargs")
+            # Log actual device of the model
+            if hasattr(result, 'device'):
+                logger.info(f"SAM2 model device: {result.device}")
+            elif hasattr(result, 'image_encoder') and hasattr(result.image_encoder, 'device'):
+                logger.info(f"SAM2 model device: {result.image_encoder.device}")
+            return result
+        except TypeError as e:
+            logger.info(f"build_sam2 kwargs failed: {e}, trying positional args")
+            pos = [cfg_path]
+            if ckpt:
+                pos.append(ckpt)
+            if "device" not in kwargs:
+                pos.append(device)
+            logger.info(f"Calling build_sam2 with positional args: {pos}")
+            result = build_sam2(*pos)
+            logger.info(f"build_sam2 succeeded with positional args")
+            return result
+    try:
+        try:
+            sam = _try_build(cfg)
+        except Exception:
+            alt_cfg = _find_hiera_config_if_hieradet(cfg)
+            if alt_cfg:
+                sam = _try_build(alt_cfg)
+            else:
+                raise
+        if sam is not None:
+            predictor = SAM2ImagePredictor(sam)
+            meta["sam2_init_ok"] = True
+            meta["sam2_device"] = device
+            return predictor, True, meta
+        else:
+            return None, False, meta
+    except Exception as e:
+        logger.error(f"SAM2 loading failed: {e}")
+        return None, False, meta
+def run_sam2_mask(predictor: object,
+                  first_frame_bgr: np.ndarray,
+                  point: Optional[Tuple[int, int]] = None,
+                  auto: bool = False) -> Tuple[Optional[np.ndarray], bool]:
+    """Return (mask_uint8_0_255, ok)."""
+    if predictor is None:
+        return None, False
+    try:
+        rgb = cv2.cvtColor(first_frame_bgr, cv2.COLOR_BGR2RGB)
+        predictor.set_image(rgb)
+        if auto:
+            h, w = rgb.shape[:2]
+            box = np.array([int(0.05*w), int(0.05*h), int(0.95*w), int(0.95*h)])
+            masks, _, _ = predictor.predict(box=box)
+        elif point is not None:
+            x, y = int(point[0]), int(point[1])
+            pts = np.array([[x, y]], dtype=np.int32)
+            labels = np.array([1], dtype=np.int32)
+            masks, _, _ = predictor.predict(point_coords=pts, point_labels=labels)
+        else:
+            h, w = rgb.shape[:2]
+            box = np.array([int(0.1*w), int(0.1*h), int(0.9*w), int(0.9*h)])
+            masks, _, _ = predictor.predict(box=box)
+        if masks is None or len(masks) == 0:
+            return None, False
+        m = masks[0].astype(np.uint8) * 255
+        return m, True
+    except Exception as e:
+        logger.warning(f"SAM2 mask failed: {e}")
+        return None, False
+def _refine_mask_grabcut(image_bgr: np.ndarray,
+                         mask_u8: np.ndarray,
+                         iters: int = None,
+                         trimap_erode: int = None,
+                         trimap_dilate: int = None) -> np.ndarray:
+    """Use SAM2 seed as initialization for GrabCut refinement."""
+    iters = int(os.environ.get("REFINE_GRABCUT_ITERS", "2")) if iters is None else int(iters)
+    e = int(os.environ.get("REFINE_TRIMAP_ERODE", "3")) if trimap_erode is None else int(trimap_erode)
+    d = int(os.environ.get("REFINE_TRIMAP_DILATE", "6")) if trimap_dilate is None else int(trimap_dilate)
+    h, w = mask_u8.shape[:2]
+    m = (mask_u8 > 127).astype(np.uint8) * 255
+    sure_fg = cv2.erode(m, cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (max(1, e), max(1, e))), iterations=1)
+    sure_bg = cv2.erode(255 - m, cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (max(1, d), max(1, d))), iterations=1)
+    gc_mask = np.full((h, w), cv2.GC_PR_BGD, dtype=np.uint8)
+    gc_mask[sure_bg > 0] = cv2.GC_BGD
+    gc_mask[sure_fg > 0] = cv2.GC_FGD
+    bgdModel = np.zeros((1, 65), np.float64)
+    fgdModel = np.zeros((1, 65), np.float64)
+    try:
+        cv2.grabCut(image_bgr, gc_mask, None, bgdModel, fgdModel, iters, cv2.GC_INIT_WITH_MASK)
+        out = np.where((gc_mask == cv2.GC_FGD) | (gc_mask == cv2.GC_PR_FGD), 255, 0).astype(np.uint8)
+        out = cv2.medianBlur(out, 5)
+        return out
+    except Exception as e:
+        logger.warning(f"GrabCut refinement failed; using original mask. Reason: {e}")
+        return m
+# --------------------------------------------------------------------------------------
+# MatAnyone Integration
+# --------------------------------------------------------------------------------------
+def load_matany() -> Tuple[Optional[object], bool, Dict[str, Any]]:
+    """
+    Probe MatAnyone availability with T=1 squeeze patch for conv2d compatibility.
+    Returns (None, available, meta); actual instantiation happens in MatAnyoneSession.
+    """
+    meta = {"matany_import_ok": False, "matany_init_ok": False}
+    enable_env = os.environ.get("ENABLE_MATANY", "1").strip().lower()
+    if enable_env in {"0", "false", "off", "no"}:
+        logger.info("MatAnyone disabled by ENABLE_MATANY=0.")
+        meta["disabled"] = True
+        return None, False, meta
+    # Apply T=1 squeeze patch before importing InferenceCore
+    try:
+        from .matany_compat_patch import apply_matany_t1_squeeze_guard
+        if apply_matany_t1_squeeze_guard():
+            logger.info("[MatAnyCompat] T=1 squeeze guard applied")
+            meta["patch_applied"] = True
+        else:
+            logger.warning("[MatAnyCompat] T=1 squeeze patch failed; conv2d errors may occur")
+            meta["patch_applied"] = False
+    except Exception as e:
+        logger.warning(f"[MatAnyCompat] Patch import failed: {e}")
+        meta["patch_applied"] = False
+    try:
+        from matanyone.inference.inference_core import InferenceCore  # type: ignore
+        meta["matany_import_ok"] = True
+        # Log MatAnyone version and InferenceCore attributes
+        try:
+            version = importlib.metadata.version("matanyone")
+            logger.info(f"[MATANY] MatAnyone version: {version}")
+        except Exception:
+            logger.info("[MATANY] MatAnyone version unknown")
+        logger.debug(f"[MATANY] InferenceCore attributes: {dir(InferenceCore)}")
+        device = _pick_device("MATANY_DEVICE")
+        repo_id = os.environ.get("MATANY_REPO_ID", "PeiqingYang/MatAnyone")
+        meta["matany_repo_id"] = repo_id
+        meta["matany_device"] = device
+        return None, True, meta
+    except Exception as e:
+        logger.warning(f"MatAnyone import failed: {e}")
+        return None, False, meta
+# --------------------------------------------------------------------------------------
+# Fallback Functions
+# --------------------------------------------------------------------------------------
+def fallback_mask(first_frame_bgr: np.ndarray) -> np.ndarray:
+    """Prefer MediaPipe; fallback to GrabCut. Returns uint8 mask 0/255."""
+    h, w = first_frame_bgr.shape[:2]
+    if _HAS_MEDIAPIPE:
+        try:
+            mp_selfie = mp.solutions.selfie_segmentation
+            with mp_selfie.SelfieSegmentation(model_selection=1) as segmenter:
+                rgb = cv2.cvtColor(first_frame_bgr, cv2.COLOR_BGR2RGB)
+                res = segmenter.process(rgb)
+                m = (np.clip(res.segmentation_mask, 0, 1) > 0.5).astype(np.uint8) * 255
+                m = cv2.medianBlur(m, 5)
+                return m
+        except Exception as e:
+            logger.warning(f"MediaPipe fallback failed: {e}")
+    # Ultimate fallback: GrabCut
+    mask = np.zeros((h, w), np.uint8)
+    rect = (int(0.1*w), int(0.1*h), int(0.8*w), int(0.8*h))
+    bgdModel = np.zeros((1, 65), np.float64)
+    fgdModel = np.zeros((1, 65), np.float64)
+    try:
+        cv2.grabCut(first_frame_bgr, mask, rect, bgdModel, fgdModel, 5, cv2.GC_INIT_WITH_RECT)
+        mask_bin = np.where((mask == cv2.GC_FGD) | (mask == cv2.GC_PR_FGD), 255, 0).astype(np.uint8)
+        return mask_bin
+    except Exception as e:
+        logger.warning(f"GrabCut failed: {e}")
+        return np.zeros((h, w), dtype=np.uint8)
+def composite_video(fg_path: Union[str, Path],
+                    alpha_path: Union[str, Path],
+                    bg_image_path: Union[str, Path],
+                    out_path: Union[str, Path],
+                    fps: int,
+                    size: Tuple[int, int]) -> bool:
+    """Blend MatAnyone FG+ALPHA over background using pro compositor."""
+    fg_cap = cv2.VideoCapture(str(fg_path))
+    al_cap = cv2.VideoCapture(str(alpha_path))
+    if not fg_cap.isOpened() or not al_cap.isOpened():
+        return False
+    w, h = size
+    bg = cv2.imread(str(bg_image_path), cv2.IMREAD_COLOR)
+    if bg is None:
+        bg = np.full((h, w, 3), 127, dtype=np.uint8)
+    bg_f = _resize_keep_ar(bg, (w, h))
+    if _probe_ffmpeg():
+        tmp_out = Path(str(out_path) + ".tmp.mp4")
+        writer = _video_writer(tmp_out, fps, (w, h))
+        post_h264 = True
+    else:
+        writer = _video_writer(Path(out_path), fps, (w, h))
+        post_h264 = False
+    ok_any = False
+    try:
+        while True:
+            ok_fg, fg = fg_cap.read()
+            ok_al, al = al_cap.read()
+            if not ok_fg or not ok_al:
+                break
+            fg = cv2.resize(fg, (w, h), interpolation=cv2.INTER_CUBIC)
+            al_gray = cv2.cvtColor(cv2.resize(al, (w, h)), cv2.COLOR_BGR2GRAY)
+            comp = _composite_frame_pro(
+                cv2.cvtColor(fg, cv2.COLOR_BGR2RGB),
+                al_gray,
+                cv2.cvtColor(bg_f, cv2.COLOR_BGR2RGB)
+            )
+            writer.write(cv2.cvtColor(comp, cv2.COLOR_RGB2BGR))
+            ok_any = True
+    finally:
+        fg_cap.release()
+        al_cap.release()
+        writer.release()
+    if post_h264 and ok_any:
+        try:
+            cmd = [
+                _ffmpeg_bin(), "-y",
+                "-i", str(tmp_out),
+                "-c:v", "libx264", "-pix_fmt", "yuv420p", "-movflags", "+faststart",
+                str(out_path)
+            ]
+            subprocess.run(cmd, check=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+            tmp_out.unlink(missing_ok=True)
+        except Exception as e:
+            logger.warning(f"ffmpeg finalize failed: {e}")
+            Path(out_path).unlink(missing_ok=True)
+            tmp_out.replace(out_path)
+    return ok_any
+def fallback_composite(video_path: Union[str, Path],
+                       mask_path: Union[str, Path],
+                       bg_image_path: Union[str, Path],
+                       out_path: Union[str, Path]) -> bool:
+    """Static-mask compositing using pro compositor."""
+    mask = cv2.imread(str(mask_path), cv2.IMREAD_GRAYSCALE)
+    cap = cv2.VideoCapture(str(video_path))
+    if mask is None or not cap.isOpened():
+        return False
+    w = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH) or 0)
+    h = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT) or 0)
+    fps = int(round(cap.get(cv2.CAP_PROP_FPS) or 25))
+    bg = cv2.imread(str(bg_image_path), cv2.IMREAD_COLOR)
+    if bg is None:
+        bg = np.full((h, w, 3), 127, dtype=np.uint8)
+    mask_resized = cv2.resize(mask, (w, h), interpolation=cv2.INTER_NEAREST)
+    bg_f = _resize_keep_ar(bg, (w, h))
+    if _probe_ffmpeg():
+        tmp_out = Path(str(out_path) + ".tmp.mp4")
+        writer = _video_writer(tmp_out, fps, (w, h))
+        use_post_ffmpeg = True
+    else:
+        writer = _video_writer(Path(out_path), fps, (w, h))
+        use_post_ffmpeg = False
+    ok_any = False
+    try:
+        while True:
+            ok, frame = cap.read()
+            if not ok:
+                break
+            comp = _composite_frame_pro(
+                cv2.cvtColor(frame, cv2.COLOR_BGR2RGB),
+                mask_resized,
+                cv2.cvtColor(bg_f, cv2.COLOR_BGR2RGB)
+            )
+            writer.write(cv2.cvtColor(comp, cv2.COLOR_RGB2BGR))
+            ok_any = True
+    finally:
+        cap.release()
+        writer.release()
+    if use_post_ffmpeg and ok_any:
+        try:
+            cmd = [
+                _ffmpeg_bin(), "-y",
+                "-i", str(tmp_out),
+                "-c:v", "libx264", "-pix_fmt", "yuv420p", "-movflags", "+faststart",
+                str(out_path)
+            ]
+            subprocess.run(cmd, check=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+            tmp_out.unlink(missing_ok=True)
+        except Exception as e:
+            logger.warning(f"ffmpeg H.264 finalize failed: {e}")
+            Path(out_path).unlink(missing_ok=True)
+            tmp_out.replace(out_path)
+    return ok_any
+# --------------------------------------------------------------------------------------
+# Stage-A (Transparent Export) Functions
+# --------------------------------------------------------------------------------------
+def _checkerboard_bg(w: int, h: int, tile: int = 32) -> np.ndarray:
+    y, x = np.mgrid[0:h, 0:w]
+    c = ((x // tile) + (y // tile)) % 2
+    a = np.where(c == 0, 200, 150).astype(np.uint8)
+    return np.stack([a, a, a], axis=-1)
+def _build_stage_a_rgba_vp9_from_fg_alpha(
+    fg_path: Union[str, Path],
+    alpha_path: Union[str, Path],
+    out_webm: Union[str, Path],
+    fps: int,
+    size: Tuple[int, int],
+    src_audio: Optional[Union[str, Path]] = None,
+) -> bool:
+    if not _probe_ffmpeg():
+        return False
+    w, h = size
+    try:
+        cmd = [_ffmpeg_bin(), "-y", "-i", str(fg_path), "-i", str(alpha_path)]
+        if src_audio:
+            cmd += ["-i", str(src_audio)]
+        fcx = f"[1:v]format=gray,scale={w}:{h},fps={fps}[al];" \
+              f"[0:v]scale={w}:{h},fps={fps}[fg];" \
+              f"[fg][al]alphamerge[outv]"
+        cmd += ["-filter_complex", fcx, "-map", "[outv]"]
+        if src_audio:
+            cmd += ["-map", "2:a:0?", "-c:a", "libopus", "-b:a", "128k"]
+        cmd += [
+            "-c:v", "libvpx-vp9", "-pix_fmt", "yuva420p",
+            "-crf", os.environ.get("STAGEA_VP9_CRF", "28"),
+            "-b:v", "0", "-row-mt", "1", "-shortest", str(out_webm),
+        ]
+        subprocess.run(cmd, check=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+        return True
+    except Exception as e:
+        logger.warning(f"Stage-A VP9(alpha) build failed: {e}")
+        return False
+def _build_stage_a_rgba_vp9_from_mask(
+    video_path: Union[str, Path],
+    mask_png: Union[str, Path],
+    out_webm: Union[str, Path],
+    fps: int,
+    size: Tuple[int, int],
+) -> bool:
+    if not _probe_ffmpeg():
+        return False
+    w, h = size
+    try:
+        cmd = [
+            _ffmpeg_bin(), "-y",
+            "-i", str(video_path),
+            "-loop", "1", "-i", str(mask_png),
+            "-filter_complex",
+            f"[1:v]format=gray,scale={w}:{h},fps={fps}[al];"
+            f"[0:v]scale={w}:{h},fps={fps}[fg];"
+            f"[fg][al]alphamerge[outv]",
+            "-map", "[outv]",
+            "-c:v", "libvpx-vp9", "-pix_fmt", "yuva420p",
+            "-crf", os.environ.get("STAGEA_VP9_CRF", "28"),
+            "-b:v", "0", "-row-mt", "1", "-shortest", str(out_webm),
+        ]
+        subprocess.run(cmd, check=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+        return True
+    except Exception as e:
+        logger.warning(f"Stage-A VP9(alpha) (mask) build failed: {e}")
+        return False
+def _build_stage_a_checkerboard_from_fg_alpha(
+    fg_path: Union[str, Path],
+    alpha_path: Union[str, Path],
+    out_mp4: Union[str, Path],
+    fps: int,
+    size: Tuple[int, int],
+) -> bool:
+    fg_cap = cv2.VideoCapture(str(fg_path))
+    al_cap = cv2.VideoCapture(str(alpha_path))
+    if not fg_cap.isOpened() or not al_cap.isOpened():
+        return False
+    w, h = size
+    writer = _video_writer(Path(out_mp4), fps, (w, h))
+    bg = _checkerboard_bg(w, h)
+    ok_any = False
+    try:
+        while True:
+            okf, fg = fg_cap.read()
+            oka, al = al_cap.read()
+            if not okf or not oka:
+                break
+            fg = cv2.resize(fg, (w, h))
+            al = cv2.cvtColor(cv2.resize(al, (w, h)), cv2.COLOR_BGR2GRAY)
+            comp = _composite_frame_pro(cv2.cvtColor(fg, cv2.COLOR_BGR2RGB), al, bg)
+            writer.write(cv2.cvtColor(comp, cv2.COLOR_RGB2BGR))
+            ok_any = True
+    finally:
+        fg_cap.release()
+        al_cap.release()
+        writer.release()
+    return ok_any
+def _build_stage_a_checkerboard_from_mask(
+    video_path: Union[str, Path],
+    mask_png: Union[str, Path],
+    out_mp4: Union[str, Path],
+    fps: int,
+    size: Tuple[int, int],
+) -> bool:
+    cap = cv2.VideoCapture(str(video_path))
+    if not cap.isOpened():
+        return False
+    w, h = size
+    mask = cv2.imread(str(mask_png), cv2.IMREAD_GRAYSCALE)
+    if mask is None:
+        return False
+    mask = cv2.resize(mask, (w, h), interpolation=cv2.INTER_NEAREST)
+    writer = _video_writer(Path(out_mp4), fps, (w, h))
+    bg = _checkerboard_bg(w, h)
+    ok_any = False
+    try:
+        while True:
+            ok, frame = cap.read()
+            if not ok:
+                break
+            frame = cv2.resize(frame, (w, h))
+            comp = _composite_frame_pro(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB), mask, bg)
+            writer.write(cv2.cvtColor(comp, cv2.COLOR_RGB2BGR))
+            ok_any = True
+    finally:
+        cap.release()
+        writer.release()
+    return ok_any
+# --------------------------------------------------------------------------------------
+# MatAnyone Integration
+# --------------------------------------------------------------------------------------
+def run_matany(
+    video_path: Union[str, Path],
+    mask_path: Optional[Union[str, Path]],
+    out_dir: Union[str, Path],
+    device: Optional[str] = None,
+    progress_callback: Optional[Callable[[float, str], None]] = None,
+) -> Tuple[Path, Path]:
+    """
+    Run MatAnyone streaming matting via our shape-guarded adapter.
+    Returns (alpha_mp4_path, fg_mp4_path).
+    Raises MatAnyError on failure.
+    """
+    from .matanyone_loader import MatAnyoneSession, MatAnyError
+    session = MatAnyoneSession(device=device, precision="auto")
+    alpha_p, fg_p = session.process_stream(
+        video_path=Path(video_path),
+        seed_mask_path=Path(mask_path) if mask_path else None,
+        out_dir=Path(out_dir),
+        progress_cb=progress_callback,
+    )
+    return alpha_p, fg_p

VideoBackgroundReplacer2/models/matanyone_loader.py ADDED Viewed

	@@ -0,0 +1,290 @@

+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""
+MatAnyone adapter — Using Official API (File-Based)
+Fixed to use MatAnyone's official process_video() API instead of
+bypassing it with internal tensor manipulation. This eliminates
+all 5D tensor dimension issues.
+Changes (2025-09-17):
+- Replaced custom tensor processing with official MatAnyone API
+- Uses file-based input/output as designed by MatAnyone authors
+- Eliminates all tensor dimension compatibility issues
+- Simplified error handling and logging
+"""
+from __future__ import annotations
+import os
+import time
+import logging
+import tempfile
+import importlib.metadata
+from pathlib import Path
+from typing import Optional, Callable, Tuple
+log = logging.getLogger(__name__)
+# ---------- Progress helper ----------
+def _env_flag(name: str, default: str = "0") -> bool:
+    return os.getenv(name, default).strip().lower() in {"1", "true", "yes", "on"}
+_PROGRESS_CB_ENABLED = _env_flag("MATANY_PROGRESS", "1")
+_PROGRESS_MIN_INTERVAL = float(os.getenv("MATANY_PROGRESS_MIN_SEC", "0.25"))
+_progress_last = 0.0
+_progress_last_msg = None
+_progress_disabled = False
+def _emit_progress(cb, pct: float, msg: str):
+    global _progress_last, _progress_last_msg, _progress_disabled
+    if not cb or not _PROGRESS_CB_ENABLED or _progress_disabled:
+        return
+    now = time.time()
+    if (now - _progress_last) < _PROGRESS_MIN_INTERVAL and msg == _progress_last_msg:
+        return
+    try:
+        try:
+            cb(pct, msg)  # preferred (pct, msg)
+        except TypeError:
+            cb(msg)       # legacy (msg)
+        _progress_last = now
+        _progress_last_msg = msg
+    except Exception as e:
+        _progress_disabled = True
+        log.warning("[progress-cb] disabled due to exception: %s", e)
+# ---------- Errors ----------
+class MatAnyError(RuntimeError):
+    pass
+# ---------- CUDA helpers ----------
+def _cuda_snapshot(device: Optional[str]) -> str:
+    try:
+        import torch
+        if not torch.cuda.is_available():
+            return "CUDA: N/A"
+        idx = 0
+        if device and device.startswith("cuda:"):
+            try:
+                idx = int(device.split(":")[1])
+            except (ValueError, IndexError):
+                idx = 0
+        name = torch.cuda.get_device_name(idx)
+        alloc = torch.cuda.memory_allocated(idx) / (1024**3)
+        resv = torch.cuda.memory_reserved(idx) / (1024**3)
+        return f"device={idx}, name={name}, alloc={alloc:.2f}GB, reserved={resv:.2f}GB"
+    except Exception as e:
+        return f"CUDA snapshot error: {e!r}"
+def _safe_empty_cache():
+    try:
+        import torch
+        if torch.cuda.is_available():
+            log.info(f"[MATANY] CUDA memory before empty_cache: {_cuda_snapshot('cuda:0')}")
+            torch.cuda.empty_cache()
+            log.info(f"[MATANY] CUDA memory after empty_cache: {_cuda_snapshot('cuda:0')}")
+    except Exception:
+        pass
+# ============================================================================
+class MatAnyoneSession:
+    """
+    Simple wrapper around MatAnyone's official API.
+    Uses file-based input/output as designed by the MatAnyone authors.
+    """
+    def __init__(self, device: Optional[str] = None, precision: str = "auto"):
+        self.device = device or ("cuda" if self._cuda_available() else "cpu")
+        self.precision = precision.lower()
+        # Log MatAnyone version
+        try:
+            version = importlib.metadata.version("matanyone")
+            log.info(f"[MATANY] MatAnyone version: {version}")
+        except Exception:
+            log.info("[MATANY] MatAnyone version unknown")
+        # Initialize MatAnyone's official API
+        try:
+            from matanyone import InferenceCore
+            self.processor = InferenceCore("PeiqingYang/MatAnyone")
+            log.info("[MATANY] MatAnyone InferenceCore initialized successfully")
+        except Exception as e:
+            raise MatAnyError(f"Failed to initialize MatAnyone: {e}")
+    def _cuda_available(self) -> bool:
+        try:
+            import torch
+            return torch.cuda.is_available()
+        except Exception:
+            return False
+    def process_stream(
+        self,
+        video_path: Path,
+        seed_mask_path: Optional[Path] = None,
+        out_dir: Optional[Path] = None,
+        progress_cb: Optional[Callable] = None,
+    ) -> Tuple[Path, Path]:
+        """
+        Process video using MatAnyone's official API.
+        Args:
+            video_path: Path to input video file
+            seed_mask_path: Path to first-frame mask PNG (white=foreground, black=background)
+            out_dir: Output directory for results
+            progress_cb: Progress callback function
+        Returns:
+            Tuple of (alpha_path, foreground_path)
+        """
+        video_path = Path(video_path)
+        if not video_path.exists():
+            raise MatAnyError(f"Video file not found: {video_path}")
+        if seed_mask_path and not Path(seed_mask_path).exists():
+            raise MatAnyError(f"Seed mask not found: {seed_mask_path}")
+        out_dir = Path(out_dir) if out_dir else video_path.parent / "matanyone_output"
+        out_dir.mkdir(parents=True, exist_ok=True)
+        log.info(f"[MATANY] Processing video: {video_path}")
+        log.info(f"[MATANY] Using mask: {seed_mask_path}")
+        log.info(f"[MATANY] Output directory: {out_dir}")
+        _emit_progress(progress_cb, 0.0, "Initializing MatAnyone processing...")
+        try:
+            # Use MatAnyone's official API
+            start_time = time.time()
+            _emit_progress(progress_cb, 0.1, "Running MatAnyone video matting...")
+            # Call the official process_video method
+            foreground_path, alpha_path = self.processor.process_video(
+                input_path=str(video_path),
+                mask_path=str(seed_mask_path) if seed_mask_path else None,
+                output_path=str(out_dir)
+            )
+            processing_time = time.time() - start_time
+            log.info(f"[MATANY] Processing completed in {processing_time:.1f}s")
+            log.info(f"[MATANY] Foreground output: {foreground_path}")
+            log.info(f"[MATANY] Alpha output: {alpha_path}")
+            # Convert to Path objects
+            fg_path = Path(foreground_path) if foreground_path else None
+            al_path = Path(alpha_path) if alpha_path else None
+            # Verify outputs exist
+            if not fg_path or not fg_path.exists():
+                raise MatAnyError(f"Foreground output not created: {fg_path}")
+            if not al_path or not al_path.exists():
+                raise MatAnyError(f"Alpha output not created: {al_path}")
+            _emit_progress(progress_cb, 1.0, "MatAnyone processing complete")
+            return al_path, fg_path  # Return (alpha, foreground) to match expected order
+        except Exception as e:
+            log.error(f"[MATANY] Processing failed: {e}")
+            raise MatAnyError(f"MatAnyone processing failed: {e}")
+        finally:
+            _safe_empty_cache()
+# ============================================================================
+# MatAnyoneModel Wrapper Class for app_hf.py compatibility
+# ============================================================================
+class MatAnyoneModel:
+    """Wrapper class for MatAnyone to match app_hf.py interface"""
+    def __init__(self, device="cuda"):
+        self.device = device
+        self.session = None
+        self.loaded = False
+        log.info(f"Initializing MatAnyoneModel on device: {device}")
+        # Initialize the session
+        self._load_model()
+    def _load_model(self):
+        """Load the MatAnyone session"""
+        try:
+            self.session = MatAnyoneSession(device=self.device, precision="auto")
+            self.loaded = True
+            log.info("MatAnyoneModel loaded successfully")
+        except Exception as e:
+            log.error(f"Error loading MatAnyoneModel: {e}")
+            self.loaded = False
+    def replace_background(self, video_path, masks, background_path):
+        """Replace background in video using MatAnyone"""
+        if not self.loaded:
+            raise MatAnyError("MatAnyoneModel not loaded")
+        try:
+            from pathlib import Path
+            import tempfile
+            # Convert paths to Path objects
+            video_path = Path(video_path)
+            # For now, we expect masks to be a path to the first-frame mask
+            mask_path = Path(masks) if isinstance(masks, (str, Path)) else None
+            # Create output directory
+            with tempfile.TemporaryDirectory() as temp_dir:
+                output_dir = Path(temp_dir)
+                # Process the video stream
+                alpha_path, fg_path = self.session.process_stream(
+                    video_path=video_path,
+                    seed_mask_path=mask_path,
+                    out_dir=output_dir,
+                    progress_cb=None
+                )
+                # Return the foreground video path
+                # In a full implementation, you'd composite with the background_path
+                return str(fg_path)
+        except Exception as e:
+            log.error(f"Error in replace_background: {e}")
+            raise MatAnyError(f"Background replacement failed: {e}")
+# ============================================================================
+# Helper function for pipeline integration
+# ============================================================================
+def create_matanyone_session(device=None):
+    """Create a MatAnyone session for use in pipeline"""
+    return MatAnyoneSession(device=device)
+def run_matanyone_on_files(video_path, mask_path, output_dir, device="cuda", progress_callback=None):
+    """
+    Run MatAnyone on video and mask files.
+    Args:
+        video_path: Path to input video
+        mask_path: Path to first-frame mask PNG
+        output_dir: Directory for outputs
+        device: Device to use (cuda/cpu)
+        progress_callback: Progress callback function
+    Returns:
+        Tuple of (alpha_path, foreground_path) or (None, None) on failure
+    """
+    try:
+        session = MatAnyoneSession(device=device)
+        alpha_path, fg_path = session.process_stream(
+            video_path=Path(video_path),
+            seed_mask_path=Path(mask_path) if mask_path else None,
+            out_dir=Path(output_dir),
+            progress_cb=progress_callback
+        )
+        return str(alpha_path), str(fg_path)
+    except Exception as e:
+        log.error(f"MatAnyone processing failed: {e}")
+        return None, None

VideoBackgroundReplacer2/models/sam2_loader.py ADDED Viewed

	@@ -0,0 +1,262 @@

+#!/usr/bin/env python3
+"""
+SAM2 Loader with T4-optimized predictor wrapper
+Provides SAM2Predictor class with memory management and optimization features
+"""
+import os
+import gc
+import torch
+import logging
+import numpy as np
+from pathlib import Path
+from typing import Optional, Any, Dict, List, Tuple
+logger = logging.getLogger(__name__)
+class SAM2Predictor:
+    """
+    T4-optimized SAM2 video predictor wrapper with memory management
+    """
+    def __init__(self, device: torch.device, model_size: str = "small"):
+        self.device = device
+        self.model_size = model_size
+        self.predictor = None
+        self.model = None
+        self._load_predictor()
+    def _load_predictor(self):
+        """Load SAM2 predictor with optimizations"""
+        try:
+            from sam2.build_sam import build_sam2_video_predictor
+            # Download checkpoint if needed
+            checkpoint_path = f"./checkpoints/sam2_hiera_{self.model_size}.pt"
+            if not self._ensure_checkpoint(checkpoint_path):
+                raise RuntimeError(f"Failed to get SAM2 {self.model_size} checkpoint")
+            # Build predictor
+            model_cfg = f"sam2_hiera_{self.model_size[0]}.yaml"  # small -> s, base -> b, large -> l
+            self.predictor = build_sam2_video_predictor(model_cfg, checkpoint_path, device=self.device)
+            # Apply T4 optimizations
+            self._optimize_for_t4()
+            logger.info(f"SAM2 {self.model_size} predictor loaded successfully")
+        except ImportError as e:
+            logger.error(f"SAM2 import failed: {e}")
+            raise RuntimeError("SAM2 not available - check third_party/sam2 installation")
+        except Exception as e:
+            logger.error(f"SAM2 loading failed: {e}")
+            raise
+    def _ensure_checkpoint(self, checkpoint_path: str) -> bool:
+        """Ensure checkpoint exists, download if needed"""
+        checkpoint_file = Path(checkpoint_path)
+        if checkpoint_file.exists():
+            file_size = checkpoint_file.stat().st_size / (1024**2)
+            if file_size > 50:  # At least 50MB
+                logger.info(f"SAM2 checkpoint exists: {file_size:.1f}MB")
+                return True
+            else:
+                logger.warning(f"Checkpoint too small ({file_size:.1f}MB), re-downloading")
+                checkpoint_file.unlink()
+        return self._download_checkpoint(checkpoint_path)
+    def _download_checkpoint(self, checkpoint_path: str, timeout_seconds: int = 600) -> bool:
+        """Download SAM2 checkpoint"""
+        try:
+            logger.info(f"Downloading SAM2 {self.model_size} checkpoint...")
+            checkpoint_file = Path(checkpoint_path)
+            checkpoint_file.parent.mkdir(parents=True, exist_ok=True)
+            import requests
+            # Checkpoint URLs
+            urls = {
+                "small": "https://dl.fbaipublicfiles.com/segment_anything_2/072824/sam2_hiera_small.pt",
+                "base": "https://dl.fbaipublicfiles.com/segment_anything_2/072824/sam2_hiera_base_plus.pt",
+                "large": "https://dl.fbaipublicfiles.com/segment_anything_2/072824/sam2_hiera_large.pt"
+            }
+            if self.model_size not in urls:
+                raise ValueError(f"Unknown model size: {self.model_size}")
+            checkpoint_url = urls[self.model_size]
+            import time
+            start_time = time.time()
+            response = requests.get(checkpoint_url, stream=True, timeout=30)
+            response.raise_for_status()
+            total_size = int(response.headers.get('content-length', 0))
+            temp_path = checkpoint_file.with_suffix('.download')
+            downloaded = 0
+            last_log = start_time
+            with open(temp_path, 'wb') as f:
+                for chunk in response.iter_content(chunk_size=1024*1024):
+                    if chunk:
+                        f.write(chunk)
+                        downloaded += len(chunk)
+                        current_time = time.time()
+                        if current_time - start_time > timeout_seconds:
+                            raise TimeoutError(f"Download timeout after {timeout_seconds}s")
+                        # Progress logging every 15 seconds
+                        if current_time - last_log > 15:
+                            progress = (downloaded / total_size * 100) if total_size > 0 else 0
+                            speed = downloaded / (current_time - start_time) / (1024**2)
+                            logger.info(f"Download: {progress:.1f}% ({speed:.1f}MB/s)")
+                            last_log = current_time
+            temp_path.rename(checkpoint_file)
+            download_time = time.time() - start_time
+            speed = downloaded / download_time / (1024**2)
+            logger.info(f"Download complete: {downloaded/(1024**2):.1f}MB in {download_time:.1f}s ({speed:.1f}MB/s)")
+            return True
+        except Exception as e:
+            logger.error(f"Checkpoint download failed: {e}")
+            if Path(checkpoint_path).exists():
+                Path(checkpoint_path).unlink()
+            return False
+    def _optimize_for_t4(self):
+        """Apply T4-specific optimizations"""
+        try:
+            if hasattr(self.predictor, "model") and self.predictor.model is not None:
+                self.model = self.predictor.model
+                # Apply fp16 and channels_last for T4 efficiency
+                self.model = self.model.half().to(self.device)
+                self.model = self.model.to(memory_format=torch.channels_last)
+                logger.info("SAM2: fp16 + channels_last applied for T4 optimization")
+        except Exception as e:
+            logger.warning(f"SAM2 T4 optimization warning: {e}")
+    def init_state(self, video_path: str):
+        """Initialize video processing state"""
+        if self.predictor is None:
+            raise RuntimeError("Predictor not loaded")
+        try:
+            return self.predictor.init_state(video_path=video_path)
+        except Exception as e:
+            logger.error(f"Failed to initialize video state: {e}")
+            raise
+    def add_new_points(self, inference_state, frame_idx: int, obj_id: int,
+                      points: np.ndarray, labels: np.ndarray):
+        """Add new points for tracking"""
+        if self.predictor is None:
+            raise RuntimeError("Predictor not loaded")
+        try:
+            return self.predictor.add_new_points(
+                inference_state=inference_state,
+                frame_idx=frame_idx,
+                obj_id=obj_id,
+                points=points,
+                labels=labels
+            )
+        except Exception as e:
+            logger.error(f"Failed to add new points: {e}")
+            raise
+    def propagate_in_video(self, inference_state, scale: float = 1.0, **kwargs):
+        """Propagate through video with optional scaling"""
+        if self.predictor is None:
+            raise RuntimeError("Predictor not loaded")
+        try:
+            # Use the predictor's propagate_in_video method
+            return self.predictor.propagate_in_video(inference_state, **kwargs)
+        except Exception as e:
+            logger.error(f"Failed to propagate in video: {e}")
+            raise
+    def prune_state(self, inference_state, keep: int):
+        """Prune SAM2 state to keep only recent frames in memory"""
+        try:
+            # Try to access and prune internal caches
+            # This is model-specific and may need adjustment based on SAM2 internals
+            if hasattr(inference_state, 'cached_features'):
+                # Keep only the most recent 'keep' frames
+                cached_keys = list(inference_state.cached_features.keys())
+                if len(cached_keys) > keep:
+                    keys_to_remove = cached_keys[:-keep]
+                    for key in keys_to_remove:
+                        if key in inference_state.cached_features:
+                            del inference_state.cached_features[key]
+                    logger.debug(f"Pruned {len(keys_to_remove)} old cached features")
+            # Clear other potential caches
+            if hasattr(inference_state, 'point_inputs_per_obj'):
+                # Keep recent point inputs only
+                for obj_id in list(inference_state.point_inputs_per_obj.keys()):
+                    obj_inputs = inference_state.point_inputs_per_obj[obj_id]
+                    if len(obj_inputs) > keep:
+                        # Keep only recent entries
+                        recent_keys = sorted(obj_inputs.keys())[-keep:]
+                        new_inputs = {k: obj_inputs[k] for k in recent_keys}
+                        inference_state.point_inputs_per_obj[obj_id] = new_inputs
+            # Force garbage collection
+            torch.cuda.empty_cache() if self.device.type == 'cuda' else None
+        except Exception as e:
+            logger.debug(f"State pruning warning: {e}")
+    def clear_memory(self):
+        """Clear GPU memory aggressively"""
+        try:
+            if self.device.type == 'cuda':
+                torch.cuda.empty_cache()
+                torch.cuda.synchronize()
+                torch.cuda.ipc_collect()
+            gc.collect()
+        except Exception as e:
+            logger.warning(f"Memory clearing warning: {e}")
+    def get_memory_usage(self) -> Dict[str, float]:
+        """Get current memory usage statistics"""
+        if self.device.type != 'cuda':
+            return {"allocated_gb": 0.0, "reserved_gb": 0.0, "free_gb": 0.0}
+        try:
+            allocated = torch.cuda.memory_allocated(self.device) / (1024**3)
+            reserved = torch.cuda.memory_reserved(self.device) / (1024**3)
+            free, total = torch.cuda.mem_get_info(self.device)
+            free_gb = free / (1024**3)
+            return {
+                "allocated_gb": allocated,
+                "reserved_gb": reserved,
+                "free_gb": free_gb,
+                "total_gb": total / (1024**3)
+            }
+        except Exception:
+            return {"allocated_gb": 0.0, "reserved_gb": 0.0, "free_gb": 0.0}
+    def __del__(self):
+        """Cleanup on deletion"""
+        try:
+            if hasattr(self, 'predictor') and self.predictor is not None:
+                del self.predictor
+            if hasattr(self, 'model') and self.model is not None:
+                del self.model
+            self.clear_memory()
+        except Exception:
+            pass

VideoBackgroundReplacer2/pipeline.py ADDED Viewed

	@@ -0,0 +1,477 @@

+#!/usr/bin/env python3
+"""
+pipeline.py — Production SAM2 + MatAnyone (T4-optimized, single-pass streaming)
+Key features
+------------
+- One SAM2 inference state for the entire video (no per-chunk reinit).
+- In-stream pipeline: Read → SAM2 → MatAnyone → Compose → Write (no big RAM dicts).
+- Bounded memory everywhere (deque/window); optional CPU spill.
+- fp16 + channels_last on SAM2; mixed precision blocks.
+- VRAM-aware controller adjusts memory window/scale.
+- Heartbeat logger to prevent HF watchdog restarts.
+- Safer FFmpeg audio re-mux.
+Compatible with Tesla T4 (≈15–16 GB) and PyTorch 2.5.x + CUDA 12.4 wheels.
+"""
+import os
+import gc
+import cv2
+import time
+import uuid
+import torch
+import queue
+import shutil
+import logging
+import tempfile
+import subprocess
+import threading
+import numpy as np
+from PIL import Image
+from pathlib import Path
+from typing import Optional, Tuple, Dict, Any, Callable
+from collections import deque
+# ----------------------------------------------------------------------------------------------------------------------
+# Logging
+# ----------------------------------------------------------------------------------------------------------------------
+logger = logging.getLogger("backgroundfx_pro")
+if not logger.handlers:
+    h = logging.StreamHandler()
+    h.setFormatter(logging.Formatter("[%(asctime)s] %(levelname)s:%(name)s: %(message)s"))
+    logger.addHandler(h)
+logger.setLevel(logging.INFO)
+# ----------------------------------------------------------------------------------------------------------------------
+# Environment & Torch tuning for T4
+# ----------------------------------------------------------------------------------------------------------------------
+def setup_t4_environment():
+    os.environ.setdefault("PYTORCH_CUDA_ALLOC_CONF",
+                          "expandable_segments:True,max_split_size_mb:256,garbage_collection_threshold:0.7")
+    os.environ.setdefault("OMP_NUM_THREADS", "1")
+    os.environ.setdefault("OPENBLAS_NUM_THREADS", "1")
+    os.environ.setdefault("MKL_NUM_THREADS", "1")
+    os.environ.setdefault("OPENCV_OPENCL_RUNTIME", "disabled")
+    os.environ.setdefault("OPENCV_IO_ENABLE_OPENEXR", "0")
+    torch.set_grad_enabled(False)
+    try:
+        torch.backends.cudnn.benchmark = True
+        torch.backends.cuda.matmul.allow_tf32 = True
+        torch.backends.cudnn.allow_tf32 = True
+        torch.set_float32_matmul_precision("high")
+    except Exception:
+        pass
+    if torch.cuda.is_available():
+        try:
+            frac = float(os.getenv("CUDA_MEMORY_FRACTION", "0.88"))
+            torch.cuda.set_per_process_memory_fraction(frac)
+            logger.info(f"CUDA per-process memory fraction = {frac:.2f}")
+        except Exception as e:
+            logger.warning(f"Could not set CUDA memory fraction: {e}")
+def vram_gb() -> Tuple[float, float]:
+    if not torch.cuda.is_available():
+        return 0.0, 0.0
+    free, total = torch.cuda.mem_get_info()
+    return free / (1024 ** 3), total / (1024 ** 3)
+# ----------------------------------------------------------------------------------------------------------------------
+# Heartbeat (prevents Spaces watchdog killing the job)
+# ----------------------------------------------------------------------------------------------------------------------
+def heartbeat_monitor(running_flag: Dict[str, bool], interval: float = 8.0):
+    while running_flag.get("running", False):
+        print(f"[HB] t={int(time.time())}", flush=True)
+        time.sleep(interval)
+# ----------------------------------------------------------------------------------------------------------------------
+# Streaming video I/O
+# ----------------------------------------------------------------------------------------------------------------------
+class StreamingVideoIO:
+    def __init__(self, video_path: str, out_path: str, fps: float):
+        self.video_path = video_path
+        self.out_path = out_path
+        self.fps = fps
+        self.cap = None
+        self.writer = None
+        self.size = None
+    def __enter__(self):
+        self.cap = cv2.VideoCapture(self.video_path)
+        if not self.cap.isOpened():
+            raise RuntimeError(f"Cannot open video: {self.video_path}")
+        w = int(self.cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+        h = int(self.cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+        self.size = (w, h)
+        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+        self.writer = cv2.VideoWriter(self.out_path, fourcc, self.fps, (w, h))
+        return self
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        if self.cap:
+            self.cap.release()
+        if self.writer:
+            self.writer.release()
+    def read_frame(self):
+        if not self.cap:
+            return False, None
+        return self.cap.read()
+    def write_frame(self, frame_bgr: np.ndarray):
+        if not self.writer:
+            return
+        self.writer.write(frame_bgr)
+# ----------------------------------------------------------------------------------------------------------------------
+# Models: loaders and safe optimizations
+# ----------------------------------------------------------------------------------------------------------------------
+def load_sam2_predictor(device: torch.device):
+    """
+    Prefer your local wrapper to keep interfaces stable.
+    """
+    try:
+        from models.sam2_loader import SAM2Predictor  # your wrapper
+        predictor = SAM2Predictor(device=device)
+        # Optional: try to access underlying model to set fp16 + channels_last
+        try:
+            if hasattr(predictor, "model") and predictor.model is not None:
+                predictor.model = predictor.model.half().to(device)
+                predictor.model = predictor.model.to(memory_format=torch.channels_last)
+                logger.info("SAM2: fp16 + channels_last applied (wrapper model).")
+        except Exception as e:
+            logger.warning(f"SAM2 fp16 optimization warning: {e}")
+        return predictor
+    except Exception as e:
+        logger.error(f"Failed to import SAM2Predictor: {e}")
+        raise
+def load_matany_session(device: torch.device):
+    """
+    Supports either MatAnyoneSession or MatAnyoneLoader (your code has varied).
+    """
+    try:
+        try:
+            from models.matanyone_loader import MatAnyoneSession as _MatAny
+        except Exception:
+            from models.matanyone_loader import MatAnyoneLoader as _MatAny
+        session = _MatAny(device=device)
+        # Try fp16 eval where safe
+        if hasattr(session, "model") and session.model is not None:
+            session.model.eval()
+            try:
+                session.model = session.model.half().to(device)
+                logger.info("MatAnyone: fp16 + eval applied.")
+            except Exception:
+                logger.info("MatAnyone: using fp32 (fp16 not supported for some layers).")
+        return session
+    except Exception as e:
+        logger.warning(f"MatAnyone not available ({e}). Proceeding without refinement.")
+        return None
+# ----------------------------------------------------------------------------------------------------------------------
+# SAM2 state pruning (adapter): we call predictor.prune_state if present, else best-effort
+# ----------------------------------------------------------------------------------------------------------------------
+def prune_sam2_state(predictor, state: Any, keep: int):
+    """
+    Try to prune SAM2 temporal caches to a fixed window length.
+    Your SAM2Predictor should implement prune_state(state, keep=N). If not, we do nothing.
+    """
+    try:
+        if hasattr(predictor, "prune_state"):
+            predictor.prune_state(state, keep=keep)
+        elif hasattr(state, "prune") and callable(getattr(state, "prune")):
+            state.prune(keep=keep)
+        else:
+            # No-op; rely on model internals and GC
+            pass
+    except Exception as e:
+        logger.debug(f"SAM2 prune_state warning: {e}")
+# ----------------------------------------------------------------------------------------------------------------------
+# VRAM-aware controller
+# ----------------------------------------------------------------------------------------------------------------------
+class VRAMAdaptiveController:
+    def __init__(self):
+        self.memory_window = int(os.getenv("SAM2_WINDOW", "96"))   # frames to keep in model state
+        self.propagation_scale = float(os.getenv("SAM2_PROP_SCALE", "0.90"))  # e.g., downscale factor for propagation
+        self.cleanup_every = 20  # frames
+    def adapt(self):
+        free, total = vram_gb()
+        if free == 0.0:
+            return
+        # Tighten if we dip under ~1.6 GB
+        if free < 1.6:
+            self.memory_window = max(48, self.memory_window - 8)
+            self.propagation_scale = max(0.75, self.propagation_scale - 0.03)
+            self.cleanup_every = max(12, self.cleanup_every - 2)
+            logger.warning(f"Low VRAM ({free:.2f} GB free) → window={self.memory_window}, scale={self.propagation_scale:.2f}")
+        # Relax if plenty free
+        elif free > 3.0:
+            self.memory_window = min(128, self.memory_window + 4)
+            self.propagation_scale = min(1.0, self.propagation_scale + 0.01)
+            self.cleanup_every = min(40, self.cleanup_every + 2)
+# ----------------------------------------------------------------------------------------------------------------------
+# Audio mux helper (safer stream mapping)
+# ----------------------------------------------------------------------------------------------------------------------
+def mux_audio(video_path_no_audio: str, source_with_audio: str, out_path: str) -> bool:
+    cmd = [
+        "ffmpeg", "-y", "-hide_banner", "-loglevel", "error",
+        "-i", video_path_no_audio,
+        "-i", source_with_audio,
+        "-map", "0:v:0", "-map", "1:a:0",
+        "-c:v", "copy", "-c:a", "aac", "-shortest",
+        out_path
+    ]
+    try:
+        r = subprocess.run(cmd, capture_output=True, text=True, timeout=180)
+        if r.returncode != 0:
+            logger.warning(f"FFmpeg mux failed: {r.stderr.strip()}")
+            return False
+        return True
+    except Exception as e:
+        logger.warning(f"FFmpeg mux error: {e}")
+        return False
+# ----------------------------------------------------------------------------------------------------------------------
+# Main processing
+# ----------------------------------------------------------------------------------------------------------------------
+def process(
+    video_path: str,
+    background_image: Optional[Image.Image] = None,
+    background_type: str = "custom",
+    background_prompt: str = "",
+    job_directory: Optional[Path] = None,
+    progress_callback: Optional[Callable[[str, float], None]] = None
+) -> str:
+    """
+    Production SAM2 + MatAnyone pipeline for T4.
+    - Single-pass streaming (no large mask dicts)
+    - Bounded memory windows
+    """
+    setup_t4_environment()
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    # Heartbeat
+    hb_flag = {"running": True}
+    hb_thread = threading.Thread(target=heartbeat_monitor, args=(hb_flag, 8.0), daemon=True)
+    hb_thread.start()
+    def report(step: str, p: Optional[float] = None):
+        if p is None:
+            logger.info(step)
+        else:
+            logger.info(f"{step} [{p:.1%}]")
+        if progress_callback:
+            try:
+                progress_callback(step, p)
+            except Exception as e:
+                logger.debug(f"progress_callback error: {e}")
+    # Validate I/O
+    src = Path(video_path)
+    if not src.exists():
+        hb_flag["running"] = False
+        raise FileNotFoundError(f"Video not found: {video_path}")
+    if job_directory is None:
+        job_directory = Path.cwd() / "tmp" / f"job_{uuid.uuid4().hex[:8]}"
+    job_directory.mkdir(parents=True, exist_ok=True)
+    # Probe video
+    cap_probe = cv2.VideoCapture(str(src))
+    if not cap_probe.isOpened():
+        hb_flag["running"] = False
+        raise RuntimeError(f"Cannot open video: {video_path}")
+    fps = cap_probe.get(cv2.CAP_PROP_FPS) or 25.0
+    width = int(cap_probe.get(cv2.CAP_PROP_FRAME_WIDTH))
+    height = int(cap_probe.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    frame_count = int(cap_probe.get(cv2.CAP_PROP_FRAME_COUNT))
+    duration = frame_count / fps if fps > 0 else 0.0
+    cap_probe.release()
+    logger.info(f"Video: {width}x{height} @ {fps:.2f} fps | {frame_count} frames ({duration:.1f}s)")
+    # Prepare background
+    if background_image is None:
+        hb_flag["running"] = False
+        raise ValueError("background_image is required")
+    bg = background_image.resize((width, height), Image.LANCZOS)
+    bg_np = np.array(bg).astype(np.float32)
+    # Load models
+    report("Loading SAM2 + MatAnyone", 0.05)
+    predictor = load_sam2_predictor(device)
+    matany = load_matany_session(device)
+    # Init SAM2 state (single)
+    report("Initializing SAM2 video state", 0.08)
+    state = predictor.init_state(video_path=str(src))
+    # Minimal prompt: single positive point at center (replace with your prompt UI if needed)
+    center_pt = np.array([[width // 2, height // 2]], dtype=np.float32)
+    labels = np.array([1], dtype=np.int32)
+    ann_obj_id = 1
+    with torch.inference_mode():
+        _ = predictor.add_new_points(
+            inference_state=state,
+            frame_idx=0,
+            obj_id=ann_obj_id,
+            points=center_pt,
+            labels=labels,
+        )
+    # Controller
+    ctrl = VRAMAdaptiveController()
+    # Output paths
+    out_raw = str(job_directory / f"composite_{int(time.time())}.mp4")
+    out_final = str(job_directory / f"final_{int(time.time())}.mp4")
+    # Windows/buffers (bounded)
+    # For completeness we keep a tiny deque for any auxiliary temporal ops (e.g., matting history)
+    aux_window = deque(maxlen=max(32, min(96, ctrl.memory_window // 2)))
+    # Stream processing
+    start = time.time()
+    frames_done = 0
+    next_cleanup_at = ctrl.cleanup_every
+    report("Streaming: SAM2 → MatAnyone → Compose → Write", 0.12)
+    with StreamingVideoIO(str(src), out_raw, fps) as vio:
+        # iterate SAM2 propagation alongside reading frames
+        with torch.inference_mode(), torch.autocast(device_type="cuda", dtype=torch.float16 if device.type == "cuda" else None):
+            for out_frame_idx, out_obj_ids, out_mask_logits in predictor.propagate_in_video(state, scale=ctrl.propagation_scale):
+                # Read the matching frame
+                ret, frame_bgr = vio.read_frame()
+                if not ret:
+                    break
+                # Get mask for ann_obj_id; keep on GPU as long as possible
+                mask_t = None
+                try:
+                    if isinstance(out_obj_ids, torch.Tensor):
+                        # find index where id == ann_obj_id
+                        idxs = (out_obj_ids == ann_obj_id).nonzero(as_tuple=False)
+                        if idxs.numel() > 0:
+                            i = idxs[0].item()
+                            logits = out_mask_logits[i]
+                        else:
+                            logits = None
+                    else:
+                        # list/array fallback
+                        ids_list = list(out_obj_ids)
+                        i = ids_list.index(ann_obj_id) if ann_obj_id in ids_list else -1
+                        logits = out_mask_logits[i] if i >= 0 else None
+                    if logits is not None:
+                        # logits → prob → binary mask (threshold 0)
+                        mask_t = (logits > 0).float()  # HxW on CUDA fp16 → fp32 float
+                except Exception as e:
+                    logger.debug(f"Mask extraction warning @frame {out_frame_idx}: {e}")
+                    mask_t = None
+                # Optional: MatAnyone refinement
+                if mask_t is not None and matany is not None:
+                    try:
+                        # MatAnyone APIs vary — try common forms
+                        # Convert RGB because many mattors expect RGB
+                        frame_rgb = cv2.cvtColor(frame_bgr, cv2.COLOR_BGR2RGB)
+                        # Move frame to GPU only if your matting backend supports it
+                        refined = None
+                        if hasattr(matany, "refine_mask"):
+                            refined = matany.refine_mask(frame_rgb, mask_t)  # allow handler to decide device
+                        elif hasattr(matany, "process_frame"):
+                            refined = matany.process_frame(frame_rgb, mask_t)
+                        if refined is not None:
+                            # ensure float mask 0..1 on CUDA or CPU
+                            if isinstance(refined, torch.Tensor):
+                                mask_t = refined.float()
+                            else:
+                                # numpy → torch
+                                mask_t = torch.from_numpy(refined.astype(np.float32))
+                                if device.type == "cuda":
+                                    mask_t = mask_t.to(device)
+                    except Exception as e:
+                        logger.debug(f"MatAnyone refinement failed (frame {out_frame_idx}): {e}")
+                # Compose and write (convert once, keep math sane)
+                if mask_t is not None:
+                    # bring mask to CPU for np composition; keep as float [0,1]
+                    mask_np = mask_t.detach().clamp(0, 1).to("cpu", non_blocking=True).float().numpy()
+                    m3 = mask_np[..., None]  # HxWx1
+                    frame_rgb = cv2.cvtColor(frame_bgr, cv2.COLOR_BGR2RGB).astype(np.float32)
+                    comp = frame_rgb * m3 + bg_np * (1.0 - m3)
+                    comp_bgr = cv2.cvtColor(comp.astype(np.uint8), cv2.COLOR_RGB2BGR)
+                    vio.write_frame(comp_bgr)
+                else:
+                    # No mask — write original frame
+                    vio.write_frame(frame_bgr)
+                # Periodic maintenance
+                frames_done += 1
+                if frames_done >= next_cleanup_at:
+                    ctrl.adapt()
+                    prune_sam2_state(predictor, state, keep=ctrl.memory_window)
+                    # Clear small aux buffers
+                    aux_window.clear()
+                    if device.type == "cuda":
+                        torch.cuda.ipc_collect()
+                        torch.cuda.empty_cache()
+                    next_cleanup_at = frames_done + ctrl.cleanup_every
+                # Progress
+                if frames_done % 25 == 0 and frame_count > 0:
+                    p = 0.12 + 0.75 * (frames_done / frame_count)
+                    report(f"Processing frame {frames_done}/{frame_count} | win={ctrl.memory_window} scale={ctrl.propagation_scale:.2f}", p)
+    # Audio mux
+    report("Restoring audio", 0.93)
+    ok = mux_audio(out_raw, str(src), out_final)
+    final_path = out_final if ok else out_raw
+    # Cleanup models/state promptly
+    try:
+        del predictor
+        del state
+        if matany is not None:
+            del matany
+    except Exception:
+        pass
+    if device.type == "cuda":
+        torch.cuda.ipc_collect()
+        torch.cuda.empty_cache()
+    gc.collect()
+    hb_flag["running"] = False
+    elapsed = time.time() - start
+    try:
+        peak = torch.cuda.max_memory_allocated() / (1024 ** 3) if device.type == "cuda" else 0.0
+        logger.info(f"Peak GPU memory: {peak:.2f} GB")
+    except Exception:
+        pass
+    report(f"Done in {elapsed:.1f}s", 1.0)
+    logger.info(f"Output: {final_path}")
+    logger.info(f"Artifacts: {job_directory}")
+    return final_path
+# -------------------------------------------------------------------------------------------------
+# CLI entry (optional)
+# -------------------------------------------------------------------------------------------------
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser(description="BackgroundFX Pro pipeline")
+    parser.add_argument("--video", required=True, help="Path to input video")
+    parser.add_argument("--background", required=True, help="Path to background image")
+    parser.add_argument("--outdir", default=None, help="Job directory (optional)")
+    args = parser.parse_args()
+    bg_img = Image.open(args.background).convert("RGB")
+    outdir = Path(args.outdir) if args.outdir else None
+    out_path = process(args.video, background_image=bg_img, job_directory=outdir)
+    print(out_path)

VideoBackgroundReplacer2/requirements.txt ADDED Viewed

	@@ -0,0 +1,72 @@

+# ===== Core Dependencies =====
+# PyTorch is installed in Dockerfile with CUDA 12.1 — REQUIRED for SAM2
+# torch==2.5.1
+# torchvision==0.20.1
+# torchaudio==2.5.1
+# ===== Base Dependencies =====
+numpy>=1.24.0,<2.1.0
+Pillow>=10.0.0,<12.0.0
+protobuf>=4.25.0,<6.0.0
+# ===== Image/Video Processing =====
+opencv-python-headless>=4.8.0,<4.11.0
+imageio>=2.25.0,<3.0.0
+imageio-ffmpeg>=0.4.7,<0.6.0
+moviepy>=1.0.3,<2.0.0
+decord>=0.6.0,<0.7.0
+scikit-image>=0.19.3,<0.22.0
+# ===== MediaPipe =====
+mediapipe>=0.10.0,<0.11.0
+# ===== SAM2 Dependencies =====
+# SAM2 is installed via git clone in Dockerfile
+hydra-core>=1.3.2,<2.0.0
+omegaconf>=2.3.0,<3.0.0
+einops>=0.6.0,<0.9.0
+timm>=0.9.0,<1.1.0
+pyyaml>=6.0.0,<7.0.0
+matplotlib>=3.5.0,<4.0.0
+iopath>=0.1.10,<0.2.0
+# ===== MatAnyone Dependencies =====
+# MatAnyone is installed separately in Dockerfile
+kornia>=0.7.0,<0.8.0
+tqdm>=4.60.0,<5.0.0
+# ===== UI and API =====
+# Bump to avoid gradio_client 1.3.0 bug ("bool is not iterable")
+gradio==4.42.0
+# ===== Web stack pins for Gradio 4.42.0 =====
+fastapi==0.109.2
+starlette==0.36.3
+uvicorn==0.29.0
+httpx==0.27.2
+anyio==4.4.0
+orjson>=3.10.0
+# ===== Pydantic family (avoid breaking core 2.23.x) =====
+pydantic==2.8.2
+pydantic-core==2.20.1
+annotated-types==0.6.0
+typing-extensions==4.12.2
+# ===== Helpers and Utilities =====
+huggingface-hub>=0.20.0,<1.0.0
+ffmpeg-python>=0.2.0,<1.0.0
+psutil>=5.8.0,<7.0.0
+requests>=2.25.0,<3.0.0
+scikit-learn>=1.3.0,<2.0.0
+# ===== Additional Dependencies =====
+# Performance and monitoring
+gputil>=1.4.0,<2.0.0
+nvidia-ml-py3>=7.352.0,<12.0.0
+# Error handling and logging
+loguru>=0.6.0,<1.0.0
+# File handling
+python-multipart>=0.0.5,<1.0.0

VideoBackgroundReplacer2/two_stage_pipeline.py ADDED Viewed

	@@ -0,0 +1,388 @@

+#!/usr/bin/env python3
+"""
+two_stage_pipeline.py — Ephemeral SAM2 stage + MatAnyone stage
+- Stage 1: SAM2 -> lossless mask stream (FFV1 .mkv) + meta.json, then unload SAM2
+- Stage 2: read mask stream -> (optional) MatAnyone refine -> composite -> mux audio
+"""
+import os, sys, gc, json, cv2, time, uuid, torch, shutil, logging, subprocess, threading
+import numpy as np
+from pathlib import Path
+from typing import Optional, Callable, Tuple, Dict, Any
+from PIL import Image
+logger = logging.getLogger("backgroundfx_pro.two_stage")
+if not logger.handlers:
+    h = logging.StreamHandler()
+    h.setFormatter(logging.Formatter("[%(asctime)s] %(levelname)s:%(name)s: %(message)s"))
+    logger.addHandler(h)
+logger.setLevel(logging.INFO)
+# ---------------------------
+# Env & CUDA helpers
+# ---------------------------
+def setup_env():
+    os.environ.setdefault("PYTORCH_CUDA_ALLOC_CONF","expandable_segments:True,max_split_size_mb:256,garbage_collection_threshold:0.7")
+    os.environ.setdefault("OMP_NUM_THREADS","1")
+    os.environ.setdefault("OPENBLAS_NUM_THREADS","1")
+    os.environ.setdefault("MKL_NUM_THREADS","1")
+    torch.set_grad_enabled(False)
+    try:
+        torch.backends.cudnn.benchmark = True
+        torch.backends.cuda.matmul.allow_tf32 = True
+        torch.backends.cudnn.allow_tf32 = True
+        torch.set_float32_matmul_precision("high")
+    except Exception:
+        pass
+    if torch.cuda.is_available():
+        try:
+            torch.cuda.set_per_process_memory_fraction(float(os.getenv("CUDA_MEMORY_FRACTION","0.88")))
+        except Exception:
+            pass
+def free_cuda():
+    if torch.cuda.is_available():
+        torch.cuda.ipc_collect()
+        torch.cuda.empty_cache()
+def unload_sam2_modules():
+    """Aggressively unload SAM2 python modules to reduce RSS."""
+    try:
+        import importlib
+        mods = [m for m in list(sys.modules) if m.startswith("sam2")]
+        for m in mods:
+            sys.modules.pop(m, None)
+        importlib.invalidate_caches()
+        gc.collect()
+        free_cuda()
+        logger.info("SAM2 modules unloaded.")
+    except Exception as e:
+        logger.warning(f"Unloading SAM2 modules: {e}")
+# ---------------------------
+# Video probing
+# ---------------------------
+def probe_video(path:str) -> Tuple[int,int,float,int]:
+    cap = cv2.VideoCapture(path)
+    if not cap.isOpened():
+        raise RuntimeError(f"Cannot open video: {path}")
+    fps = cap.get(cv2.CAP_PROP_FPS) or 25.0
+    w   = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+    h   = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    n   = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+    cap.release()
+    return w,h,float(fps),n
+# ---------------------------
+# FFmpeg mask writers/readers
+# ---------------------------
+class MaskFFV1Writer:
+    """Write uint8 binary/gray masks to FFV1 lossless .mkv via pipe."""
+    def __init__(self, path:str, w:int, h:int, fps:float):
+        self.path = path
+        self.w, self.h, self.fps = w,h,fps
+        self.proc = None
+    def __enter__(self):
+        cmd = [
+            "ffmpeg","-y","-hide_banner","-loglevel","error",
+            "-f","rawvideo","-pix_fmt","gray","-s",f"{self.w}x{self.h}","-r",f"{self.fps}",
+            "-i","-",
+            "-c:v","ffv1","-level","3","-g","1", self.path
+        ]
+        self.proc = subprocess.Popen(cmd, stdin=subprocess.PIPE)
+        return self
+    def write(self, mask_u8: np.ndarray):
+        # Expect HxW uint8 (0/255). Ensure contiguous.
+        if mask_u8.dtype != np.uint8:
+            mask_u8 = mask_u8.astype(np.uint8)
+        self.proc.stdin.write(mask_u8.tobytes())
+    def __exit__(self, exc_type, exc, tb):
+        if self.proc:
+            try:
+                self.proc.stdin.flush()
+                self.proc.stdin.close()
+                self.proc.wait(timeout=120)
+            except Exception:
+                self.proc.kill()
+class MaskFFV1Reader:
+    """Read uint8 masks from FFV1 .mkv via pipe."""
+    def __init__(self, path:str, w:int, h:int):
+        self.path = path
+        self.w,self.h = w,h
+        self.proc = None
+        self.frame_bytes = w*h
+    def __enter__(self):
+        cmd = [
+            "ffmpeg","-hide_banner","-loglevel","error","-i", self.path,
+            "-f","rawvideo","-pix_fmt","gray","-"
+        ]
+        self.proc = subprocess.Popen(cmd, stdout=subprocess.PIPE)
+        return self
+    def read(self) -> Optional[np.ndarray]:
+        buf = self.proc.stdout.read(self.frame_bytes)
+        if not buf or len(buf) < self.frame_bytes:
+            return None
+        return np.frombuffer(buf, dtype=np.uint8).reshape(self.h, self.w)
+    def __exit__(self, exc_type, exc, tb):
+        if self.proc:
+            try:
+                self.proc.stdout.close()
+                self.proc.wait(timeout=30)
+            except Exception:
+                self.proc.kill()
+# Fallback: PNG sequence (disk heavy but simple & robust)
+class MaskPNGWriter:
+    def __init__(self, dirpath: Path):
+        self.dir = dirpath; self.dir.mkdir(parents=True, exist_ok=True); self.idx=0
+    def write(self, mask_u8: np.ndarray):
+        cv2.imwrite(str(self.dir / f"{self.idx:06d}.png"), mask_u8)
+        self.idx+=1
+class MaskPNGReader:
+    def __init__(self, dirpath: Path):
+        self.dir=dirpath; self.idx=0
+    def read(self) -> Optional[np.ndarray]:
+        p = self.dir / f"{self.idx:06d}.png"
+        if not p.exists(): return None
+        img = cv2.imread(str(p), cv2.IMREAD_GRAYSCALE)
+        self.idx+=1
+        return img
+# ---------------------------
+# Stage 1 — SAM2 → mask dump
+# ---------------------------
+def stage1_dump_masks(video_path:str, out_dir:Path, obj_point:Tuple[int,int]=None) -> Dict[str,Any]:
+    """
+    Run only SAM2, save masks as FFV1 (preferred) or PNG sequence + meta.json.
+    Returns meta dict.
+    """
+    setup_env()
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    w,h,fps,n = probe_video(video_path)
+    out_dir.mkdir(parents=True, exist_ok=True)
+    meta = {"video":video_path, "width":w,"height":h,"fps":fps,"frames":n, "storage":None}
+    logger.info(f"[Stage1] {w}x{h}@{fps:.2f} | frames={n}")
+    # Load SAM2 (your wrapper)
+    from models.sam2_loader import SAM2Predictor
+    predictor = SAM2Predictor(device=device)
+    state = predictor.init_state(video_path=video_path)
+    # Prompt: center positive if not provided
+    if obj_point is None:
+        obj_point = (w//2, h//2)
+    pts = np.array([[obj_point[0], obj_point[1]]], dtype=np.float32)
+    labels = np.array([1], dtype=np.int32)
+    ann_obj_id = 1
+    with torch.inference_mode():
+        predictor.add_new_points(state, 0, ann_obj_id, pts, labels)
+    # Preferred: FFV1 mask stream
+    mask_mkv = out_dir / "mask.mkv"
+    use_png = False
+    try:
+        with MaskFFV1Writer(str(mask_mkv), w, h, fps) as writer, \
+             torch.inference_mode(), torch.autocast("cuda", dtype=torch.float16 if device.type=="cuda" else None):
+            for _, out_ids, out_logits in predictor.propagate_in_video(state):
+                # pick ann_obj_id
+                i = None
+                if isinstance(out_ids, torch.Tensor):
+                    nz = (out_ids == ann_obj_id).nonzero(as_tuple=False)
+                    if nz.numel() > 0: i = nz[0].item()
+                else:
+                    ids = list(out_ids);  i = ids.index(ann_obj_id) if ann_obj_id in ids else None
+                if i is None:
+                    # write empty
+                    writer.write(np.zeros((h,w), np.uint8))
+                    continue
+                mask = (out_logits[i] > 0).detach()
+                mask_u8 = (mask.float().mul_(255).to("cpu", non_blocking=True).numpy()).astype(np.uint8)
+                writer.write(mask_u8)
+        meta["storage"] = "ffv1"
+        meta["mask_path"] = str(mask_mkv)
+        logger.info("[Stage1] Masks saved as FFV1 .mkv")
+    except Exception as e:
+        logger.warning(f"FFV1 writer failed ({e}), falling back to PNG sequence.")
+        png_dir = out_dir / "masks_png"
+        wr = MaskPNGWriter(png_dir)
+        with torch.inference_mode(), torch.autocast("cuda", dtype=torch.float16 if device.type=="cuda" else None):
+            for _, out_ids, out_logits in predictor.propagate_in_video(state):
+                i = None
+                if isinstance(out_ids, torch.Tensor):
+                    nz = (out_ids == ann_obj_id).nonzero(as_tuple=False)
+                    if nz.numel() > 0: i = nz[0].item()
+                else:
+                    ids = list(out_ids);  i = ids.index(ann_obj_id) if ann_obj_id in ids else None
+                if i is None:
+                    wr.write(np.zeros((h,w), np.uint8)); continue
+                mask = (out_logits[i] > 0).detach()
+                wr.write((mask.float().mul_(255).to("cpu").numpy()).astype(np.uint8))
+        meta["storage"] = "png"
+        meta["mask_path"] = str(png_dir)
+    # Persist meta
+    with open(out_dir / "meta.json","w") as f:
+        json.dump(meta, f)
+    # Unload SAM2 completely
+    del predictor, state
+    free_cuda(); unload_sam2_modules()
+    return meta
+# ---------------------------
+# Stage 2 — refine + compose
+# ---------------------------
+def stage2_refine_and_compose(video_path:str, mask_dir:Path, background_image:Image.Image,
+                              out_path:str, use_matany:bool=True) -> str:
+    w,h,fps,n = probe_video(video_path)
+    bg = background_image.resize((w,h), Image.LANCZOS)
+    bg_np = np.array(bg).astype(np.float32)
+    # Read meta
+    with open(mask_dir / "meta.json","r") as f:
+        meta = json.load(f)
+    storage = meta["storage"]; mask_path = meta["mask_path"]
+    # Optional MatAnyone
+    session = None
+    if use_matany:
+        try:
+            from models.matanyone_loader import MatAnyoneSession as _M
+        except Exception:
+            try:
+                from models.matanyone_loader import MatAnyoneLoader as _M
+            except Exception:
+                _M = None
+        if _M:
+            session = _M(device=torch.device("cuda" if torch.cuda.is_available() else "cpu"))
+            if hasattr(session,"model") and session.model is not None:
+                session.model.eval()
+    # Open video + writer
+    cap = cv2.VideoCapture(video_path)
+    fourcc = cv2.VideoWriter_fourcc(*"mp4v")
+    tmp_out = str(Path(out_path).with_suffix(".noaudio.mp4"))
+    writer = cv2.VideoWriter(tmp_out, fourcc, fps, (w,h))
+    # Open mask reader
+    if storage == "ffv1":
+        mreader = MaskFFV1Reader(mask_path, w, h)
+        mreader.__enter__()
+        read_mask = lambda : mreader.read()
+    else:
+        mreader = MaskPNGReader(Path(mask_path))
+        read_mask = lambda : mreader.read()
+    i = 0
+    try:
+        while True:
+            ok, frame_bgr = cap.read()
+            if not ok: break
+            mask_u8 = read_mask()
+            if mask_u8 is None:
+                # out of masks; write original
+                writer.write(frame_bgr); i+=1; continue
+            # Optional refine
+            if session is not None:
+                try:
+                    frame_rgb = cv2.cvtColor(frame_bgr, cv2.COLOR_BGR2RGB)
+                    # Provide a float mask 0..1 to session; adapt if your API differs
+                    mask_f = (mask_u8.astype(np.float32) / 255.0)
+                    if hasattr(session,"refine_mask"):
+                        mask_refined = session.refine_mask(frame_rgb, mask_f)
+                    elif hasattr(session,"process_frame"):
+                        mask_refined = session.process_frame(frame_rgb, mask_f)
+                    else:
+                        mask_refined = mask_f
+                    if isinstance(mask_refined, torch.Tensor):
+                        mask_u8 = (mask_refined.detach().clamp(0,1).mul(255).to("cpu").numpy()).astype(np.uint8)
+                    elif isinstance(mask_refined, np.ndarray):
+                        mask_u8 = (np.clip(mask_refined,0,1)*255).astype(np.uint8)
+                except Exception as e:
+                    logger.debug(f"MatAnyone refine failed @frame {i}: {e}")
+            # Composite
+            m = (mask_u8.astype(np.float32)/255.0)[...,None]  # HxWx1
+            fr = cv2.cvtColor(frame_bgr, cv2.COLOR_BGR2RGB).astype(np.float32)
+            comp = fr*m + bg_np*(1.0-m)
+            comp_bgr = cv2.cvtColor(comp.astype(np.uint8), cv2.COLOR_RGB2BGR)
+            writer.write(comp_bgr)
+            if i % 50 == 0:
+                logger.info(f"[Stage2] frame {i}/{n}")
+            i += 1
+    finally:
+        cap.release(); writer.release()
+        if isinstance(mreader, MaskFFV1Reader):
+            mreader.__exit__(None,None,None)
+    # Mux audio
+    final_out = str(Path(out_path))
+    cmd = [
+        "ffmpeg","-y","-hide_banner","-loglevel","error",
+        "-i", tmp_out, "-i", video_path,
+        "-map","0:v:0","-map","1:a:0","-c:v","copy","-c:a","aac","-shortest", final_out
+    ]
+    try:
+        r = subprocess.run(cmd, capture_output=True, text=True, timeout=180)
+        if r.returncode != 0:
+            logger.warning(f"Audio mux failed: {r.stderr.strip()}")
+            shutil.move(tmp_out, final_out)
+        else:
+            os.remove(tmp_out)
+    except Exception:
+        shutil.move(tmp_out, final_out)
+    return final_out
+# ---------------------------
+# Orchestrator
+# ---------------------------
+def process_two_stage(
+    video_path:str,
+    background_image: Image.Image,
+    workdir: Optional[Path]=None,
+    progress: Optional[Callable[[str,float],None]] = None,
+    use_matany: bool = True,
+) -> str:
+    setup_env()
+    if workdir is None:
+        workdir = Path.cwd()/ "tmp" / f"job_{uuid.uuid4().hex[:8]}"
+    workdir.mkdir(parents=True, exist_ok=True)
+    # Stage 1
+    if progress: progress("Stage 1: SAM2 mask pass", 0.05)
+    mask_dir = workdir / "sam2_masks"
+    meta = stage1_dump_masks(video_path, mask_dir)
+    if progress: progress("Stage 1 complete", 0.45)
+    # Stage 2
+    if progress: progress("Stage 2: refine + compose", 0.50)
+    out_path = workdir / f"final_{int(time.time())}.mp4"
+    final_video = stage2_refine_and_compose(video_path, mask_dir, background_image, str(out_path), use_matany=use_matany)
+    if progress: progress("Done", 1.0)
+    logger.info(f"Output: {final_video}")
+    return final_video
+# ---------------------------
+# CLI
+# ---------------------------
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser(description="Two-stage BackgroundFX Pro")
+    parser.add_argument("--video", required=True)
+    parser.add_argument("--background", required=True)
+    parser.add_argument("--outdir", default=None)
+    parser.add_argument("--no-matany", action="store_true")
+    args = parser.parse_args()
+    bg = Image.open(args.background).convert("RGB")
+    out = process_two_stage(args.video, bg, Path(args.outdir) if args.outdir else None, use_matany=not args.no_matany)
+    print(out)

VideoBackgroundReplacer2/ui.py ADDED Viewed

	@@ -0,0 +1,140 @@

+#!/usr/bin/env python3
+"""
+BackgroundFX Pro — Main UI Application (Gradio 4.42.x)
+Clean, focused main file that coordinates the application
+"""
+# ============================================================
+# Mount-mode handoff: delegate to app.py when enabled
+# (So we can serve a safe /config JSON via our FastAPI shim)
+# ============================================================
+import os, runpy
+if os.getenv("GRADIO_MOUNT_MODE") == "1":
+    runpy.run_module("app", run_name="__main__")
+    raise SystemExit
+# ==== Runtime hygiene & paths (very high in file) ====
+import sys
+import logging
+from pathlib import Path
+# --- Sanitize OMP/BLAS threads early (avoids "libgomp: Invalid value..." issues)
+def _sanitize_omp_env():
+    import multiprocessing as _mp
+    cpu = max(1, _mp.cpu_count())
+    default_omp = max(1, cpu // 2)
+    raw = os.environ.get("OMP_NUM_THREADS", "").strip()
+    try:
+        n = int(raw)
+        if n <= 0 or n > cpu * 2:
+            raise ValueError
+        omp_val = n
+    except Exception:
+        omp_val = default_omp
+    os.environ["OMP_NUM_THREADS"] = str(omp_val)
+    os.environ.setdefault("OPENBLAS_NUM_THREADS", "1")
+    os.environ.setdefault("MKL_NUM_THREADS", "1")
+    os.environ.setdefault("NUMEXPR_NUM_THREADS", "1")
+_sanitize_omp_env()
+# Stable app dirs (avoid /tmp surprises on HF)
+APP_ROOT = Path(__file__).resolve().parent
+DATA_ROOT = APP_ROOT / "data"
+TMP_ROOT = APP_ROOT / "tmp"
+JOB_ROOT = TMP_ROOT / "backgroundfx_jobs"
+for p in (DATA_ROOT, TMP_ROOT, JOB_ROOT):
+    p.mkdir(parents=True, exist_ok=True)
+# Keep model/caches local to repo volume
+os.environ.setdefault("HF_HOME", str(APP_ROOT / ".hf"))
+os.environ.setdefault("TORCH_HOME", str(APP_ROOT / ".torch"))
+Path(os.environ["HF_HOME"]).mkdir(parents=True, exist_ok=True)
+Path(os.environ["TORCH_HOME"]).mkdir(parents=True, exist_ok=True)
+# Make Gradio a bit quieter / safer in Spaces
+os.environ.setdefault("GRADIO_ANALYTICS_ENABLED", "False")
+# Standard imports (after env is sane)
+import torch
+import gradio as gr
+# Import our modules
+from ui_core_functionality import startup_probe, logger
+from ui_core_interface import create_interface
+# Optional: patch a Gradio client util to tolerate boolean JSON Schemas
+def _patch_gradio_client_bool_schema():
+    try:
+        import gradio_client.utils as _gc_utils  # type: ignore
+        _orig_get_type = _gc_utils.get_type
+        def _safe_get_type(schema):
+            if isinstance(schema, bool):
+                return "Any" if schema else "None"
+            return _orig_get_type(schema)
+        _gc_utils.get_type = _safe_get_type  # type: ignore[attr-defined]
+        if hasattr(_gc_utils, "_json_schema_to_python_type"):
+            _orig_walk = _gc_utils._json_schema_to_python_type  # type: ignore[attr-defined]
+            def _safe_walk(schema, defs):
+                if isinstance(schema, bool):
+                    return "Any" if schema else "None"
+                return _orig_walk(schema, defs)
+            _gc_utils._json_schema_to_python_type = _safe_walk  # type: ignore[attr-defined]
+        logger.info("🩹 Patched gradio_client.utils to handle boolean JSON Schemas.")
+    except Exception as e:
+        logger.warning("Could not patch gradio_client boolean schema handling: %s", e)
+_patch_gradio_client_bool_schema()
+# =======================================================================
+# MAIN APPLICATION
+# =======================================================================
+def main():
+    """Main application entry point"""
+    try:
+        startup_probe()
+        logger.info("🚀 Launching Gradio interface...")
+        logger.info(
+            "Gradio=%s | torch=%s | cu=%s | cuda_available=%s",
+            getattr(gr, "__version__", "?"),
+            torch.__version__,
+            getattr(torch.version, "cuda", None),
+            torch.cuda.is_available(),
+        )
+        demo = create_interface()
+        # Gradio 4.x: keep queue small to avoid RAM spikes (no concurrency_count here)
+        demo.queue(max_size=2)
+        # Port from env (HF sets PORT)
+        port = int(os.environ.get("PORT", os.environ.get("GRADIO_SERVER_PORT", "7860")))
+        # Detect HF Space; never use share=True on Spaces (avoids frpc download / 500s)
+        in_space = bool(os.getenv("SPACE_ID") or os.getenv("HF_SPACE_ID") or os.getenv("SYSTEM") == "spaces")
+        demo.launch(
+            server_name="0.0.0.0",
+            server_port=port,
+            share=False if in_space else False,   # keep False on Spaces
+            show_api=False,       # safer on public Spaces
+            show_error=True,
+            quiet=True,
+            debug=False,
+            max_threads=1         # worker threads; per-listener concurrency set in ui_core_interface.py
+        )
+    except Exception as e:
+        logger.error("❌ Application startup failed: %s", e)
+        raise
+if __name__ == "__main__":
+    main()

VideoBackgroundReplacer2/ui_core_functionality.py ADDED Viewed

	@@ -0,0 +1,662 @@

+#!/usr/bin/env python3
+"""
+BackgroundFX Pro — Core Functionality
+All processing logic, utilities, background generators, and handlers
+Enhanced with file safety, robust logging, and runtime diagnostics.
+"""
+import os
+import sys
+import io
+import gc
+import time
+import json
+import uuid
+import shutil
+import logging
+import tempfile
+import requests
+import threading
+import traceback
+import subprocess
+from datetime import datetime
+from concurrent.futures import ThreadPoolExecutor
+from typing import Optional, Tuple, List, Dict, Any, Union, Callable
+from pathlib import Path
+import torch
+import numpy as np
+from PIL import Image, ImageDraw, ImageFont
+import cv2
+# ==============================================================================
+# PATHS & ENV
+# ==============================================================================
+# Repo root (…/app)
+APP_ROOT = Path(__file__).resolve().parent
+DATA_ROOT = APP_ROOT / "data"
+TMP_ROOT  = APP_ROOT / "tmp"
+JOB_ROOT  = TMP_ROOT / "backgroundfx_jobs"
+for p in (
+    DATA_ROOT,
+    TMP_ROOT,
+    JOB_ROOT,
+    APP_ROOT / ".hf",
+    APP_ROOT / ".torch",
+    APP_ROOT / "checkpoints",
+    APP_ROOT / "models",
+    APP_ROOT / "utils",
+):
+    p.mkdir(parents=True, exist_ok=True)
+# Cache dirs (stable on Spaces)
+os.environ.setdefault("HF_HOME", str(APP_ROOT / ".hf"))
+os.environ.setdefault("TORCH_HOME", str(APP_ROOT / ".torch"))
+# Quiet BLAS/OpenMP spam (in case ui.py wasn't first)
+if not os.environ.get("OMP_NUM_THREADS", "").isdigit():
+    os.environ["OMP_NUM_THREADS"] = "4"
+os.environ.setdefault("OMP_NUM_THREADS", "4")
+os.environ.setdefault("OPENBLAS_NUM_THREADS", "1")
+os.environ.setdefault("MKL_NUM_THREADS", "1")
+os.environ.setdefault("NUMEXPR_NUM_THREADS", "1")
+os.environ.setdefault("PYTHONFAULTHANDLER", "1")
+# ==============================================================================
+# LOGGING + DIAGNOSTICS (console + file + heartbeat)
+# ==============================================================================
+# Line-buffer logs so Space UI shows them promptly
+try:
+    sys.stdout.reconfigure(line_buffering=True)
+    sys.stderr.reconfigure(line_buffering=True)
+except Exception:
+    pass
+LOG_FILE = DATA_ROOT / "run.log"
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s | %(levelname)s | %(message)s",
+    handlers=[logging.StreamHandler(sys.stdout),
+              logging.FileHandler(LOG_FILE, encoding="utf-8")],
+    force=True,
+)
+logger = logging.getLogger("bgfx")
+# Faulthandler (native crashes -> stacks)
+try:
+    import faulthandler, signal  # type: ignore
+    faulthandler.enable(all_threads=True)
+    if hasattr(signal, "SIGUSR1"):
+        faulthandler.register(signal.SIGUSR1, file=sys.stderr, all_threads=True)
+except Exception as e:
+    logger.warning("faulthandler setup skipped: %s", e)
+def _disk_stats(p: Path) -> str:
+    try:
+        total, used, free = shutil.disk_usage(str(p))
+        mb = lambda x: x // (1024 * 1024)
+        return f"disk(total={mb(total)}MB, used={mb(used)}MB, free={mb(free)}MB)"
+    except Exception:
+        return "disk(n/a)"
+def _cgroup_limit_bytes():
+    for fp in ("/sys/fs/cgroup/memory.max", "/sys/fs/cgroup/memory/memory.limit_in_bytes"):
+        try:
+            s = Path(fp).read_text().strip()
+            if s and s != "max":
+                return int(s)
+        except Exception:
+            pass
+def _rss_bytes():
+    try:
+        for line in Path("/proc/self/status").read_text().splitlines():
+            if line.startswith("VmRSS:"):
+                return int(line.split()[1]) * 1024
+    except Exception:
+        return None
+def _heartbeat():
+    lim = _cgroup_limit_bytes()
+    while True:
+        rss = _rss_bytes()
+        logger.info(
+            "HEARTBEAT | rss=%s MB | limit=%s MB | %s",
+            f"{rss//2**20}" if rss else "n/a",
+            f"{lim//2**20}" if lim else "n/a",
+            _disk_stats(APP_ROOT),
+        )
+        time.sleep(2)
+# Start heartbeat as a daemon thread (only once)
+try:
+    threading.Thread(target=_heartbeat, name="heartbeat", daemon=True).start()
+except Exception as e:
+    logger.warning("heartbeat skipped: %s", e)
+import atexit
+@atexit.register
+def _on_exit():
+    logger.info("PROCESS EXITING (atexit) — if you don't see this, it was a hard kill (OOM/SIGKILL)")
+# ==============================================================================
+# STARTUP VALIDATION
+# ==============================================================================
+def startup_probe():
+    """Comprehensive startup probe - validates system readiness"""
+    try:
+        logger.info("🚀 BACKGROUNDFX PRO STARTUP PROBE")
+        logger.info("📁 Working directory: %s", os.getcwd())
+        logger.info("🐍 Python executable: %s", sys.executable)
+        # Write probe (fail fast if not writable)
+        probe_file = TMP_ROOT / "startup_probe.txt"
+        probe_file.write_text("startup_test_ok", encoding="utf-8")
+        assert probe_file.read_text(encoding="utf-8") == "startup_test_ok"
+        logger.info("✅ WRITE PROBE OK: %s | %s", probe_file, _disk_stats(APP_ROOT))
+        probe_file.unlink(missing_ok=True)
+        # GPU/Torch status
+        try:
+            logger.info("🔧 Torch=%s | cu=%s | cuda_available=%s",
+                        torch.__version__, getattr(torch.version, "cuda", None), torch.cuda.is_available())
+            if torch.cuda.is_available():
+                gpu_count = torch.cuda.device_count()
+                name = torch.cuda.get_device_name(0) if gpu_count else "Unknown"
+                vram_gb = torch.cuda.get_device_properties(0).total_memory / (1024**3) if gpu_count else 0
+                logger.info("🔥 GPU Available: %s (%d device(s)) — VRAM %.1f GB", name, gpu_count, vram_gb)
+            else:
+                logger.warning("⚠️  No GPU available — using CPU")
+        except Exception as e:
+            logger.warning("⚠️  Torch check failed: %s", e)
+        # Directory verification (and creation if missing)
+        for d in ("checkpoints", "models", "utils"):
+            dp = APP_ROOT / d
+            dp.mkdir(parents=True, exist_ok=True)
+            logger.info("✅ Directory %s: %s", d, dp)
+        # Job dir isolation test
+        test_job = JOB_ROOT / "startup_test_job"
+        test_job.mkdir(parents=True, exist_ok=True)
+        tfile = test_job / "test.tmp"
+        tfile.write_text("job_isolation_test")
+        assert tfile.read_text() == "job_isolation_test"
+        logger.info("✅ Job isolation directory ready: %s", JOB_ROOT)
+        shutil.rmtree(test_job, ignore_errors=True)
+        # Env summary
+        logger.info("🌍 Env: OMP_NUM_THREADS=%s | HF_HOME=%s | TORCH_HOME=%s",
+                    os.environ.get("OMP_NUM_THREADS", "unset"),
+                    os.environ.get("HF_HOME", "default"),
+                    os.environ.get("TORCH_HOME", "default"))
+        logger.info("🎯 Startup probe completed — system ready!")
+    except Exception as e:
+        logger.error("❌ STARTUP PROBE FAILED: %s", e)
+        logger.error("📊 %s", _disk_stats(APP_ROOT))
+        raise RuntimeError(f"Startup probe failed — system not ready: {e}") from e
+# ==============================================================================
+# FILE SAFETY UTILITIES
+# ==============================================================================
+def new_tmp_path(suffix: str) -> Path:
+    """Generate safe temporary path within TMP_ROOT"""
+    return TMP_ROOT / f"{uuid.uuid4().hex}{suffix}"
+def atomic_write_bytes(dst: Path, data: bytes):
+    """Atomic file write to prevent corruption"""
+    tmp = new_tmp_path(dst.suffix + ".part")
+    try:
+        with open(tmp, "wb") as f:
+            f.write(data)
+        tmp.replace(dst)  # atomic on same FS
+        logger.debug("✅ Atomic write: %s", dst)
+    except Exception as e:
+        if tmp.exists():
+            tmp.unlink(missing_ok=True)
+        raise e
+def safe_name(name: str, default="file") -> str:
+    """Sanitize filename to prevent traversal/unicode issues"""
+    import re
+    base = re.sub(r"[^A-Za-z0-9._-]+", "_", (name or default))
+    return base[:120] or default
+def place_uploaded(in_path: str, sub="uploads") -> Path:
+    """Safely handle uploaded files with sanitized names"""
+    target_dir = DATA_ROOT / sub
+    target_dir.mkdir(exist_ok=True, parents=True)
+    out = target_dir / safe_name(Path(in_path).name)
+    shutil.copy2(in_path, out)
+    logger.info("📁 Uploaded file placed: %s", out)
+    return out
+def tmp_video_path(ext=".mp4") -> Path:
+    return new_tmp_path(ext)
+def tmp_image_path(ext=".png") -> Path:
+    return new_tmp_path(ext)
+def run_safely(fn: Callable, *args, **kwargs):
+    """Execute function with comprehensive error logging"""
+    try:
+        return fn(*args, **kwargs)
+    except Exception:
+        logger.error("PROCESSING FAILED\n%s", "".join(traceback.format_exc()))
+        logger.error("CWD=%s | DATA_ROOT=%s | TMP_ROOT=%s | %s",
+                     os.getcwd(), DATA_ROOT, TMP_ROOT, _disk_stats(APP_ROOT))
+        try:
+            logger.error("Env: OMP_NUM_THREADS=%s | CUDA=%s | torch=%s | cu=%s",
+                         os.environ.get("OMP_NUM_THREADS"),
+                         os.environ.get("CUDA_VISIBLE_DEVICES", "default"),
+                         torch.__version__,
+                         getattr(torch.version, "cuda", None))
+        except Exception:
+            pass
+        raise
+# ==============================================================================
+# SYSTEM UTILITIES
+# ==============================================================================
+def get_device():
+    """Get optimal device for processing"""
+    return torch.device("cuda" if torch.cuda.is_available() else "cpu")
+def clear_gpu_memory():
+    """Aggressive GPU memory cleanup"""
+    try:
+        if torch.cuda.is_available():
+            torch.cuda.empty_cache()
+            torch.cuda.synchronize()
+            gc.collect()
+            logger.info("🧹 GPU memory cleared")
+    except Exception as e:
+        logger.warning("GPU cleanup warning: %s", e)
+def safe_file_operation(operation: Callable, *args, max_retries: int = 3, **kwargs):
+    """Safely execute file operations with retries"""
+    last_error = None
+    for attempt in range(max_retries):
+        try:
+            return operation(*args, **kwargs)
+        except Exception as e:
+            last_error = e
+            if attempt < max_retries - 1:
+                time.sleep(0.1 * (attempt + 1))
+                logger.warning("File op retry %d: %s", attempt + 1, e)
+            else:
+                logger.error("File op failed after %d attempts: %s", max_retries, e)
+    raise last_error
+# ==============================================================================
+# BACKGROUND GENERATORS
+# ==============================================================================
+def generate_ai_background(prompt: str, width: int, height: int) -> Image.Image:
+    """Generate AI-like background using prompt cues (procedural)"""
+    try:
+        logger.info("Generating AI background: '%s' (%dx%d)", prompt, width, height)
+        img = np.zeros((height, width, 3), dtype=np.uint8)
+        prompt_lower = prompt.lower()
+        if any(w in prompt_lower for w in ('city', 'urban', 'futuristic', 'cyberpunk')):
+            for i in range(height):
+                r = int(20 + 80 * (i / height))
+                g = int(30 + 100 * (i / height))
+                b = int(60 + 120 * (i / height))
+                img[i, :] = [r, g, b]
+        elif any(w in prompt_lower for w in ('beach', 'tropical', 'ocean', 'sea')):
+            for i in range(height):
+                r = int(135 + 120 * (i / height))
+                g = int(206 + 49 * (i / height))
+                b = int(235 + 20 * (i / height))
+                img[i, :] = [r, g, b]
+        elif any(w in prompt_lower for w in ('forest', 'jungle', 'nature', 'green')):
+            for i in range(height):
+                r = int(34 + 105 * (i / height))
+                g = int(139 + 30 * (i / height))
+                b = int(34 - 15 * (i / height))
+                img[i, :] = [max(0, r), max(0, g), max(0, b)]
+        elif any(w in prompt_lower for w in ('space', 'galaxy', 'stars', 'cosmic')):
+            for i in range(height):
+                r = int(10 + 50 * (i / height))
+                g = int(0 + 30 * (i / height))
+                b = int(30 + 100 * (i / height))
+                img[i, :] = [r, g, b]
+        elif any(w in prompt_lower for w in ('desert', 'sand', 'canyon')):
+            for i in range(height):
+                r = int(238 + 17 * (i / height))
+                g = int(203 + 52 * (i / height))
+                b = int(173 + 82 * (i / height))
+                img[i, :] = [min(255, r), min(255, g), min(255, b)]
+        else:
+            colors = [(255, 182, 193), (255, 218, 185), (176, 224, 230)]
+            color = colors[len(prompt) % len(colors)]
+            for i in range(height):
+                t = 1 - (i / height) * 0.3
+                img[i, :] = [int(color[0] * t), int(color[1] * t), int(color[2] * t)]
+        noise = np.random.randint(-15, 15, (height, width, 3))
+        img = np.clip(img.astype(np.int16) + noise, 0, 255).astype(np.uint8)
+        return Image.fromarray(img)
+    except Exception as e:
+        logger.warning("AI background generation failed: %s — using fallback", e)
+        return create_gradient_background("sunset", width, height)
+def create_gradient_background(gradient_type: str, width: int, height: int) -> Image.Image:
+    img = np.zeros((height, width, 3), dtype=np.uint8)
+    gradients = {
+        "sunset": [(255, 165, 0), (128, 64, 128)],
+        "ocean":  [(0, 100, 255), (30, 144, 255)],
+        "forest": [(34, 139, 34), (139, 69, 19)],
+        "sky":    [(135, 206, 235), (206, 235, 255)],
+    }
+    if gradient_type in gradients:
+        start, end = gradients[gradient_type]
+        for i in range(height):
+            r = int(start[0] * (1 - i/height) + end[0] * (i/height))
+            g = int(start[1] * (1 - i/height) + end[1] * (i/height))
+            b = int(start[2] * (1 - i/height) + end[2] * (i/height))
+            img[i, :] = [r, g, b]
+    else:
+        img.fill(128)
+    return Image.fromarray(img)
+def create_solid_background(color: str, width: int, height: int) -> Image.Image:
+    color_map = {
+        "white": (255, 255, 255), "black": (0, 0, 0), "red": (255, 0, 0),
+        "green": (0, 255, 0), "blue": (0, 0, 255), "yellow": (255, 255, 0),
+        "purple": (128, 0, 128), "orange": (255, 165, 0), "pink": (255, 192, 203),
+        "gray": (128, 128, 128)
+    }
+    rgb = color_map.get(color.lower(), (128, 128, 128))
+    return Image.new("RGB", (width, height), rgb)
+def download_unsplash_image(query: str, width: int, height: int) -> Image.Image:
+    try:
+        url = f"https://source.unsplash.com/{width}x{height}/?{query}"
+        resp = requests.get(url, timeout=10)
+        resp.raise_for_status()
+        img = Image.open(io.BytesIO(resp.content))
+        if img.size != (width, height):
+            img = img.resize((width, height), Image.Resampling.LANCZOS)
+        return img.convert("RGB")
+    except Exception as e:
+        logger.warning("Unsplash download failed: %s", e)
+        return create_solid_background("gray", width, height)
+# ==============================================================================
+# VIDEO UTILITIES
+# ==============================================================================
+def get_video_info(video_path: str) -> Dict[str, Any]:
+    try:
+        cap = cv2.VideoCapture(video_path)
+        if not cap.isOpened():
+            raise ValueError("Cannot open video file")
+        fps   = cap.get(cv2.CAP_PROP_FPS)
+        frames= int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+        w     = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+        h     = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+        cap.release()
+        return {"fps": fps, "frame_count": frames, "width": w, "height": h,
+                "duration": (frames / fps if fps > 0 else 0)}
+    except Exception as e:
+        logger.error("get_video_info failed: %s", e)
+        return {"fps": 30.0, "frame_count": 0, "width": 1920, "height": 1080, "duration": 0}
+def extract_frame(video_path: str, frame_number: int) -> Optional[np.ndarray]:
+    try:
+        cap = cv2.VideoCapture(video_path)
+        cap.set(cv2.CAP_PROP_POS_FRAMES, frame_number)
+        ret, frame = cap.read()
+        cap.release()
+        if ret:
+            return cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+        return None
+    except Exception as e:
+        logger.error("extract_frame failed: %s", e)
+        return None
+def ffmpeg_safe_call(inp: Path, out: Path, extra=()):
+    cmd = ["ffmpeg", "-y", "-hide_banner", "-loglevel", "error", "-i", str(inp), *extra, str(out)]
+    logger.info("FFMPEG %s", " ".join(cmd))
+    subprocess.run(cmd, check=True, timeout=300)
+# ==============================================================================
+# PROGRESS TRACKING
+# ==============================================================================
+class ProgressTracker:
+    """Thread-safe progress tracking for video processing"""
+    def __init__(self):
+        self.current_step = ""
+        self.progress = 0.0
+        self.total_frames = 0
+        self.processed_frames = 0
+        self.start_time = time.time()
+        self.lock = threading.Lock()
+    def update(self, step: str, progress: float = None):
+        with self.lock:
+            self.current_step = step
+            if progress is not None:
+                self.progress = max(0.0, min(1.0, progress))
+    def update_frames(self, processed: int, total: int = None):
+        with self.lock:
+            self.processed_frames = processed
+            if total is not None:
+                self.total_frames = total
+            if self.total_frames > 0:
+                self.progress = self.processed_frames / self.total_frames
+    def get_status(self) -> Dict[str, Any]:
+        with self.lock:
+            elapsed = time.time() - self.start_time
+            eta = 0
+            if self.progress > 0.01:
+                eta = elapsed * (1.0 - self.progress) / self.progress
+            return {
+                "step": self.current_step, "progress": self.progress,
+                "processed_frames": self.processed_frames, "total_frames": self.total_frames,
+                "elapsed": elapsed, "eta": eta
+            }
+# Global tracker
+progress_tracker = ProgressTracker()
+# ==============================================================================
+# SAFE FILE OPS
+# ==============================================================================
+def create_job_directory() -> Path:
+    job_id = str(uuid.uuid4())[:8]
+    job_dir = JOB_ROOT / f"job_{job_id}_{int(time.time())}"
+    job_dir.mkdir(parents=True, exist_ok=True)
+    logger.info("📁 Created job directory: %s", job_dir)
+    return job_dir
+def atomic_file_write(filepath: Path, content: bytes):
+    # Use with_name to append ".tmp" without breaking pathlib rules
+    temp_path = filepath.with_name(f"{filepath.name}.tmp")
+    try:
+        with open(temp_path, 'wb') as f:
+            f.write(content)
+        temp_path.rename(filepath)
+        logger.debug("✅ Atomic write: %s", filepath)
+    except Exception as e:
+        if temp_path.exists():
+            temp_path.unlink(missing_ok=True)
+        raise e
+def safe_download(url: str, filepath: Path, max_size: int = 500 * 1024 * 1024):
+    # Use with_name to append ".download" safely (e.g., "video.mp4.download")
+    temp_path = filepath.with_name(f"{filepath.name}.download")
+    try:
+        r = requests.get(url, stream=True, timeout=30)
+        r.raise_for_status()
+        cl = r.headers.get('content-length')
+        if cl and int(cl) > max_size:
+            raise ValueError(f"File too large: {cl} bytes")
+        downloaded = 0
+        with open(temp_path, 'wb') as f:
+            for chunk in r.iter_content(chunk_size=8192):
+                if chunk:
+                    downloaded += len(chunk)
+                    if downloaded > max_size:
+                        raise ValueError(f"Download exceeded size limit: {downloaded} bytes")
+                    f.write(chunk)
+        if not temp_path.exists() or temp_path.stat().st_size == 0:
+            raise ValueError("Download resulted in empty file")
+        temp_path.rename(filepath)
+        logger.info("✅ Downloaded: %s (%d bytes)", filepath, downloaded)
+    except Exception as e:
+        if temp_path.exists():
+            temp_path.unlink(missing_ok=True)
+        logger.error("❌ Download failed: %s", e)
+        raise
+# ==============================================================================
+# ENHANCED PIPELINE INTEGRATION
+# ==============================================================================
+def process_video_pipeline(
+    video_path: str,
+    background_image: Optional[Image.Image],
+    background_type: str,
+    background_prompt: str,
+    job_dir: Path,
+    progress_callback: Optional[Callable] = None
+) -> str:
+    """Process video using the two-stage pipeline with enhanced safety and monitoring"""
+    def _inner_process():
+        logger.info("=" * 60)
+        logger.info("=== ENHANCED TWO-STAGE PIPELINE (WITH SAFETY) ===")
+        logger.info("=" * 60)
+        logger.info("DEBUG video_path=%s exists=%s size=%s bytes",
+                    video_path, Path(video_path).exists(),
+                    (Path(video_path).stat().st_size if Path(video_path).exists() else "N/A"))
+        logger.info("DEBUG job_dir=%s writable=%s", job_dir, os.access(job_dir, os.W_OK))
+        logger.info("DEBUG bg_image=%s bg_type=%s | %s",
+                    (background_image.size if background_image else None),
+                    background_type, _disk_stats(APP_ROOT))
+        if not Path(video_path).exists():
+            raise FileNotFoundError(f"Video file not found: {video_path}")
+        # Copy into controlled area
+        safe_video_path = place_uploaded(video_path, "videos")
+        logger.info("DEBUG safe_video_path=%s", safe_video_path)
+        logger.info("DEBUG importing two-stage pipeline…")
+        try:
+            from two_stage_pipeline import process_two_stage as pipeline_process
+            logger.info("✓ two-stage pipeline import OK")
+        except ImportError as e:
+            logger.error("Import two_stage_pipeline failed: %s", e)
+            raise
+        progress_tracker.update("Initializing enhanced two-stage pipeline…")
+        current_stage = {"stage": "init", "start_time": time.time()}
+        def safe_progress_callback(step: str, progress: float = None):
+            try:
+                now = time.time()
+                elapsed = now - current_stage["start_time"]
+                if "Stage 1" in step and current_stage["stage"] != "stage1":
+                    current_stage["stage"] = "stage1"
+                    current_stage["start_time"] = now
+                    logger.info("🔄 Entering Stage 1 (SAM2) | %s", _disk_stats(APP_ROOT))
+                elif "Stage 2" in step and current_stage["stage"] != "stage2":
+                    d1 = now - current_stage["start_time"]
+                    current_stage["stage"] = "stage2"
+                    current_stage["start_time"] = now
+                    logger.info("🔄 Entering Stage 2 (Composition) — Stage 1 time %.1fs | %s", d1, _disk_stats(APP_ROOT))
+                elif "Done" in step and current_stage["stage"] != "complete":
+                    d2 = now - current_stage["start_time"]
+                    current_stage["stage"] = "complete"
+                    logger.info("🔄 Pipeline complete — Stage 2 time %.1fs | %s", d2, _disk_stats(APP_ROOT))
+                logger.info("PROGRESS [%s] (%.1fs): %s (%s)",
+                            current_stage['stage'].upper(), elapsed, step, progress)
+                progress_tracker.update(step, progress)
+                if progress_callback:
+                    progress_callback(f"Progress: {progress:.1%} - {step}" if progress is not None else step)
+                if current_stage["stage"] == "stage1" and elapsed > 15:
+                    logger.warning("⚠️ Stage 1 running for %.1fs — monitoring memory", elapsed)
+            except Exception as e:
+                logger.error("Progress callback error: %s", e)
+        if background_image is None:
+            raise ValueError("Background image is required")
+        logger.info("DEBUG: calling two-stage pipeline…")
+        result_path = pipeline_process(
+            video_path=str(safe_video_path),
+            background_image=background_image,
+            workdir=job_dir,
+            progress=safe_progress_callback,
+            use_matany=True
+        )
+        logger.info("DEBUG: pipeline returned %s (%s)", result_path, type(result_path))
+        if result_path:
+            result_file = Path(result_path)
+            logger.info("DEBUG: result exists=%s", result_file.exists())
+            if result_file.exists():
+                size = result_file.stat().st_size
+                logger.info("DEBUG: result size=%d bytes", size)
+                if size == 0:
+                    raise RuntimeError("Pipeline produced empty output file")
+                # Quick validity check
+                try:
+                    cap = cv2.VideoCapture(str(result_file))
+                    if cap.isOpened():
+                        frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+                        logger.info("DEBUG: output frame_count=%d", frames)
+                        cap.release()
+                    else:
+                        logger.warning("⚠️ Output may not be a valid video (cannot open)")
+                except Exception as e:
+                    logger.warning("⚠️ Could not verify output video: %s", e)
+        if not result_path or not Path(result_path).exists():
+            raise RuntimeError("Two-stage pipeline failed — no output produced")
+        logger.info("=" * 60)
+        logger.info("✅ ENHANCED TWO-STAGE PIPELINE COMPLETED: %s", result_path)
+        logger.info("=" * 60)
+        return result_path
+    try:
+        return run_safely(_inner_process)
+    except Exception as e:
+        logger.error("🧹 Error cleanup…")
+        clear_gpu_memory()
+        logger.error("Job dir state: %s",
+                     (list(job_dir.iterdir()) if job_dir.exists() else "does not exist"))
+        raise

VideoBackgroundReplacer2/ui_core_interface.py ADDED Viewed

	@@ -0,0 +1,430 @@

+#!/usr/bin/env python3
+"""
+BackgroundFX Pro — Gradio Interface & Event Handlers
+UI components, event handlers, and interface creation
+"""
+import logging
+import shutil
+import traceback
+from typing import Optional, Tuple
+from pathlib import Path
+import torch
+import gradio as gr
+from PIL import Image
+# Import our functionality
+from ui_core_functionality import (
+    get_device, clear_gpu_memory, get_video_info, extract_frame,
+    create_gradient_background, create_solid_background, download_unsplash_image,
+    generate_ai_background, create_job_directory, safe_file_operation, process_video_pipeline,
+    progress_tracker, JOB_ROOT, APP_ROOT, logger
+)
+# ===============================================================================
+# GRADIO HANDLERS
+# ===============================================================================
+def handle_custom_background_upload(image: Optional[Image.Image]) -> Tuple[Optional[Image.Image], str]:
+    """Handle custom background image upload"""
+    if image is None:
+        return None, "No image uploaded"
+    try:
+        if image.mode != "RGB":
+            image = image.convert("RGB")
+        status = f"✅ Custom background uploaded: {image.size[0]}x{image.size[1]}"
+        logger.info(status)
+        return image, status
+    except Exception as e:
+        error_msg = f"❌ Background upload failed: {str(e)}"
+        logger.error(error_msg)
+        return None, error_msg
+def handle_background_type_change(bg_type: str):
+    """Handle background type selection - show/hide relevant controls"""
+    logger.info(f"🎨 Background type changed to: {bg_type}")
+    if bg_type == "upload":
+        return (
+            gr.update(visible=True, label="Upload Custom Background Image"),
+            gr.update(visible=False),
+            gr.update(visible=False),
+        )
+    else:
+        prompt_placeholder = {
+            "ai_generate": "Describe the scene: 'futuristic city', 'tropical beach', 'mystical forest'...",
+            "gradient": "Choose style: 'sunset', 'ocean', 'forest', 'sky'",
+            "solid": "Choose color: 'red', 'blue', 'green', 'white', 'black'...",
+            "unsplash": "Search query: 'mountain landscape', 'city skyline', 'nature'..."
+        }
+        return (
+            gr.update(visible=False),
+            gr.update(visible=True, placeholder=prompt_placeholder.get(bg_type, "Enter your prompt...")),
+            gr.update(visible=True, value=f"Generate {bg_type.replace('_', ' ').title()} Background"),
+        )
+def handle_video_upload(video_file) -> Tuple[Optional[str], str]:
+    """Handle video file upload"""
+    if video_file is None:
+        return None, "No video file provided"
+    try:
+        job_dir = create_job_directory()
+        # Preserve original extension if possible
+        src_path = Path(video_file)
+        ext = src_path.suffix if src_path.suffix else ".mp4"
+        video_path = job_dir / f"input_video{ext}"
+        safe_file_operation(lambda src, dst: shutil.copy2(src, dst), str(src_path), str(video_path))
+        info = get_video_info(str(video_path))
+        duration_text = f"{info['duration']:.1f}s"
+        status = f"✅ Video uploaded: {info['width']}x{info['height']}, {info['fps']:.1f}fps, {duration_text}"
+        logger.info(status)
+        return str(video_path), status
+    except Exception as e:
+        error_msg = f"❌ Video upload failed: {str(e)}"
+        logger.error(error_msg)
+        return None, error_msg
+def handle_background_generation(bg_type: str, bg_prompt: str, video_path: str) -> Tuple[Optional[Image.Image], str]:
+    """Handle background generation (for non-upload types)"""
+    if not video_path:
+        return None, "No video loaded"
+    if bg_type == "upload":
+        return None, "Use the upload field above for custom backgrounds"
+    try:
+        info = get_video_info(video_path)
+        width, height = info['width'], info['height']
+        if bg_type == "ai_generate":
+            background = generate_ai_background(bg_prompt, width, height)
+            status = f"✅ Generated AI background: '{bg_prompt}'"
+        elif bg_type == "gradient":
+            gradients = ["sunset", "ocean", "forest", "sky"]
+            gradient_type = next((g for g in gradients if g in bg_prompt.lower()), gradients[0])
+            background = create_gradient_background(gradient_type, width, height)
+            status = f"✅ Generated {gradient_type} gradient background"
+        elif bg_type == "solid":
+            colors = ["white", "black", "red", "green", "blue", "yellow", "purple", "orange", "pink", "gray"]
+            color = next((c for c in colors if c in bg_prompt.lower()), "white")
+            background = create_solid_background(color, width, height)
+            status = f"✅ Generated {color} solid background"
+        elif bg_type == "unsplash":
+            query = bg_prompt.strip() or "nature"
+            background = download_unsplash_image(query, width, height)
+            status = f"✅ Downloaded background from Unsplash: '{query}'"
+        else:
+            background = create_solid_background("gray", width, height)
+            status = "✅ Generated default gray background"
+        logger.info(status)
+        return background, status
+    except Exception as e:
+        error_msg = f"❌ Background generation failed: {str(e)}"
+        logger.error(error_msg)
+        return None, error_msg
+def handle_video_processing(
+    video_path: str,
+    background_image: Optional[Image.Image],
+    background_type: str,
+    background_prompt: str,
+    progress=gr.Progress()
+) -> Tuple[Optional[str], str]:
+    """Handle complete video processing"""
+    if not video_path:
+        return None, "❌ No video provided"
+    if not background_image:
+        return None, "❌ No background provided"
+    try:
+        progress(0, "Starting video processing...")
+        logger.info("🎬 Starting video processing")
+        job_dir = create_job_directory()
+        progress_tracker.update("Creating job directory...")
+        def update_progress(message: str):
+            try:
+                status = progress_tracker.get_status()
+                progress_val = status['progress']
+                progress(progress_val, message)
+                logger.info(f"Progress: {progress_val:.1%} - {message}")
+            except Exception as e:
+                logger.warning(f"Progress update failed: {e}")
+        result_path = process_video_pipeline(
+            video_path=video_path,
+            background_image=background_image,
+            background_type=background_type,
+            background_prompt=background_prompt,
+            job_dir=job_dir,
+            progress_callback=update_progress
+        )
+        progress(1.0, "Processing complete!")
+        clear_gpu_memory()
+        status = "✅ Video processing completed successfully!"
+        logger.info(status)
+        return result_path, status
+    except Exception as e:
+        error_msg = f"❌ Processing failed: {str(e)}"
+        logger.error(error_msg)
+        logger.error("Traceback: %s", traceback.format_exc())
+        clear_gpu_memory()
+        return None, error_msg
+def handle_preview_generation(video_path: str, frame_number: int = 0) -> Tuple[Optional[Image.Image], str]:
+    """Generate preview frame from video"""
+    if not video_path:
+        return None, "No video loaded"
+    try:
+        frame = extract_frame(video_path, frame_number)
+        if frame is None:
+            return None, "Failed to extract frame"
+        preview_image = Image.fromarray(frame)
+        return preview_image, f"✅ Preview generated (frame {frame_number})"
+    except Exception as e:
+        error_msg = f"❌ Preview generation failed: {str(e)}"
+        logger.error(error_msg)
+        return None, error_msg
+# ===============================================================================
+# GRADIO INTERFACE
+# ===============================================================================
+def create_interface():
+    """Create the main Gradio interface"""
+    custom_css = """
+    .container { max-width: 1200px; margin: auto; }
+    .header { text-align: center; margin-bottom: 30px; }
+    .section { margin: 20px 0; padding: 20px; border-radius: 10px; }
+    .status { font-family: monospace; font-size: 12px; }
+    .progress-bar { margin: 10px 0; }
+    """
+    with gr.Blocks(
+        title="BackgroundFX Pro",
+        css=custom_css,
+        theme=gr.themes.Soft(),
+        analytics_enabled=False,   # keep things quiet/stable on 4.x
+    ) as demo:
+        gr.HTML("""
+        <div class="header">
+            <h1>🎬 BackgroundFX Pro</h1>
+            <p>Professional AI-powered video background replacement using SAM2 and MatAnyone</p>
+        </div>
+        """)
+        video_path_state = gr.State(value=None)
+        background_image_state = gr.State(value=None)
+        with gr.Row():
+            with gr.Column(scale=1):
+                with gr.Group():
+                    gr.HTML("<h3>📹 Video Input</h3>")
+                    video_upload = gr.File(
+                        label="Upload Video",
+                        file_types=[".mp4", ".avi", ".mov", ".mkv"],
+                        type="filepath"
+                    )
+                    video_preview = gr.Image(
+                        label="Video Preview",
+                        interactive=False,
+                        height=300
+                    )
+                    # Fixed preview status box (hidden)
+                    preview_status = gr.Textbox(
+                        label="Preview Status",
+                        interactive=False,
+                        visible=False,
+                        elem_classes=["status"]
+                    )
+                    video_status = gr.Textbox(
+                        label="Video Status",
+                        interactive=False,
+                        elem_classes=["status"]
+                    )
+                with gr.Group():
+                    gr.HTML("<h3>🎨 Background Selection</h3>")
+                    gr.HTML("""
+                    <div style='background: #f0f8ff; padding: 10px; border-radius: 5px; margin-bottom: 15px;'>
+                        <b>Choose your background method:</b><br>
+                        • <b>Upload:</b> Use your own image<br>
+                        • <b>AI Generate:</b> Create with AI prompt<br>
+                        • <b>Gradient/Solid/Unsplash:</b> Quick generation
+                    </div>
+                    """)
+                    background_type = gr.Radio(
+                        choices=[
+                            ("📤 Upload Image", "upload"),
+                            ("🤖 AI Generate", "ai_generate"),
+                            ("🌈 Gradient", "gradient"),
+                            ("🎯 Solid Color", "solid"),
+                            ("📸 Unsplash Photo", "unsplash")
+                        ],
+                        label="Background Type",
+                        value="upload"
+                    )
+                    custom_bg_upload = gr.Image(
+                        label="Upload Custom Background",
+                        type="pil",
+                        interactive=True,
+                        height=250,
+                        visible=True
+                    )
+                    background_prompt = gr.Textbox(
+                        label="Background Prompt",
+                        placeholder=("AI: 'futuristic city', 'tropical beach' | Gradient: 'sunset', 'ocean' | "
+                                     "Solid: 'red', 'blue' | Unsplash: 'mountain landscape'"),
+                        value="futuristic city skyline at sunset",
+                        visible=False
+                    )
+                    generate_bg_btn = gr.Button(
+                        "Generate Background",
+                        variant="secondary",
+                    )
+                    background_preview = gr.Image(
+                        label="Background Preview",
+                        interactive=False,
+                        height=300
+                    )
+                    background_status = gr.Textbox(
+                        label="Background Status",
+                        interactive=False,
+                        elem_classes=["status"]
+                    )
+            with gr.Column(scale=1):
+                with gr.Group():
+                    gr.HTML("<h3>⚡ Processing</h3>")
+                    process_btn = gr.Button(
+                        "🚀 Process Video",
+                        variant="primary",
+                    )
+                    processing_status = gr.Textbox(
+                        label="Processing Status",
+                        interactive=False,
+                        elem_classes=["status"]
+                    )
+                with gr.Group():
+                    gr.HTML("<h3>📽️ Results</h3>")
+                    result_video = gr.Video(
+                        label="Processed Video",
+                        height=400
+                    )
+                    # Real downloadable output
+                    download_btn = gr.DownloadButton(
+                        "📥 Download Result",
+                        visible=False
+                    )
+        with gr.Accordion("🔧 System Information", open=False):
+            system_info = gr.HTML(f"""
+            <div class="system-info">
+                <p><strong>Device:</strong> {get_device()}</p>
+                <p><strong>Torch Version:</strong> {torch.__version__}</p>
+                <p><strong>CUDA Available:</strong> {torch.cuda.is_available()}</p>
+                <p><strong>Job Directory:</strong> {JOB_ROOT}</p>
+                <p><strong>App Root:</strong> {APP_ROOT}</p>
+            </div>
+            """)
+        # =========================
+        # Event Handlers (4.42.x)
+        # =========================
+        # Lightweight; no queue needed
+        background_type.change(
+            fn=handle_background_type_change,
+            inputs=[background_type],
+            outputs=[custom_bg_upload, background_prompt, generate_bg_btn],
+            queue=False,
+            concurrency_limit=4,
+        )
+        # Small, immediate state update; no queue
+        custom_bg_upload.change(
+            fn=handle_custom_background_upload,
+            inputs=[custom_bg_upload],
+            outputs=[background_image_state, background_status],
+            queue=False,
+            concurrency_limit=2,
+        ).then(
+            fn=lambda img: img,
+            inputs=[background_image_state],
+            outputs=[background_preview],
+            queue=False,
+        )
+        # Copy to job dir + probe video info; keep queued but single flight
+        video_upload.change(
+            fn=handle_video_upload,
+            inputs=[video_upload],
+            outputs=[video_path_state, video_status],
+            queue=True,
+            concurrency_limit=1,
+        ).then(
+            fn=handle_preview_generation,
+            inputs=[video_path_state],
+            outputs=[video_preview, preview_status],
+            queue=False,
+        )
+        # Background generation can be heavier; single-flight
+        generate_bg_btn.click(
+            fn=handle_background_generation,
+            inputs=[background_type, background_prompt, video_path_state],
+            outputs=[background_image_state, background_status],
+            queue=True,
+            concurrency_limit=1,
+        ).then(
+            fn=lambda img: img,
+            inputs=[background_image_state],
+            outputs=[background_preview],
+            queue=False,
+        )
+        # The heavy pipeline — single-flight
+        process_btn.click(
+            fn=handle_video_processing,
+            inputs=[
+                video_path_state,
+                background_image_state,
+                background_type,
+                background_prompt
+            ],
+            outputs=[result_video, processing_status],
+            queue=True,
+            concurrency_limit=1,
+        ).then(
+            # Wire the download button (set value=path and visibility)
+            fn=lambda path: gr.update(value=path, visible=bool(path)),
+            inputs=[result_video],
+            outputs=[download_btn],
+            queue=False,
+        )
+    return demo

VideoBackgroundReplacer2/update_pins.py ADDED Viewed

	@@ -0,0 +1,197 @@

+#!/usr/bin/env python3
+"""
+update_pins.py
+- Fetch newest SHAs (release tag or default branch) for SAM2 + MatAnyone
+- Update ARG lines in Dockerfile: SAM2_SHA / MATANYONE_SHA
+- Supports dry-run and manual pins
+- Uses GitHub API; set GITHUB_TOKEN to avoid rate limits (optional)
+"""
+import os
+import re
+import sys
+import json
+import argparse
+from urllib.parse import urlparse
+import requests
+from datetime import datetime, timezone
+from shutil import copyfile
+DOCKERFILE_PATH = "Dockerfile"
+# Default repos (must match your Dockerfile ARGs)
+SAM2_REPO_URL = "https://github.com/facebookresearch/segment-anything-2"
+MATANY_REPO_URL = "https://github.com/pq-yang/MatAnyone"
+SESSION = requests.Session()
+if os.getenv("GITHUB_TOKEN"):
+    SESSION.headers.update({"Authorization": f"Bearer {os.environ['GITHUB_TOKEN']}"})
+SESSION.headers.update({
+    "Accept": "application/vnd.github+json",
+    "User-Agent": "update-pins-script"
+})
+def gh_owner_repo(repo_url: str):
+    p = urlparse(repo_url)
+    parts = p.path.strip("/").split("/")
+    if len(parts) < 2:
+        raise ValueError(f"Invalid repo URL: {repo_url}")
+    return parts[0], parts[1]
+def gh_api(path: str):
+    url = f"https://api.github.com{path}"
+    r = SESSION.get(url, timeout=30)
+    if r.status_code >= 400:
+        raise RuntimeError(f"GitHub API error {r.status_code}: {r.text}")
+    return r.json()
+def get_latest_release_sha(repo_url: str) -> tuple[str, str]:
+    """Return (ref_desc, commit_sha) using latest release tag."""
+    owner, repo = gh_owner_repo(repo_url)
+    try:
+        rel = gh_api(f"/repos/{owner}/{repo}/releases/latest")
+        tag = rel["tag_name"]
+        # Resolve tag to commit
+        ref = gh_api(f"/repos/{owner}/{repo}/git/ref/tags/{tag}")
+        obj = ref["object"]
+        if obj["type"] == "tag":
+            tag_obj = gh_api(f"/repos/{owner}/{repo}/git/tags/{obj['sha']}")
+            sha = tag_obj["object"]["sha"]
+        else:
+            sha = obj["sha"]
+        return (f"release:{tag}", sha)
+    except Exception as e:
+        raise RuntimeError(f"Could not get latest release for {repo}: {e}")
+def get_latest_default_branch_sha(repo_url: str) -> tuple[str, str]:
+    """Return (ref_desc, commit_sha) using the default branch head."""
+    owner, repo = gh_owner_repo(repo_url)
+    info = gh_api(f"/repos/{owner}/{repo}")
+    default_branch = info["default_branch"]
+    branch = gh_api(f"/repos/{owner}/{repo}/branches/{default_branch}")
+    sha = branch["commit"]["sha"]
+    return (f"branch:{default_branch}", sha)
+def get_sha_for_ref(repo_url: str, ref: str) -> tuple[str, str]:
+    """
+    Resolve any Git ref (branch name, tag name, or commit SHA) to a commit SHA.
+    """
+    owner, repo = gh_owner_repo(repo_url)
+    # If it's already a full SHA, just return it
+    if re.fullmatch(r"[0-9a-f]{40}", ref):
+        return (f"commit:{ref[:7]}", ref)
+    # Try branches/<ref>, then tags/<ref>, then commits/<ref>
+    for kind, path in [
+        ("branch", f"/repos/{owner}/{repo}/branches/{ref}"),
+        ("tag",    f"/repos/{owner}/{repo}/git/ref/tags/{ref}"),
+        ("commit", f"/repos/{owner}/{repo}/commits/{ref}")
+    ]:
+        try:
+            data = gh_api(path)
+            if kind == "branch":
+                return (f"branch:{ref}", data["commit"]["sha"])
+            if kind == "tag":
+                obj = data["object"]
+                if obj["type"] == "tag":
+                    tag_obj = gh_api(f"/repos/{owner}/{repo}/git/tags/{obj['sha']}")
+                    return (f"tag:{ref}", tag_obj["object"]["sha"])
+                else:
+                    return (f"tag:{ref}", obj["sha"])
+            if kind == "commit":
+                return (f"commit:{ref[:7]}", data["sha"])
+        except Exception:
+            continue
+    raise RuntimeError(f"Could not resolve ref '{ref}' for {repo}")
+def update_dockerfile_arg(dockerfile_text: str, arg_name: str, new_value: str) -> str:
+    """
+    Replace a line like:
+        ARG SAM2_SHA=...
+    with:
+        ARG SAM2_SHA=<new_value>
+    """
+    pattern = rf"^(ARG\s+{re.escape(arg_name)}=).*$"
+    # Use a callable replacement to avoid backreference ambiguity (e.g., \12)
+    def repl(m: re.Match) -> str:
+        return m.group(1) + new_value
+    new_text, n = re.subn(pattern, repl, dockerfile_text, flags=re.MULTILINE)
+    if n == 0:
+        raise RuntimeError(f"ARG {arg_name}=… line not found in Dockerfile.")
+    return new_text
+def main():
+    ap = argparse.ArgumentParser(description="Update pinned SHAs in Dockerfile.")
+    ap.add_argument("--mode", choices=["release", "default-branch"], default="release",
+                    help="Where to pull pins from (latest GitHub release tag or default branch head).")
+    ap.add_argument("--sam2-ref", help="Explicit ref for SAM2 (tag/branch/sha). Overrides --mode.")
+    ap.add_argument("--matany-ref", help="Explicit ref for MatAnyone (tag/branch/sha). Overrides --mode.")
+    ap.add_argument("--dockerfile", default=DOCKERFILE_PATH, help="Path to Dockerfile.")
+    ap.add_argument("--dry-run", action="store_true", help="Show changes but do not write file.")
+    ap.add_argument("--json", action="store_true", help="Print resulting pins as JSON.")
+    ap.add_argument("--no-backup", action="store_true", help="Do not create a Dockerfile.bak backup.")
+    args = ap.parse_args()
+    # Resolve SHAs
+    if args.sam2_ref:
+        sam2_refdesc, sam2_sha = get_sha_for_ref(SAM2_REPO_URL, args.sam2_ref)
+    else:
+        sam2_refdesc, sam2_sha = (
+            get_latest_release_sha(SAM2_REPO_URL) if args.mode == "release"
+            else get_latest_default_branch_sha(SAM2_REPO_URL)
+        )
+    if args.matany_ref:
+        mat_refdesc, mat_sha = get_sha_for_ref(MATANY_REPO_URL, args.matany_ref)
+    else:
+        mat_refdesc, mat_sha = (
+            get_latest_release_sha(MATANY_REPO_URL) if args.mode == "release"
+            else get_latest_default_branch_sha(MATANY_REPO_URL)
+        )
+    result = {
+        "timestamp": datetime.now(timezone.utc).isoformat(),
+        "mode": args.mode,
+        "SAM2": {"repo": SAM2_REPO_URL, "ref": sam2_refdesc, "sha": sam2_sha},
+        "MatAnyone": {"repo": MATANY_REPO_URL, "ref": mat_refdesc, "sha": mat_sha},
+    }
+    # Show pins
+    if args.json:
+        print(json.dumps(result, indent=2))
+    else:
+        print(f"[Pins] SAM2 -> {sam2_refdesc} -> {sam2_sha}")
+        print(f"[Pins] MatAnyone -> {mat_refdesc} -> {mat_sha}")
+    # Read Dockerfile
+    if not os.path.isfile(args.dockerfile):
+        raise FileNotFoundError(f"Dockerfile not found at: {args.dockerfile}")
+    with open(args.dockerfile, "r", encoding="utf-8") as f:
+        text = f.read()
+    # Update lines
+    text = update_dockerfile_arg(text, "SAM2_SHA", sam2_sha)
+    text = update_dockerfile_arg(text, "MATANYONE_SHA", mat_sha)
+    if args.dry_run:
+        print("\n--- Dockerfile (preview) ---\n")
+        print(text)
+        return
+    # Backup
+    if not args.no_backup:
+        copyfile(args.dockerfile, args.dockerfile + ".bak")
+    # Write
+    with open(args.dockerfile, "w", encoding="utf-8") as f:
+        f.write(text)
+    print(f"\n✅ Updated {args.dockerfile} with new pins.")
+if __name__ == "__main__":
+    try:
+        main()
+    except Exception as e:
+        print(f"\n❌ Error: {e}", file=sys.stderr)
+        sys.exit(1)

VideoBackgroundReplacer2/utils/__init__.py ADDED Viewed

File without changes

VideoBackgroundReplacer2/utils/paths.py ADDED Viewed

	@@ -0,0 +1,29 @@

+# utils/paths.py
+from pathlib import Path
+import os, re, uuid, shutil
+APP_ROOT = Path(__file__).resolve().parents[1]
+DATA_ROOT = APP_ROOT / "data"
+TMP_ROOT  = APP_ROOT / "tmp"
+for p in (DATA_ROOT, TMP_ROOT, APP_ROOT / ".hf", APP_ROOT / ".torch"):
+    p.mkdir(parents=True, exist_ok=True)
+os.environ.setdefault("HF_HOME", str(APP_ROOT / ".hf"))
+os.environ.setdefault("TORCH_HOME", str(APP_ROOT / ".torch"))
+def safe_name(name: str, default="file"):
+    base = re.sub(r"[^A-Za-z0-9._-]+", "_", (name or default))
+    return (base or default)[:120]
+def job_dir(prefix="job"):
+    d = DATA_ROOT / f"{prefix}-{uuid.uuid4().hex[:8]}"
+    d.mkdir(parents=True, exist_ok=True)
+    return d
+def disk_stats(p: Path = APP_ROOT) -> str:
+    try:
+        total, used, free = shutil.disk_usage(str(p))
+        mb = lambda x: x // (1024 * 1024)
+        return f"disk(total={mb(total)}MB, used={mb(used)}MB, free={mb(free)}MB)"
+    except Exception:
+        return "disk(n/a)"

VideoBackgroundReplacer2/utils/perf_tuning.py ADDED Viewed

	@@ -0,0 +1,21 @@

+# utils/perf_tuning.py
+import os, logging
+try:
+    import cv2
+except Exception:
+    cv2 = None
+import torch
+def apply():
+    os.environ.setdefault("OMP_NUM_THREADS", "4")
+    if cv2:
+        try:
+            cv2.setNumThreads(4)
+        except Exception as e:
+            logging.info("cv2 threads not set: %s", e)
+    if torch.cuda.is_available():
+        torch.backends.cudnn.benchmark = True
+        try:
+            logging.info("CUDA device %s — cuDNN benchmark ON", torch.cuda.get_device_name(0))
+        except Exception:
+            logging.info("CUDA available — cuDNN benchmark ON")

app.py CHANGED Viewed

@@ -1,300 +1,570 @@
-#!/usr/bin/env python3
-"""
-VideoBackgroundReplacer2 - SAM2 + MatAnyone Integration
-=======================================================
-- Sets up Gradio UI and launches pipeline
-- Aligned with torch/cu121 stack; runs on HF Spaces (Docker)
-Changes (2025-09-18):
-- Added precise web-stack probes (FastAPI/Starlette/Pydantic/etc. versions + file paths)
-- Added toggleable "mount mode": run Gradio inside our own FastAPI app
-  and provide a safe /config route shim (uses demo.get_config_file()).
-- Kept your startup diagnostics, GPU logging, and heartbeats
-"""
-print("=== APP STARTUP: Initializing VideoBackgroundReplacer2 ===")
-# ---------------------------------------------------------------------
-# Imports & basic setup
-# ---------------------------------------------------------------------
-import sys
 import os
-import gc
-import json
-import logging
-import threading
 import time
-import warnings
-import traceback
-import subprocess
 from pathlib import Path
-from loguru import logger
-# Logging (loguru to stderr)
-logger.remove()
-logger.add(
-    sys.stderr,
-    format="<green>{time:YYYY-MM-DD HH:mm:ss}</green> | <level>{level: <8}</level> "
-           "| <cyan>{name}</cyan>:<cyan>{function}</cyan>:<cyan>{line}</cyan> - <level>{message}</level>"
 )
-# Warnings
-warnings.filterwarnings("ignore", category=UserWarning)
-warnings.filterwarnings("ignore", category=FutureWarning)
-warnings.filterwarnings("ignore", module="torchvision.io._video_deprecation_warning")
-# Environment (lightweight & safe in Spaces)
-os.environ.setdefault("OMP_NUM_THREADS", "1")
-os.environ.setdefault("TOKENIZERS_PARALLELISM", "false")
-# Paths
-BASE_DIR = Path(__file__).parent.absolute()
-THIRD_PARTY_DIR = BASE_DIR / "third_party"
-SAM2_DIR = THIRD_PARTY_DIR / "sam2"
-CHECKPOINTS_DIR = BASE_DIR / "checkpoints"
-# Python path extends
-for p in (str(THIRD_PARTY_DIR), str(SAM2_DIR)):
-    if p not in sys.path:
-        sys.path.insert(0, p)
-logger.info(f"Base directory: {BASE_DIR}")
-logger.info(f"Python path[0:5]: {sys.path[:5]}")
-# ---------------------------------------------------------------------
-# GPU / Torch diagnostics (non-blocking)
-# ---------------------------------------------------------------------
-try:
-    import torch
-except Exception as e:
-    logger.warning("Torch import failed at startup: %s", e)
-    torch = None
-DEVICE = "cuda" if (torch and torch.cuda.is_available()) else "cpu"
-if DEVICE == "cuda":
-    os.environ["SAM2_DEVICE"] = "cuda"
-    os.environ["MATANY_DEVICE"] = "cuda"
-    os.environ.setdefault("CUDA_LAUNCH_BLOCKING", "0")
-    try:
-        logger.info(f"CUDA available: {torch.cuda.get_device_name(0)}")
-    except Exception:
-        logger.info("CUDA device name not available at startup.")
-else:
-    os.environ["SAM2_DEVICE"] = "cpu"
-    os.environ["MATANY_DEVICE"] = "cpu"
-    logger.warning("CUDA not available, falling back to CPU")
-def verify_models():
-    """Verify critical model files exist and are loadable (cheap checks)."""
-    results = {"status": "success", "details": {}}
-    try:
-        sam2_model_path = os.getenv("SAM2_MODEL_PATH", str(CHECKPOINTS_DIR / "sam2_hiera_large.pt"))
-        if not os.path.exists(sam2_model_path):
-            raise FileNotFoundError(f"SAM2 model not found at {sam2_model_path}")
-        # Cheap load test (map to CPU to avoid VRAM use during boot)
-        if torch:
-            sd = torch.load(sam2_model_path, map_location="cpu")
-            if not isinstance(sd, dict):
-                raise ValueError("Invalid SAM2 checkpoint format")
-        results["details"]["sam2"] = {
-            "status": "success",
-            "path": sam2_model_path,
-            "size_mb": round(os.path.getsize(sam2_model_path) / (1024 * 1024), 2),
-        }
-    except Exception as e:
-        results["status"] = "error"
-        results["details"]["sam2"] = {
-            "status": "error",
-            "error": str(e),
-            "traceback": traceback.format_exc(),
-        }
-    return results
-def run_startup_diagnostics():
-    diag = {
-        "system": {
-            "python": sys.version,
-            "pytorch": getattr(torch, "__version__", None) if torch else None,
-            "cuda_available": bool(torch and torch.cuda.is_available()),
-            "device_count": (torch.cuda.device_count() if torch and torch.cuda.is_available() else 0),
-            "cuda_version": getattr(getattr(torch, "version", None), "cuda", None) if torch else None,
-        },
-        "paths": {
-            "base_dir": str(BASE_DIR),
-            "checkpoints_dir": str(CHECKPOINTS_DIR),
-            "sam2_dir": str(SAM2_DIR),
-        },
-        "env_subset": {k: v for k, v in os.environ.items() if k in ("HOST", "PORT", "SPACE_ID", "SPACE_AUTHOR_NAME")},
     }
-    diag["model_verification"] = verify_models()
-    return diag
-startup_diag = run_startup_diagnostics()
-logger.info("Startup diagnostics completed")
-# Noisy heartbeat so logs show life during import time
-def _heartbeat():
-    i = 0
-    while True:
-        i += 1
-        print(f"[startup-heartbeat] {i*5}s…", flush=True)
-        time.sleep(5)
-threading.Thread(target=_heartbeat, daemon=True).start()
-# Optional perf tuning import (non-fatal)
-try:
-    import perf_tuning  # noqa: F401
-    logger.info("perf_tuning imported successfully.")
-except Exception as e:
-    logger.info("perf_tuning not available: %s", e)
-# MatAnyone non-instantiating probe
-try:
-    import inspect
-    from matanyone.inference import inference_core as ic  # type: ignore
-    sigs = {}
-    for name in ("InferenceCore",):
-        obj = getattr(ic, name, None)
-        if obj:
-            sigs[name] = "callable" if callable(obj) else "present"
-    logger.info(f"[MATANY] probe (non-instantiating): {sigs}")
-except Exception as e:
-    logger.info(f"[MATANY] probe skipped: {e}")
-# ---------------------------------------------------------------------
-# Gradio import and web-stack probes
-# ---------------------------------------------------------------------
-import gradio as gr
-# Standard logger for some libs that use stdlib logging
-py_logger = logging.getLogger("backgroundfx_pro")
-if not py_logger.handlers:
-    h = logging.StreamHandler()
-    h.setFormatter(logging.Formatter("[%(asctime)s] %(levelname)s: %(message)s"))
-    py_logger.addHandler(h)
-py_logger.setLevel(logging.INFO)
-def _log_web_stack_versions_and_paths():
-    import inspect
-    try:
-        import fastapi, starlette, pydantic, httpx, anyio
-        try:
-            import pydantic_core
-            pc_ver = pydantic_core.__version__
-        except Exception:
-            pc_ver = "unknown"
-        logger.info(
-            "[WEB-STACK] fastapi=%s | starlette=%s | pydantic=%s | pydantic-core=%s | httpx=%s | anyio=%s",
-            getattr(fastapi, "__version__", "?"),
-            getattr(starlette, "__version__", "?"),
-            getattr(pydantic, "__version__", "?"),
-            pc_ver,
-            getattr(httpx, "__version__", "?"),
-            getattr(anyio, "__version__", "?"),
         )
-    except Exception as e:
-        logger.warning("[WEB-STACK] version probe failed: %s", e)
-    try:
-        import gradio
-        import gradio.routes as gr_routes
-        import gradio.queueing as gr_queueing
-        logger.info("[PATH] gradio.__file__     = %s", getattr(gradio, "__file__", "?"))
-        logger.info("[PATH] gradio.routes       = %s", inspect.getfile(gr_routes))
-        logger.info("[PATH] gradio.queueing     = %s", inspect.getfile(gr_queueing))
-        import starlette.exceptions as st_exc
-        logger.info("[PATH] starlette.exceptions= %s", inspect.getfile(st_exc))
-    except Exception as e:
-        logger.warning("[PATH] probe failed: %s", e)
-def _post_launch_diag():
-    try:
-        if not torch:
-            return
-        avail = torch.cuda.is_available()
-        logger.info("CUDA available (post-launch): %s", avail)
-        if avail:
-            idx = torch.cuda.current_device()
-            name = torch.cuda.get_device_name(idx)
-            cap = torch.cuda.get_device_capability(idx)
-            logger.info("CUDA device %d: %s (cc %d.%d)", idx, name, cap[0], cap[1])
-    except Exception as e:
-        logger.warning("Post-launch CUDA diag failed: %s", e)
-# ---------------------------------------------------------------------
-# UI factory (uses your existing builder)
-# ---------------------------------------------------------------------
-def build_ui() -> gr.Blocks:
-    # FIX: import from ui_core_interface (not from ui)
-    from ui_core_interface import create_interface
-    return create_interface()
-# ---------------------------------------------------------------------
-# Optional: custom FastAPI mount mode
-# ---------------------------------------------------------------------
-def build_fastapi_with_gradio(demo: gr.Blocks):
     """
-    Returns a FastAPI app with Gradio mounted at root.
-    Also exposes JSON health and a config shim using demo.get_config_file().
     """
-    from fastapi import FastAPI
-    from fastapi.responses import JSONResponse
-    app = FastAPI(title="VideoBackgroundReplacer2")
-    @app.get("/healthz")
-    def _healthz():
-        return {"ok": True, "ts": time.time()}
-    @app.get("/config")
-    def _config():
-        try:
-            cfg = demo.get_config_file()
-            return JSONResponse(content=cfg)
-        except Exception as e:
-            return JSONResponse(
-                status_code=500,
-                content={"error": "config_generation_failed", "detail": str(e)},
-            )
-    # Mount Gradio UI at root; our /config route remains at parent level
-    app = gr.mount_gradio_app(app, demo, path="/")
-    return app
-# ---------------------------------------------------------------------
-# Entrypoint
-# ---------------------------------------------------------------------
 if __name__ == "__main__":
-    host = os.environ.get("HOST", "0.0.0.0")
-    port = int(os.environ.get("PORT", "7860"))
-    mount_mode = os.environ.get("GRADIO_MOUNT_MODE", "0") == "1"
-    logger.info("Launching on %s:%s (mount_mode=%s)…", host, port, mount_mode)
-    _log_web_stack_versions_and_paths()
-    demo = build_ui()
-    demo.queue(max_size=16, api_open=False)
-    threading.Thread(target=_post_launch_diag, daemon=True).start()
-    if mount_mode:
-        try:
-            from uvicorn import run as uvicorn_run
-        except Exception:
-            logger.error("uvicorn is not installed; mount mode cannot start.")
-            raise
-        app = build_fastapi_with_gradio(demo)
-        uvicorn_run(app=app, host=host, port=port, log_level="info")
-    else:
-        demo.launch(
-            server_name=host,
-            server_port=port,
-            share=False,
-            show_api=False,
-            show_error=True,
-            quiet=False,
-            debug=True,
-            max_threads=1,
-        )

+import streamlit as st
 import os
+import sys
+import tempfile
 import time
 from pathlib import Path
+import cv2
+import numpy as np
+from PIL import Image
+import logging
+import base64
+from io import BytesIO
+# Add project root to path
+sys.path.append(str(Path(__file__).parent.absolute()))
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# Set page config
+st.set_page_config(
+    page_title="MyAvatar - Video Background Replacer",
+    page_icon="🎥",
+    layout="wide",
+    initial_sidebar_state="expanded"
 )
+# Custom CSS for better UI with logo
+def add_logo():
+    st.markdown(
+        """
+        <style>
+            .main .block-container {
+                padding-top: 2rem;
+                padding-bottom: 2rem;
+            }
+            .stButton>button {
+                width: 100%;
+                background-color: #4CAF50;
+                color: white;
+                font-weight: bold;
+                transition: all 0.3s;
+            }
+            .stButton>button:hover {
+                background-color: #45a049;
+            }
+            .stProgress > div > div > div > div {
+                background-color: #4CAF50;
+            }
+            .stAlert {
+                border-radius: 10px;
+            }
+            .stTabs [data-baseweb="tab-list"] {
+                gap: 10px;
+            }
+            .stTabs [data-baseweb="tab"] {
+                height: 50px;
+                white-space: pre;
+                background-color: #f0f2f6;
+                border-radius: 4px 4px 0 0;
+                padding: 10px 20px;
+                margin-right: 5px;
+            }
+            .stTabs [aria-selected="true"] {
+                background-color: #4CAF50;
+                color: white;
+            }
+            .video-container {
+                border: 2px dashed #4CAF50;
+                border-radius: 10px;
+                padding: 10px;
+                margin-bottom: 20px;
+            }
+            .logo-container {
+                display: flex;
+                justify-content: flex-end;
+                padding: 10px 20px 0 0;
+            }
+            .logo {
+                height: 50px;
+                width: auto;
+                margin-bottom: -20px;
+            }
+            .title-container {
+                text-align: center;
+                margin-bottom: 30px;
+            }
+            .color-swatch {
+                display: inline-block;
+                width: 30px;
+                height: 30px;
+                margin: 5px;
+                border: 2px solid #ddd;
+                border-radius: 4px;
+                cursor: pointer;
+                transition: transform 0.2s;
+            }
+            .color-swatch:hover {
+                transform: scale(1.1);
+                border-color: #4CAF50;
+            }
+            .background-option {
+                padding: 10px;
+                margin: 5px 0;
+                border-radius: 5px;
+                background-color: #f8f9fa;
+                border-left: 4px solid #4CAF50;
+            }
+        </style>
+        """,
+        unsafe_allow_html=True
+    )
+    # Add logo to the top right
+    st.markdown(
+        """
+        <div class="logo-container">
+            <img src="data:image/png;base64,{}" class="logo">
+        </div>
+        """.format(base64.b64encode(open("myavatar_logo.png", "rb").read()).decode()),
+        unsafe_allow_html=True
+    )
+def initialize_session_state():
+    """Initialize all session state variables"""
+    if 'uploaded_video' not in st.session_state:
+        st.session_state.uploaded_video = None
+    if 'bg_image' not in st.session_state:
+        st.session_state.bg_image = None
+    if 'bg_color' not in st.session_state:
+        st.session_state.bg_color = "#00FF00"
+    if 'bg_type' not in st.session_state:
+        st.session_state.bg_type = "image"
+    if 'processed_video_path' not in st.session_state:
+        st.session_state.processed_video_path = None
+    if 'processing' not in st.session_state:
+        st.session_state.processing = False
+    if 'progress' not in st.session_state:
+        st.session_state.progress = 0
+    if 'progress_text' not in st.session_state:
+        st.session_state.progress_text = "Ready"
+def handle_video_upload():
+    """Handle video file upload"""
+    uploaded = st.file_uploader(
+        "📹 Upload Video",
+        type=["mp4", "mov", "avi"],
+        key="video_uploader"
+    )
+    if uploaded is not None:
+        st.session_state.uploaded_video = uploaded
+def show_video_preview():
+    """Show video preview in the UI"""
+    st.markdown("### Video Preview")
+    if st.session_state.uploaded_video is not None:
+        video_bytes = st.session_state.uploaded_video.getvalue()
+        st.video(video_bytes)
+        st.session_state.uploaded_video.seek(0)
+def handle_background_selection():
+    """Handle background selection UI with all options"""
+    st.markdown("### Background Options")
+    # Background type selection
+    bg_type = st.radio(
+        "Select Background Type:",
+        ["Image", "Color", "Blur", "Professional Backgrounds", "AI Generated"],
+        horizontal=True,
+        key="bg_type_radio"
+    )
+    st.session_state.bg_type = bg_type.lower()
+    # Show appropriate controls based on selection
+    if bg_type == "Image":
+        handle_image_background()
+    elif bg_type == "Color":
+        handle_color_background()
+    elif bg_type == "Blur":
+        handle_blur_background()
+    elif bg_type == "Professional Backgrounds":
+        handle_professional_backgrounds()
+    elif bg_type == "AI Generated":
+        handle_ai_generated_background()
+def handle_image_background():
+    """Handle image background selection"""
+    bg_image = st.file_uploader(
+        "🖼️ Upload Background Image",
+        type=["jpg", "png", "jpeg"],
+        key="bg_image_uploader"
+    )
+    if bg_image is not None:
+        st.session_state.bg_image = Image.open(bg_image)
+        st.image(
+            st.session_state.bg_image,
+            caption="Selected Background",
+            use_container_width=True
+        )
+def handle_color_background():
+    """Handle color background selection with presets"""
+    st.markdown("#### Select a Color")
+    # Color presets
+    color_presets = {
+        "Pure White": "#FFFFFF",
+        "Pure Black": "#000000",
+        "Light Gray": "#F5F5F5",
+        "Dark Gray": "#333333",
+        "Professional Blue": "#0078D4",
+        "Corporate Green": "#107C10",
+        "Warm Beige": "#F5F5DC",
+        "Custom": st.session_state.get('bg_color', "#00FF00")
     }
+    # Create color swatches
+    cols = st.columns(4)
+    selected_color = None
+    for i, (name, color) in enumerate(color_presets.items()):
+        with cols[i % 4]:
+            if name == "Custom":
+                # Show color picker for custom color
+                st.session_state.bg_color = st.color_picker(
+                    "Custom Color",
+                    st.session_state.get('bg_color', "#00FF00"),
+                    key="custom_color_picker"
+                )
+            else:
+                # Create a color swatch
+                if st.button(
+                    "",
+                    key=f"color_{name}",
+                    help=name,
+                    type="secondary",
+                    use_container_width=True
+                ):
+                    st.session_state.bg_color = color
+                # Show the color preview
+                st.markdown(
+                    f'<div style="background-color:{color}; height:30px; border-radius:4px; margin-top:-10px;"></div>',
+                    unsafe_allow_html=True
+                )
+                st.caption(name)
+def handle_blur_background():
+    """Handle blur background selection"""
+    blur_strength = st.select_slider(
+        "Blur Strength:",
+        options=["Subtle", "Medium", "Strong", "Maximum"],
+        value="Medium",
+        key="blur_strength"
+    )
+    # Show preview of blur effect
+    st.markdown("**Preview**")
+    preview_img = np.zeros((100, 200, 3), dtype=np.uint8)
+    cv2.putText(
+        preview_img,
+        "Blur Effect",
+        (20, 50),
+        cv2.FONT_HERSHEY_SIMPLEX,
+        0.8,
+        (255, 255, 255),
+        2
+    )
+    # Apply blur based on selection
+    if blur_strength == "Subtle":
+        preview_img = cv2.GaussianBlur(preview_img, (15, 15), 5)
+    elif blur_strength == "Medium":
+        preview_img = cv2.GaussianBlur(preview_img, (25, 25), 10)
+    elif blur_strength == "Strong":
+        preview_img = cv2.GaussianBlur(preview_img, (35, 35), 15)
+    else:  # Maximum
+        preview_img = cv2.GaussianBlur(preview_img, (51, 51), 20)
+    st.image(preview_img, use_column_width=True)
+    st.caption(f"Selected: {blur_strength} blur")
+def handle_professional_backgrounds():
+    """Handle professional background selection"""
+    categories = {
+        "Office Settings": ["Modern Office", "Executive Office", "Home Office", "Conference Room"],
+        "Virtual Backgrounds": ["Professional", "Minimalist", "Creative", "Branded"],
+        "Nature Scenes": ["Forest", "Beach", "Mountain", "City Skyline"],
+        "Abstract Designs": ["Gradient", "Geometric", "Particles", "Bokeh"]
+    }
+    # Category selection
+    selected_category = st.selectbox(
+        "Select Category:",
+        list(categories.keys()),
+        key="bg_category"
+    )
+    # Show thumbnails for selected category
+    st.markdown("#### Available Backgrounds")
+    cols = st.columns(2)
+    for i, bg in enumerate(categories[selected_category]):
+        with cols[i % 2]:
+            # Create a placeholder image (replace with actual thumbnails)
+            img = np.zeros((120, 200, 3), dtype=np.uint8)
+            cv2.putText(
+                img,
+                bg,
+                (20, 60),
+                cv2.FONT_HERSHEY_SIMPLEX,
+                0.7,
+                (255, 255, 255),
+                2
+            )
+            if st.button(
+                f"Use {bg}",
+                key=f"prof_bg_{bg}",
+                use_container_width=True
+            ):
+                st.session_state.selected_bg = bg
+                st.success(f"Selected: {bg}")
+            st.image(img, use_column_width=True)
+def handle_ai_generated_background():
+    """Handle AI generated background selection"""
+    ai_prompts = [
+        "Professional office with bookshelf",
+        "Modern co-working space",
+        "Neutral abstract background",
+        "City skyline at night",
+        "Minimalist home office setup",
+        "Corporate meeting room",
+        "Creative studio background",
+        "Custom prompt..."
+    ]
+    # Prompt selection
+    selected_prompt = st.selectbox(
+        "Select a prompt or create your own:",
+        ai_prompts,
+        key="ai_prompt_select"
+    )
+    if selected_prompt == "Custom prompt...":
+        custom_prompt = st.text_input(
+            "Enter your custom prompt:",
+            key="custom_ai_prompt"
         )
+        if custom_prompt:
+            selected_prompt = custom_prompt
+    # Generate button
+    if st.button(
+        "��� Generate Background",
+        key="generate_ai_bg",
+        use_container_width=True
+    ):
+        with st.spinner(f"Generating '{selected_prompt}'..."):
+            # Simulate generation
+            time.sleep(2)
+            # Create a placeholder for the generated image
+            img = np.zeros((300, 500, 3), dtype=np.uint8)
+            cv2.putText(
+                img,
+                f"AI Generated:\n{selected_prompt}",
+                (50, 150),
+                cv2.FONT_HERSHEY_SIMPLEX,
+                0.8,
+                (255, 255, 255),
+                2,
+                cv2.LINE_AA
+            )
+            # Show the "generated" image
+            st.image(img, use_column_width=True)
+            # Add use button
+            if st.button(
+                "Use This Background",
+                key="use_ai_bg",
+                use_container_width=True
+            ):
+                st.session_state.bg_image = Image.fromarray(img)
+                st.success("Background selected!")
+def process_video(input_file, background, bg_type="image"):
     """
+    Mock video processing that works without SAM2/MatA
+    Just applies a simple effect to simulate background replacement
     """
+    try:
+        # Create a temporary directory for processing
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_dir = Path(temp_dir)
+            # Save the uploaded video to a temporary file
+            input_path = str(temp_dir / "input.mp4")
+            with open(input_path, "wb") as f:
+                f.write(input_file.getvalue())
+            # Set up progress bar
+            progress_bar = st.progress(0)
+            status_text = st.empty()
+            def update_progress(progress, message):
+                progress = max(0, min(1, progress))
+                progress_bar.progress(progress)
+                status_text.text(f"Status: {message}")
+            # Simulate processing steps
+            update_progress(0.1, "Loading video...")
+            time.sleep(1)
+            update_progress(0.3, "Processing frames...")
+            time.sleep(2)
+            # Create a simple output video that just adds a colored border
+            cap = cv2.VideoCapture(input_path)
+            fps = int(cap.get(cv2.CAP_PROP_FPS))
+            width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+            height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+            output_path = str(temp_dir / "output.mp4")
+            fourcc = cv2.VideoWriter_fourcentCC(*'mp4v')
+            out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
+            frame_count = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+            for i in range(frame_count):
+                ret, frame = cap.read()
+                if not ret:
+                    break
+                # Simple effect: add a colored border to simulate processing
+                border_size = 20
+                if bg_type == "color":
+                    color_hex = st.session_state.bg_color.lstrip('#')
+                    color_bgr = tuple(int(color_hex[i:i+2], 16) for i in (4, 2, 0))  # RGB to BGR
+                else:
+                    color_bgr = (0, 255, 0)  # Default green border
+                frame = cv2.copyMakeBorder(
+                    frame,
+                    border_size, border_size, border_size, border_size,
+                    cv2.BORDER_CONSTANT,
+                    value=color_bgr
+                )
+                # Resize back to original dimensions
+                frame = cv2.resize(frame, (width, height))
+                out.write(frame)
+                # Update progress
+                if i % 10 == 0:
+                    update_progress(0.3 + 0.7 * (i/frame_count), f"Processing frame {i}/{frame_count}")
+            cap.release()
+            out.release()
+            update_progress(1.0, "Processing complete!")
+            time.sleep(0.5)
+            return output_path
+    except Exception as e:
+        logger.error(f"Error in mock video processing: {str(e)}", exc_info=True)
+        st.error(f"An error occurred during processing: {str(e)}")
+        return None
+def main():
+    # Add custom CSS and logo
+    add_logo()
+    # Title
+    st.markdown(
+        """
+        <div class="title-container">
+            <h1>🎥 Video Background Replacer</h1>
+        </div>
+        """,
+        unsafe_allow_html=True
+    )
+    st.markdown("---")
+    # Initialize session state
+    initialize_session_state()
+    # Main layout
+    col1, col2 = st.columns([1, 1], gap="large")
+    with col1:
+        st.header("1. Upload Video")
+        handle_video_upload()
+        show_video_preview()
+    with col2:
+        st.header("2. Background Settings")
+        handle_background_selection()
+        st.header("3. Process & Download")
+        if st.button(
+            "🚀 Process Video",
+            type="primary",
+            disabled=not st.session_state.uploaded_video or st.session_state.processing,
+            use_container_width=True
+        ):
+            with st.spinner("Processing video (this may take a few minutes)..."):
+                st.session_state.processing = True
+                try:
+                    # Prepare background based on type
+                    background = None
+                    if st.session_state.bg_type == "image" and 'bg_image' in st.session_state and st.session_state.bg_image is not None:
+                        background = st.session_state.bg_image
+                    elif st.session_state.bg_type == "color" and 'bg_color' in st.session_state:
+                        background = st.session_state.bg_color
+                    # Process the video
+                    output_path = process_video(
+                        st.session_state.uploaded_video,
+                        background,
+                        bg_type=st.session_state.bg_type
+                    )
+                    if output_path and os.path.exists(output_path):
+                        # Store the path to the processed video
+                        st.session_state.processed_video_path = output_path
+                        st.success("✅ Video processing complete!")
+                    else:
+                        st.error("❌ Failed to process video. Please check the logs for details.")
+                except Exception as e:
+                    st.error(f"❌ An error occurred: {str(e)}")
+                    logger.exception("Video processing failed")
+                finally:
+                    st.session_state.processing = False
+        # Show processed video if available
+        if 'processed_video_path' in st.session_state and st.session_state.processed_video_path:
+            st.markdown("### Processed Video")
+            try:
+                # Display the video directly from the file
+                with open(st.session_state.processed_video_path, 'rb') as f:
+                    video_bytes = f.read()
+                    st.video(video_bytes)
+                    # Download button
+                    st.download_button(
+                        label="💾 Download Processed Video",
+                        data=video_bytes,
+                        file_name="processed_video.mp4",
+                        mime="video/mp4",
+                        use_container_width=True
+                    )
+            except Exception as e:
+                st.error(f"Error displaying video: {str(e)}")
+                logger.error(f"Error displaying video: {str(e)}", exc_info=True)
 if __name__ == "__main__":
+    main()

app_backup.py ADDED Viewed

	@@ -0,0 +1,300 @@

+#!/usr/bin/env python3
+"""
+VideoBackgroundReplacer2 - SAM2 + MatAnyone Integration
+=======================================================
+- Sets up Gradio UI and launches pipeline
+- Aligned with torch/cu121 stack; runs on HF Spaces (Docker)
+Changes (2025-09-18):
+- Added precise web-stack probes (FastAPI/Starlette/Pydantic/etc. versions + file paths)
+- Added toggleable "mount mode": run Gradio inside our own FastAPI app
+  and provide a safe /config route shim (uses demo.get_config_file()).
+- Kept your startup diagnostics, GPU logging, and heartbeats
+"""
+print("=== APP STARTUP: Initializing VideoBackgroundReplacer2 ===")
+# ---------------------------------------------------------------------
+# Imports & basic setup
+# ---------------------------------------------------------------------
+import sys
+import os
+import gc
+import json
+import logging
+import threading
+import time
+import warnings
+import traceback
+import subprocess
+from pathlib import Path
+from loguru import logger
+# Logging (loguru to stderr)
+logger.remove()
+logger.add(
+    sys.stderr,
+    format="<green>{time:YYYY-MM-DD HH:mm:ss}</green> | <level>{level: <8}</level> "
+           "| <cyan>{name}</cyan>:<cyan>{function}</cyan>:<cyan>{line}</cyan> - <level>{message}</level>"
+)
+# Warnings
+warnings.filterwarnings("ignore", category=UserWarning)
+warnings.filterwarnings("ignore", category=FutureWarning)
+warnings.filterwarnings("ignore", module="torchvision.io._video_deprecation_warning")
+# Environment (lightweight & safe in Spaces)
+os.environ.setdefault("OMP_NUM_THREADS", "1")
+os.environ.setdefault("TOKENIZERS_PARALLELISM", "false")
+# Paths
+BASE_DIR = Path(__file__).parent.absolute()
+THIRD_PARTY_DIR = BASE_DIR / "third_party"
+SAM2_DIR = THIRD_PARTY_DIR / "sam2"
+CHECKPOINTS_DIR = BASE_DIR / "checkpoints"
+# Python path extends
+for p in (str(THIRD_PARTY_DIR), str(SAM2_DIR)):
+    if p not in sys.path:
+        sys.path.insert(0, p)
+logger.info(f"Base directory: {BASE_DIR}")
+logger.info(f"Python path[0:5]: {sys.path[:5]}")
+# ---------------------------------------------------------------------
+# GPU / Torch diagnostics (non-blocking)
+# ---------------------------------------------------------------------
+try:
+    import torch
+except Exception as e:
+    logger.warning("Torch import failed at startup: %s", e)
+    torch = None
+DEVICE = "cuda" if (torch and torch.cuda.is_available()) else "cpu"
+if DEVICE == "cuda":
+    os.environ["SAM2_DEVICE"] = "cuda"
+    os.environ["MATANY_DEVICE"] = "cuda"
+    os.environ.setdefault("CUDA_LAUNCH_BLOCKING", "0")
+    try:
+        logger.info(f"CUDA available: {torch.cuda.get_device_name(0)}")
+    except Exception:
+        logger.info("CUDA device name not available at startup.")
+else:
+    os.environ["SAM2_DEVICE"] = "cpu"
+    os.environ["MATANY_DEVICE"] = "cpu"
+    logger.warning("CUDA not available, falling back to CPU")
+def verify_models():
+    """Verify critical model files exist and are loadable (cheap checks)."""
+    results = {"status": "success", "details": {}}
+    try:
+        sam2_model_path = os.getenv("SAM2_MODEL_PATH", str(CHECKPOINTS_DIR / "sam2_hiera_large.pt"))
+        if not os.path.exists(sam2_model_path):
+            raise FileNotFoundError(f"SAM2 model not found at {sam2_model_path}")
+        # Cheap load test (map to CPU to avoid VRAM use during boot)
+        if torch:
+            sd = torch.load(sam2_model_path, map_location="cpu")
+            if not isinstance(sd, dict):
+                raise ValueError("Invalid SAM2 checkpoint format")
+        results["details"]["sam2"] = {
+            "status": "success",
+            "path": sam2_model_path,
+            "size_mb": round(os.path.getsize(sam2_model_path) / (1024 * 1024), 2),
+        }
+    except Exception as e:
+        results["status"] = "error"
+        results["details"]["sam2"] = {
+            "status": "error",
+            "error": str(e),
+            "traceback": traceback.format_exc(),
+        }
+    return results
+def run_startup_diagnostics():
+    diag = {
+        "system": {
+            "python": sys.version,
+            "pytorch": getattr(torch, "__version__", None) if torch else None,
+            "cuda_available": bool(torch and torch.cuda.is_available()),
+            "device_count": (torch.cuda.device_count() if torch and torch.cuda.is_available() else 0),
+            "cuda_version": getattr(getattr(torch, "version", None), "cuda", None) if torch else None,
+        },
+        "paths": {
+            "base_dir": str(BASE_DIR),
+            "checkpoints_dir": str(CHECKPOINTS_DIR),
+            "sam2_dir": str(SAM2_DIR),
+        },
+        "env_subset": {k: v for k, v in os.environ.items() if k in ("HOST", "PORT", "SPACE_ID", "SPACE_AUTHOR_NAME")},
+    }
+    diag["model_verification"] = verify_models()
+    return diag
+startup_diag = run_startup_diagnostics()
+logger.info("Startup diagnostics completed")
+# Noisy heartbeat so logs show life during import time
+def _heartbeat():
+    i = 0
+    while True:
+        i += 1
+        print(f"[startup-heartbeat] {i*5}s…", flush=True)
+        time.sleep(5)
+threading.Thread(target=_heartbeat, daemon=True).start()
+# Optional perf tuning import (non-fatal)
+try:
+    import perf_tuning  # noqa: F401
+    logger.info("perf_tuning imported successfully.")
+except Exception as e:
+    logger.info("perf_tuning not available: %s", e)
+# MatAnyone non-instantiating probe
+try:
+    import inspect
+    from matanyone.inference import inference_core as ic  # type: ignore
+    sigs = {}
+    for name in ("InferenceCore",):
+        obj = getattr(ic, name, None)
+        if obj:
+            sigs[name] = "callable" if callable(obj) else "present"
+    logger.info(f"[MATANY] probe (non-instantiating): {sigs}")
+except Exception as e:
+    logger.info(f"[MATANY] probe skipped: {e}")
+# ---------------------------------------------------------------------
+# Gradio import and web-stack probes
+# ---------------------------------------------------------------------
+import gradio as gr
+# Standard logger for some libs that use stdlib logging
+py_logger = logging.getLogger("backgroundfx_pro")
+if not py_logger.handlers:
+    h = logging.StreamHandler()
+    h.setFormatter(logging.Formatter("[%(asctime)s] %(levelname)s: %(message)s"))
+    py_logger.addHandler(h)
+py_logger.setLevel(logging.INFO)
+def _log_web_stack_versions_and_paths():
+    import inspect
+    try:
+        import fastapi, starlette, pydantic, httpx, anyio
+        try:
+            import pydantic_core
+            pc_ver = pydantic_core.__version__
+        except Exception:
+            pc_ver = "unknown"
+        logger.info(
+            "[WEB-STACK] fastapi=%s | starlette=%s | pydantic=%s | pydantic-core=%s | httpx=%s | anyio=%s",
+            getattr(fastapi, "__version__", "?"),
+            getattr(starlette, "__version__", "?"),
+            getattr(pydantic, "__version__", "?"),
+            pc_ver,
+            getattr(httpx, "__version__", "?"),
+            getattr(anyio, "__version__", "?"),
+        )
+    except Exception as e:
+        logger.warning("[WEB-STACK] version probe failed: %s", e)
+    try:
+        import gradio
+        import gradio.routes as gr_routes
+        import gradio.queueing as gr_queueing
+        logger.info("[PATH] gradio.__file__     = %s", getattr(gradio, "__file__", "?"))
+        logger.info("[PATH] gradio.routes       = %s", inspect.getfile(gr_routes))
+        logger.info("[PATH] gradio.queueing     = %s", inspect.getfile(gr_queueing))
+        import starlette.exceptions as st_exc
+        logger.info("[PATH] starlette.exceptions= %s", inspect.getfile(st_exc))
+    except Exception as e:
+        logger.warning("[PATH] probe failed: %s", e)
+def _post_launch_diag():
+    try:
+        if not torch:
+            return
+        avail = torch.cuda.is_available()
+        logger.info("CUDA available (post-launch): %s", avail)
+        if avail:
+            idx = torch.cuda.current_device()
+            name = torch.cuda.get_device_name(idx)
+            cap = torch.cuda.get_device_capability(idx)
+            logger.info("CUDA device %d: %s (cc %d.%d)", idx, name, cap[0], cap[1])
+    except Exception as e:
+        logger.warning("Post-launch CUDA diag failed: %s", e)
+# ---------------------------------------------------------------------
+# UI factory (uses your existing builder)
+# ---------------------------------------------------------------------
+def build_ui() -> gr.Blocks:
+    # FIX: import from ui_core_interface (not from ui)
+    from ui_core_interface import create_interface
+    return create_interface()
+# ---------------------------------------------------------------------
+# Optional: custom FastAPI mount mode
+# ---------------------------------------------------------------------
+def build_fastapi_with_gradio(demo: gr.Blocks):
+    """
+    Returns a FastAPI app with Gradio mounted at root.
+    Also exposes JSON health and a config shim using demo.get_config_file().
+    """
+    from fastapi import FastAPI
+    from fastapi.responses import JSONResponse
+    app = FastAPI(title="VideoBackgroundReplacer2")
+    @app.get("/healthz")
+    def _healthz():
+        return {"ok": True, "ts": time.time()}
+    @app.get("/config")
+    def _config():
+        try:
+            cfg = demo.get_config_file()
+            return JSONResponse(content=cfg)
+        except Exception as e:
+            return JSONResponse(
+                status_code=500,
+                content={"error": "config_generation_failed", "detail": str(e)},
+            )
+    # Mount Gradio UI at root; our /config route remains at parent level
+    app = gr.mount_gradio_app(app, demo, path="/")
+    return app
+# ---------------------------------------------------------------------
+# Entrypoint
+# ---------------------------------------------------------------------
+if __name__ == "__main__":
+    host = os.environ.get("HOST", "0.0.0.0")
+    port = int(os.environ.get("PORT", "7860"))
+    mount_mode = os.environ.get("GRADIO_MOUNT_MODE", "0") == "1"
+    logger.info("Launching on %s:%s (mount_mode=%s)…", host, port, mount_mode)
+    _log_web_stack_versions_and_paths()
+    demo = build_ui()
+    demo.queue(max_size=16, api_open=False)
+    threading.Thread(target=_post_launch_diag, daemon=True).start()
+    if mount_mode:
+        try:
+            from uvicorn import run as uvicorn_run
+        except Exception:
+            logger.error("uvicorn is not installed; mount mode cannot start.")
+            raise
+        app = build_fastapi_with_gradio(demo)
+        uvicorn_run(app=app, host=host, port=port, log_level="info")
+    else:
+        demo.launch(
+            server_name=host,
+            server_port=port,
+            share=False,
+            show_api=False,
+            show_error=True,
+            quiet=False,
+            debug=True,
+            max_threads=1,
+        )

pipeline_utils.py ADDED Viewed

	@@ -0,0 +1,191 @@

+import os
+import cv2
+import numpy as np
+import tempfile
+from pathlib import Path
+from typing import Optional, Union, Callable
+import logging
+from PIL import Image
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+class VideoProcessor:
+    def __init__(self, temp_dir: Optional[str] = None):
+        """
+        Initialize the video processor.
+        Args:
+            temp_dir: Directory for temporary files. If None, creates a temp directory.
+        """
+        self.temp_dir = Path(temp_dir) if temp_dir else Path(tempfile.mkdtemp(prefix="bg_replace_"))
+        self.temp_dir.mkdir(parents=True, exist_ok=True)
+        self.device = self._get_device()
+        logger.info(f"Initialized VideoProcessor with device: {self.device}")
+    def _get_device(self) -> str:
+        """Check if CUDA is available."""
+        try:
+            import torch
+            return "cuda" if torch.cuda.is_available() else "cpu"
+        except ImportError:
+            return "cpu"
+    def _create_static_bg_video(
+        self,
+        bg_image: np.ndarray,
+        reference_video: str,
+        output_path: str
+    ) -> str:
+        """
+        Create a static background video matching the input video's duration.
+        """
+        cap = cv2.VideoCapture(reference_video)
+        width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+        height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+        fps = cap.get(cv2.CAP_PROP_FPS)
+        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+        cap.release()
+        # Resize background image
+        bg_image = cv2.resize(bg_image, (width, height))
+        # Write video
+        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+        out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
+        for _ in range(total_frames):
+            out.write(bg_image)
+        out.release()
+        return output_path
+    def _process_with_pipeline(
+        self,
+        input_video: str,
+        background: Optional[Union[str, np.ndarray]] = None,
+        bg_type: str = "blur",
+        progress_callback: Optional[Callable] = None
+    ) -> str:
+        """
+        Process video using the two-stage pipeline.
+        """
+        try:
+            # Import the pipeline
+            from integrated_pipeline import TwoStageProcessor
+            # Update progress
+            if progress_callback:
+                progress_callback(0.1, "Initializing pipeline...")
+            # Handle background
+            bg_video_path = ""
+            if bg_type == "image" and background is not None:
+                if isinstance(background, str):
+                    bg_image = cv2.imread(background)
+                else:
+                    bg_image = background
+                bg_video_path = str(self.temp_dir / "background.mp4")
+                self._create_static_bg_video(bg_image, input_video, bg_video_path)
+            # Initialize processor
+            processor = TwoStageProcessor(temp_dir=str(self.temp_dir))
+            # Process video
+            output_path = str(self.temp_dir / "output.mp4")
+            # Mock click points (center of frame)
+            click_points = [[0.5, 0.5]]
+            # Process
+            success = processor.process_video(
+                input_video=input_video,
+                background_video=bg_video_path if bg_type == "image" else "",
+                click_points=click_points,
+                output_path=output_path,
+                use_matanyone=True,
+                progress_callback=progress_callback
+            )
+            if not success:
+                raise RuntimeError("Video processing failed")
+            return output_path
+        except Exception as e:
+            logger.error(f"Error in pipeline: {str(e)}")
+            raise
+    def process_video(
+        self,
+        input_path: Union[str, bytes],
+        background: Optional[Union[str, np.ndarray]] = None,
+        bg_type: str = "blur",
+        progress_callback: Optional[Callable] = None
+    ) -> bytes:
+        """
+        Process a video with the given background.
+        Args:
+            input_path: Path to input video or bytes
+            background: Background image path or numpy array
+            bg_type: Type of background ("image", "color", or "blur")
+            progress_callback: Optional callback for progress updates
+        Returns:
+            Processed video as bytes
+        """
+        try:
+            # Save input to temp file if it's bytes
+            if isinstance(input_path, bytes):
+                input_video = str(self.temp_dir / "input.mp4")
+                with open(input_video, "wb") as f:
+                    f.write(input_path)
+            else:
+                input_video = input_path
+            # Process the video
+            output_path = self._process_with_pipeline(
+                input_video,
+                background,
+                bg_type,
+                progress_callback
+            )
+            # Read the output file
+            with open(output_path, "rb") as f:
+                return f.read()
+        except Exception as e:
+            logger.error(f"Error processing video: {str(e)}")
+            raise
+# Global instance
+video_processor = VideoProcessor()
+def process_video_pipeline(
+    input_data: Union[str, bytes],
+    background: Optional[Union[str, np.ndarray]] = None,
+    bg_type: str = "blur",
+    progress_callback: Optional[Callable] = None
+) -> bytes:
+    """
+    High-level function to process a video.
+    Args:
+        input_data: Input video path or bytes
+        background: Background image path or numpy array
+        bg_type: Type of background ("image", "color", or "blur")
+        progress_callback: Optional progress callback
+    Returns:
+        Processed video as bytes
+    """
+    return video_processor.process_video(
+        input_data,
+        background,
+        bg_type,
+        progress_callback
+    )

requirements.txt CHANGED Viewed

@@ -35,22 +35,21 @@ iopath>=0.1.10,<0.2.0
 kornia>=0.7.0,<0.8.0
 tqdm>=4.60.0,<5.0.0
-# ===== UI and API =====
-# Bump to avoid gradio_client 1.3.0 bug ("bool is not iterable")
-gradio==4.42.0
-# ===== Web stack pins for Gradio 4.42.0 =====
-fastapi==0.109.2
-starlette==0.36.3
-uvicorn==0.29.0
-httpx==0.27.2
-anyio==4.4.0
 orjson>=3.10.0
 # ===== Pydantic family (avoid breaking core 2.23.x) =====
 pydantic==2.8.2
 pydantic-core==2.20.1
-annotated-types==0.6.0
 typing-extensions==4.12.2
 # ===== Helpers and Utilities =====
@@ -69,4 +68,4 @@ nvidia-ml-py3>=7.352.0,<12.0.0
 loguru>=0.6.0,<1.0.0
 # File handling
-python-multipart>=0.0.5,<1.0.0

 kornia>=0.7.0,<0.8.0
 tqdm>=4.60.0,<5.0.0
+# ===== Streamlit UI =====
+streamlit>=1.32.0
+streamlit-webrtc>=0.50.0  # For real-time video processing
+# ===== Web stack =====
+fastapi>=0.104.0
+uvicorn>=0.24.0
+httpx>=0.25.0
+anyio>=4.0.0
 orjson>=3.10.0
 # ===== Pydantic family (avoid breaking core 2.23.x) =====
 pydantic==2.8.2
 pydantic-core==2.20.1
+annotated-types==0.60.0
 typing-extensions==4.12.2
 # ===== Helpers and Utilities =====
 loguru>=0.6.0,<1.0.0
 # File handling
+python-multipart>=0.0.5,<1.0.0

streamlit_app.py ADDED Viewed

	@@ -0,0 +1,301 @@

+# streamlit_ui.py
+import streamlit as st
+import os
+import sys
+import tempfile
+import time
+from pathlib import Path
+import cv2
+import numpy as np
+from PIL import Image
+import logging
+import io
+# Add project root to path
+sys.path.append(str(Path(__file__).parent.absolute()))
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# Set page config
+st.set_page_config(
+    page_title="🎬 Advanced Video Background Replacer",
+    page_icon="🎥",
+    layout="wide",
+    initial_sidebar_state="expanded"
+)
+# Custom CSS for better UI
+st.markdown("""
+<style>
+    .main .block-container {
+        padding-top: 2rem;
+        padding-bottom: 2rem;
+    }
+    .stButton>button {
+        width: 100%;
+        background-color: #4CAF50;
+        color: white;
+        font-weight: bold;
+        transition: all 0.3s;
+    }
+    .stButton>button:hover {
+        background-color: #45a049;
+    }
+    .stProgress > div > div > div > div {
+        background-color: #4CAF50;
+    }
+    .stAlert {
+        border-radius: 10px;
+    }
+    .stTabs [data-baseweb="tab-list"] {
+        gap: 10px;
+    }
+    .stTabs [data-baseweb="tab"] {
+        height: 50px;
+        white-space: pre;
+        background-color: #f0f2f6;
+        border-radius: 4px 4px 0 0;
+        padding: 10px 20px;
+        margin-right: 5px;
+    }
+    .stTabs [aria-selected="true"] {
+        background-color: #4CAF50;
+        color: white;
+    }
+    .video-container {
+        border: 2px dashed #4CAF50;
+        border-radius: 10px;
+        padding: 10px;
+        margin-bottom: 20px;
+    }
+</style>
+""", unsafe_allow_html=True)
+def initialize_session_state():
+    """Initialize all session state variables"""
+    if 'uploaded_video' not in st.session_state:
+        st.session_state.uploaded_video = None
+    if 'bg_image' not in st.session_state:
+        st.session_state.bg_image = None
+    if 'bg_color' not in st.session_state:
+        st.session_state.bg_color = "#00FF00"
+    if 'processed_video_path' not in st.session_state:
+        st.session_state.processed_video_path = None
+    if 'processing' not in st.session_state:
+        st.session_state.processing = False
+    if 'progress' not in st.session_state:
+        st.session_state.progress = 0
+    if 'progress_text' not in st.session_state:
+        st.session_state.progress_text = "Ready"
+def handle_video_upload():
+    """Handle video file upload"""
+    uploaded = st.file_uploader(
+        "📹 Upload Video",
+        type=["mp4", "mov", "avi"],
+        key="video_uploader"
+    )
+    if uploaded is not None:
+        st.session_state.uploaded_video = uploaded
+def show_video_preview():
+    """Show video preview in the UI"""
+    st.markdown("### Video Preview")
+    if st.session_state.uploaded_video is not None:
+        video_bytes = st.session_state.uploaded_video.getvalue()
+        st.video(video_bytes)
+        st.session_state.uploaded_video.seek(0)
+def handle_background_selection():
+    """Handle background selection UI"""
+    st.markdown("### Background Options")
+    bg_type = st.radio(
+        "Select Background Type:",
+        ["Image", "Color", "Blur"],
+        horizontal=True,
+        index=0
+    )
+    if bg_type == "Image":
+        bg_image = st.file_uploader(
+            "🖼️ Upload Background Image",
+            type=["jpg", "png", "jpeg"],
+            key="bg_image_uploader"
+        )
+        if bg_image is not None:
+            st.session_state.bg_image = Image.open(bg_image)
+            st.image(
+                st.session_state.bg_image,
+                caption="Selected Background",
+                use_container_width=True
+            )
+    elif bg_type == "Color":
+        st.session_state.bg_color = st.color_picker(
+            "🎨 Choose Background Color",
+            st.session_state.bg_color
+        )
+        color_rgb = tuple(int(st.session_state.bg_color.lstrip('#')[i:i+2], 16) for i in (0, 2, 4))
+        color_display = np.zeros((100, 100, 3), dtype=np.uint8)
+        color_display[:, :] = color_rgb[::-1]  # RGB to BGR for OpenCV
+        st.image(color_display, caption="Selected Color", width=200)
+    return bg_type.lower()
+def process_video(input_file, background, bg_type="image"):
+    """
+    Process video with the selected background using SAM2 and MatAnyone pipeline.
+    Returns the path to the processed video file.
+    """
+    try:
+        # Create a temporary directory for processing
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_dir = Path(temp_dir)
+            # Save the uploaded video to a temporary file
+            input_path = str(temp_dir / "input.mp4")
+            with open(input_path, "wb") as f:
+                f.write(input_file.getvalue())
+            # Prepare background
+            bg_path = None
+            if bg_type == "image" and background is not None:
+                # Convert PIL Image to OpenCV format
+                bg_cv = cv2.cvtColor(np.array(background), cv2.COLOR_RGB2BGR)
+                bg_path = str(temp_dir / "background.jpg")
+                cv2.imwrite(bg_path, bg_cv)
+            elif bg_type == "color" and hasattr(st.session_state, 'bg_color'):
+                # Create a solid color image
+                color_hex = st.session_state.bg_color.lstrip('#')
+                color_rgb = tuple(int(color_hex[i:i+2], 16) for i in (0, 2, 4))
+                bg_path = str(temp_dir / "background.jpg")
+                cv2.imwrite(bg_path, np.ones((100, 100, 3), dtype=np.uint8) * color_rgb[::-1])
+            # Set up progress callback
+            progress_bar = st.progress(0)
+            status_text = st.empty()
+            def progress_callback(progress, message):
+                progress = max(0, min(1, float(progress)))
+                progress_bar.progress(progress)
+                status_text.text(f"Status: {message}")
+                st.session_state.progress = int(progress * 100)
+                st.session_state.progress_text = message
+            # Process the video
+            output_path = str(temp_dir / "output.mp4")
+            # Mock click points (center of the frame)
+            click_points = [[0.5, 0.5]]
+            # Import the pipeline processor
+            from integrated_pipeline import TwoStageProcessor
+            # Initialize the processor
+            processor = TwoStageProcessor(temp_dir=str(temp_dir))
+            # Process the video
+            success = processor.process_video(
+                input_video=input_path,
+                background_video=bg_path if bg_type == "image" else "",
+                click_points=click_points,
+                output_path=output_path,
+                use_matanyone=True,
+                progress_callback=progress_callback
+            )
+            if not success:
+                raise RuntimeError("Video processing failed")
+            # Return the path to the processed video
+            return output_path
+    except Exception as e:
+        logger.error(f"Error in video processing: {str(e)}", exc_info=True)
+        st.error(f"An error occurred during processing: {str(e)}")
+        return None
+def main():
+    st.title("🎬 Advanced Video Background Replacer")
+    st.markdown("---")
+    # Initialize session state
+    initialize_session_state()
+    # Main layout
+    col1, col2 = st.columns([1, 1], gap="large")
+    with col1:
+        st.header("1. Upload Video")
+        handle_video_upload()
+        show_video_preview()
+    with col2:
+        st.header("2. Background Settings")
+        bg_type = handle_background_selection()
+        st.header("3. Process & Download")
+        if st.button(
+            "🚀 Process Video",
+            type="primary",
+            disabled=not st.session_state.uploaded_video or st.session_state.processing,
+            use_container_width=True
+        ):
+            with st.spinner("Processing video (this may take a few minutes)..."):
+                st.session_state.processing = True
+                try:
+                    # Prepare background based on type
+                    background = None
+                    if bg_type == "image" and 'bg_image' in st.session_state and st.session_state.bg_image is not None:
+                        background = st.session_state.bg_image
+                    elif bg_type == "color" and 'bg_color' in st.session_state:
+                        background = st.session_state.bg_color
+                    # Process the video
+                    output_path = process_video(
+                        st.session_state.uploaded_video,
+                        background,
+                        bg_type=bg_type
+                    )
+                    if output_path and os.path.exists(output_path):
+                        # Store the path to the processed video
+                        st.session_state.processed_video_path = output_path
+                        st.success("✅ Video processing complete!")
+                    else:
+                        st.error("❌ Failed to process video. Please check the logs for details.")
+                except Exception as e:
+                    st.error(f"❌ An error occurred: {str(e)}")
+                    logger.exception("Video processing failed")
+                finally:
+                    st.session_state.processing = False
+        # Show processed video if available
+        if 'processed_video_path' in st.session_state and st.session_state.processed_video_path:
+            st.markdown("### Processed Video")
+            try:
+                # Display the video directly from the file
+                with open(st.session_state.processed_video_path, 'rb') as f:
+                    video_bytes = f.read()
+                    st.video(video_bytes)
+                    # Download button
+                    st.download_button(
+                        label="💾 Download Processed Video",
+                        data=video_bytes,
+                        file_name="processed_video.mp4",
+                        mime="video/mp4",
+                        use_container_width=True
+                    )
+            except Exception as e:
+                st.error(f"Error displaying video: {str(e)}")
+                logger.error(f"Error displaying video: {str(e)}", exc_info=True)
+if __name__ == "__main__":
+    main()