Spaces:

lukeafullard
/

ImageProcessing

Sleeping

App Files Files Community

lukeafullard commited on Jan 3

Commit

dbc4275

verified ·

1 Parent(s): 7670112

Update src/streamlit_app.py

Browse files

Files changed (1) hide show

src/streamlit_app.py +59 -88

src/streamlit_app.py CHANGED Viewed

@@ -1,50 +1,62 @@
 import streamlit as st
 from PIL import Image, ImageEnhance
-from rembg import remove
-import io
 import torch
 import numpy as np
-from transformers import AutoImageProcessor, Swin2SRForImageSuperResolution, pipeline
 # Page Configuration
 st.set_page_config(layout="wide", page_title="AI Image Lab")
 # --- Caching AI Models ---
-# We use separate functions for 2x and 4x to avoid loading both into memory if not needed.
 @st.cache_resource
-def load_upscaler_x2():
-    """Loads the Swin2SR model for 2x upscale."""
-    model_id = "caidas/swin2SR-classical-sr-x2-64"
-    processor = AutoImageProcessor.from_pretrained(model_id)
-    model = Swin2SRForImageSuperResolution.from_pretrained(model_id)
-    return processor, model
-@st.cache_resource
-def load_upscaler_x4():
-    """Loads the Swin2SR model for 4x upscale."""
-    # This model is heavier and takes longer to run
-    model_id = "caidas/swin2SR-classical-sr-x4-63"
-    processor = AutoImageProcessor.from_pretrained(model_id)
-    model = Swin2SRForImageSuperResolution.from_pretrained(model_id)
-    return processor, model
-@st.cache_resource
-def load_depth_pipeline():
-    """Loads a lightweight Depth Estimation pipeline."""
-    pipe = pipeline(task="depth-estimation", model="vinvino02/glpn-nyu")
-    return pipe
-def ai_upscale(image, processor, model):
-    """Runs the super-resolution model."""
-    inputs = processor(image, return_tensors="pt")
     with torch.no_grad():
-        outputs = model(**inputs)
-    output = outputs.reconstruction.data.squeeze().float().cpu().clamp_(0, 1).numpy()
-    output = np.moveaxis(output, 0, -1)
-    output = (output * 255.0).round().astype(np.uint8)
-    return Image.fromarray(output)
 def convert_image_to_bytes(img):
     buf = io.BytesIO()
@@ -52,98 +64,57 @@ def convert_image_to_bytes(img):
     return buf.getvalue()
 def main():
-    st.title("✨ AI Image Lab: Transformers Edition")
-    st.markdown("Processing pipeline: **Background Removal** → **AI Modifiers** → **Geometry**")
     # --- Sidebar Controls ---
     st.sidebar.header("Processing Pipeline")
-    # 1. Background
-    st.sidebar.subheader("1. Cleanup")
-    remove_bg = st.sidebar.checkbox("Remove Background (rembg)", value=False)
-    # 2. AI Enhancements
-    st.sidebar.subheader("2. AI Enhancements")
-    ai_mode = st.sidebar.radio(
-        "Choose AI Modification:",
-        ["None", "AI Super-Resolution (2x)", "AI Super-Resolution (4x)", "Depth Estimation"]
-    )
-    # 3. Geometry & Color
-    st.sidebar.subheader("3. Final Adjustments")
     rotate_angle = st.sidebar.slider("Rotate", -180, 180, 0, 1)
-    contrast_val = st.sidebar.slider("Contrast", 0.5, 1.5, 1.0, 0.1)
     # --- Main Content ---
     uploaded_file = st.file_uploader("Upload an image...", type=["jpg", "jpeg", "png", "webp"])
     if uploaded_file is not None:
         image = Image.open(uploaded_file).convert("RGB")
         processed_image = image.copy()
         # --- STEP 1: Background Removal ---
         if remove_bg:
-            with st.spinner("Removing background..."):
-                processed_image = remove(processed_image)
-        # --- STEP 2: AI Enhancements ---
-        if ai_mode == "AI Super-Resolution (2x)":
-            st.info("Loading Swin2SR (2x) model... (Fast)")
-            try:
-                processor, model = load_upscaler_x2()
-                with st.spinner("Upscaling (2x)..."):
-                    processed_image = ai_upscale(processed_image, processor, model)
-            except Exception as e:
-                st.error(f"Error loading Upscaler: {e}")
-        elif ai_mode == "AI Super-Resolution (4x)":
-            st.warning("Loading Swin2SR (4x) model... (This is computationally heavy!)")
-            # Added a warning because 4x on CPU can be quite slow for large images
-            try:
-                processor, model = load_upscaler_x4()
-                with st.spinner("Upscaling (4x)... please wait"):
-                    processed_image = ai_upscale(processed_image, processor, model)
-            except Exception as e:
-                st.error(f"Error loading Upscaler: {e}")
-        elif ai_mode == "Depth Estimation":
-            st.info("Generating Depth Map...")
             try:
-                depth_pipe = load_depth_pipeline()
-                with st.spinner("Estimating depth..."):
-                    result = depth_pipe(processed_image)
-                    processed_image = result["depth"]
             except Exception as e:
-                st.error(f"Error loading Depth Model: {e}")
-        # --- STEP 3: Geometry/Color ---
-        # Rotation
         if rotate_angle != 0:
             processed_image = processed_image.rotate(rotate_angle, expand=True)
-        # Contrast
-        if contrast_val != 1.0:
-            enhancer = ImageEnhance.Contrast(processed_image)
-            processed_image = enhancer.enhance(contrast_val)
         # --- Display ---
         col1, col2 = st.columns(2)
         with col1:
             st.subheader("Original")
             st.image(image, use_container_width=True)
-            st.caption(f"Size: {image.size}")
         with col2:
             st.subheader("Result")
             st.image(processed_image, use_container_width=True)
-            st.caption(f"Size: {processed_image.size}")
         # --- Download ---
         st.markdown("---")
         btn = st.download_button(
             label="💾 Download Result",
             data=convert_image_to_bytes(processed_image),
-            file_name="ai_enhanced_image.png",
             mime="image/png",
         )

 import streamlit as st
 from PIL import Image, ImageEnhance
 import torch
+import torch.nn.functional as F
+from torchvision import transforms
+from transformers import AutoModelForImageSegmentation
+import io
 import numpy as np
 # Page Configuration
 st.set_page_config(layout="wide", page_title="AI Image Lab")
 # --- Caching AI Models ---
 @st.cache_resource
+def load_birefnet_model():
+    """
+    Loads the RMBG-1.4 model for Background Removal (Pure PyTorch).
+    """
+    # We use 'briaai/RMBG-1.4' which is SOTA for background removal
+    model = AutoModelForImageSegmentation.from_pretrained("briaai/RMBG-1.4", trust_remote_code=True)
+    # Move to GPU if available, otherwise CPU
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    model.to(device)
+    return model, device
+# ... (Previous Upscalers kept for reference, you can re-add them if you wish) ...
+def remove_background_torch(image, model, device):
+    """
+    Runs background removal using RMBG-1.4 on PyTorch.
+    """
+    # 1. Prepare input
+    w, h = image.size
+    # The model expects specific normalization and size
+    transform_image = transforms.Compose([
+        transforms.Resize((1024, 1024)),
+        transforms.ToTensor(),
+        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
+    ])
+    input_images = transform_image(image).unsqueeze(0).to(device)
+    # 2. Inference
     with torch.no_grad():
+        preds = model(input_images)[-1].sigmoid().cpu()
+    # 3. Post-process mask
+    pred = preds[0].squeeze()
+    # Convert mask to PIL and resize back to original dimensions
+    pred_pil = transforms.ToPILImage()(pred)
+    mask = pred_pil.resize((w, h))
+    # 4. Apply mask to original image
+    image.putalpha(mask)
+    return image
 def convert_image_to_bytes(img):
     buf = io.BytesIO()
     return buf.getvalue()
 def main():
+    st.title("✨ AI Image Lab: Pure PyTorch Edition")
+    st.markdown("Processing pipeline: **RMBG-1.4 (No ONNX)**")
     # --- Sidebar Controls ---
     st.sidebar.header("Processing Pipeline")
+    remove_bg = st.sidebar.checkbox("Remove Background (RMBG-1.4)", value=False)
+    st.sidebar.subheader("Final Adjustments")
     rotate_angle = st.sidebar.slider("Rotate", -180, 180, 0, 1)
     # --- Main Content ---
     uploaded_file = st.file_uploader("Upload an image...", type=["jpg", "jpeg", "png", "webp"])
     if uploaded_file is not None:
+        # Important: RMBG model works best if we ensure RGB mode
         image = Image.open(uploaded_file).convert("RGB")
         processed_image = image.copy()
         # --- STEP 1: Background Removal ---
         if remove_bg:
+            st.info("Loading RMBG-1.4 Model (First run will download ~170MB)...")
             try:
+                # Load Model
+                model, device = load_birefnet_model()
+                with st.spinner("Removing background using PyTorch..."):
+                    processed_image = remove_background_torch(processed_image, model, device)
             except Exception as e:
+                st.error(f"Error during background removal: {e}")
+        # --- STEP 2: Geometry/Color ---
         if rotate_angle != 0:
             processed_image = processed_image.rotate(rotate_angle, expand=True)
         # --- Display ---
         col1, col2 = st.columns(2)
         with col1:
             st.subheader("Original")
             st.image(image, use_container_width=True)
         with col2:
             st.subheader("Result")
             st.image(processed_image, use_container_width=True)
         # --- Download ---
         st.markdown("---")
         btn = st.download_button(
             label="💾 Download Result",
             data=convert_image_to_bytes(processed_image),
+            file_name="nobg_image.png",
             mime="image/png",
         )