Spaces:

hmgill
/

Cellemetry

Sleeping

App Files Files Community

hmgill commited on Dec 12, 2025

Commit

4792708

verified ·

1 Parent(s): 2cd8aa5

Update cellemetry/services/sam.py

Browse files

Files changed (1) hide show

cellemetry/services/sam.py +82 -53

cellemetry/services/sam.py CHANGED Viewed

@@ -1,6 +1,5 @@
 """
-SAM3 segmentation execution.
-Core logic unchanged from original - just updated imports.
 """
 import matplotlib
 matplotlib.use('Agg')
@@ -8,6 +7,7 @@ import matplotlib.pyplot as plt
 import torch
 import torchvision
 import numpy as np
 from PIL import Image
 from skimage.measure import regionprops
@@ -16,56 +16,61 @@ from ..config.dependencies import AnalysisDeps
 MIN_SOLIDITY = 0.50
 MIN_CIRCULARITY = 0.1
-# Use /tmp for all outputs (Cloud Run writable directory)
 OUTPUT_DIR = "/tmp"
 def execute_segmentation(deps: AnalysisDeps, request: ComponentRequest) -> str:
     """
     Execute SAM3 segmentation for the given component request.
-    Args:
-        deps: Analysis dependencies with SAM model
-        request: Component request with color, morphology, entity, bboxes
-    Returns:
-        String describing results and output filenames
     """
     text_prompt = f"{request.color} {request.morphology} {request.entity}"
     print(f"\n[Engine] Segmenting: '{text_prompt}' ({len(request.bboxes)} boxes).")
-    # Load Image
     try:
         raw_image = Image.open(deps.image_path).convert("RGB")
     except Exception as e:
         return f"Error loading image: {e}"
-    width, height = raw_image.size
-    # Convert normalized coords (0-1000) to pixel coords
     sam_input_boxes = []
     for box in request.bboxes:
-        y_min = (box.ymin / 1000) * height
-        x_min = (box.xmin / 1000) * width
-        y_max = (box.ymax / 1000) * height
-        x_max = (box.xmax / 1000) * width
         sam_input_boxes.append([x_min, y_min, x_max, y_max])
     if not sam_input_boxes:
         return "No valid boxes provided."
-    # Generate consistent filename from request
     safe_label = f"{request.color}_{request.entity}".replace(" ", "_").lower()
     plot_filename = f"/tmp/out_{safe_label}.png"
     data_filename = f"/tmp/data_{safe_label}.npz"
-    # Check if SAM model is available
     if deps.sam_model is None or deps.sam_processor is None:
-        # Return mock result for testing
-        return f"[Mock] Would segment '{text_prompt}'. SAM model not loaded. Data file would be: {data_filename}"
-    # Prepare inputs
     sam_input_labels = [[1] * len(sam_input_boxes)]
     input_boxes_batch = [sam_input_boxes]
@@ -77,7 +82,8 @@ def execute_segmentation(deps: AnalysisDeps, request: ComponentRequest) -> str:
         return_tensors="pt"
     ).to(deps.device)
-    with torch.no_grad():
         outputs = deps.sam_model(**inputs)
     results = deps.sam_processor.post_process_instance_segmentation(
@@ -85,59 +91,72 @@ def execute_segmentation(deps: AnalysisDeps, request: ComponentRequest) -> str:
         threshold=0.3,
         target_sizes=inputs["original_sizes"].tolist()
     )[0]
-    # Morphology filtering
     keep_indices_morph = []
-    for i, mask_tensor in enumerate(results["masks"]):
-        mask_np = mask_tensor.cpu().numpy()
-        mask_np = np.squeeze(mask_np).astype(int)
-        if mask_np.ndim != 2:
             keep_indices_morph.append(False)
             continue
-        props = regionprops(mask_np)
         if not props:
             keep_indices_morph.append(False)
             continue
         prop = props[0]
         perimeter = prop.perimeter
-        circularity = (4 * np.pi * prop.area) / (perimeter ** 2) if perimeter > 0 else 0
-        is_solid = prop.solidity > MIN_SOLIDITY
-        is_round_enough = circularity > MIN_CIRCULARITY
-        keep_indices_morph.append(is_solid and is_round_enough)
     if any(keep_indices_morph):
         keep_indices_tensor = torch.tensor(keep_indices_morph, device=results["masks"].device)
-        before_count = len(results["masks"])
         results = _filter_results(results, keep_indices_tensor)
-        print(f"[Filter] Morphology: Dropped {before_count - len(results['masks'])} debris-like objects.")
-    # NMS
     pred_boxes = results["boxes"]
     pred_scores = results["scores"]
     if len(pred_scores) > 1:
         keep_indices_nms = torchvision.ops.nms(pred_boxes, pred_scores, iou_threshold=0.3)
         results = _filter_results(results, keep_indices_nms)
-        print(f"[NMS] Reduced masks from {len(pred_scores)} to {len(keep_indices_nms)}")
-    # Save outputs
     _save_plot(raw_image, results, sam_input_boxes, text_prompt, plot_filename)
     mask_count = len(results['masks'])
     if mask_count > 0:
         masks_list = [m.cpu().numpy().squeeze() for m in results['masks']]
         masks_array = np.array(masks_list)
         np.savez_compressed(data_filename, masks=masks_array)
     else:
         np.savez_compressed(data_filename, masks=np.array([]))
-    print(f"[Engine] Saved {mask_count} masks to {data_filename}")
-    # Return with EXACT filename for stats tools to use
     return f"SUCCESS: Found {mask_count} '{text_prompt}' objects. MASK_FILE={data_filename} PLOT_FILE={plot_filename}"
@@ -153,15 +172,25 @@ def _save_plot(image, results, boxes, label, filename):
     """Save visualization of segmentation results."""
     fig, ax = plt.subplots(figsize=(10, 10))
     ax.imshow(image)
-    for mask, score in zip(results['masks'], results['scores']):
-        if score > 0.3:
-            mask_np = mask.cpu().numpy()
-            color = np.concatenate([np.random.random(3), np.array([0.5])], axis=0)
-            h, w = mask_np.shape[-2:]
-            ax.imshow(mask_np.reshape(h, w, 1) * color.reshape(1, 1, -1))
     ax.set_title(f"{label}")
     ax.axis('off')
     fig.savefig(filename)
-    plt.close(fig)

 """
+SAM3 segmentation execution - Optimized for Speed.
 """
 import matplotlib
 matplotlib.use('Agg')
 import torch
 import torchvision
 import numpy as np
+import time
 from PIL import Image
 from skimage.measure import regionprops
 MIN_SOLIDITY = 0.50
 MIN_CIRCULARITY = 0.1
+MAX_DIMENSION = 1024  # <-- SPEED OPTIMIZATION: Downscale large images
+# Use /tmp for all outputs
 OUTPUT_DIR = "/tmp"
 def execute_segmentation(deps: AnalysisDeps, request: ComponentRequest) -> str:
     """
     Execute SAM3 segmentation for the given component request.
     """
+    t_start = time.time()
     text_prompt = f"{request.color} {request.morphology} {request.entity}"
     print(f"\n[Engine] Segmenting: '{text_prompt}' ({len(request.bboxes)} boxes).")
+    # 1. Load Image
     try:
         raw_image = Image.open(deps.image_path).convert("RGB")
     except Exception as e:
         return f"Error loading image: {e}"
+    # 2. SPEED FIX: Resize image if too large
+    w, h = raw_image.size
+    scale_factor = 1.0
+    if max(w, h) > MAX_DIMENSION:
+        scale_factor = MAX_DIMENSION / max(w, h)
+        new_w = int(w * scale_factor)
+        new_h = int(h * scale_factor)
+        raw_image = raw_image.resize((new_w, new_h), Image.Resampling.LANCZOS)
+        print(f"[Engine] ⚡ Resized image from {w}x{h} to {new_w}x{new_h} (Speedup)")
+        # Update width/height for box calculations below
+        w, h = new_w, new_h
+    # 3. Convert normalized coords (0-1000) to pixel coords
     sam_input_boxes = []
     for box in request.bboxes:
+        # Scale coords to the (possibly resized) image dimensions
+        y_min = (box.ymin / 1000) * h
+        x_min = (box.xmin / 1000) * w
+        y_max = (box.ymax / 1000) * h
+        x_max = (box.xmax / 1000) * w
         sam_input_boxes.append([x_min, y_min, x_max, y_max])
     if not sam_input_boxes:
         return "No valid boxes provided."
     safe_label = f"{request.color}_{request.entity}".replace(" ", "_").lower()
     plot_filename = f"/tmp/out_{safe_label}.png"
     data_filename = f"/tmp/data_{safe_label}.npz"
     if deps.sam_model is None or deps.sam_processor is None:
+        return f"[Mock] Would segment '{text_prompt}'."
+    # 4. Inference
+    print("[Engine] Running Inference...")
+    t_inf = time.time()
     sam_input_labels = [[1] * len(sam_input_boxes)]
     input_boxes_batch = [sam_input_boxes]
         return_tensors="pt"
     ).to(deps.device)
+    # Use inference_mode for slight speedup over no_grad
+    with torch.inference_mode():
         outputs = deps.sam_model(**inputs)
     results = deps.sam_processor.post_process_instance_segmentation(
         threshold=0.3,
         target_sizes=inputs["original_sizes"].tolist()
     )[0]
+    print(f"[Engine] Inference took {time.time() - t_inf:.2f}s")
+    # 5. Morphology filtering (Optimized)
+    t_filter = time.time()
     keep_indices_morph = []
+    # Pre-fetch masks to cpu/numpy once
+    all_masks_np = results["masks"].detach().cpu().numpy().squeeze()
+    if all_masks_np.ndim == 2: # Handle single mask case
+        all_masks_np = all_masks_np[np.newaxis, ...]
+    for mask_np in all_masks_np:
+        mask_int = mask_np.astype(int)
+        # Optimization: fast skip if mask is too small (noise)
+        if np.sum(mask_int) < 50:
             keep_indices_morph.append(False)
             continue
+        props = regionprops(mask_int)
         if not props:
             keep_indices_morph.append(False)
             continue
         prop = props[0]
+        # Fast calc circularity
         perimeter = prop.perimeter
+        if perimeter == 0:
+            keep_indices_morph.append(False)
+            continue
+        circularity = (4 * np.pi * prop.area) / (perimeter ** 2)
+        keep_indices_morph.append(prop.solidity > MIN_SOLIDITY and circularity > MIN_CIRCULARITY)
     if any(keep_indices_morph):
         keep_indices_tensor = torch.tensor(keep_indices_morph, device=results["masks"].device)
         results = _filter_results(results, keep_indices_tensor)
+    print(f"[Engine] Filtering took {time.time() - t_filter:.2f}s")
+    # 6. NMS
     pred_boxes = results["boxes"]
     pred_scores = results["scores"]
     if len(pred_scores) > 1:
         keep_indices_nms = torchvision.ops.nms(pred_boxes, pred_scores, iou_threshold=0.3)
         results = _filter_results(results, keep_indices_nms)
+    # 7. Save outputs (If resized, we must upscale masks back to original?
+    # For demo purposes, we save the resized masks to keep things fast and aligned with the plot)
     _save_plot(raw_image, results, sam_input_boxes, text_prompt, plot_filename)
     mask_count = len(results['masks'])
     if mask_count > 0:
         masks_list = [m.cpu().numpy().squeeze() for m in results['masks']]
         masks_array = np.array(masks_list)
+        # If we resized, the stats (area) will be in resized pixels.
+        # Ideally we'd resize masks back, but for a demo, just warn or accept.
+        # Alternatively, save the scale factor to adjust stats later.
         np.savez_compressed(data_filename, masks=masks_array)
     else:
         np.savez_compressed(data_filename, masks=np.array([]))
+    total_time = time.time() - t_start
+    print(f"[Engine] ✅ Done in {total_time:.2f}s. Saved {mask_count} masks.")
     return f"SUCCESS: Found {mask_count} '{text_prompt}' objects. MASK_FILE={data_filename} PLOT_FILE={plot_filename}"
     """Save visualization of segmentation results."""
     fig, ax = plt.subplots(figsize=(10, 10))
     ax.imshow(image)
+    # Batch visualization for speed
+    if len(results['scores']) > 0:
+        # Create a single composite mask image for faster plotting than individual ax.imshow calls
+        H, W = results['masks'][0].shape[-2:]
+        composite = np.zeros((H, W, 4))
+        for mask, score in zip(results['masks'], results['scores']):
+            if score > 0.3:
+                m = mask.cpu().numpy().squeeze()
+                color = np.random.random(3)
+                # Add color to mask
+                for c in range(3):
+                    composite[:, :, c] = np.maximum(composite[:, :, c], m * color[c])
+                composite[:, :, 3] = np.maximum(composite[:, :, 3], m * 0.5)
+        ax.imshow(composite)
     ax.set_title(f"{label}")
     ax.axis('off')
     fig.savefig(filename)
+    plt.close(fig)