AnikS22
/

MidasMap

+"""
+PyTorch Dataset for immunogold particle detection.
+Implements patch-based training with:
+- 70% hard mining (patches centered near particles)
+- 30% random patches (background recognition)
+- Copy-paste augmentation with Gaussian-blended bead bank
+- Albumentations pipeline with keypoint co-transforms
+"""
+import random
+from pathlib import Path
+from typing import Dict, List, Optional, Tuple
+import albumentations as A
+import cv2
+import numpy as np
+import torch
+from torch.utils.data import Dataset
+from src.heatmap import generate_heatmap_gt
+from src.preprocessing import (
+    SynapseRecord,
+    load_all_annotations,
+    load_image,
+    load_mask,
+)
+# ---------------------------------------------------------------------------
+# Augmentation pipeline
+# ---------------------------------------------------------------------------
+def get_train_augmentation() -> A.Compose:
+    """
+    Training augmentation pipeline.
+    Conservative intensity limits: contrast delta is only 11-39 units on uint8.
+    DO NOT use Cutout/Mixup/JPEG artifacts — they destroy or mimic particles.
+    """
+    return A.Compose(
+        [
+            # Geometric (co-transform keypoints)
+            A.RandomRotate90(p=1.0),  # EM is rotation invariant
+            A.HorizontalFlip(p=0.5),
+            A.VerticalFlip(p=0.5),
+            # Only ±10° to avoid interpolation artifacts that destroy contrast
+            A.Rotate(
+                limit=10,
+                border_mode=cv2.BORDER_REFLECT_101,
+                p=0.5,
+            ),
+            # Mild elastic deformation (simulates section flatness variation)
+            A.ElasticTransform(alpha=30, sigma=5, p=0.3),
+            # Intensity (image only)
+            A.RandomBrightnessContrast(
+                brightness_limit=0.08,  # NOT default 0.2
+                contrast_limit=0.08,
+                p=0.7,
+            ),
+            # EM shot noise simulation
+            A.GaussNoise(p=0.5),
+            # Mild blur — simulate slight defocus
+            A.GaussianBlur(blur_limit=(3, 3), p=0.2),
+        ],
+        keypoint_params=A.KeypointParams(
+            format="xy",
+            remove_invisible=True,
+            label_fields=["class_labels"],
+        ),
+    )
+def get_val_augmentation() -> A.Compose:
+    """No augmentation for validation — identity transform."""
+    return A.Compose(
+        [],
+        keypoint_params=A.KeypointParams(
+            format="xy",
+            remove_invisible=True,
+            label_fields=["class_labels"],
+        ),
+    )
+# ---------------------------------------------------------------------------
+# Bead bank for copy-paste augmentation
+# ---------------------------------------------------------------------------
+class BeadBank:
+    """
+    Pre-extracted particle crops for copy-paste augmentation.
+    Stores small patches centered on annotated particles from training
+    images. During training, random beads are pasted onto patches to
+    increase particle density and address class imbalance.
+    """
+    def __init__(self):
+        self.crops: Dict[str, List[Tuple[np.ndarray, int]]] = {
+            "6nm": [],
+            "12nm": [],
+        }
+        self.crop_sizes = {"6nm": 32, "12nm": 48}
+    def extract_from_image(
+        self,
+        image: np.ndarray,
+        annotations: Dict[str, np.ndarray],
+    ):
+        """Extract bead crops from a training image."""
+        h, w = image.shape[:2]
+        for cls, coords in annotations.items():
+            crop_size = self.crop_sizes[cls]
+            half = crop_size // 2
+            for x, y in coords:
+                xi, yi = int(round(x)), int(round(y))
+                # Skip if too close to edge
+                if yi - half < 0 or yi + half > h or xi - half < 0 or xi + half > w:
+                    continue
+                crop = image[yi - half : yi + half, xi - half : xi + half].copy()
+                if crop.shape == (crop_size, crop_size):
+                    self.crops[cls].append((crop, half))
+    def paste_beads(
+        self,
+        image: np.ndarray,
+        coords_6nm: List[Tuple[float, float]],
+        coords_12nm: List[Tuple[float, float]],
+        class_labels: List[str],
+        mask: Optional[np.ndarray] = None,
+        n_paste_per_class: int = 5,
+        rng: Optional[np.random.Generator] = None,
+    ) -> Tuple[np.ndarray, List[Tuple[float, float]], List[Tuple[float, float]], List[str]]:
+        """
+        Paste random beads onto image with Gaussian alpha blending.
+        Returns augmented image and updated coordinate lists.
+        """
+        if rng is None:
+            rng = np.random.default_rng()
+        image = image.copy()
+        h, w = image.shape[:2]
+        new_coords_6nm = list(coords_6nm)
+        new_coords_12nm = list(coords_12nm)
+        new_labels = list(class_labels)
+        for cls in ["6nm", "12nm"]:
+            if not self.crops[cls]:
+                continue
+            crop_size = self.crop_sizes[cls]
+            half = crop_size // 2
+            n_paste = min(n_paste_per_class, len(self.crops[cls]))
+            for _ in range(n_paste):
+                # Random paste location (within image bounds)
+                px = rng.integers(half + 5, w - half - 5)
+                py = rng.integers(half + 5, h - half - 5)
+                # Skip if outside tissue mask
+                if mask is not None:
+                    if py >= mask.shape[0] or px >= mask.shape[1] or not mask[py, px]:
+                        continue
+                # Check minimum distance from existing particles (avoid overlap)
+                too_close = False
+                all_existing = new_coords_6nm + new_coords_12nm
+                for ex, ey in all_existing:
+                    if (ex - px) ** 2 + (ey - py) ** 2 < (half * 1.5) ** 2:
+                        too_close = True
+                        break
+                if too_close:
+                    continue
+                # Select random crop
+                crop, _ = self.crops[cls][rng.integers(len(self.crops[cls]))]
+                # Gaussian alpha mask for soft blending
+                yy, xx = np.mgrid[:crop_size, :crop_size]
+                center = crop_size / 2
+                sigma = half * 0.7
+                alpha = np.exp(-((xx - center) ** 2 + (yy - center) ** 2) / (2 * sigma ** 2))
+                # Blend
+                region = image[py - half : py + half, px - half : px + half]
+                if region.shape != crop.shape:
+                    continue
+                blended = (alpha * crop + (1 - alpha) * region).astype(np.uint8)
+                image[py - half : py + half, px - half : px + half] = blended
+                # Add to annotations
+                if cls == "6nm":
+                    new_coords_6nm.append((float(px), float(py)))
+                else:
+                    new_coords_12nm.append((float(px), float(py)))
+                new_labels.append(cls)
+        return image, new_coords_6nm, new_coords_12nm, new_labels
+# ---------------------------------------------------------------------------
+# Dataset
+# ---------------------------------------------------------------------------
+class ImmunogoldDataset(Dataset):
+    """
+    Patch-based dataset for immunogold particle detection.
+    Sampling strategy:
+    - 70% of patches centered within 100px of a known particle (hard mining)
+    - 30% of patches at random locations (background recognition)
+    This ensures the model sees particles in nearly every batch despite
+    particles occupying <0.1% of image area.
+    """
+    def __init__(
+        self,
+        records: List[SynapseRecord],
+        fold_id: str,
+        mode: str = "train",
+        patch_size: int = 512,
+        stride: int = 2,
+        hard_mining_fraction: float = 0.7,
+        copy_paste_per_class: int = 5,
+        sigmas: Optional[Dict[str, float]] = None,
+        samples_per_epoch: int = 200,
+        seed: int = 42,
+    ):
+        """
+        Args:
+            records: all SynapseRecord entries
+            fold_id: synapse_id to hold out (test set)
+            mode: 'train' or 'val'
+            patch_size: training patch size
+            stride: model output stride
+            hard_mining_fraction: fraction of patches near particles
+            copy_paste_per_class: beads to paste per class
+            sigmas: heatmap Gaussian sigmas per class
+            samples_per_epoch: virtual epoch size
+            seed: random seed
+        """
+        super().__init__()
+        self.patch_size = patch_size
+        self.stride = stride
+        self.hard_mining_fraction = hard_mining_fraction
+        self.copy_paste_per_class = copy_paste_per_class if mode == "train" else 0
+        self.sigmas = sigmas or {"6nm": 1.0, "12nm": 1.5}
+        self.samples_per_epoch = samples_per_epoch
+        self.mode = mode
+        self._base_seed = seed
+        self.rng = np.random.default_rng(seed)
+        # Split records
+        if mode == "train":
+            self.records = [r for r in records if r.synapse_id != fold_id]
+        elif mode == "val":
+            self.records = [r for r in records if r.synapse_id == fold_id]
+        else:
+            self.records = records
+        # Pre-load all images and annotations into memory (~4MB each × 10 = 40MB)
+        self.images = {}
+        self.masks = {}
+        self.annotations = {}
+        for record in self.records:
+            sid = record.synapse_id
+            self.images[sid] = load_image(record.image_path)
+            if record.mask_path:
+                self.masks[sid] = load_mask(record.mask_path)
+            self.annotations[sid] = load_all_annotations(record, self.images[sid].shape)
+        # Build particle index for hard mining
+        self._build_particle_index()
+        # Build bead bank for copy-paste
+        self.bead_bank = BeadBank()
+        if mode == "train":
+            for sid in self.images:
+                self.bead_bank.extract_from_image(
+                    self.images[sid], self.annotations[sid]
+                )
+        # Augmentation
+        if mode == "train":
+            self.transform = get_train_augmentation()
+        else:
+            self.transform = get_val_augmentation()
+    def _build_particle_index(self):
+        """Build flat index of all particles for hard mining."""
+        self.particle_list = []  # (synapse_id, x, y, class)
+        for sid, annots in self.annotations.items():
+            for cls in ["6nm", "12nm"]:
+                for x, y in annots[cls]:
+                    self.particle_list.append((sid, x, y, cls))
+    @staticmethod
+    def worker_init_fn(worker_id: int):
+        """Re-seed RNG per DataLoader worker to avoid identical sequences."""
+        import torch
+        seed = torch.initial_seed() % (2**32) + worker_id
+        np.random.seed(seed)
+    def __len__(self) -> int:
+        return self.samples_per_epoch
+    def __getitem__(self, idx: int) -> dict:
+        # Reseed RNG using idx so each call produces a unique patch.
+        # Without this, the same 200 patches repeat every epoch → instant overfitting.
+        self.rng = np.random.default_rng(self._base_seed + idx + int(torch.initial_seed() % 100000))
+        """
+        Sample a patch with ground truth heatmap.
+        Returns dict with:
+            'image': (1, patch_size, patch_size) float32 tensor
+            'heatmap': (2, patch_size//stride, patch_size//stride) float32
+            'offsets': (2, patch_size//stride, patch_size//stride) float32
+            'offset_mask': (patch_size//stride, patch_size//stride) bool
+            'conf_map': (2, patch_size//stride, patch_size//stride) float32
+        """
+        # Decide: hard or random patch
+        do_hard = (self.rng.random() < self.hard_mining_fraction
+                   and len(self.particle_list) > 0
+                   and self.mode == "train")
+        if do_hard:
+            # Pick random particle, center patch on it with jitter
+            pidx = self.rng.integers(len(self.particle_list))
+            sid, px, py, _ = self.particle_list[pidx]
+            # Jitter center up to 128px
+            jitter = 128
+            cx = int(px + self.rng.integers(-jitter, jitter + 1))
+            cy = int(py + self.rng.integers(-jitter, jitter + 1))
+        else:
+            # Random image and location
+            sid = list(self.images.keys())[
+                self.rng.integers(len(self.images))
+            ]
+            h, w = self.images[sid].shape[:2]
+            cx = self.rng.integers(self.patch_size // 2, w - self.patch_size // 2)
+            cy = self.rng.integers(self.patch_size // 2, h - self.patch_size // 2)
+        # Extract patch
+        image = self.images[sid]
+        h, w = image.shape[:2]
+        half = self.patch_size // 2
+        # Clamp to image bounds
+        cx = max(half, min(w - half, cx))
+        cy = max(half, min(h - half, cy))
+        x0, x1 = cx - half, cx + half
+        y0, y1 = cy - half, cy + half
+        patch = image[y0:y1, x0:x1].copy()
+        # Pad if needed (edge cases)
+        if patch.shape[0] != self.patch_size or patch.shape[1] != self.patch_size:
+            padded = np.zeros((self.patch_size, self.patch_size), dtype=np.uint8)
+            ph, pw = patch.shape[:2]
+            padded[:ph, :pw] = patch
+            patch = padded
+        # Get annotations within this patch (convert to patch-local coordinates)
+        keypoints = []
+        class_labels = []
+        for cls in ["6nm", "12nm"]:
+            for ax, ay in self.annotations[sid][cls]:
+                # Convert to patch-local coords
+                lx = ax - x0
+                ly = ay - y0
+                if 0 <= lx < self.patch_size and 0 <= ly < self.patch_size:
+                    keypoints.append((lx, ly))
+                    class_labels.append(cls)
+        # Copy-paste augmentation (before geometric transforms)
+        if self.copy_paste_per_class > 0 and self.mode == "train":
+            local_6nm = [(x, y) for (x, y), c in zip(keypoints, class_labels) if c == "6nm"]
+            local_12nm = [(x, y) for (x, y), c in zip(keypoints, class_labels) if c == "12nm"]
+            mask_patch = None
+            if sid in self.masks:
+                mask_patch = self.masks[sid][y0:y1, x0:x1]
+            patch, local_6nm, local_12nm, class_labels = self.bead_bank.paste_beads(
+                patch, local_6nm, local_12nm, class_labels,
+                mask=mask_patch,
+                n_paste_per_class=self.copy_paste_per_class,
+                rng=self.rng,
+            )
+            # Rebuild keypoints from updated coords
+            keypoints = [(x, y) for x, y in local_6nm] + [(x, y) for x, y in local_12nm]
+            class_labels = ["6nm"] * len(local_6nm) + ["12nm"] * len(local_12nm)
+        # Apply augmentation (co-transforms keypoints)
+        transformed = self.transform(
+            image=patch,
+            keypoints=keypoints,
+            class_labels=class_labels,
+        )
+        patch_aug = transformed["image"]
+        kp_aug = transformed["keypoints"]
+        cl_aug = transformed["class_labels"]
+        # Separate keypoints by class
+        coords_6nm = np.array(
+            [(x, y) for (x, y), c in zip(kp_aug, cl_aug) if c == "6nm"],
+            dtype=np.float64,
+        ).reshape(-1, 2)
+        coords_12nm = np.array(
+            [(x, y) for (x, y), c in zip(kp_aug, cl_aug) if c == "12nm"],
+            dtype=np.float64,
+        ).reshape(-1, 2)
+        # Generate heatmap GT from TRANSFORMED coordinates (never warp heatmap)
+        heatmap, offsets, offset_mask, conf_map = generate_heatmap_gt(
+            coords_6nm, coords_12nm,
+            self.patch_size, self.patch_size,
+            sigmas=self.sigmas,
+            stride=self.stride,
+        )
+        # Convert to tensors
+        patch_tensor = torch.from_numpy(patch_aug).float().unsqueeze(0) / 255.0
+        return {
+            "image": patch_tensor,
+            "heatmap": torch.from_numpy(heatmap),
+            "offsets": torch.from_numpy(offsets),
+            "offset_mask": torch.from_numpy(offset_mask),
+            "conf_map": torch.from_numpy(conf_map),
+        }