Spaces:

AnikS22
/

MidasMap

Running

App Files Files Community

MidasMap / src /dataset.py

AnikS22

Deploy MidasMap Gradio app, src, requirements, checkpoint

86c24cb verified 6 days ago

raw

history blame contribute delete

16.1 kB

	"""
	PyTorch Dataset for immunogold particle detection.

	Implements patch-based training with:
	- 70% hard mining (patches centered near particles)
	- 30% random patches (background recognition)
	- Copy-paste augmentation with Gaussian-blended bead bank
	- Albumentations pipeline with keypoint co-transforms
	"""

	import random
	from pathlib import Path
	from typing import Dict, List, Optional, Tuple

	import albumentations as A
	import cv2
	import numpy as np
	import torch
	from torch.utils.data import Dataset

	from src.heatmap import generate_heatmap_gt
	from src.preprocessing import (
	SynapseRecord,
	load_all_annotations,
	load_image,
	load_mask,
	)


	# ---------------------------------------------------------------------------
	# Augmentation pipeline
	# ---------------------------------------------------------------------------

	def get_train_augmentation() -> A.Compose:
	"""
	Training augmentation pipeline.

	Conservative intensity limits: contrast delta is only 11-39 units on uint8.
	DO NOT use Cutout/Mixup/JPEG artifacts — they destroy or mimic particles.
	"""
	return A.Compose(
	[
	# Geometric (co-transform keypoints)
	A.RandomRotate90(p=1.0), # EM is rotation invariant
	A.HorizontalFlip(p=0.5),
	A.VerticalFlip(p=0.5),
	# Only ±10° to avoid interpolation artifacts that destroy contrast
	A.Rotate(
	limit=10,
	border_mode=cv2.BORDER_REFLECT_101,
	p=0.5,
	),
	# Mild elastic deformation (simulates section flatness variation)
	A.ElasticTransform(alpha=30, sigma=5, p=0.3),
	# Intensity (image only)
	A.RandomBrightnessContrast(
	brightness_limit=0.08, # NOT default 0.2
	contrast_limit=0.08,
	p=0.7,
	),
	# EM shot noise simulation
	A.GaussNoise(p=0.5),
	# Mild blur — simulate slight defocus
	A.GaussianBlur(blur_limit=(3, 3), p=0.2),
	],
	keypoint_params=A.KeypointParams(
	format="xy",
	remove_invisible=True,
	label_fields=["class_labels"],
	),
	)


	def get_val_augmentation() -> A.Compose:
	"""No augmentation for validation — identity transform."""
	return A.Compose(
	[],
	keypoint_params=A.KeypointParams(
	format="xy",
	remove_invisible=True,
	label_fields=["class_labels"],
	),
	)


	# ---------------------------------------------------------------------------
	# Bead bank for copy-paste augmentation
	# ---------------------------------------------------------------------------

	class BeadBank:
	"""
	Pre-extracted particle crops for copy-paste augmentation.

	Stores small patches centered on annotated particles from training
	images. During training, random beads are pasted onto patches to
	increase particle density and address class imbalance.
	"""

	def __init__(self):
	self.crops: Dict[str, List[Tuple[np.ndarray, int]]] = {
	"6nm": [],
	"12nm": [],
	}
	self.crop_sizes = {"6nm": 32, "12nm": 48}

	def extract_from_image(
	self,
	image: np.ndarray,
	annotations: Dict[str, np.ndarray],
	):
	"""Extract bead crops from a training image."""
	h, w = image.shape[:2]

	for cls, coords in annotations.items():
	crop_size = self.crop_sizes[cls]
	half = crop_size // 2

	for x, y in coords:
	xi, yi = int(round(x)), int(round(y))
	# Skip if too close to edge
	if yi - half < 0 or yi + half > h or xi - half < 0 or xi + half > w:
	continue

	crop = image[yi - half : yi + half, xi - half : xi + half].copy()
	if crop.shape == (crop_size, crop_size):
	self.crops[cls].append((crop, half))

	def paste_beads(
	self,
	image: np.ndarray,
	coords_6nm: List[Tuple[float, float]],
	coords_12nm: List[Tuple[float, float]],
	class_labels: List[str],
	mask: Optional[np.ndarray] = None,
	n_paste_per_class: int = 5,
	rng: Optional[np.random.Generator] = None,
	) -> Tuple[np.ndarray, List[Tuple[float, float]], List[Tuple[float, float]], List[str]]:
	"""
	Paste random beads onto image with Gaussian alpha blending.

	Returns augmented image and updated coordinate lists.
	"""
	if rng is None:
	rng = np.random.default_rng()

	image = image.copy()
	h, w = image.shape[:2]
	new_coords_6nm = list(coords_6nm)
	new_coords_12nm = list(coords_12nm)
	new_labels = list(class_labels)

	for cls in ["6nm", "12nm"]:
	if not self.crops[cls]:
	continue

	crop_size = self.crop_sizes[cls]
	half = crop_size // 2
	n_paste = min(n_paste_per_class, len(self.crops[cls]))

	for _ in range(n_paste):
	# Random paste location (within image bounds)
	px = rng.integers(half + 5, w - half - 5)
	py = rng.integers(half + 5, h - half - 5)

	# Skip if outside tissue mask
	if mask is not None:
	if py >= mask.shape[0] or px >= mask.shape[1] or not mask[py, px]:
	continue

	# Check minimum distance from existing particles (avoid overlap)
	too_close = False
	all_existing = new_coords_6nm + new_coords_12nm
	for ex, ey in all_existing:
	if (ex - px) 2 + (ey - py) 2 < (half * 1.5) ** 2:
	too_close = True
	break
	if too_close:
	continue

	# Select random crop
	crop, _ = self.crops[cls][rng.integers(len(self.crops[cls]))]

	# Gaussian alpha mask for soft blending
	yy, xx = np.mgrid[:crop_size, :crop_size]
	center = crop_size / 2
	sigma = half * 0.7
	alpha = np.exp(-((xx - center) 2 + (yy - center) 2) / (2 * sigma ** 2))

	# Blend
	region = image[py - half : py + half, px - half : px + half]
	if region.shape != crop.shape:
	continue
	blended = (alpha * crop + (1 - alpha) * region).astype(np.uint8)
	image[py - half : py + half, px - half : px + half] = blended

	# Add to annotations
	if cls == "6nm":
	new_coords_6nm.append((float(px), float(py)))
	else:
	new_coords_12nm.append((float(px), float(py)))
	new_labels.append(cls)

	return image, new_coords_6nm, new_coords_12nm, new_labels


	# ---------------------------------------------------------------------------
	# Dataset
	# ---------------------------------------------------------------------------

	class ImmunogoldDataset(Dataset):
	"""
	Patch-based dataset for immunogold particle detection.

	Sampling strategy:
	- 70% of patches centered within 100px of a known particle (hard mining)
	- 30% of patches at random locations (background recognition)

	This ensures the model sees particles in nearly every batch despite
	particles occupying <0.1% of image area.
	"""

	def __init__(
	self,
	records: List[SynapseRecord],
	fold_id: str,
	mode: str = "train",
	patch_size: int = 512,
	stride: int = 2,
	hard_mining_fraction: float = 0.7,
	copy_paste_per_class: int = 5,
	sigmas: Optional[Dict[str, float]] = None,
	samples_per_epoch: int = 200,
	seed: int = 42,
	):
	"""
	Args:
	records: all SynapseRecord entries
	fold_id: synapse_id to hold out (test set)
	mode: 'train' or 'val'
	patch_size: training patch size
	stride: model output stride
	hard_mining_fraction: fraction of patches near particles
	copy_paste_per_class: beads to paste per class
	sigmas: heatmap Gaussian sigmas per class
	samples_per_epoch: virtual epoch size
	seed: random seed
	"""
	super().__init__()
	self.patch_size = patch_size
	self.stride = stride
	self.hard_mining_fraction = hard_mining_fraction
	self.copy_paste_per_class = copy_paste_per_class if mode == "train" else 0
	self.sigmas = sigmas or {"6nm": 1.0, "12nm": 1.5}
	self.samples_per_epoch = samples_per_epoch
	self.mode = mode
	self._base_seed = seed
	self.rng = np.random.default_rng(seed)

	# Split records
	if mode == "train":
	self.records = [r for r in records if r.synapse_id != fold_id]
	elif mode == "val":
	self.records = [r for r in records if r.synapse_id == fold_id]
	else:
	self.records = records

	# Pre-load all images and annotations into memory (~4MB each × 10 = 40MB)
	self.images = {}
	self.masks = {}
	self.annotations = {}

	for record in self.records:
	sid = record.synapse_id
	self.images[sid] = load_image(record.image_path)
	if record.mask_path:
	self.masks[sid] = load_mask(record.mask_path)
	self.annotations[sid] = load_all_annotations(record, self.images[sid].shape)

	# Build particle index for hard mining
	self._build_particle_index()

	# Build bead bank for copy-paste
	self.bead_bank = BeadBank()
	if mode == "train":
	for sid in self.images:
	self.bead_bank.extract_from_image(
	self.images[sid], self.annotations[sid]
	)

	# Augmentation
	if mode == "train":
	self.transform = get_train_augmentation()
	else:
	self.transform = get_val_augmentation()

	def _build_particle_index(self):
	"""Build flat index of all particles for hard mining."""
	self.particle_list = [] # (synapse_id, x, y, class)
	for sid, annots in self.annotations.items():
	for cls in ["6nm", "12nm"]:
	for x, y in annots[cls]:
	self.particle_list.append((sid, x, y, cls))

	@staticmethod
	def worker_init_fn(worker_id: int):
	"""Re-seed RNG per DataLoader worker to avoid identical sequences."""
	import torch
	seed = torch.initial_seed() % (2**32) + worker_id
	np.random.seed(seed)

	def __len__(self) -> int:
	return self.samples_per_epoch

	def __getitem__(self, idx: int) -> dict:
	# Reseed RNG using idx so each call produces a unique patch.
	# Without this, the same 200 patches repeat every epoch → instant overfitting.
	self.rng = np.random.default_rng(self._base_seed + idx + int(torch.initial_seed() % 100000))
	"""
	Sample a patch with ground truth heatmap.

	Returns dict with:
	'image': (1, patch_size, patch_size) float32 tensor
	'heatmap': (2, patch_size//stride, patch_size//stride) float32
	'offsets': (2, patch_size//stride, patch_size//stride) float32
	'offset_mask': (patch_size//stride, patch_size//stride) bool
	'conf_map': (2, patch_size//stride, patch_size//stride) float32
	"""
	# Decide: hard or random patch
	do_hard = (self.rng.random() < self.hard_mining_fraction
	and len(self.particle_list) > 0
	and self.mode == "train")

	if do_hard:
	# Pick random particle, center patch on it with jitter
	pidx = self.rng.integers(len(self.particle_list))
	sid, px, py, _ = self.particle_list[pidx]
	# Jitter center up to 128px
	jitter = 128
	cx = int(px + self.rng.integers(-jitter, jitter + 1))
	cy = int(py + self.rng.integers(-jitter, jitter + 1))
	else:
	# Random image and location
	sid = list(self.images.keys())[
	self.rng.integers(len(self.images))
	]
	h, w = self.images[sid].shape[:2]
	cx = self.rng.integers(self.patch_size // 2, w - self.patch_size // 2)
	cy = self.rng.integers(self.patch_size // 2, h - self.patch_size // 2)

	# Extract patch
	image = self.images[sid]
	h, w = image.shape[:2]
	half = self.patch_size // 2

	# Clamp to image bounds
	cx = max(half, min(w - half, cx))
	cy = max(half, min(h - half, cy))

	x0, x1 = cx - half, cx + half
	y0, y1 = cy - half, cy + half

	patch = image[y0:y1, x0:x1].copy()

	# Pad if needed (edge cases)
	if patch.shape[0] != self.patch_size or patch.shape[1] != self.patch_size:
	padded = np.zeros((self.patch_size, self.patch_size), dtype=np.uint8)
	ph, pw = patch.shape[:2]
	padded[:ph, :pw] = patch
	patch = padded

	# Get annotations within this patch (convert to patch-local coordinates)
	keypoints = []
	class_labels = []
	for cls in ["6nm", "12nm"]:
	for ax, ay in self.annotations[sid][cls]:
	# Convert to patch-local coords
	lx = ax - x0
	ly = ay - y0
	if 0 <= lx < self.patch_size and 0 <= ly < self.patch_size:
	keypoints.append((lx, ly))
	class_labels.append(cls)

	# Copy-paste augmentation (before geometric transforms)
	if self.copy_paste_per_class > 0 and self.mode == "train":
	local_6nm = [(x, y) for (x, y), c in zip(keypoints, class_labels) if c == "6nm"]
	local_12nm = [(x, y) for (x, y), c in zip(keypoints, class_labels) if c == "12nm"]
	mask_patch = None
	if sid in self.masks:
	mask_patch = self.masks[sid][y0:y1, x0:x1]

	patch, local_6nm, local_12nm, class_labels = self.bead_bank.paste_beads(
	patch, local_6nm, local_12nm, class_labels,
	mask=mask_patch,
	n_paste_per_class=self.copy_paste_per_class,
	rng=self.rng,
	)
	# Rebuild keypoints from updated coords
	keypoints = [(x, y) for x, y in local_6nm] + [(x, y) for x, y in local_12nm]
	class_labels = ["6nm"] * len(local_6nm) + ["12nm"] * len(local_12nm)

	# Apply augmentation (co-transforms keypoints)
	transformed = self.transform(
	image=patch,
	keypoints=keypoints,
	class_labels=class_labels,
	)
	patch_aug = transformed["image"]
	kp_aug = transformed["keypoints"]
	cl_aug = transformed["class_labels"]

	# Separate keypoints by class
	coords_6nm = np.array(
	[(x, y) for (x, y), c in zip(kp_aug, cl_aug) if c == "6nm"],
	dtype=np.float64,
	).reshape(-1, 2)
	coords_12nm = np.array(
	[(x, y) for (x, y), c in zip(kp_aug, cl_aug) if c == "12nm"],
	dtype=np.float64,
	).reshape(-1, 2)

	# Generate heatmap GT from TRANSFORMED coordinates (never warp heatmap)
	heatmap, offsets, offset_mask, conf_map = generate_heatmap_gt(
	coords_6nm, coords_12nm,
	self.patch_size, self.patch_size,
	sigmas=self.sigmas,
	stride=self.stride,
	)

	# Convert to tensors
	patch_tensor = torch.from_numpy(patch_aug).float().unsqueeze(0) / 255.0

	return {
	"image": patch_tensor,
	"heatmap": torch.from_numpy(heatmap),
	"offsets": torch.from_numpy(offsets),
	"offset_mask": torch.from_numpy(offset_mask),
	"conf_map": torch.from_numpy(conf_map),
	}