Spaces:

muhammadhabibna
/

glaucoma-api-idsc

Sleeping

App Files Files Community

glaucoma-api-idsc / preprocessing.py

muhammadhabibna

Fix(critical): Pretrained ImageNet CNN Weights and Strict Clinical Validation Gates

329abd1 3 months ago

Raw

History Blame Contribute Delete

16 kB

	"""
	preprocessing.py
	Multi-gate fundus validation + preprocessing pipeline.

	Gate 1 — Fundus Shape Gate:
	Retinal fundus photos have a distinct circular/oval bright region
	on a very dark (near-black) background. Non-fundus images fail this.

	Gate 2 — Color Profile Gate:
	Fundus images are dominated by warm reddish-orange tones (blood vessels,
	retinal tissue). Screenshots, selfies, and random photos fail this.

	Gate 3 — Quality Gate:
	Sharpness measured via Laplacian variance inside the fundus ROI.
	Low sharpness = blurry / out-of-focus scan → reject.

	Inference transform (no augmentation, exact test_transform from notebook):
	Resize 380×380 → ImageNet Normalize → Tensor
	"""

	import cv2
	import numpy as np
	import base64
	from PIL import Image
	import albumentations as A
	from albumentations.pytorch import ToTensorV2

	IMG_SIZE = 380 # EfficientNet-B4 input size
	CDR_SIZE = 512 # Notebook Step 4: CDR computed on 512×512
	IMAGENET_MEAN = [0.485, 0.456, 0.406]
	IMAGENET_STD = [0.229, 0.224, 0.225]

	# ─── Exact test_transform from notebook ──────────────────────────────────────
	test_transform = A.Compose([
	A.Resize(IMG_SIZE, IMG_SIZE),
	A.Normalize(mean=IMAGENET_MEAN, std=IMAGENET_STD),
	ToTensorV2()
	])

	# ─── Display transform: CLAHE applied, no normalization ──────────────────────
	display_transform = A.Compose([
	A.Resize(IMG_SIZE, IMG_SIZE),
	A.CLAHE(clip_limit=2.0, p=1.0),
	])


	# ═══════════════════════════════════════════════════════════════════════════
	# GATE 1 — Fundus Shape Gate
	# ═══════════════════════════════════════════════════════════════════════════

	def check_fundus_shape(img_rgb: np.ndarray) -> tuple:
	"""
	Gate 1: Verify the image contains a circular/oval bright region
	on a dark background — the hallmark of a retinal fundus photo.

	Checks:
	a) Dark border ratio: ≥ 20% of pixels must be near-black (L < 30)
	(fundus images have large dark surround from the camera aperture)
	b) Bright circular region: largest bright contour must be
	roughly circular (aspect ratio 0.5–2.0) and cover 10–85% of image.

	Returns: (passed: bool, reason: str, score: float 0–1)
	"""
	h, w = img_rgb.shape[:2]
	total_pixels = h * w

	img_lab = cv2.cvtColor(img_rgb, cv2.COLOR_RGB2LAB)
	L = img_lab[:, :, 0]

	# ── a) Dark border check ─────────────────────────────────────────────
	dark_pixels = np.sum(L < 30)
	dark_ratio = dark_pixels / total_pixels

	if dark_ratio < 0.20:
	# Fundus images must have at least ~20% pitch black borders from camera aperture
	return False, f"Tidak terdeteksi sebagai foto fundus retina (dark border terlalu kecil: {dark_ratio:.0%})", 0.0

	# ── b) Bright circular region check ──────────────────────────────────
	_, bright_mask = cv2.threshold(L, 30, 255, cv2.THRESH_BINARY)
	kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (15, 15))
	bright_mask = cv2.morphologyEx(bright_mask, cv2.MORPH_CLOSE, kernel)
	bright_mask = cv2.morphologyEx(bright_mask, cv2.MORPH_OPEN, kernel)

	contours, _ = cv2.findContours(bright_mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
	if not contours:
	return False, "Tidak ditemukan region cerah (bukan foto fundus retina)", 0.0

	largest = max(contours, key=cv2.contourArea)
	x, y, bw, bh = cv2.boundingRect(largest)
	bright_area = cv2.contourArea(largest)
	bright_ratio = bright_area / total_pixels

	if bright_ratio < 0.15:
	return False, f"Region retina terlalu kecil (area: {bright_ratio:.0%} dari gambar)", 0.0
	if bright_ratio > 0.80:
	return False, f"Seluruh gambar terang — bukan foto fundus dengan bingkai hitam ({bright_ratio:.0%})", 0.0

	# Aspect ratio check: fundus ROI must be roughly a perfect circle
	aspect = bw / bh if bh > 0 else 0
	if aspect < 0.7 or aspect > 1.3:
	return False, f"Bentuk region tidak bulat sempurna (aspect ratio: {aspect:.2f}) — bukan fundus retina", 0.0

	# ── Score: combination of dark border + circularity ──────────────────
	dark_score = min(dark_ratio / 0.40, 1.0)
	circ_score = 1.0 - abs(aspect - 1.0) / 0.3 # closer to 1.0 = more circular
	shape_score = round(max((dark_score + circ_score) / 2, 0.0), 3)

	return True, "OK", shape_score


	# ═══════════════════════════════════════════════════════════════════════════
	# GATE 2 — Color Profile Gate
	# ═══════════════════════════════════════════════════════════════════════════

	def check_fundus_color(img_rgb: np.ndarray) -> tuple:
	"""
	Gate 2: Verify the image has a warm reddish-orange color profile
	typical of retinal fundus photography.

	Fundus images: dominant hue in HSV is orange-red (Hue 0–30 or 160–180),
	medium-high saturation. Grayscale/blue-dominant images fail.

	Returns: (passed: bool, reason: str, score: float 0–1)
	"""
	img_hsv = cv2.cvtColor(img_rgb, cv2.COLOR_RGB2HSV)
	H = img_hsv[:, :, 0]
	S = img_hsv[:, :, 1]
	V = img_hsv[:, :, 2]

	# Only look at pixels that aren't near-black (part of the fundus ROI)
	roi_mask = V > 40
	if roi_mask.sum() < 1000:
	return False, "Gambar terlalu gelap untuk dianalisis warnanya", 0.0

	H_roi = H[roi_mask]
	S_roi = S[roi_mask]

	# ── Reddish-orange hue check ─────────────────────────────────────────
	# In OpenCV HSV: Hue 0–17 = red-orange, 17–35 = orange-yellow
	# Red wraps around: also 160–180
	red_orange_mask = ((H_roi <= 20) \| (H_roi >= 160))
	orange_yellow_mask = ((H_roi > 10) & (H_roi <= 35))
	warm_ratio = (red_orange_mask.sum() + orange_yellow_mask.sum()) / len(H_roi)

	# ── Saturation check ─────────────────────────────────────────────────
	mean_saturation = S_roi.mean()

	# Grayscale images or weakly colored diagrams: saturation is low
	if mean_saturation < 35:
	return False, f"Gambar tidak memiliki ketajaman warna fundus (saturasi: {mean_saturation:.0f} < 35)", 0.0

	if warm_ratio < 0.35:
	return False, (
	f"Warna tidak dominan merah/oranye fundus "
	f"(warm hue: {warm_ratio:.0%}, harusnya ≥35%). "
	f"Bukan foto medis retina yang valid."
	), 0.0

	color_score = round(min(warm_ratio / 0.60, 1.0) * min(mean_saturation / 90, 1.0), 3)
	return True, "OK", color_score


	# ═══════════════════════════════════════════════════════════════════════════
	# GATE 3 — Quality Gate (Sharpness within fundus ROI)
	# ═══════════════════════════════════════════════════════════════════════════

	def compute_quality_score(img_rgb: np.ndarray) -> float:
	"""
	Gate 3: Sharpness-based Quality Score measured INSIDE the fundus ROI.
	Uses Laplacian variance on the bright region only.

	Maps to 1–5 scale matching dataset QS convention.
	QS < 3 → reject.

	Thresholds calibrated for retinal fundus images (naturally smooth).
	"""
	img_lab = cv2.cvtColor(img_rgb, cv2.COLOR_RGB2LAB)
	L = img_lab[:, :, 0]
	_, roi_mask = cv2.threshold(L, 30, 255, cv2.THRESH_BINARY)

	gray = cv2.cvtColor(img_rgb, cv2.COLOR_RGB2GRAY)
	gray_resized = cv2.resize(gray, (300, 300))
	roi_resized = cv2.resize(roi_mask, (300, 300))

	# Measure sharpness only inside the fundus ROI
	lap = cv2.Laplacian(gray_resized, cv2.CV_64F)
	if roi_resized.sum() > 5000:
	lap_var = lap[roi_resized > 0].var()
	else:
	lap_var = lap.var() # fallback to full image

	print(f"[Preprocessing] Laplacian Variance (ROI): {lap_var:.2f}")

	if lap_var < 3.0:
	return 1.0 # Extremely blurry
	elif lap_var < 8.0:
	return 2.0 # Blurry → reject
	elif lap_var < 15.0:
	return 3.0 # Acceptable
	elif lap_var < 30.0:
	return 4.0 # Good
	else:
	return 5.0 # Excellent


	# ═══════════════════════════════════════════════════════════════════════════
	# Auto-crop Fundus ROI
	# ═══════════════════════════════════════════════════════════════════════════

	def auto_crop_fundus(img_rgb: np.ndarray) -> np.ndarray:
	"""
	Auto-detect and crop the circular fundus region.
	Falls back to full image if detection fails.
	"""
	img_lab = cv2.cvtColor(img_rgb, cv2.COLOR_RGB2LAB)
	L = img_lab[:, :, 0]
	_, mask = cv2.threshold(L, 30, 255, cv2.THRESH_BINARY)

	kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (20, 20))
	mask = cv2.morphologyEx(mask, cv2.MORPH_CLOSE, kernel)
	mask = cv2.morphologyEx(mask, cv2.MORPH_OPEN, kernel)

	contours, _ = cv2.findContours(mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
	if not contours:
	return img_rgb

	largest = max(contours, key=cv2.contourArea)
	x, y, w, h = cv2.boundingRect(largest)
	pad = 10
	x1 = max(0, x - pad); y1 = max(0, y - pad)
	x2 = min(img_rgb.shape[1], x + w + pad)
	y2 = min(img_rgb.shape[0], y + h + pad)
	cropped = img_rgb[y1:y2, x1:x2]
	return cropped if cropped.size > 0 else img_rgb


	# ═══════════════════════════════════════════════════════════════════════════
	# Main Preprocessing Pipeline
	# ═══════════════════════════════════════════════════════════════════════════

	def preprocess_image(img_bytes: bytes) -> dict:
	"""
	Full multi-gate preprocessing pipeline:

	Gate 1 — Fundus Shape: circular bright region on dark background
	Gate 2 — Color Profile: reddish-orange dominant (retinal tissue)
	Gate 3 — Quality: sharpness ≥ 3.0 inside fundus ROI

	Returns dict with:
	passed_gate : bool
	gate_failed : str \| None ('shape' \| 'color' \| 'quality' \| None)
	rejection_reason : str \| None
	quality_score : float (1–5)
	shape_score : float (0–1)
	color_score : float (0–1)
	original_b64, preprocessed_b64, tensor, cdr_img_rgb
	"""
	# ── Decode ───────────────────────────────────────────────────────────
	nparr = np.frombuffer(img_bytes, np.uint8)
	img_bgr = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
	if img_bgr is None:
	raise ValueError("Tidak dapat membaca gambar. Upload file JPEG/PNG yang valid.")
	img_rgb = cv2.cvtColor(img_bgr, cv2.COLOR_BGR2RGB)

	# ── Gate 1: Fundus Shape ─────────────────────────────────────────────
	shape_ok, shape_reason, shape_score = check_fundus_shape(img_rgb)
	print(f"[Gate 1 - Shape] passed={shape_ok}, score={shape_score}, reason={shape_reason}")
	if not shape_ok:
	return _rejection_response(img_rgb, 'shape', shape_reason, shape_score, 0.0, 0.0)

	# ── Gate 2: Color Profile ────────────────────────────────────────────
	color_ok, color_reason, color_score = check_fundus_color(img_rgb)
	print(f"[Gate 2 - Color] passed={color_ok}, score={color_score}, reason={color_reason}")
	if not color_ok:
	return _rejection_response(img_rgb, 'color', color_reason, shape_score, color_score, 0.0)

	# ── Gate 3: Quality ──────────────────────────────────────────────────
	quality_score = compute_quality_score(img_rgb)
	quality_ok = quality_score >= 3.0
	print(f"[Gate 3 - Quality] passed={quality_ok}, score={quality_score}/5.0")
	if not quality_ok:
	reason = (
	f"Kualitas gambar terlalu rendah (skor {quality_score}/5.0). "
	f"Gambar terlalu blur atau tidak fokus. Gunakan hasil scan fundus yang jelas."
	)
	return _rejection_response(img_rgb, 'quality', reason, shape_score, color_score, quality_score)

	# ── All gates passed → process ───────────────────────────────────────
	cropped = auto_crop_fundus(img_rgb)

	original_display = cv2.resize(cropped, (IMG_SIZE, IMG_SIZE))
	original_b64 = ndarray_to_b64(original_display)

	display_result = display_transform(image=cropped)
	preprocessed_b64 = ndarray_to_b64(display_result['image'])

	test_result = test_transform(image=cropped)
	tensor = test_result['image']

	cdr_img_rgb = cv2.resize(cropped, (CDR_SIZE, CDR_SIZE))

	return {
	'passed_gate': True,
	'gate_failed': None,
	'rejection_reason': None,
	'quality_score': quality_score,
	'shape_score': shape_score,
	'color_score': color_score,
	'original_b64': original_b64,
	'preprocessed_b64': preprocessed_b64,
	'tensor': tensor,
	'cdr_img_rgb': cdr_img_rgb,
	}


	def _rejection_response(img_rgb: np.ndarray, gate: str, reason: str,
	shape_score: float, color_score: float,
	quality_score: float) -> dict:
	"""Return a standardised rejection dict with a display thumbnail."""
	# Always give user a preview of what was uploaded
	thumb = cv2.resize(img_rgb, (IMG_SIZE, IMG_SIZE))
	original_b64 = ndarray_to_b64(thumb)
	return {
	'passed_gate': False,
	'gate_failed': gate,
	'rejection_reason': reason,
	'quality_score': quality_score,
	'shape_score': shape_score,
	'color_score': color_score,
	'original_b64': original_b64,
	'preprocessed_b64': original_b64, # show same thumb
	'tensor': None,
	'cdr_img_rgb': None,
	}


	def ndarray_to_b64(img_rgb: np.ndarray) -> str:
	"""Convert RGB numpy array (uint8) to base64 JPEG string."""
	img_bgr = cv2.cvtColor(img_rgb, cv2.COLOR_RGB2BGR)
	_, buffer = cv2.imencode('.jpg', img_bgr, [cv2.IMWRITE_JPEG_QUALITY, 90])
	return base64.b64encode(buffer).decode('utf-8')