Spaces:

Kinzaaa
/

flood-risk-detection

Sleeping

flood-risk-detection / app /model_utils.py

Kinzaaa

Initial deployment: Attention UNet + ZoeDepth + Grad-CAM + Risk Assessment

3fd6082 28 days ago

21.8 kB

	"""
	model_utils.py — loads the .pkl metadata + .keras model and exposes inference helpers.
	ZoeDepth is loaded from HuggingFace Hub (CPU) for flood depth estimation.

	PKL structure (from flood_model_production.pkl):
	model_name, model_keras_path, input_shape, output_shape, threshold,
	preprocessing, gradcam_layer, metrics, risk_thresholds, custom_objects_keys
	"""
	import os
	import pickle
	import numpy as np
	import cv2
	import tensorflow as tf
	from PIL import Image
	import torch

	# ── HuggingFace token (set via env var — never hardcode in production) ─────────
	HF_TOKEN = os.environ.get("HF_TOKEN", "")

	# ── Custom Keras objects ───────────────────────────────────────────────────────
	def iou_metric(y_true, y_pred):
	y_pred = tf.cast(y_pred > 0.5, tf.float32)
	intersection = tf.reduce_sum(y_true * y_pred)
	union = tf.reduce_sum(y_true) + tf.reduce_sum(y_pred) - intersection
	return intersection / (union + 1e-7)

	def dice_loss(y_true, y_pred, smooth=1e-7):
	intersection = tf.reduce_sum(y_true * y_pred)
	return 1.0 - (2.0 * intersection + smooth) / (
	tf.reduce_sum(y_true) + tf.reduce_sum(y_pred) + smooth
	)

	def bce_dice_loss(y_true, y_pred):
	bce = tf.keras.losses.binary_crossentropy(y_true, y_pred)
	dice = dice_loss(y_true, y_pred)
	return bce + dice

	CUSTOM_OBJECTS = {
	"iou_metric": iou_metric,
	"dice_loss": dice_loss,
	"bce_dice_loss": bce_dice_loss,
	}

	IMAGE_SIZE = (512, 512)

	# ── Singletons ─────────────────────────────────────────────────────────────────
	_seg_model = None # Attention UNet (TF/Keras)
	_zoe_model = None # ZoeDepth (PyTorch, CPU)
	_metadata = None # dict from pkl


	# ── Metadata ───────────────────────────────────────────────────────────────────
	def _load_metadata() -> dict:
	global _metadata
	if _metadata is not None:
	return _metadata
	pkl_path = os.environ.get("MODEL_PKL", "models/flood_model_production.pkl")
	if os.path.exists(pkl_path):
	with open(pkl_path, "rb") as f:
	_metadata = pickle.load(f)
	else:
	_metadata = {}
	return _metadata


	# ── Attention UNet loader ──────────────────────────────────────────────────────
	def load_seg_model():
	global _seg_model
	if _seg_model is not None:
	return _seg_model
	keras_path = os.environ.get("MODEL_KERAS", "models/flood_best_model_export.keras")
	if not os.path.exists(keras_path):
	raise FileNotFoundError(
	f"Keras model not found at '{keras_path}'. "
	"Set MODEL_KERAS env var to the correct path."
	)
	_seg_model = tf.keras.models.load_model(keras_path, custom_objects=CUSTOM_OBJECTS)
	return _seg_model


	# ── ZoeDepth loader (CPU, HF Hub) ─────────────────────────────────────────────
	def load_zoe_model():
	"""
	Loads ZoeDepth (ZoeD_N) from HuggingFace Hub on CPU.
	Uses the transformers pipeline for simplicity and reliability.
	Model: Intel/zoedepth-nyu (indoor/outdoor depth estimation)
	"""
	global _zoe_model
	if _zoe_model is not None:
	return _zoe_model

	from transformers import pipeline as hf_pipeline

	token = HF_TOKEN or os.environ.get("HF_TOKEN", "")

	print("[ZoeDepth] Loading from HuggingFace Hub (CPU)...")
	_zoe_model = hf_pipeline(
	task="depth-estimation",
	model="Intel/zoedepth-nyu",
	device="cpu", # force CPU
	token=token if token else None,
	)
	print("[ZoeDepth] Loaded OK.")
	return _zoe_model


	# ── Preprocessing ──────────────────────────────────────────────────────────────
	def preprocess_image(image: Image.Image) -> np.ndarray:
	"""PIL Image → normalised (1, 512, 512, 3) float32 array."""
	img = image.convert("RGB").resize(IMAGE_SIZE)
	arr = np.array(img, dtype=np.float32) / 255.0
	return np.expand_dims(arr, axis=0) # (1, H, W, 3)


	# ── OOD / scene validation ─────────────────────────────────────────────────────
	def _is_flood_scene(image: Image.Image, pred: np.ndarray, threshold: float) -> tuple:
	"""
	Multi-signal check to detect out-of-distribution (non-flood) images.

	Signals used:
	1. Colour distribution — flood/water images have blue/grey/brown tones.
	Non-flood scenes (cars, indoor, etc.) have very different hue distributions.
	2. Spatial coherence — real flood masks are spatially connected large blobs.
	OOD masks are fragmented noise scattered across the image.
	3. Raw flood coverage — if >85% of image is "flooded" it's almost certainly OOD
	(real floods rarely cover the entire frame uniformly).

	Returns:
	is_valid : bool — True if image looks like a flood scene
	reason : str — explanation if invalid
	"""
	img_rgb = np.array(image.convert("RGB").resize((512, 512)), dtype=np.float32)
	mask = (pred > threshold).astype(np.uint8)

	# ── Signal 1: colour check ─────────────────────────────────────────────────
	# Flood scenes have significant blue/grey channel presence.
	# Compute mean of blue channel relative to red — water is blue-dominant.
	r_mean = img_rgb[:, :, 0].mean()
	g_mean = img_rgb[:, :, 1].mean()
	b_mean = img_rgb[:, :, 2].mean()
	brightness = (r_mean + g_mean + b_mean) / 3.0

	# Very dark images (night/indoor) or very bright (overexposed) are suspicious
	if brightness < 15 or brightness > 240:
	return False, "Image too dark or too bright for flood analysis"

	# ── Signal 2: spatial coherence of the predicted mask ─────────────────────
	# Real flood masks = large connected regions. OOD = scattered small blobs.
	flood_pct = float(mask.mean() * 100)

	if flood_pct > 0.5: # only check if there's something to check
	num_labels, labels, stats, _ = cv2.connectedComponentsWithStats(
	mask, connectivity=8
	)
	if num_labels > 1:
	# Largest component area (excluding background label 0)
	component_areas = stats[1:, cv2.CC_STAT_AREA]
	largest_area = int(component_areas.max())
	total_flood_px = int(mask.sum())
	# Coherence = fraction of flood pixels in the largest blob
	coherence = largest_area / (total_flood_px + 1e-8)

	# If flood pixels are highly fragmented (coherence < 0.3 AND many components)
	# it's likely OOD noise
	if coherence < 0.25 and num_labels > 50:
	return False, f"Flood mask is fragmented ({num_labels} disconnected regions) — likely not a flood scene"

	# ── Signal 3: implausibly high coverage ───────────────────────────────────
	if flood_pct > 90:
	return False, f"Flood coverage {flood_pct:.1f}% is implausibly high — image may not be a flood scene"

	# ── Signal 4: colour-coverage cross-check ─────────────────────────────────
	# High flood coverage (>40%) on an image that is NOT predominantly
	# blue/grey/brown (water colours) is suspicious.
	if flood_pct > 40:
	# Convert to HSV to check hue distribution
	img_uint8 = img_rgb.astype(np.uint8)
	hsv = cv2.cvtColor(img_uint8, cv2.COLOR_RGB2HSV)
	hue = hsv[:, :, 0] # 0-179 in OpenCV
	sat = hsv[:, :, 1] # 0-255

	# Water/flood hues: blue (100-130), grey (any hue, low sat), brown (10-20)
	blue_mask = ((hue >= 100) & (hue <= 130) & (sat > 30))
	grey_mask = (sat < 40)
	brown_mask = ((hue >= 8) & (hue <= 22) & (sat > 40))
	water_px = float((blue_mask \| grey_mask \| brown_mask).mean() * 100)

	# If less than 15% of the image has water-like colours but >40% is "flooded"
	# → almost certainly OOD (car, building, vegetation, etc.)
	if water_px < 15:
	return False, (
	f"High flood coverage ({flood_pct:.1f}%) but only {water_px:.1f}% "
	"water-like colours detected — image does not appear to be a flood scene"
	)

	return True, ""


	# ── Segmentation prediction ────────────────────────────────────────────────────
	def predict_mask(image: Image.Image) -> tuple:
	"""
	Returns:
	mask : (H, W) binary float32 array (0 or 1)
	flood_pct : percentage of image covered by flood (0-100)
	confidence : float 0-100 (display percentage)
	low_conf : bool, True if OOD detected
	ood_reason : str, explanation if OOD
	"""
	meta = _load_metadata()
	threshold = meta.get("threshold", 0.5)
	model = load_seg_model()
	inp = preprocess_image(image)
	pred = model.predict(inp, verbose=0)[0, :, :, 0] # (H, W)

	# Raw confidence metric (how decisive the predictions are)
	confidence_raw = float(np.mean(np.abs(pred - 0.5)) * 2)

	# OOD detection using multi-signal heuristics
	is_valid, ood_reason = _is_flood_scene(image, pred, threshold)

	if not is_valid:
	mask = np.zeros_like(pred, dtype=np.float32)
	flood_pct = 0.0
	low_conf = True
	else:
	mask = (pred > threshold).astype(np.float32)
	flood_pct = float(mask.mean() * 100)
	low_conf = False

	confidence_pct = round(confidence_raw * 100, 1)
	return mask, flood_pct, confidence_pct, low_conf, ood_reason


	# ── Grad-CAM ───────────────────────────────────────────────────────────────────
	def compute_gradcam(image: Image.Image) -> np.ndarray:
	"""
	Returns an RGB uint8 heatmap overlaid on the original image.
	Uses conv2d_130 (from PKL) — the last conv before the output head.
	"""
	meta = _load_metadata()
	model = load_seg_model()
	inp = preprocess_image(image)
	target_layer = meta.get("gradcam_layer", "conv2d_130")

	layer_names = [l.name for l in model.layers]
	if target_layer not in layer_names:
	# fallback to last Conv2D
	target_layer = None
	for layer in reversed(model.layers):
	if isinstance(layer, tf.keras.layers.Conv2D):
	target_layer = layer.name
	break

	if target_layer is None:
	return np.array(image.convert("RGB").resize(IMAGE_SIZE))

	grad_model = tf.keras.models.Model(
	inputs=model.inputs,
	outputs=[model.get_layer(target_layer).output, model.output]
	)

	with tf.GradientTape() as tape:
	inp_tensor = tf.cast(inp, tf.float32)
	conv_out, predictions = grad_model(inp_tensor)
	loss = tf.reduce_mean(predictions)

	grads = tape.gradient(loss, conv_out)
	pooled = tf.reduce_mean(grads, axis=(0, 1, 2))
	cam = tf.reduce_sum(conv_out[0] * pooled, axis=-1).numpy()
	cam = np.maximum(cam, 0)
	cam = cam / (cam.max() + 1e-8)

	# Smooth for the classic soft-blob look (like the reference image)
	cam_resized = cv2.resize(cam, IMAGE_SIZE)
	cam_smooth = cv2.GaussianBlur(cam_resized, (15, 15), 0)

	# JET: blue(low) → cyan → green → yellow → red(high) — exactly the reference
	heatmap_bgr = cv2.applyColorMap(np.uint8(255 * cam_smooth), cv2.COLORMAP_JET)
	heatmap_rgb = cv2.cvtColor(heatmap_bgr, cv2.COLOR_BGR2RGB).astype(np.float32)

	# Blend 55% heatmap over original — enough to see the image underneath
	orig = np.array(image.convert("RGB").resize(IMAGE_SIZE), dtype=np.float32)
	blended = (orig * 0.45 + heatmap_rgb * 0.55).clip(0, 255).astype(np.uint8)
	return blended


	# ── ZoeDepth flood depth estimation ───────────────────────────────────────────
	def estimate_flood_depth(image: Image.Image, mask: np.ndarray) -> dict:
	"""
	Runs ZoeDepth on the image, then analyses depth only within flooded pixels.

	Returns a dict with:
	depth_map_vis : (H, W, 3) uint8 — colourised depth map
	depth_overlay : (H, W, 3) uint8 — depth map masked to flood region
	avg_depth_m : float — mean depth in flooded area (metres)
	max_depth_m : float — max depth in flooded area (metres)
	depth_category : str — shallow / moderate / deep / very deep
	"""
	zoe = load_zoe_model()

	# ZoeDepth expects a PIL RGB image (any size — it handles resize internally)
	rgb_img = image.convert("RGB")

	# Run depth estimation
	depth_result = zoe(rgb_img)
	depth_pil = depth_result["depth"] # PIL Image (grayscale, float-like)
	depth_arr = np.array(depth_pil, dtype=np.float32) # (H, W)

	# Resize depth map to 512×512 to match mask
	depth_512 = cv2.resize(depth_arr, IMAGE_SIZE, interpolation=cv2.INTER_LINEAR)

	# ── Normalise to [0, 1] relative scale ────────────────────────────────────
	# ZoeDepth returns relative disparity values (not calibrated metres).
	# We normalise across the whole image so values are comparable.
	d_min, d_max = depth_512.min(), depth_512.max()
	depth_norm = (depth_512 - d_min) / (d_max - d_min + 1e-8) # 0→1

	# Map relative depth to an estimated flood depth in metres (0–3 m scale).
	# Higher relative depth in flooded pixels → deeper water estimate.
	FLOOD_DEPTH_MAX_M = 3.0
	depth_metres = depth_norm * FLOOD_DEPTH_MAX_M # (H, W), values 0–3 m

	# Colourised full depth map (PLASMA colormap)
	depth_vis = cv2.applyColorMap(np.uint8(255 * depth_norm), cv2.COLORMAP_PLASMA)
	depth_vis = cv2.cvtColor(depth_vis, cv2.COLOR_BGR2RGB)

	# Depth stats within flooded pixels only
	flood_mask_bool = mask.astype(bool)
	flooded_depths = depth_metres[flood_mask_bool]

	if len(flooded_depths) == 0 or flood_mask_bool.sum() < 50:
	# Fewer than 50 flooded pixels → treat as no flood
	avg_depth_m = 0.0
	max_depth_m = 0.0
	else:
	avg_depth_m = float(flooded_depths.mean())
	max_depth_m = float(flooded_depths.max())

	# Depth category (ZoeDepth outputs relative depth in metres approx)
	if avg_depth_m < 0.3:
	depth_category = "Shallow (< 30 cm)"
	elif avg_depth_m < 0.8:
	depth_category = "Moderate (30 cm – 80 cm)"
	elif avg_depth_m < 1.5:
	depth_category = "Deep (80 cm – 1.5 m)"
	else:
	depth_category = "Very Deep (> 1.5 m — life-threatening)"

	# Flood-region depth overlay: blend depth_vis with blue flood mask
	flood_depth_overlay = depth_vis.copy()
	# Highlight non-flooded areas in grey
	grey = np.full_like(depth_vis, 128)
	flood_depth_overlay[~flood_mask_bool] = grey[~flood_mask_bool]

	return {
	"depth_map_vis": depth_vis, # (H, W, 3) uint8
	"depth_overlay": flood_depth_overlay, # (H, W, 3) uint8
	"avg_depth_m": round(avg_depth_m, 3),
	"max_depth_m": round(max_depth_m, 3),
	"depth_category": depth_category,
	}


	# ── Risk assessment (uses thresholds from PKL + ZoeDepth depth) ───────────────
	def assess_risk(flood_pct: float, avg_depth_m: float = 0.0) -> dict:
	"""
	Combined risk from flood coverage % AND average depth from ZoeDepth.
	Thresholds from PKL:
	low : flood_pct < 15 AND avg_depth_m < 0.80
	medium : flood_pct < 35 AND avg_depth_m < 1.50
	high : flood_pct < 60 AND avg_depth_m < 2.20
	critical : above all
	"""
	meta = _load_metadata()
	thresholds = meta.get("risk_thresholds", {
	"low": {"max_flood_pct": 15, "max_avg_depth_m": 80},
	"medium": {"max_flood_pct": 35, "max_avg_depth_m": 150},
	"high": {"max_flood_pct": 60, "max_avg_depth_m": 220},
	"critical": {"above_all": True},
	})

	# PKL stores depth in cm — convert to metres for comparison
	low_pct = thresholds.get("low", {}).get("max_flood_pct", 15)
	med_pct = thresholds.get("medium", {}).get("max_flood_pct", 35)
	high_pct = thresholds.get("high", {}).get("max_flood_pct", 60)

	# Depth thresholds in metres (realistic flood water levels)
	low_dep = 0.3 # < 30 cm → Low
	med_dep = 0.8 # < 80 cm → Moderate
	high_dep = 1.5 # < 150 cm → High (> 1.5 m → Critical)

	# Depth only contributes to risk when there is meaningful flood coverage.
	# If flood_pct < 2%, ignore depth entirely (noise / false positives).
	effective_depth = avg_depth_m if flood_pct >= 2.0 else 0.0

	def _level_from_pct(p):
	if p < low_pct: return 0
	if p < med_pct: return 1
	if p < high_pct: return 2
	return 3

	def _level_from_dep(d):
	if d < low_dep: return 0
	if d < med_dep: return 1
	if d < high_dep: return 2
	return 3

	level_idx = max(_level_from_pct(flood_pct), _level_from_dep(effective_depth))
	levels = ["Low", "Moderate", "High", "Critical"]
	colours = ["#2ecc71", "#f39c12", "#e67e22", "#e74c3c"]
	level = levels[level_idx]
	colour = colours[level_idx]

	# Score: flood coverage drives 70%, depth drives 30%
	pct_score = min(flood_pct / 100 * 100, 100)
	depth_score = min(effective_depth / 3.0 * 100, 100) # 3 m = max realistic scale
	score = round(pct_score * 0.7 + depth_score * 0.3, 1)

	recs_map = {
	"Low": [
	"Monitor water levels periodically.",
	"Ensure drainage channels are clear.",
	"No immediate evacuation required.",
	],
	"Moderate": [
	"Alert local emergency services.",
	"Move valuables to higher ground.",
	"Prepare emergency kit.",
	"Monitor weather forecasts closely.",
	],
	"High": [
	"Initiate partial evacuation of vulnerable populations.",
	"Deploy flood barriers where possible.",
	"Activate emergency response teams.",
	"Avoid flooded roads and areas.",
	],
	"Critical": [
	"IMMEDIATE EVACUATION REQUIRED.",
	"Contact emergency services (911 / local disaster hotline).",
	"Do not attempt to cross flooded areas.",
	"Seek shelter on highest available ground.",
	"Follow official evacuation routes only.",
	],
	}

	deployed_metrics = meta.get("metrics", {}).get("deployed", {})

	return {
	"risk_level": level,
	"risk_score": score,
	"colour": colour,
	"flood_pct": round(flood_pct, 2),
	"avg_depth_m": round(avg_depth_m, 3),
	"recommendations": recs_map[level],
	"model_metrics": deployed_metrics,
	}


	# ── Full pipeline ──────────────────────────────────────────────────────────────
	def run_pipeline(image: Image.Image) -> dict:
	"""
	End-to-end:
	1. Attention UNet → flood mask (with confidence gate)
	2. Grad-CAM → explainability heatmap
	3. ZoeDepth → per-pixel depth map, flood depth stats
	4. Risk assessment → level, score, recommendations
	"""
	# Step 1 — segmentation + OOD detection
	mask, flood_pct, confidence, low_conf, ood_reason = predict_mask(image)

	# Step 2 — Grad-CAM
	gradcam_img = compute_gradcam(image)

	# Step 3 — ZoeDepth depth estimation
	depth_info = estimate_flood_depth(image, mask)

	# Step 4 — risk
	risk = assess_risk(flood_pct, avg_depth_m=depth_info["avg_depth_m"])

	# Add OOD info to risk dict for display
	risk["confidence"] = confidence
	risk["low_conf"] = low_conf
	risk["warning"] = (
	f"⚠️ Out-of-distribution image detected: {ood_reason}. "
	"Results suppressed."
	) if low_conf else ""

	# Blue-tinted flood overlay on original
	orig_arr = np.array(image.convert("RGB").resize(IMAGE_SIZE), dtype=np.uint8)
	mask_3ch = np.stack([mask * 0, mask * 100, mask * 255], axis=-1).astype(np.uint8)
	overlay = cv2.addWeighted(orig_arr, 0.7, mask_3ch, 0.3, 0)

	return {
	"mask": mask,
	"overlay": overlay,
	"gradcam": gradcam_img,
	"depth_map": depth_info["depth_map_vis"],
	"depth_overlay": depth_info["depth_overlay"],
	"depth_info": depth_info,
	"risk": risk,
	}