root

Clean upload with correct folder structure

ea234dc 21 days ago

9.2 kB

	import torch
	import copy
	import matplotlib.pyplot as plt
	from torchvision.transforms import v2
	from typing import Union, Tuple
	from torch.utils.data import Subset, Dataset

	# --- Rich Imports ---
	from rich.console import Console
	from rich.tree import Tree
	from rich.panel import Panel
	from rich.text import Text
	from rich.syntax import Syntax

	console = Console()

	def print_transform_summary(
	name: str, geometric_sync: v2.Compose, haze_only: v2.Compose, common: v2.Compose
	):
	"""
	Prints a structured summary of the different transformation components using Rich.
	"""
	# Create the root tree
	tree = Tree(f"[bold cyan]{name}[/]")

	# 1. Geometric Branch
	geo_branch = tree.add("[bold magenta]1. Geometric (Synchronous)[/]")
	geo_branch.add("[dim]Applies identically to CLEAR & HAZY for alignment[/]")
	geo_branch.add(str(geometric_sync))

	# 2. Appearance Branch
	haze_branch = tree.add("[bold yellow]2. Appearance (Hazy-Only)[/]")
	haze_branch.add("[dim]Simulates real-world haze variations[/]")
	haze_branch.add(str(haze_only))

	# 3. Common Branch
	common_branch = tree.add("[bold green]3. Common (Tensor & Norm)[/]")
	common_branch.add("[dim]Final prep: ToTensor, Normalize[/]")
	common_branch.add(str(common))

	# Print in a nice panel
	console.print(Panel(tree, title="[bold]Augmentation Pipeline[/]", expand=False, border_style="blue"))


	def restandardize_tensor(
	tensor: torch.Tensor,
	mean: Union[torch.Tensor, Tuple[float, float, float]] = [0.5, 0.5, 0.5],
	std: Union[torch.Tensor, Tuple[float, float, float]] = [0.5, 0.5, 0.5],
	) -> torch.Tensor:
	"""
	Reverses normalization (z-score) -> (Tensor * STD) + MEAN.
	Returns tensor clipped to [0, 1].
	"""
	if not isinstance(mean, torch.Tensor):
	mean = torch.tensor(mean, dtype=tensor.dtype, device=tensor.device).view(-1, 1, 1)
	if not isinstance(std, torch.Tensor):
	std = torch.tensor(std, dtype=tensor.dtype, device=tensor.device).view(-1, 1, 1)

	if tensor.dim() == 4:
	mean = mean.unsqueeze(0)
	std = std.unsqueeze(0)

	de_normalized_tensor = (tensor * std) + mean
	final_tensor = torch.clamp(de_normalized_tensor, 0.0, 1.0)
	return final_tensor


	def get_haze_transforms(
	dataset_name: str,
	resize_size: int = 640,
	split: str = "train",
	verbose: bool = False,
	):
	"""
	Defines PyTorch v2 transformations.

	Training: Resizes and augments.
	Validation: DOES NOT RESIZE (keeps original resolution).
	"""

	# --- 1. Define Common Blocks ---

	# Train: Resize + Normalize
	train_common = v2.Compose([
	v2.ToImage(),
	v2.ToDtype(torch.float32, scale=True),
	v2.Normalize(mean=(0.5, 0.5, 0.5), std=(0.5, 0.5, 0.5)),
	])

	# Val/Test: NO RESIZE (Original Size) + Normalize
	eval_common = v2.Compose([
	v2.ToImage(),
	v2.ToDtype(torch.float32, scale=True),
	v2.Normalize(mean=(0.5, 0.5, 0.5), std=(0.5, 0.5, 0.5)),
	])

	# --- 2. SANITY CHECK LOGIC (New!) ---
	if split == "sanity":
	# STRICTLY DETERMINISTIC.
	# No RandomCrop. No Flips. No Jitter. Just Resize & Normalize.
	def sanity_transform(clear_img, hazy_img):
	clean_img = train_common(clear_img)
	hazy_img = train_common(hazy_img)
	return clean_img, hazy_img

	if verbose:
	print("Transform Mode: SANITY (Deterministic Resize)")
	return sanity_transform

	# --- 3. Training Logic ---
	if split == "train":
	geometric_sync_transforms = v2.Compose([
	v2.RandomCrop(resize_size, pad_if_needed=True),
	v2.RandomHorizontalFlip(p=0.5),
	v2.RandomVerticalFlip(p=0.5),
	])

	# Dataset-specific augmentation logic
	# --- REVISED SAFER TRANSFORMATIONS ---
	# We reduce the intensity significantly.
	# The goal is "Domain Randomization" (robustness), not "Data Distortion".

	if dataset_name == "OHAZE":
	haze_only_transforms = v2.Compose([
	v2.ColorJitter(brightness=0.05, contrast=0.05, saturation=0.05, hue=0.0),
	])
	elif dataset_name == "DENSEHAZE":
	haze_only_transforms = v2.Compose([
	v2.ColorJitter(brightness=0.05, contrast=0.05, saturation=0.05, hue=0.0),
	v2.RandomGrayscale(p=0.2),
	])
	elif dataset_name == "NHHAZE":
	# NH-HAZE is non-homogeneous and very small (~55 pairs).
	# We need slightly more aggressive augmentation to prevent overfitting,
	# but we must be careful not to destroy the 'patchy' haze structure.
	haze_only_transforms = v2.Compose([
	v2.ColorJitter(
	brightness=0.1, # Moderate brightness changes
	contrast=0.1, # Moderate contrast
	saturation=0.1, # Haze affects saturation significantly
	hue=0.0 # Keep hue 0 to preserve realistic outdoor colors
	),
	# Grayscale helps the model focus on structure/texture rather
	# than memorizing the specific color cast of the few training images.
	v2.RandomGrayscale(p=0.15),
	])

	elif dataset_name in ["RESIDE-INDOOR", "HAZE4K"]:
	haze_only_transforms = v2.Compose([
	v2.ColorJitter(
	brightness=0.15,
	contrast=0.15,
	saturation=0.15,
	hue=0.01
	)
	])

	# Inrease the Saturation and Hue Jitter to force the model to
	# generalize to different weather conditions/times of day
	elif dataset_name == "RESIDE-OUTDOOR":
	haze_only_transforms = v2.Compose([
	v2.ColorJitter(
	brightness = 0.2,
	contrast = 0.2,
	saturation = 0.2, # Stronger saturation jitter
	hue = 0.05 # Allow slight color shifting (simulates time-of-day)
	),
	# Optional: Occasional Grayscale forces reliance on structure, not just color
	v2.RandomGrayscale(p=0.1),
	])
	else:
	raise ValueError(f"Unknown dataset: {dataset_name}")


	def haze_transform(clear_img, hazy_img):
	# Apply geometric (sync), appearance (hazy only), then common (resize+norm)
	clean_img, hazy_img = geometric_sync_transforms(clear_img, hazy_img)
	hazy_img = haze_only_transforms(hazy_img)
	clean_img = train_common(clean_img)
	hazy_img = train_common(hazy_img)
	return clean_img, hazy_img

	if verbose:
	print_transform_summary(
	f"{dataset_name} \| TRAIN \| {resize_size}x{resize_size}",
	geometric_sync_transforms,
	haze_only_transforms,
	train_common,
	)
	return haze_transform

	# --- 3. Validation Logic ---
	else:
	def val_transform(clear_img, hazy_img):
	# Only apply normalization, NO RESIZING
	clean_img = eval_common(clear_img)
	hazy_img = eval_common(hazy_img)
	return clean_img, hazy_img

	if verbose:
	print_transform_summary(
	f"{dataset_name} \| VAL/TEST \| Original Size",
	v2.Identity(),
	v2.Identity(),
	eval_common,
	)
	return val_transform


	def partition_dataset(dataset, train_transform, val_transform, train_ratio=0.8):
	indices = torch.randperm(len(dataset)).tolist()
	num_train = int(len(dataset) * train_ratio)

	train_subset = Subset(copy.deepcopy(dataset), indices[:num_train])
	val_subset = Subset(copy.deepcopy(dataset), indices[num_train:])

	# Inject transforms
	train_subset.dataset.transform = train_transform
	val_subset.dataset.transform = val_transform

	return train_subset, val_subset


	def plotting_pair_images(dataset, num_instances=3, start_index=0, save_figure=False):
	N_COLS = 2
	N_ROWS = num_instances
	end_index = start_index + num_instances

	fig, axes = plt.subplots(N_ROWS, N_COLS, figsize=(8, 5 * N_ROWS))
	fig.suptitle(f"GT vs Haze Comparison", fontsize=16)

	row_index = 0
	for i in range(start_index, end_index):
	clean, hazy = dataset[i]
	clean = restandardize_tensor(clean)
	hazy = restandardize_tensor(hazy)

	axes[row_index][0].imshow(clean.permute(1, 2, 0))
	axes[row_index][0].set_title(f"Clean {i}")
	axes[row_index][0].axis("off")

	axes[row_index][1].imshow(hazy.permute(1, 2, 0))
	axes[row_index][1].set_title(f"Hazy {i}")
	axes[row_index][1].axis("off")
	row_index += 1

	plt.tight_layout(rect=[0, 0.03, 1, 0.95])

	if save_figure:
	path = "hazy_clear_comparison.png"
	console.print(f"[bold green]Saving visualization to: {path}[/]")
	plt.savefig(path, dpi=300, bbox_inches="tight")

	plt.show()