Upload baselines/predict_nnunet.py with huggingface_hub

fa5bb00 verified 3 months ago

4.62 kB

	"""
	nnU-Net prediction script that loads the trained model checkpoint
	and generates predictions compatible with evaluate.py.

	Usage:
	python baselines/predict_nnunet.py \
	--nnunet_results /workspace/data/nnUNet_results \
	--test_dir data/flat_test \
	--output_dir results/nnunet \
	--num_samples 16
	"""
	import argparse
	import os
	import sys
	import glob
	import numpy as np
	import torch
	from PIL import Image
	from tqdm import tqdm


	def load_nnunet_model(nnunet_results, fold=0):
	"""Load nnU-Net model from checkpoint."""
	from nnunetv2.inference.predict_from_raw_data import nnUNetPredictor

	# Find the trainer folder
	dataset_dir = os.path.join(nnunet_results, "Dataset001_LIDC")
	trainer_dirs = [d for d in os.listdir(dataset_dir) if os.path.isdir(os.path.join(dataset_dir, d))]
	trainer_name = trainer_dirs[0] # e.g., nnUNetTrainer200epochs__nnUNetPlans__2d
	model_folder = os.path.join(dataset_dir, trainer_name)

	print(f"Loading nnU-Net model from: {model_folder}")

	predictor = nnUNetPredictor(
	tile_step_size=0.5,
	use_gaussian=True,
	use_mirroring=True,
	perform_everything_on_device=True,
	device=torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu'),
	verbose=False,
	verbose_preprocessing=False,
	allow_tqdm=False,
	)
	predictor.initialize_from_trained_model_folder(
	model_folder,
	use_folds=(fold,),
	checkpoint_name='checkpoint_best.pth',
	)
	return predictor


	def predict_single_image(predictor, image_path):
	"""Run nnU-Net prediction on a single image and return binary mask."""
	# Load image as numpy array
	img = np.array(Image.open(image_path).convert('L')) # (H, W)
	# nnU-Net expects (C, Z, Y, X) for 3D or is handled internally
	# For 2D nnU-Net, we need to pass the image properly
	# Use the predictor's predict_single_npy_array method
	img_input = img[np.newaxis, np.newaxis].astype(np.float32) # (1, 1, H, W)

	# nnU-Net properties dict for 2D data
	props = {
	'spacing': [999.0, 1.0, 1.0],
	'shape_after_cropping': img_input.shape[1:],
	'bbox_used_for_cropping': [[0, s] for s in img_input.shape[1:]],
	'shape_before_cropping': img_input.shape[1:],
	'class_locations': {},
	}

	# Run prediction
	prediction = predictor.predict_single_npy_array(
	input_image=img_input[0], # (1, H, W) - single channel
	image_properties=props,
	segmentation_previous_stage=None,
	output_file_or_dir=None,
	save_or_return_probabilities=False,
	)

	# prediction is a numpy array with segmentation labels
	binary_mask = (prediction > 0).astype(np.uint8)

	# Remove z dimension if present
	if binary_mask.ndim == 3:
	binary_mask = binary_mask[0]

	return binary_mask


	def main():
	parser = argparse.ArgumentParser(description="nnU-Net Prediction")
	parser.add_argument("--nnunet_results", type=str, required=True)
	parser.add_argument("--test_dir", type=str, required=True)
	parser.add_argument("--output_dir", type=str, required=True)
	parser.add_argument("--num_samples", type=int, default=16)
	parser.add_argument("--fold", type=int, default=0)
	args = parser.parse_args()

	os.makedirs(args.output_dir, exist_ok=True)

	# Load model
	predictor = load_nnunet_model(args.nnunet_results, args.fold)

	# Get test images
	image_files = sorted(glob.glob(os.path.join(args.test_dir, "*.png")))
	# Filter to only images (not masks)
	image_files = [f for f in image_files if "_mask" not in os.path.basename(f)]
	print(f"Test dataset: {len(image_files)} images from {args.test_dir}")

	total_saved = 0
	for img_path in tqdm(image_files, desc="Predicting"):
	basename = os.path.splitext(os.path.basename(img_path))[0]

	# Get prediction
	mask = predict_single_image(predictor, img_path)

	# Save N replicated samples (deterministic model = same prediction)
	for s in range(args.num_samples):
	out_path = os.path.join(args.output_dir, f"{basename}_sample{s:02d}.png")
	Image.fromarray(mask * 255).save(out_path)
	total_saved += 1

	print(f"\nSaved {len(image_files)} predictions × {args.num_samples} samples = {total_saved} files")
	print(f"\nPredictions saved to {args.output_dir}")
	print(f"Ready for evaluation:")
	print(f" python evaluate.py --samples_dir {args.output_dir} --gt_dir data/testing --results_file results/nnunet_eval.csv")


	if __name__ == "__main__":
	main()