IR_expeiment / PART2 /PromptIR /utils /dataset_utils.py

Upload folder using huggingface_hub

2ecc7ab verified 21 days ago

12.8 kB

	import os
	import random
	import copy
	from PIL import Image
	import numpy as np

	from torch.utils.data import Dataset
	from torchvision.transforms import ToPILImage, Compose, RandomCrop, ToTensor
	import torch

	from utils.image_utils import random_augmentation, crop_img
	from utils.degradation_utils import Degradation


	class PromptTrainDataset(Dataset):
	def __init__(self, args):
	super(PromptTrainDataset, self).__init__()
	self.args = args
	self.rs_ids = []
	self.hazy_ids = []
	self.D = Degradation(args)
	self.de_temp = 0
	self.de_type = self.args.de_type
	print(self.de_type)

	self.de_dict = {'denoise_15': 0, 'denoise_25': 1, 'denoise_50': 2, 'derain': 3, 'dehaze': 4, 'deblur' : 5}

	self._init_ids()
	self._merge_ids()

	self.crop_transform = Compose([
	ToPILImage(),
	RandomCrop(args.patch_size),
	])

	self.toTensor = ToTensor()

	def _init_ids(self):
	if 'denoise_15' in self.de_type or 'denoise_25' in self.de_type or 'denoise_50' in self.de_type:
	self._init_clean_ids()
	if 'derain' in self.de_type:
	self._init_rs_ids()
	if 'dehaze' in self.de_type:
	self._init_hazy_ids()

	random.shuffle(self.de_type)

	def _init_clean_ids(self):
	ref_file = self.args.data_file_dir + "noisy/denoise_airnet.txt"
	temp_ids = []
	temp_ids+= [id_.strip() for id_ in open(ref_file)]
	clean_ids = []
	name_list = os.listdir(self.args.denoise_dir)
	clean_ids += [self.args.denoise_dir + id_ for id_ in name_list if id_.strip() in temp_ids]

	if 'denoise_15' in self.de_type:
	self.s15_ids = [{"clean_id": x,"de_type":0} for x in clean_ids]
	self.s15_ids = self.s15_ids * 3
	random.shuffle(self.s15_ids)
	self.s15_counter = 0
	if 'denoise_25' in self.de_type:
	self.s25_ids = [{"clean_id": x,"de_type":1} for x in clean_ids]
	self.s25_ids = self.s25_ids * 3
	random.shuffle(self.s25_ids)
	self.s25_counter = 0
	if 'denoise_50' in self.de_type:
	self.s50_ids = [{"clean_id": x,"de_type":2} for x in clean_ids]
	self.s50_ids = self.s50_ids * 3
	random.shuffle(self.s50_ids)
	self.s50_counter = 0

	self.num_clean = len(clean_ids)
	print("Total Denoise Ids : {}".format(self.num_clean))

	def _init_hazy_ids(self):
	temp_ids = []
	hazy = self.args.data_file_dir + "hazy/hazy_outside.txt"
	temp_ids+= [self.args.dehaze_dir + id_.strip() for id_ in open(hazy)]
	self.hazy_ids = [{"clean_id" : x,"de_type":4} for x in temp_ids]

	self.hazy_counter = 0

	self.num_hazy = len(self.hazy_ids)
	print("Total Hazy Ids : {}".format(self.num_hazy))

	def _init_rs_ids(self):
	temp_ids = []
	rs = self.args.data_file_dir + "rainy/rainTrain.txt"
	temp_ids+= [self.args.derain_dir + id_.strip() for id_ in open(rs)]
	self.rs_ids = [{"clean_id":x,"de_type":3} for x in temp_ids]
	self.rs_ids = self.rs_ids * 120

	self.rl_counter = 0
	self.num_rl = len(self.rs_ids)
	print("Total Rainy Ids : {}".format(self.num_rl))


	def _crop_patch(self, img_1, img_2):
	H = img_1.shape[0]
	W = img_1.shape[1]
	ind_H = random.randint(0, H - self.args.patch_size)
	ind_W = random.randint(0, W - self.args.patch_size)

	patch_1 = img_1[ind_H:ind_H + self.args.patch_size, ind_W:ind_W + self.args.patch_size]
	patch_2 = img_2[ind_H:ind_H + self.args.patch_size, ind_W:ind_W + self.args.patch_size]

	return patch_1, patch_2

	def _get_gt_name(self, rainy_name):
	gt_name = rainy_name.split("rainy")[0] + 'gt/norain-' + rainy_name.split('rain-')[-1]
	return gt_name

	def _get_nonhazy_name(self, hazy_name):
	dir_name = hazy_name.split("synthetic")[0] + 'original/'
	name = hazy_name.split('/')[-1].split('_')[0]
	suffix = '.' + hazy_name.split('.')[-1]
	nonhazy_name = dir_name + name + suffix
	return nonhazy_name

	def _merge_ids(self):
	self.sample_ids = []
	if "denoise_15" in self.de_type:
	self.sample_ids += self.s15_ids
	self.sample_ids += self.s25_ids
	self.sample_ids += self.s50_ids
	if "derain" in self.de_type:
	self.sample_ids+= self.rs_ids

	if "dehaze" in self.de_type:
	self.sample_ids+= self.hazy_ids
	print(len(self.sample_ids))

	def __getitem__(self, idx):
	sample = self.sample_ids[idx]
	de_id = sample["de_type"]

	if de_id < 3:
	if de_id == 0:
	clean_id = sample["clean_id"]
	elif de_id == 1:
	clean_id = sample["clean_id"]
	elif de_id == 2:
	clean_id = sample["clean_id"]

	clean_img = crop_img(np.array(Image.open(clean_id).convert('RGB')), base=16)
	clean_patch = self.crop_transform(clean_img)
	clean_patch= np.array(clean_patch)

	clean_name = clean_id.split("/")[-1].split('.')[0]

	clean_patch = random_augmentation(clean_patch)[0]

	degrad_patch = self.D.single_degrade(clean_patch, de_id)
	else:
	if de_id == 3:
	# Rain Streak Removal
	degrad_img = crop_img(np.array(Image.open(sample["clean_id"]).convert('RGB')), base=16)
	clean_name = self._get_gt_name(sample["clean_id"])
	clean_img = crop_img(np.array(Image.open(clean_name).convert('RGB')), base=16)
	elif de_id == 4:
	# Dehazing with SOTS outdoor training set
	degrad_img = crop_img(np.array(Image.open(sample["clean_id"]).convert('RGB')), base=16)
	clean_name = self._get_nonhazy_name(sample["clean_id"])
	clean_img = crop_img(np.array(Image.open(clean_name).convert('RGB')), base=16)

	degrad_patch, clean_patch = random_augmentation(*self._crop_patch(degrad_img, clean_img))

	clean_patch = self.toTensor(clean_patch)
	degrad_patch = self.toTensor(degrad_patch)


	return [clean_name, de_id], degrad_patch, clean_patch

	def __len__(self):
	return len(self.sample_ids)


	class DenoiseTestDataset(Dataset):
	def __init__(self, args):
	super(DenoiseTestDataset, self).__init__()
	self.args = args
	self.clean_ids = []
	self.sigma = 15

	self._init_clean_ids()

	self.toTensor = ToTensor()

	def _init_clean_ids(self):
	name_list = os.listdir(self.args.denoise_path)
	self.clean_ids += [self.args.denoise_path + id_ for id_ in name_list]

	self.num_clean = len(self.clean_ids)

	def _add_gaussian_noise(self, clean_patch):
	noise = np.random.randn(*clean_patch.shape)
	noisy_patch = np.clip(clean_patch + noise * self.sigma, 0, 255).astype(np.uint8)
	return noisy_patch, clean_patch

	def set_sigma(self, sigma):
	self.sigma = sigma

	def __getitem__(self, clean_id):
	clean_img = crop_img(np.array(Image.open(self.clean_ids[clean_id]).convert('RGB')), base=16)
	clean_name = self.clean_ids[clean_id].split("/")[-1].split('.')[0]

	noisy_img, _ = self._add_gaussian_noise(clean_img)
	clean_img, noisy_img = self.toTensor(clean_img), self.toTensor(noisy_img)

	return [clean_name], noisy_img, clean_img
	def tile_degrad(input_,tile=128,tile_overlap =0):
	sigma_dict = {0:0,1:15,2:25,3:50}
	b, c, h, w = input_.shape
	tile = min(tile, h, w)
	assert tile % 8 == 0, "tile size should be multiple of 8"

	stride = tile - tile_overlap
	h_idx_list = list(range(0, h-tile, stride)) + [h-tile]
	w_idx_list = list(range(0, w-tile, stride)) + [w-tile]
	E = torch.zeros(b, c, h, w).type_as(input_)
	W = torch.zeros_like(E)
	s = 0
	for h_idx in h_idx_list:
	for w_idx in w_idx_list:
	in_patch = input_[..., h_idx:h_idx+tile, w_idx:w_idx+tile]
	out_patch = in_patch
	# out_patch = model(in_patch)
	out_patch_mask = torch.ones_like(in_patch)

	E[..., h_idx:(h_idx+tile), w_idx:(w_idx+tile)].add_(out_patch)
	W[..., h_idx:(h_idx+tile), w_idx:(w_idx+tile)].add_(out_patch_mask)
	# restored = E.div_(W)

	restored = torch.clamp(restored, 0, 1)
	return restored
	def __len__(self):
	return self.num_clean


	class DerainDehazeDataset(Dataset):
	def __init__(self, args, task="derain",addnoise = False,sigma = None):
	super(DerainDehazeDataset, self).__init__()
	self.ids = []
	self.task_idx = 0
	self.args = args

	self.task_dict = {'derain': 0, 'dehaze': 1}
	self.toTensor = ToTensor()
	self.addnoise = addnoise
	self.sigma = sigma

	self.set_dataset(task)
	def _add_gaussian_noise(self, clean_patch):
	noise = np.random.randn(*clean_patch.shape)
	noisy_patch = np.clip(clean_patch + noise * self.sigma, 0, 255).astype(np.uint8)
	return noisy_patch, clean_patch

	def _init_input_ids(self):
	if self.task_idx == 0:
	self.ids = []
	name_list = os.listdir(self.args.derain_path + 'input/')
	# print(name_list)
	print(self.args.derain_path)
	self.ids += [self.args.derain_path + 'input/' + id_ for id_ in name_list]
	elif self.task_idx == 1:
	self.ids = []
	name_list = os.listdir(self.args.dehaze_path + 'input/')
	self.ids += [self.args.dehaze_path + 'input/' + id_ for id_ in name_list]

	self.length = len(self.ids)

	def _get_gt_path(self, degraded_name):
	if self.task_idx == 0:
	gt_name = degraded_name.replace("input", "target")
	elif self.task_idx == 1:
	dir_name = degraded_name.split("input")[0] + 'target/'
	name = degraded_name.split('/')[-1].split('_')[0] + '.png'
	gt_name = dir_name + name
	return gt_name

	def set_dataset(self, task):
	self.task_idx = self.task_dict[task]
	self._init_input_ids()

	def __getitem__(self, idx):
	degraded_path = self.ids[idx]
	clean_path = self._get_gt_path(degraded_path)

	degraded_img = crop_img(np.array(Image.open(degraded_path).convert('RGB')), base=16)
	if self.addnoise:
	degraded_img,_ = self._add_gaussian_noise(degraded_img)
	clean_img = crop_img(np.array(Image.open(clean_path).convert('RGB')), base=16)

	clean_img, degraded_img = self.toTensor(clean_img), self.toTensor(degraded_img)
	degraded_name = degraded_path.split('/')[-1][:-4]

	return [degraded_name], degraded_img, clean_img

	def __len__(self):
	return self.length


	class TestSpecificDataset(Dataset):
	def __init__(self, args):
	super(TestSpecificDataset, self).__init__()
	self.args = args
	self.degraded_ids = []
	self._init_clean_ids(args.test_path)

	self.toTensor = ToTensor()

	def _init_clean_ids(self, root):
	extensions = ['jpg', 'JPG', 'png', 'PNG', 'jpeg', 'JPEG', 'bmp', 'BMP']
	if os.path.isdir(root):
	name_list = []
	for image_file in os.listdir(root):
	if any([image_file.endswith(ext) for ext in extensions]):
	name_list.append(image_file)
	if len(name_list) == 0:
	raise Exception('The input directory does not contain any image files')
	self.degraded_ids += [root + id_ for id_ in name_list]
	else:
	if any([root.endswith(ext) for ext in extensions]):
	name_list = [root]
	else:
	raise Exception('Please pass an Image file')
	self.degraded_ids = name_list
	print("Total Images : {}".format(name_list))

	self.num_img = len(self.degraded_ids)

	def __getitem__(self, idx):
	degraded_img = crop_img(np.array(Image.open(self.degraded_ids[idx]).convert('RGB')), base=16)
	name = self.degraded_ids[idx].split('/')[-1][:-4]

	degraded_img = self.toTensor(degraded_img)

	return [name], degraded_img

	def __len__(self):
	return self.num_img