VQualA-SR / ImageDataset2.py

Upload 5 files

28c2184 verified 8 months ago

34.4 kB

	import os
	import torch
	import functools
	import numpy as np
	import pandas as pd
	from PIL import Image, ImageFile
	from torch.utils.data import Dataset
	from tqdm import tqdm
	import re
	IMG_EXTENSIONS = ['.jpg', '.jpeg', '.png', '.ppm', '.bmp', '.pgm', '.tif']

	ImageFile.LOAD_TRUNCATED_IMAGES = True
	def has_file_allowed_extension(filename, extensions):
	"""Checks if a file is an allowed extension.
	Args:
	filename (string): path to a file
	extensions (iterable of strings): extensions to consider (lowercase)
	Returns:
	bool: True if the filename ends with one of given extensions
	"""
	filename_lower = filename.lower()
	return any(filename_lower.endswith(ext) for ext in extensions)


	def image_loader(image_name):
	if has_file_allowed_extension(image_name, IMG_EXTENSIONS):
	I = Image.open(image_name)
	return I.convert('RGB')


	def get_default_img_loader():
	return functools.partial(image_loader)


	class ImageDataset2(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess,
	num_patch,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	self.data = pd.read_csv(csv_file, sep='\t', header=None)
	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.num_patch = num_patch
	self.test = test

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
	I = self.loader(image_name)
	I = self.preprocess(I)
	I = I.unsqueeze(0)
	n_channels = 3
	kernel_h = 224
	kernel_w = 224
	if (I.size(2) >= 1024) \| (I.size(3) >= 1024):
	step = 48
	else:
	step = 32
	patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
	n_channels,
	kernel_h,
	kernel_w)

	assert patches.size(0) >= self.num_patch
	#self.num_patch = np.minimum(patches.size(0), self.num_patch)
	if self.test:
	sel_step = patches.size(0) // self.num_patch
	sel = torch.zeros(self.num_patch)
	for i in range(self.num_patch):
	sel[i] = sel_step * i
	sel = sel.long()
	else:
	sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
	patches = patches[sel, ...]
	mos = self.data.iloc[index, 1]

	dist_type = self.data.iloc[index, 2]
	scene_content1 = self.data.iloc[index, 3]
	scene_content2 = self.data.iloc[index, 4]
	scene_content3 = self.data.iloc[index, 5]

	if scene_content2 == 'invalid':
	valid = 1
	elif scene_content3 == 'invalid':
	valid = 2
	else:
	valid = 3

	sample = {'I': patches, 'mos': float(mos), 'dist_type': dist_type, 'scene_content1': scene_content1,
	'scene_content2':scene_content2, 'scene_content3':scene_content3, 'valid':valid}

	return sample

	def __len__(self):
	return len(self.data.index)

	class ImageDataset_qonly(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess,
	num_patch,
	set,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	if csv_file[-3:] == 'txt':
	data = pd.read_csv(csv_file, sep='\t', header=None)
	self.data = data
	self.mos_col = 1
	elif csv_file[-4:] == 'xlsx':
	data = pd.read_excel(csv_file, header=0)
	self.data = data
	self.mos_col = 1
	else:
	data = pd.read_csv(csv_file, header=0)
	if ('split' in data.columns) & (set != 3):
	self.data = data[data.split==set]
	else:
	self.data = data
	self.mos_col = 1
	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.num_patch = num_patch
	self.test = test

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
	image_name = image_name.replace('\\', '/')
	I = self.loader(image_name)
	I = self.preprocess(I)
	I = I.unsqueeze(0)
	n_channels = 3
	kernel_h = 224
	kernel_w = 224
	if (I.size(2) >= 1024) \| (I.size(3) >= 1024):
	step = 48
	else:
	step = 32
	patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
	n_channels,
	kernel_h,
	kernel_w)

	assert patches.size(0) >= self.num_patch
	#self.num_patch = np.minimum(patches.size(0), self.num_patch)
	if self.test:
	sel_step = patches.size(0) // self.num_patch
	sel = torch.zeros(self.num_patch)
	for i in range(self.num_patch):
	sel[i] = sel_step * i
	sel = sel.long()
	else:
	sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
	patches = patches[sel, ...]
	mos = self.data.iloc[index, self.mos_col]
	if self.data.shape[1] == 23: #llie
	distortions = self.data.iloc[index, self.mos_col+1::2]
	distortions = distortions.to_numpy(dtype=float)
	distortions = torch.from_numpy(distortions)
	else:
	distortions = 0

	sample = {'I': patches, 'mos': float(mos), 'dists':distortions}

	return sample

	def __len__(self):
	return len(self.data)

	def __len__(self):
	return len(self.data.index)


	class ImageDataset_llie(Dataset):
	def __init__(self, csv_file,
	img_dir,
	spatialFeat,
	preprocess,
	num_patch,
	set,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	if csv_file[-3:] == 'txt':
	data = pd.read_csv(csv_file, sep='\t', header=None)
	self.data = data
	self.mos_col = 1
	elif csv_file[-4:] == 'xlsx':
	data = pd.read_excel(csv_file, header=0)
	self.data = data
	self.mos_col = 1
	else:
	data = pd.read_csv(csv_file, header=0)
	if ('split' in data.columns) & (set != 3):
	self.data = data[data.split==set]
	else:
	self.data = data
	self.mos_col = 1
	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.num_patch = num_patch
	self.test = test
	self.spatialFeat = spatialFeat

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
	image_name = image_name.replace('\\', '/')
	I = self.loader(image_name)
	I = self.preprocess(I)

	tmp = image_name.split('/')[-1]
	tmp = tmp.split('.')[0]

	spatial_feat = torch.from_numpy(np.load(os.path.join(self.spatialFeat, f'{tmp}.npy'))).view(-1)

	I = I.unsqueeze(0)
	n_channels = 3
	kernel_h = 224
	kernel_w = 224
	if (I.size(2) >= 1024) \| (I.size(3) >= 1024):
	step = 48
	else:
	step = 32
	patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
	n_channels,
	kernel_h,
	kernel_w)

	assert patches.size(0) >= self.num_patch
	self.num_patch = np.minimum(patches.size(0), self.num_patch)
	if self.test:
	sel_step = patches.size(0) // self.num_patch
	sel = torch.zeros(self.num_patch)
	for i in range(self.num_patch):
	sel[i] = sel_step * i
	sel = sel.long()
	else:
	sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
	patches = patches[sel, ...]

	mos = self.data.iloc[index, self.mos_col]
	if self.data.shape[1] == 23: #llie
	distortions = self.data.iloc[index, self.mos_col+1::2]
	distortions = distortions.to_numpy(dtype=float)
	distortions = torch.from_numpy(distortions)
	else:
	distortions = 0

	sample = {'I': patches, 'spatial_feat':spatial_feat, 'mos': float(mos), 'dists':distortions}

	return sample

	def __len__(self):
	return len(self.data)

	def __len__(self):
	return len(self.data.index)


	class ImageDataset_llie_naflex(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess,
	num_patch,
	set,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	if csv_file[-3:] == 'txt':
	data = pd.read_csv(csv_file, sep='\t', header=None)
	self.data = data
	self.mos_col = 1
	elif csv_file[-4:] == 'xlsx':
	data = pd.read_excel(csv_file, header=0)
	self.data = data
	self.mos_col = 1
	else:
	data = pd.read_csv(csv_file, header=0)
	if ('split' in data.columns) & (set != 3):
	self.data = data[data.split==set]
	else:
	self.data = data
	self.mos_col = 1
	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.num_patch = num_patch
	self.test = test

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
	image_name = image_name.replace('\\', '/')
	I = self.loader(image_name)

	mos = self.data.iloc[index, self.mos_col]
	if self.data.shape[1] == 23: #llie
	distortions = self.data.iloc[index, self.mos_col+1::2]
	distortions = distortions.to_numpy(dtype=float)
	distortions = torch.from_numpy(distortions)
	else:
	distortions = 0

	#sample = {'I': I, 'mos': float(mos), 'dists':distortions}

	return I, float(mos), distortions

	def __len__(self):
	return len(self.data)

	def __len__(self):
	return len(self.data.index)

	class ImageDataset_sr_naflex(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess,
	num_patch,
	set,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	data = pd.read_excel(csv_file, header=0)
	self.data = data

	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.num_patch = num_patch
	self.test = test

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, 'SR', self.data.iloc[index, 0])
	image_name = image_name.replace('\\', '/')

	im_name = self.data.iloc[index, 0]

	I = self.loader(image_name)

	mos = self.data.iloc[index, 3]

	return I, float(mos)

	def __len__(self):
	return len(self.data)

	def __len__(self):
	return len(self.data.index)

	class ImageDataset_diqa_naflex(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess,
	num_patch,
	set,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	data = pd.read_csv(csv_file, header=0)
	self.data = data

	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.num_patch = num_patch
	self.test = test

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, 'res', self.data.iloc[index, 0])
	image_name = image_name.replace('\\', '/')
	I = self.loader(image_name)
	if self.data.shape[1] == 5:
	image_name2 = os.path.join(self.img_dir, 'ori', self.data.iloc[index, 1])
	image_name2 = image_name.replace('\\', '/')
	I_ref = self.loader(image_name2)
	overall_mos = 0.8*self.data.iloc[index, 2] + 1
	sharp_mos = 0.8*self.data.iloc[index, 3] + 1
	color_mos = 0.8*self.data.iloc[index, 4] + 1
	else:
	I_ref = I
	overall_mos = 0.8*self.data.iloc[index, 1] + 1
	sharp_mos = 0.8*self.data.iloc[index, 2] + 1
	color_mos = 0.8*self.data.iloc[index, 3] + 1

	return I, I_ref, float(overall_mos), float(sharp_mos), float(color_mos)

	def __len__(self):
	return len(self.data)

	def __len__(self):
	return len(self.data.index)




	class ImageDataset_llie2(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess,
	num_patch,
	set,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	if csv_file[-3:] == 'txt':
	data = pd.read_csv(csv_file, sep='\t', header=None)
	self.data = data
	self.mos_col = 1
	elif csv_file[-4:] == 'xlsx':
	data = pd.read_excel(csv_file, header=0)
	self.data = data
	self.mos_col = 1
	else:
	data = pd.read_csv(csv_file, header=0)
	if ('split' in data.columns) & (set != 3):
	self.data = data[data.split==set]
	else:
	self.data = data
	self.mos_col = 1
	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.num_patch = num_patch
	self.test = test

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
	image_name = image_name.replace('\\', '/')
	I = self.loader(image_name)
	I = self.preprocess(I)

	I = I.unsqueeze(0)
	n_channels = 3
	kernel_h = 224
	kernel_w = 224
	if (I.size(2) >= 1024) \| (I.size(3) >= 1024):
	step = 48
	else:
	step = 32
	patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
	n_channels,
	kernel_h,
	kernel_w)

	assert patches.size(0) >= self.num_patch
	self.num_patch = np.minimum(patches.size(0), self.num_patch)
	if self.test:
	sel_step = patches.size(0) // self.num_patch
	sel = torch.zeros(self.num_patch)
	for i in range(self.num_patch):
	sel[i] = sel_step * i
	sel = sel.long()
	else:
	sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
	patches = patches[sel, ...]

	mos = self.data.iloc[index, self.mos_col]
	if self.data.shape[1] == 23: #llie
	distortions = self.data.iloc[index, self.mos_col+1::2]
	distortions = distortions.to_numpy(dtype=float)
	distortions = torch.from_numpy(distortions)
	else:
	distortions = 0

	sample = {'I': patches, 'mos': float(mos), 'dists':distortions}

	return sample

	def __len__(self):
	return len(self.data)

	def __len__(self):
	return len(self.data.index)


	class ImageDataset_pseudo_label(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess,
	num_patch,
	set,
	test,
	pseudo_label,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	"""
	self.data = pd.read_csv(csv_file, header=None)
	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.num_patch = num_patch
	self.pseudo_label = pseudo_label
	self.test = test

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: A list of dicts with keys 'I' and 'mos'
	"""

	image_name = self.data.iloc[index, 0]
	labels = []
	all_patches = []
	methods = list(self.pseudo_label.keys())
	for method in methods:
	if method == 'GT':
	llie_name = image_name
	elif method == 'NeRCo':
	llie_name = method + '_' + image_name[:-4] + '_fake_B.png'
	else:
	llie_name = method + '_' + image_name
	image_path = os.path.join(self.img_dir, method, llie_name)
	I = self.loader(image_path)
	I = self.preprocess(I)
	label = self.pseudo_label[method]

	I = I.unsqueeze(0)
	n_channels = 3
	kernel_h = 224
	kernel_w = 224
	if (I.size(2) >= 1024) \| (I.size(3) >= 1024):
	step = 48
	else:
	step = 32
	patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
	n_channels,
	kernel_h,
	kernel_w)

	assert patches.size(0) >= self.num_patch
	self.num_patch = np.minimum(patches.size(0), self.num_patch)
	if self.test:
	sel_step = patches.size(0) // self.num_patch
	sel = torch.zeros(self.num_patch)
	for i in range(self.num_patch):
	sel[i] = sel_step * i
	sel = sel.long()
	else:
	sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch,))
	patches = patches[sel, ...]

	labels.append(label)
	all_patches.append(patches)

	I = torch.cat(all_patches, dim=0)
	labels = torch.tensor(labels)
	sample = {'I': I, 'mos': labels}
	return sample

	def __len__(self):
	return len(self.data.index)


	# level = {'mild':0, 'moderate':1, 'severe': 2}
	#
	# tone_issues = {'global over-exposure':0, 'global under-exposure':1, 'global reverse-tone':2, 'global hazy': 3,
	# 'global high-contrast': 4, 'global low-exposure':5, 'local over-exposure': 6, 'local under-exposure': 7,
	# 'local hazy': 8, 'local high-contrast': 9, 'local low-contrast': 10}
	#
	# color_issues = {'global yellow tint':0, 'global cold tint':1, 'global green tint':2, 'global red tint': 3,
	# 'global yellow-green tint': 4, 'global purple tint':5, 'global cyan tint': 6, 'global over-saturated': 7,
	# 'global under-saturated': 8, 'local yellow tint':9, 'local cold tint':10, 'local green tint':11,
	# 'local red tint': 12, 'local yellow-green tint': 13, 'local purple tint':14, 'local cyan tint': 15,
	# 'local over-saturated': 16,'local under-saturated': 17, 'local magenta tint':18, 'local blue tint':19}
	#
	# local_areas = {'highlight area':0, 'bright area':1, 'mid-dark area':2, 'dark area':3, 'black area':4, 'human area':5,
	# 'face area':6, 'hair area':7, 'cloth area':8, 'plant area': 9, 'sky area': 10, 'ground area': 11,
	# 'water area': 12, 'lamp area':13, 'background area':13, 'background shadows':14, 'no area':15}
	#
	# tasks = {'tone':0, 'color':1}
	#
	# scene = {'food':0, 'mixed-light':1, 'outdoor':2, 'indoor':3, 'sunset':4, 'blue tone': 5, 'nighttime':6}



	class ImageDataset_oppo(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess,
	num_patch,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	self.data = pd.read_csv(csv_file, header=0)
	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.num_patch = num_patch
	self.test = test


	def __convertnan__(self, value):
	if pd.isna(value):
	value = 'free'
	return value

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
	I = self.loader(image_name)
	I = self.preprocess(I)
	I = I.unsqueeze(0)
	n_channels = 3
	kernel_h = 224
	kernel_w = 224
	if (I.size(2) >= 1024) \| (I.size(3) >= 1024):
	step = 48
	else:
	step = 32
	patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
	n_channels,
	kernel_h,
	kernel_w)

	assert patches.size(0) >= self.num_patch
	#self.num_patch = np.minimum(patches.size(0), self.num_patch)
	if self.test:
	sel_step = patches.size(0) // self.num_patch
	sel = torch.zeros(self.num_patch)
	for i in range(self.num_patch):
	sel[i] = sel_step * i
	sel = sel.long()
	else:
	sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
	patches = patches[sel, ...]

	scene = self.data.iloc[index, 1]
	mode = self.data.iloc[index, 2]
	focal_length = self.data.iloc[index, 3]
	compare_x200p = self.data.iloc[index, 4]
	tone_level = self.__convertnan__(self.data.iloc[index, 5])
	tone_global_issue = self.__convertnan__(self.data.iloc[index, 6])
	tone_local_issue = self.__convertnan__(self.data.iloc[index, 7])
	tone_local_issue_region = self.__convertnan__(self.data.iloc[index, 8])
	color_level = self.__convertnan__(self.data.iloc[index, 9])
	color_global_issue = self.__convertnan__(self.data.iloc[index, 10])
	color_local_issue = self.__convertnan__(self.data.iloc[index, 11])
	color_local_issue_region = self.__convertnan__(self.data.iloc[index, 12])

	sample = {'I': patches, 'scene': scene.lower(), 'mode': mode.lower(), 'focal_length':focal_length.lower(), 'compare_x200p':compare_x200p.lower(),
	'tone_level':tone_level.lower(), 'tone_global_issue':tone_global_issue.lower(), 'tone_local_issue':tone_local_issue.lower(),
	'tone_local_issue_region':tone_local_issue_region.lower(), 'color_level':color_level.lower(),
	'color_global_issue':color_global_issue.lower(), 'color_local_issue':color_local_issue.lower(),
	'color_local_issue_region':color_local_issue_region.lower()}

	return sample

	def __len__(self):
	return len(self.data.index)



	class ImageDataset_llie_general(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess,
	set,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	if csv_file[-3:] == 'txt':
	data = pd.read_csv(csv_file, sep='\t', header=None)
	self.data = data
	self.mos_col = 1
	elif csv_file[-4:] == 'xlsx':
	data = pd.read_excel(csv_file, header=0)
	self.data = data
	self.mos_col = 1
	else:
	data = pd.read_csv(csv_file, header=0)
	if ('split' in data.columns) & (set != 3):
	self.data = data[data.split==set]
	else:
	self.data = data
	self.mos_col = 1
	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess = preprocess
	self.test = test

	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
	image_name = image_name.replace('\\', '/')
	I = self.loader(image_name)
	I = self.preprocess(I)

	mos = self.data.iloc[index, self.mos_col]
	sample = {'I': I, 'mos': float(mos)}

	return sample

	def __len__(self):
	return len(self.data)

	def __len__(self):
	return len(self.data.index)


	class ImageDataset_ms(Dataset):
	def __init__(self, csv_file,
	img_dir,
	preprocess1,
	preprocess2,
	preprocess3,
	num_patch,
	set,
	test,
	get_loader=get_default_img_loader):
	"""
	Args:
	csv_file (string): Path to the csv file with annotations.
	img_dir (string): Directory of the images.
	transform (callable, optional): transform to be applied on a sample.
	"""
	if csv_file[-3:] == 'txt':
	data = pd.read_csv(csv_file, sep='\t', header=None)
	self.data = data
	self.mos_col = 1
	elif csv_file[-4:] == 'xlsx':
	data = pd.read_excel(csv_file, header=0)
	self.data = data
	self.mos_col = 1
	else:
	data = pd.read_csv(csv_file, header=0)
	if ('split' in data.columns) & (set != 3):
	self.data = data[data.split==set]
	else:
	self.data = data
	self.mos_col = 1
	print('%d csv data successfully loaded!' % self.__len__())
	self.img_dir = img_dir
	self.loader = get_loader()
	self.preprocess1 = preprocess1
	self.preprocess2 = preprocess2
	self.preprocess3 = preprocess3
	self.num_patch = num_patch
	self.test = test


	def __getitem__(self, index):
	"""
	Args:
	index (int): Index
	Returns:
	samples: a Tensor that represents a video segment.
	"""
	image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
	I = self.loader(image_name)

	num_patch_per_scale = (self.num_patch - 1) // 2
	I1 = self.preprocess1(I)
	I1 = I1.unsqueeze(0)
	I2 = self.preprocess1(I)
	I2 = I2.unsqueeze(0)
	I3 = self.preprocess1(I)
	I3 = I3.unsqueeze(0)

	I_global = I1

	n_channels = 3
	kernel_h = 224
	kernel_w = 224

	all_patches = [I_global] # insert global resized image (PaQ-2-PiQ)

	step = 16
	patches = I2.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
	n_channels,
	kernel_h,
	kernel_w)
	if self.test:
	sel_step = patches.size(0) // num_patch_per_scale
	sel = torch.zeros(num_patch_per_scale)
	for i in range(num_patch_per_scale):
	sel[i] = sel_step * i
	sel = sel.long()
	else:
	sel = torch.randint(low=0, high=patches.size(0), size=(num_patch_per_scale,))
	patches = patches[sel, ...]
	all_patches.append(patches)

	step = 32
	patches = I3.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
	n_channels,
	kernel_h,
	kernel_w)
	if self.test:
	sel_step = patches.size(0) // num_patch_per_scale
	sel = torch.zeros(num_patch_per_scale)
	for i in range(num_patch_per_scale):
	sel[i] = sel_step * i
	sel = sel.long()
	else:
	sel = torch.randint(low=0, high=patches.size(0), size=(num_patch_per_scale,))
	patches = patches[sel, ...]
	all_patches.append(patches)


	all_patches = torch.cat(all_patches, 0)
	mos = self.data.iloc[index, 1]
	if self.data.shape[1] == 23: # llie
	distortions = self.data.iloc[index, self.mos_col + 1::2]
	distortions = distortions.to_numpy(dtype=float)
	distortions = torch.from_numpy(distortions)
	else:
	distortions = 0

	sample = {'I': all_patches, 'mos': float(mos), 'dists': distortions}

	return sample

	def __len__(self):
	return len(self.data)