File size: 34,406 Bytes

28c2184

import os
import torch
import functools
import numpy as np
import pandas as pd
from PIL import Image, ImageFile
from torch.utils.data import Dataset
from tqdm import tqdm
import re
IMG_EXTENSIONS = ['.jpg', '.jpeg', '.png', '.ppm', '.bmp', '.pgm', '.tif']

ImageFile.LOAD_TRUNCATED_IMAGES = True
def has_file_allowed_extension(filename, extensions):
    """Checks if a file is an allowed extension.
    Args:
        filename (string): path to a file
        extensions (iterable of strings): extensions to consider (lowercase)
    Returns:
        bool: True if the filename ends with one of given extensions
    """
    filename_lower = filename.lower()
    return any(filename_lower.endswith(ext) for ext in extensions)


def image_loader(image_name):
    if has_file_allowed_extension(image_name, IMG_EXTENSIONS):
        I = Image.open(image_name)
    return I.convert('RGB')


def get_default_img_loader():
    return functools.partial(image_loader)


class ImageDataset2(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess,
                 num_patch,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        self.data = pd.read_csv(csv_file, sep='\t', header=None)
        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.num_patch = num_patch
        self.test = test

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
        I = self.loader(image_name)
        I = self.preprocess(I)
        I = I.unsqueeze(0)
        n_channels = 3
        kernel_h = 224
        kernel_w = 224
        if (I.size(2) >= 1024) | (I.size(3) >= 1024):
            step = 48
        else:
            step = 32
        patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
                                                                                                          n_channels,
                                                                                                          kernel_h,
                                                                                                          kernel_w)

        assert patches.size(0) >= self.num_patch
        #self.num_patch = np.minimum(patches.size(0), self.num_patch)
        if self.test:
            sel_step = patches.size(0) // self.num_patch
            sel = torch.zeros(self.num_patch)
            for i in range(self.num_patch):
                sel[i] = sel_step * i
            sel = sel.long()
        else:
            sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
        patches = patches[sel, ...]
        mos = self.data.iloc[index, 1]

        dist_type = self.data.iloc[index, 2]
        scene_content1 = self.data.iloc[index, 3]
        scene_content2 = self.data.iloc[index, 4]
        scene_content3 = self.data.iloc[index, 5]

        if scene_content2 == 'invalid':
            valid = 1
        elif scene_content3 == 'invalid':
            valid = 2
        else:
            valid = 3

        sample = {'I': patches, 'mos': float(mos), 'dist_type': dist_type, 'scene_content1': scene_content1,
                  'scene_content2':scene_content2, 'scene_content3':scene_content3, 'valid':valid}

        return sample

    def __len__(self):
        return len(self.data.index)
        
class ImageDataset_qonly(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess,
                 num_patch,
                 set,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        if csv_file[-3:] == 'txt':
            data = pd.read_csv(csv_file, sep='\t', header=None)
            self.data = data
            self.mos_col = 1
        elif csv_file[-4:] == 'xlsx':
            data = pd.read_excel(csv_file, header=0)
            self.data = data
            self.mos_col = 1
        else:
            data = pd.read_csv(csv_file, header=0)
            if ('split' in data.columns) & (set != 3):
                self.data = data[data.split==set]
            else:
                self.data = data
            self.mos_col = 1
        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.num_patch = num_patch
        self.test = test

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
        image_name = image_name.replace('\\', '/')
        I = self.loader(image_name)
        I = self.preprocess(I)
        I = I.unsqueeze(0)
        n_channels = 3
        kernel_h = 224
        kernel_w = 224
        if (I.size(2) >= 1024) | (I.size(3) >= 1024):
            step = 48
        else:
            step = 32
        patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
                                                                                                          n_channels,
                                                                                                          kernel_h,
                                                                                                          kernel_w)

        assert patches.size(0) >= self.num_patch
        #self.num_patch = np.minimum(patches.size(0), self.num_patch)
        if self.test:
            sel_step = patches.size(0) // self.num_patch
            sel = torch.zeros(self.num_patch)
            for i in range(self.num_patch):
                sel[i] = sel_step * i
            sel = sel.long()
        else:
            sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
        patches = patches[sel, ...]
        mos = self.data.iloc[index, self.mos_col]
        if self.data.shape[1] == 23: #llie
            distortions = self.data.iloc[index, self.mos_col+1::2]
            distortions = distortions.to_numpy(dtype=float)
            distortions = torch.from_numpy(distortions)
        else:
            distortions = 0

        sample = {'I': patches, 'mos': float(mos), 'dists':distortions}

        return sample

    def __len__(self):
        return len(self.data)

    def __len__(self):
        return len(self.data.index)


class ImageDataset_llie(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 spatialFeat,
                 preprocess,
                 num_patch,
                 set,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        if csv_file[-3:] == 'txt':
            data = pd.read_csv(csv_file, sep='\t', header=None)
            self.data = data
            self.mos_col = 1
        elif csv_file[-4:] == 'xlsx':
            data = pd.read_excel(csv_file, header=0)
            self.data = data
            self.mos_col = 1
        else:
            data = pd.read_csv(csv_file, header=0)
            if ('split' in data.columns) & (set != 3):
                self.data = data[data.split==set]
            else:
                self.data = data
            self.mos_col = 1
        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.num_patch = num_patch
        self.test = test
        self.spatialFeat = spatialFeat

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
        image_name = image_name.replace('\\', '/')
        I = self.loader(image_name)
        I = self.preprocess(I)

        tmp = image_name.split('/')[-1]
        tmp = tmp.split('.')[0]

        spatial_feat = torch.from_numpy(np.load(os.path.join(self.spatialFeat, f'{tmp}.npy'))).view(-1)

        I = I.unsqueeze(0)
        n_channels = 3
        kernel_h = 224
        kernel_w = 224
        if (I.size(2) >= 1024) | (I.size(3) >= 1024):
            step = 48
        else:
            step = 32
        patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
                                                                                                          n_channels,
                                                                                                          kernel_h,
                                                                                                          kernel_w)

        assert patches.size(0) >= self.num_patch
        self.num_patch = np.minimum(patches.size(0), self.num_patch)
        if self.test:
            sel_step = patches.size(0) // self.num_patch
            sel = torch.zeros(self.num_patch)
            for i in range(self.num_patch):
                sel[i] = sel_step * i
            sel = sel.long()
        else:
            sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
        patches = patches[sel, ...]

        mos = self.data.iloc[index, self.mos_col]
        if self.data.shape[1] == 23: #llie
            distortions = self.data.iloc[index, self.mos_col+1::2]
            distortions = distortions.to_numpy(dtype=float)
            distortions = torch.from_numpy(distortions)
        else:
            distortions = 0

        sample = {'I': patches, 'spatial_feat':spatial_feat, 'mos': float(mos), 'dists':distortions}

        return sample

    def __len__(self):
        return len(self.data)

    def __len__(self):
        return len(self.data.index)


class ImageDataset_llie_naflex(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess,
                 num_patch,
                 set,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        if csv_file[-3:] == 'txt':
            data = pd.read_csv(csv_file, sep='\t', header=None)
            self.data = data
            self.mos_col = 1
        elif csv_file[-4:] == 'xlsx':
            data = pd.read_excel(csv_file, header=0)
            self.data = data
            self.mos_col = 1
        else:
            data = pd.read_csv(csv_file, header=0)
            if ('split' in data.columns) & (set != 3):
                self.data = data[data.split==set]
            else:
                self.data = data
            self.mos_col = 1
        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.num_patch = num_patch
        self.test = test

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
        image_name = image_name.replace('\\', '/')
        I = self.loader(image_name)

        mos = self.data.iloc[index, self.mos_col]
        if self.data.shape[1] == 23: #llie
            distortions = self.data.iloc[index, self.mos_col+1::2]
            distortions = distortions.to_numpy(dtype=float)
            distortions = torch.from_numpy(distortions)
        else:
            distortions = 0

        #sample = {'I': I, 'mos': float(mos), 'dists':distortions}

        return I, float(mos), distortions

    def __len__(self):
        return len(self.data)

    def __len__(self):
        return len(self.data.index)
    
class ImageDataset_sr_naflex(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess,
                 num_patch,
                 set,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        data = pd.read_excel(csv_file, header=0)
        self.data = data

        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.num_patch = num_patch
        self.test = test

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, 'SR', self.data.iloc[index, 0])
        image_name = image_name.replace('\\', '/')

        im_name =  self.data.iloc[index, 0]

        I = self.loader(image_name)

        mos = self.data.iloc[index, 3]

        return I, float(mos)

    def __len__(self):
        return len(self.data)

    def __len__(self):
        return len(self.data.index)

class ImageDataset_diqa_naflex(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess,
                 num_patch,
                 set,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        data = pd.read_csv(csv_file, header=0)
        self.data = data

        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.num_patch = num_patch
        self.test = test

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, 'res', self.data.iloc[index, 0])
        image_name = image_name.replace('\\', '/')
        I = self.loader(image_name)
        if self.data.shape[1] == 5:
            image_name2 = os.path.join(self.img_dir, 'ori', self.data.iloc[index, 1])
            image_name2 = image_name.replace('\\', '/')
            I_ref = self.loader(image_name2)
            overall_mos = 0.8*self.data.iloc[index, 2] + 1
            sharp_mos = 0.8*self.data.iloc[index, 3] + 1
            color_mos = 0.8*self.data.iloc[index, 4] + 1
        else:
            I_ref = I
            overall_mos = 0.8*self.data.iloc[index, 1] + 1
            sharp_mos = 0.8*self.data.iloc[index, 2] + 1
            color_mos = 0.8*self.data.iloc[index, 3] + 1
   
        return I, I_ref, float(overall_mos), float(sharp_mos), float(color_mos)

    def __len__(self):
        return len(self.data)

    def __len__(self):
        return len(self.data.index)




class ImageDataset_llie2(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess,
                 num_patch,
                 set,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        if csv_file[-3:] == 'txt':
            data = pd.read_csv(csv_file, sep='\t', header=None)
            self.data = data
            self.mos_col = 1
        elif csv_file[-4:] == 'xlsx':
            data = pd.read_excel(csv_file, header=0)
            self.data = data
            self.mos_col = 1
        else:
            data = pd.read_csv(csv_file, header=0)
            if ('split' in data.columns) & (set != 3):
                self.data = data[data.split==set]
            else:
                self.data = data
            self.mos_col = 1
        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.num_patch = num_patch
        self.test = test

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
        image_name = image_name.replace('\\', '/')
        I = self.loader(image_name)
        I = self.preprocess(I)

        I = I.unsqueeze(0)
        n_channels = 3
        kernel_h = 224
        kernel_w = 224
        if (I.size(2) >= 1024) | (I.size(3) >= 1024):
            step = 48
        else:
            step = 32
        patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
                                                                                                          n_channels,
                                                                                                          kernel_h,
                                                                                                          kernel_w)

        assert patches.size(0) >= self.num_patch
        self.num_patch = np.minimum(patches.size(0), self.num_patch)
        if self.test:
            sel_step = patches.size(0) // self.num_patch
            sel = torch.zeros(self.num_patch)
            for i in range(self.num_patch):
                sel[i] = sel_step * i
            sel = sel.long()
        else:
            sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
        patches = patches[sel, ...]

        mos = self.data.iloc[index, self.mos_col]
        if self.data.shape[1] == 23: #llie
            distortions = self.data.iloc[index, self.mos_col+1::2]
            distortions = distortions.to_numpy(dtype=float)
            distortions = torch.from_numpy(distortions)
        else:
            distortions = 0

        sample = {'I': patches, 'mos': float(mos), 'dists':distortions}

        return sample

    def __len__(self):
        return len(self.data)

    def __len__(self):
        return len(self.data.index)


class ImageDataset_pseudo_label(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess,
                 num_patch,
                 set,
                 test,
                 pseudo_label,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
        """
        self.data = pd.read_csv(csv_file, header=None)
        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.num_patch = num_patch
        self.pseudo_label = pseudo_label
        self.test = test

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: A list of dicts with keys 'I' and 'mos'
        """

        image_name = self.data.iloc[index, 0]
        labels = []
        all_patches = []
        methods = list(self.pseudo_label.keys())
        for method in methods:
            if method == 'GT':
                llie_name = image_name
            elif method == 'NeRCo':
                llie_name = method + '_' + image_name[:-4] + '_fake_B.png'
            else:
                llie_name = method + '_' + image_name
            image_path = os.path.join(self.img_dir, method, llie_name)
            I = self.loader(image_path)
            I = self.preprocess(I)
            label = self.pseudo_label[method]

            I = I.unsqueeze(0)
            n_channels = 3
            kernel_h = 224
            kernel_w = 224
            if (I.size(2) >= 1024) | (I.size(3) >= 1024):
                step = 48
            else:
                step = 32
            patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
                                                                                                              n_channels,
                                                                                                              kernel_h,
                                                                                                              kernel_w)

            assert patches.size(0) >= self.num_patch
            self.num_patch = np.minimum(patches.size(0), self.num_patch)
            if self.test:
                sel_step = patches.size(0) // self.num_patch
                sel = torch.zeros(self.num_patch)
                for i in range(self.num_patch):
                    sel[i] = sel_step * i
                sel = sel.long()
            else:
                sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch,))
            patches = patches[sel, ...]

            labels.append(label)
            all_patches.append(patches)

        I = torch.cat(all_patches, dim=0)
        labels = torch.tensor(labels)
        sample = {'I': I, 'mos': labels}
        return sample

    def __len__(self):
        return len(self.data.index)


# level = {'mild':0, 'moderate':1, 'severe': 2}
#
# tone_issues = {'global over-exposure':0, 'global under-exposure':1, 'global reverse-tone':2, 'global hazy': 3,
#                'global high-contrast': 4, 'global low-exposure':5, 'local over-exposure': 6, 'local under-exposure': 7,
#                'local hazy': 8, 'local high-contrast': 9, 'local low-contrast': 10}
#
# color_issues = {'global yellow tint':0, 'global cold tint':1, 'global green tint':2, 'global red tint': 3,
#                'global yellow-green tint': 4, 'global purple tint':5, 'global cyan tint': 6, 'global over-saturated': 7,
#                'global under-saturated': 8, 'local yellow tint':9, 'local cold tint':10, 'local green tint':11,
#                 'local red tint': 12, 'local yellow-green tint': 13, 'local purple tint':14, 'local cyan tint': 15,
#                 'local over-saturated': 16,'local under-saturated': 17, 'local magenta tint':18, 'local blue tint':19}
#
# local_areas = {'highlight area':0, 'bright area':1, 'mid-dark area':2, 'dark area':3, 'black area':4, 'human area':5,
#               'face area':6, 'hair area':7, 'cloth area':8, 'plant area': 9, 'sky area': 10, 'ground area': 11,
#               'water area': 12, 'lamp area':13, 'background area':13, 'background shadows':14, 'no area':15}
#
# tasks = {'tone':0, 'color':1}
#
# scene = {'food':0, 'mixed-light':1, 'outdoor':2, 'indoor':3, 'sunset':4, 'blue tone': 5, 'nighttime':6}



class ImageDataset_oppo(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess,
                 num_patch,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        self.data = pd.read_csv(csv_file, header=0)
        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.num_patch = num_patch
        self.test = test


    def __convertnan__(self, value):
        if pd.isna(value):
            value = 'free'
        return value

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
        I = self.loader(image_name)
        I = self.preprocess(I)
        I = I.unsqueeze(0)
        n_channels = 3
        kernel_h = 224
        kernel_w = 224
        if (I.size(2) >= 1024) | (I.size(3) >= 1024):
            step = 48
        else:
            step = 32
        patches = I.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
                                                                                                          n_channels,
                                                                                                          kernel_h,
                                                                                                          kernel_w)

        assert patches.size(0) >= self.num_patch
        #self.num_patch = np.minimum(patches.size(0), self.num_patch)
        if self.test:
            sel_step = patches.size(0) // self.num_patch
            sel = torch.zeros(self.num_patch)
            for i in range(self.num_patch):
                sel[i] = sel_step * i
            sel = sel.long()
        else:
            sel = torch.randint(low=0, high=patches.size(0), size=(self.num_patch, ))
        patches = patches[sel, ...]

        scene = self.data.iloc[index, 1]
        mode = self.data.iloc[index, 2]
        focal_length = self.data.iloc[index, 3]
        compare_x200p = self.data.iloc[index, 4]
        tone_level = self.__convertnan__(self.data.iloc[index, 5])
        tone_global_issue = self.__convertnan__(self.data.iloc[index, 6])
        tone_local_issue = self.__convertnan__(self.data.iloc[index, 7])
        tone_local_issue_region = self.__convertnan__(self.data.iloc[index, 8])
        color_level = self.__convertnan__(self.data.iloc[index, 9])
        color_global_issue = self.__convertnan__(self.data.iloc[index, 10])
        color_local_issue = self.__convertnan__(self.data.iloc[index, 11])
        color_local_issue_region = self.__convertnan__(self.data.iloc[index, 12])

        sample = {'I': patches, 'scene': scene.lower(), 'mode': mode.lower(), 'focal_length':focal_length.lower(), 'compare_x200p':compare_x200p.lower(),
                  'tone_level':tone_level.lower(), 'tone_global_issue':tone_global_issue.lower(), 'tone_local_issue':tone_local_issue.lower(),
                  'tone_local_issue_region':tone_local_issue_region.lower(), 'color_level':color_level.lower(),
                  'color_global_issue':color_global_issue.lower(), 'color_local_issue':color_local_issue.lower(),
                  'color_local_issue_region':color_local_issue_region.lower()}

        return sample

    def __len__(self):
        return len(self.data.index)



class ImageDataset_llie_general(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess,
                 set,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        if csv_file[-3:] == 'txt':
            data = pd.read_csv(csv_file, sep='\t', header=None)
            self.data = data
            self.mos_col = 1
        elif csv_file[-4:] == 'xlsx':
            data = pd.read_excel(csv_file, header=0)
            self.data = data
            self.mos_col = 1
        else:
            data = pd.read_csv(csv_file, header=0)
            if ('split' in data.columns) & (set != 3):
                self.data = data[data.split==set]
            else:
                self.data = data
            self.mos_col = 1
        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess = preprocess
        self.test = test

    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
        image_name = image_name.replace('\\', '/')
        I = self.loader(image_name)
        I = self.preprocess(I)

        mos = self.data.iloc[index, self.mos_col]
        sample = {'I': I, 'mos': float(mos)}

        return sample

    def __len__(self):
        return len(self.data)

    def __len__(self):
        return len(self.data.index)


class ImageDataset_ms(Dataset):
    def __init__(self, csv_file,
                 img_dir,
                 preprocess1,
                 preprocess2,
                 preprocess3,
                 num_patch,
                 set,
                 test,
                 get_loader=get_default_img_loader):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            img_dir (string): Directory of the images.
            transform (callable, optional): transform to be applied on a sample.
        """
        if csv_file[-3:] == 'txt':
            data = pd.read_csv(csv_file, sep='\t', header=None)
            self.data = data
            self.mos_col = 1
        elif csv_file[-4:] == 'xlsx':
            data = pd.read_excel(csv_file, header=0)
            self.data = data
            self.mos_col = 1
        else:
            data = pd.read_csv(csv_file, header=0)
            if ('split' in data.columns) & (set != 3):
                self.data = data[data.split==set]
            else:
                self.data = data
            self.mos_col = 1
        print('%d csv data successfully loaded!' % self.__len__())
        self.img_dir = img_dir
        self.loader = get_loader()
        self.preprocess1 = preprocess1
        self.preprocess2 = preprocess2
        self.preprocess3 = preprocess3
        self.num_patch = num_patch
        self.test = test


    def __getitem__(self, index):
        """
        Args:
            index (int): Index
        Returns:
            samples: a Tensor that represents a video segment.
        """
        image_name = os.path.join(self.img_dir, self.data.iloc[index, 0])
        I = self.loader(image_name)

        num_patch_per_scale = (self.num_patch - 1) // 2
        I1 = self.preprocess1(I)
        I1 = I1.unsqueeze(0)
        I2 = self.preprocess1(I)
        I2 = I2.unsqueeze(0)
        I3 = self.preprocess1(I)
        I3 = I3.unsqueeze(0)

        I_global = I1

        n_channels = 3
        kernel_h = 224
        kernel_w = 224

        all_patches = [I_global]  # insert global resized image (PaQ-2-PiQ)

        step = 16
        patches = I2.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
                                                                                                           n_channels,
                                                                                                           kernel_h,
                                                                                                           kernel_w)
        if self.test:
            sel_step = patches.size(0) // num_patch_per_scale
            sel = torch.zeros(num_patch_per_scale)
            for i in range(num_patch_per_scale):
                sel[i] = sel_step * i
            sel = sel.long()
        else:
            sel = torch.randint(low=0, high=patches.size(0), size=(num_patch_per_scale,))
        patches = patches[sel, ...]
        all_patches.append(patches)

        step = 32
        patches = I3.unfold(2, kernel_h, step).unfold(3, kernel_w, step).permute(0, 2, 3, 1, 4, 5).reshape(-1,
                                                                                                           n_channels,
                                                                                                           kernel_h,
                                                                                                           kernel_w)
        if self.test:
            sel_step = patches.size(0) // num_patch_per_scale
            sel = torch.zeros(num_patch_per_scale)
            for i in range(num_patch_per_scale):
                sel[i] = sel_step * i
            sel = sel.long()
        else:
            sel = torch.randint(low=0, high=patches.size(0), size=(num_patch_per_scale,))
        patches = patches[sel, ...]
        all_patches.append(patches)


        all_patches = torch.cat(all_patches, 0)
        mos = self.data.iloc[index, 1]
        if self.data.shape[1] == 23:  # llie
            distortions = self.data.iloc[index, self.mos_col + 1::2]
            distortions = distortions.to_numpy(dtype=float)
            distortions = torch.from_numpy(distortions)
        else:
            distortions = 0

        sample = {'I': all_patches, 'mos': float(mos), 'dists': distortions}

        return sample

    def __len__(self):
        return len(self.data)