Spaces:

rhfeiyang
/

Opt-In-Art

Running on Zero

App Files Files Community

Opt-In-Art / custom_datasets /sam.py

rhfeiyang

Upload folder using huggingface_hub

262b155 verified about 1 year ago

raw

history blame

6.54 kB

	# Authors: Hui Ren (rhfeiyang.github.io)
	import os.path
	import sys
	from typing import Any, Callable, List, Optional, Tuple

	import tqdm
	from PIL import Image

	from torch.utils.data import Dataset
	import pickle
	from torchvision import transforms
	# import torch
	# import torchvision
	# import re


	class SamDataset(Dataset):
	def __init__(self, image_folder_path:str, caption_folder_path:str, id_file:str = "data/sam/clip_filtered_ids.pickle",id_dict_file:str =None , transforms: Optional[Callable] = None,
	resolution=None,
	get_img=True,
	get_cap=True,):
	if id_dict_file is not None:
	with open(id_dict_file, 'rb') as f:
	print(f"Loading id_dict from {id_dict_file}", flush=True)
	self.id_dict = pickle.load(f)
	print(f"Loaded id_dict from {id_dict_file}", flush=True)
	else:
	self.id_dict = None
	if isinstance(id_file, list):
	self.ids = id_file
	elif isinstance(id_file, str):
	with open(id_file, 'rb') as f:
	print(f"Loading ids from {id_file}", flush=True)
	self.ids = pickle.load(f)
	print(f"Loaded ids from {id_file}", flush=True)
	self.resolution = resolution
	self.ori_image_folder_path = image_folder_path
	if self.resolution is not None:
	if os.path.exists("/var/jomat/datasets/"):
	# self.image_folder_path = f"/var/jomat/datasets/SAM_{resolution}"
	self.image_folder_path = f"{image_folder_path}_{resolution}"
	else:
	self.image_folder_path = f"{image_folder_path}_{resolution}"
	os.makedirs(self.image_folder_path, exist_ok=True)
	else:
	self.image_folder_path = image_folder_path
	self.caption_folder_path = caption_folder_path
	self.transforms = transforms
	self.column_names = ["image", "text"]
	self.get_img = get_img
	self.get_cap = get_cap

	def __len__(self):
	# return 100
	return len(self.ids)

	def __getitem__(self, index: int):
	id = self.ids[index]
	ret={"id":id}
	try:
	# if index == 1:
	# raise Exception("test")
	if self.get_img:
	image = self._load_image(id)
	ret["image"]=image
	if self.get_cap:
	target = self._load_caption(id)
	ret["text"] = [target]
	if self.transforms is not None:
	ret = self.transforms(ret)
	return ret
	except Exception as e:
	raise e
	print(f"Error loading image and caption for id {id}, error: {e}, redirecting to index 0", flush=True)
	ret = self[0]
	return ret

	def define_resolution(self, resolution: int):
	self.resolution = resolution
	if os.path.exists("/var/jomat/datasets/"):
	self.image_folder_path = f"/var/jomat/datasets/SAM_{resolution}"
	# self.image_folder_path = f"{self.ori_image_folder_path}_{resolution}"
	else:
	self.image_folder_path = f"{self.ori_image_folder_path}_{resolution}"
	print(f"SamDataset resolution defined to {resolution}, new image folder path: {self.image_folder_path}")
	def _load_image(self, id: int) -> Image.Image:
	if self.id_dict is not None:
	subfolder = self.id_dict[id]
	image_path = f"{self.image_folder_path}/{subfolder}/sa_{id}.jpg"
	else:
	image_path = f"{self.image_folder_path}/sa_{id}.jpg"

	try:
	with open(image_path, 'rb') as f:
	img = Image.open(f).convert("RGB")
	# return img
	except:
	# load original image
	if self.id_dict is not None:
	subfolder = self.id_dict[id]
	ori_image_path = f"{self.ori_image_folder_path}/{subfolder}/sa_{id}.jpg"
	else:
	ori_image_path = f"{self.ori_image_folder_path}/sa_{id}.jpg"
	assert os.path.exists(ori_image_path)
	with open(ori_image_path, 'rb') as f:
	img = Image.open(f).convert("RGB")
	# resize image keep aspect ratio
	if self.resolution is not None:
	img = transforms.Resize(self.resolution, interpolation=transforms.InterpolationMode.BICUBIC)(img)
	# write image
	os.makedirs(os.path.dirname(image_path), exist_ok=True)
	img.save(image_path)

	return img


	def _load_caption(self, id: int):
	caption_path = f"{self.caption_folder_path}/sa_{id}.txt"
	if not os.path.exists(caption_path):
	return None
	try:
	with open(caption_path, 'r', encoding="utf-8") as f:
	content = f.read()
	except Exception as e:
	raise e
	print(f"Error reading caption file {caption_path}, error: {e}")
	return None
	sentences = content.split('.')
	# remove empty sentences and sentences with "black and white"(too many false prediction)
	sentences = [sentence.strip() for sentence in sentences if sentence.strip() and "black and white" not in sentence]
	# join sentence
	sentences = ". ".join(sentences)
	if len(sentences) > 0 and sentences[-1] != '.':
	sentences += '.'

	return sentences

	def with_transform(self, transform):
	self.transforms = transform
	return self

	def subsample(self, n: int = 10000):
	if n is None or n == -1:
	return self
	ori_len = len(self)
	assert n <= ori_len
	# equal interval subsample
	ids = self.ids[::ori_len // n][:n]
	self.ids = ids
	print(f"SAM dataset subsampled from {ori_len} to {len(self)}")
	return self


	if __name__ == "__main__":
	# sam_filt(caption_filt=False, clip_filt=False, clip_logit=True)
	from custom_datasets.sam_caption.mypath import MyPath
	dataset = SamDataset(image_folder_path=MyPath.db_root_dir("sam_images"), caption_folder_path=MyPath.db_root_dir("sam_captions"), id_file=MyPath.db_root_dir("sam_whole_filtered_ids_train"), id_dict_file=MyPath.db_root_dir("sam_id_dict"))
	dataset.get_img = False
	for i in tqdm.tqdm(dataset):
	a=i['text']