Spaces:

Yarflam
/

UnderWater

Paused

App Files Files Community

Yarflam commited on Dec 8, 2024

Commit

a15cce2

1 Parent(s): c954f09

Load Image

Browse files

Files changed (2) hide show

ModelLoader.py +20 -2
util/get_transform.py +142 -0

ModelLoader.py CHANGED Viewed

@@ -1,4 +1,6 @@
 from models import create_model
 import os
 ckp_path = os.path.join(os.path.dirname(__file__), 'checkpoints')
@@ -14,6 +16,7 @@ class Options(object):
 class ModelLoader:
     def __init__(self) -> None:
         self.opt = Options({
             'name': 'original',
             'checkpoints_dir': ckp_path,
             'gpu_ids': [],
@@ -28,7 +31,8 @@ class ModelLoader:
             'ndf': 64,
             'netD': 'basic',
             'netG': 'resnet_9blocks',
-            'netF': 'reshape',
             'ngf': 64,
             'no_antialias_up': None,
             'no_antialias': None,
@@ -41,12 +45,26 @@ class ModelLoader:
             'serial_batches': True, # disable data shuffling; comment this line if results on randomly chosen images are needed.
             'no_flip': True, # no flip; comment this line if results on flipped images are needed.
             'display_id': -1, # no visdom display; the test code saves the results to a HTML file.
         })
     def load(self) -> None:
         self.model = create_model(self.opt)
         self.model.load_networks('latest')
     def inference(self, src=''):
         if not os.path.isfile(src):
             raise Exception('The image %s is not found!' % src)
-        # if exist_file()
         print('Loading the image %s' % src)

 from models import create_model
+from util.get_transform import get_transform
+from PIL import Image
 import os
 ckp_path = os.path.join(os.path.dirname(__file__), 'checkpoints')
 class ModelLoader:
     def __init__(self) -> None:
         self.opt = Options({
+            'isGradio': True, # Custom
             'name': 'original',
             'checkpoints_dir': ckp_path,
             'gpu_ids': [],
             'ndf': 64,
             'netD': 'basic',
             'netG': 'resnet_9blocks',
+            'netF': 'mlp_sample',
+            'netF_nc': 256,
             'ngf': 64,
             'no_antialias_up': None,
             'no_antialias': None,
             'serial_batches': True, # disable data shuffling; comment this line if results on randomly chosen images are needed.
             'no_flip': True, # no flip; comment this line if results on flipped images are needed.
             'display_id': -1, # no visdom display; the test code saves the results to a HTML file.
+            'direction': 'AtoB', # inference
+            'flip_equivariance': False,
+            'load_size': 1680,
+            'crop_size': 512,
         })
+        self.transform = get_transform(self.opt, grayscale=False)
+        self.model = None
     def load(self) -> None:
         self.model = create_model(self.opt)
         self.model.load_networks('latest')
     def inference(self, src=''):
+        if self.model == None: self.load()
         if not os.path.isfile(src):
             raise Exception('The image %s is not found!' % src)
+        # Loading
         print('Loading the image %s' % src)
+        source = Image.open(src).convert('RGB')
+        img = self.transform(source)
+        print(img.shape)
+        # Inference
+        self.model.set_input({ 'A': img, 'B': img, 'A_paths': src })
+        self.model.forward()
+        print(self.model)

util/get_transform.py ADDED Viewed

	@@ -0,0 +1,142 @@

+import torchvision.transforms as transforms
+from PIL import Image
+import numpy as np
+def get_transform(opt, params=None, grayscale=False, method=Image.BICUBIC, convert=True):
+    transform_list = []
+    if grayscale:
+        transform_list.append(transforms.Grayscale(1))
+    if 'fixsize' in opt.preprocess:
+        transform_list.append(transforms.Resize(params["size"], method))
+    if 'resize' in opt.preprocess:
+        osize = [opt.load_size, opt.load_size]
+        if "gta2cityscapes" in opt.dataroot:
+            osize[0] = opt.load_size // 2
+        transform_list.append(transforms.Resize(osize, method))
+    elif 'scale_width' in opt.preprocess:
+        transform_list.append(transforms.Lambda(lambda img: __scale_width(img, opt.load_size, opt.crop_size, method)))
+    elif 'scale_shortside' in opt.preprocess:
+        transform_list.append(transforms.Lambda(lambda img: __scale_shortside(img, opt.load_size, opt.crop_size, method)))
+    if 'zoom' in opt.preprocess:
+        if params is None:
+            transform_list.append(transforms.Lambda(lambda img: __random_zoom(img, opt.load_size, opt.crop_size, method)))
+        else:
+            transform_list.append(transforms.Lambda(lambda img: __random_zoom(img, opt.load_size, opt.crop_size, method, factor=params["scale_factor"])))
+    if 'crop' in opt.preprocess:
+        if params is None or 'crop_pos' not in params:
+            transform_list.append(transforms.RandomCrop(opt.crop_size))
+        else:
+            transform_list.append(transforms.Lambda(lambda img: __crop(img, params['crop_pos'], opt.crop_size)))
+    if 'patch' in opt.preprocess:
+        transform_list.append(transforms.Lambda(lambda img: __patch(img, params['patch_index'], opt.crop_size)))
+    if 'trim' in opt.preprocess:
+        transform_list.append(transforms.Lambda(lambda img: __trim(img, opt.crop_size)))
+    # if opt.preprocess == 'none':
+    transform_list.append(transforms.Lambda(lambda img: __make_power_2(img, base=4, method=method)))
+    if not opt.no_flip:
+        if params is None or 'flip' not in params:
+            transform_list.append(transforms.RandomHorizontalFlip())
+        elif 'flip' in params:
+            transform_list.append(transforms.Lambda(lambda img: __flip(img, params['flip'])))
+    if convert:
+        transform_list += [transforms.ToTensor()]
+        if grayscale:
+            transform_list += [transforms.Normalize((0.5,), (0.5,))]
+        else:
+            transform_list += [transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))]
+    return transforms.Compose(transform_list)
+def __make_power_2(img, base, method=Image.BICUBIC):
+    ow, oh = img.size
+    h = int(round(oh / base) * base)
+    w = int(round(ow / base) * base)
+    if h == oh and w == ow:
+        return img
+    return img.resize((w, h), method)
+def __random_zoom(img, target_width, crop_width, method=Image.BICUBIC, factor=None):
+    if factor is None:
+        zoom_level = np.random.uniform(0.8, 1.0, size=[2])
+    else:
+        zoom_level = (factor[0], factor[1])
+    iw, ih = img.size
+    zoomw = max(crop_width, iw * zoom_level[0])
+    zoomh = max(crop_width, ih * zoom_level[1])
+    img = img.resize((int(round(zoomw)), int(round(zoomh))), method)
+    return img
+def __scale_shortside(img, target_width, crop_width, method=Image.BICUBIC):
+    ow, oh = img.size
+    shortside = min(ow, oh)
+    if shortside >= target_width:
+        return img
+    else:
+        scale = target_width / shortside
+        return img.resize((round(ow * scale), round(oh * scale)), method)
+def __trim(img, trim_width):
+    ow, oh = img.size
+    if ow > trim_width:
+        xstart = np.random.randint(ow - trim_width)
+        xend = xstart + trim_width
+    else:
+        xstart = 0
+        xend = ow
+    if oh > trim_width:
+        ystart = np.random.randint(oh - trim_width)
+        yend = ystart + trim_width
+    else:
+        ystart = 0
+        yend = oh
+    return img.crop((xstart, ystart, xend, yend))
+def __scale_width(img, target_width, crop_width, method=Image.BICUBIC):
+    ow, oh = img.size
+    if ow == target_width and oh >= crop_width:
+        return img
+    w = target_width
+    h = int(max(target_width * oh / ow, crop_width))
+    return img.resize((w, h), method)
+def __crop(img, pos, size):
+    ow, oh = img.size
+    x1, y1 = pos
+    tw = th = size
+    if (ow > tw or oh > th):
+        return img.crop((x1, y1, x1 + tw, y1 + th))
+    return img
+def __patch(img, index, size):
+    ow, oh = img.size
+    nw, nh = ow // size, oh // size
+    roomx = ow - nw * size
+    roomy = oh - nh * size
+    startx = np.random.randint(int(roomx) + 1)
+    starty = np.random.randint(int(roomy) + 1)
+    index = index % (nw * nh)
+    ix = index // nh
+    iy = index % nh
+    gridx = startx + ix * size
+    gridy = starty + iy * size
+    return img.crop((gridx, gridy, gridx + size, gridy + size))
+def __flip(img, flip):
+    if flip:
+        return img.transpose(Image.FLIP_LEFT_RIGHT)
+    return img