Spaces:

shgao
/

EditAnything

Runtime error

App Files Files Community

shgao commited on May 10, 2023

Commit

bc1676d

1 Parent(s): 0d3a58d

update tile

Browse files

Files changed (5) hide show

app.py +2 -1
sam2edit.py +5 -8
sam2edit_beauty.py +5 -8
sam2edit_handsome.py +4 -7
sam2edit_lora.py +104 -48

app.py CHANGED Viewed

@@ -41,7 +41,8 @@ with gr.Blocks() as demo:
                                           lora_model_path=lora_model_path, use_blip=True, extra_inpaint=True,
                                           sam_generator=sam_generator,
                                           blip_processor=blip_processor,
-                                          blip_model=blip_model
                                           )
             create_demo_beauty(model.process)
         with gr.TabItem(' 👨‍🌾Handsome Edit/Generation'):

                                           lora_model_path=lora_model_path, use_blip=True, extra_inpaint=True,
                                           sam_generator=sam_generator,
                                           blip_processor=blip_processor,
+                                          blip_model=blip_model,
+                                          lora_weight=0.5,
                                           )
             create_demo_beauty(model.process)
         with gr.TabItem(' 👨‍🌾Handsome Edit/Generation'):

sam2edit.py CHANGED Viewed

@@ -16,7 +16,7 @@ def create_demo(process):
     with block as demo:
         with gr.Row():
             gr.Markdown(
-                "## Generate Your Beauty powered by EditAnything https://github.com/sail-sg/EditAnything ")
         with gr.Row():
             with gr.Column():
                 source_image = gr.Image(
@@ -38,12 +38,9 @@ def create_demo(process):
                     label="Images", minimum=1, maximum=12, value=2, step=1)
                 seed = gr.Slider(label="Seed", minimum=-1,
                                  maximum=2147483647, step=1, randomize=True)
                 with gr.Accordion("Advanced options", open=False):
-                    condition_model = gr.Dropdown(choices=list(config_dict.keys()),
-                                                  value=list(
-                        config_dict.keys())[1],
-                        label='Model',
-                        multiselect=False)
                     mask_image = gr.Image(
                         source='upload', label="(Optional) Upload a predefined mask of edit region if you do not want to write your prompt.", type="numpy", value=None)
                     image_resolution = gr.Slider(
@@ -63,8 +60,8 @@ def create_demo(process):
                 result_gallery = gr.Gallery(
                     label='Output', show_label=False, elem_id="gallery").style(grid=2, height='auto')
                 result_text = gr.Text(label='BLIP2+Human Prompt Text')
-        ips = [condition_model, source_image, enable_all_generate, mask_image, control_scale, enable_auto_prompt, prompt, a_prompt, n_prompt, num_samples, image_resolution,
-               detect_resolution, ddim_steps, guess_mode, strength, scale, seed, eta]
         run_button.click(fn=process, inputs=ips, outputs=[
             result_gallery, result_text])
         # with gr.Row():

     with block as demo:
         with gr.Row():
             gr.Markdown(
+                "## EditAnything https://github.com/sail-sg/EditAnything ")
         with gr.Row():
             with gr.Column():
                 source_image = gr.Image(
                     label="Images", minimum=1, maximum=12, value=2, step=1)
                 seed = gr.Slider(label="Seed", minimum=-1,
                                  maximum=2147483647, step=1, randomize=True)
+                enable_tile = gr.Checkbox(
+                    label='Tile refinement for high resolution generation.', value=True)
                 with gr.Accordion("Advanced options", open=False):
                     mask_image = gr.Image(
                         source='upload', label="(Optional) Upload a predefined mask of edit region if you do not want to write your prompt.", type="numpy", value=None)
                     image_resolution = gr.Slider(
                 result_gallery = gr.Gallery(
                     label='Output', show_label=False, elem_id="gallery").style(grid=2, height='auto')
                 result_text = gr.Text(label='BLIP2+Human Prompt Text')
+        ips = [source_image, enable_all_generate, mask_image, control_scale, enable_auto_prompt, prompt, a_prompt, n_prompt, num_samples, image_resolution,
+               detect_resolution, ddim_steps, guess_mode, strength, scale, seed, eta, enable_tile]
         run_button.click(fn=process, inputs=ips, outputs=[
             result_gallery, result_text])
         # with gr.Row():

sam2edit_beauty.py CHANGED Viewed

@@ -49,12 +49,9 @@ def create_demo(process):
                     label="Images", minimum=1, maximum=12, value=2, step=1)
                 seed = gr.Slider(label="Seed", minimum=-1,
                                  maximum=2147483647, step=1, randomize=True)
                 with gr.Accordion("Advanced options", open=False):
-                    condition_model = gr.Dropdown(choices=list(config_dict.keys()),
-                                                  value=list(
-                        config_dict.keys())[0],
-                        label='Model',
-                        multiselect=False)
                     mask_image = gr.Image(
                         source='upload', label="(Optional) Upload a predefined mask of edit region if you do not want to write your prompt.", type="numpy", value=None)
                     image_resolution = gr.Slider(
@@ -74,8 +71,8 @@ def create_demo(process):
                 result_gallery = gr.Gallery(
                     label='Output', show_label=False, elem_id="gallery").style(grid=2, height='auto')
                 result_text = gr.Text(label='BLIP2+Human Prompt Text')
-        ips = [condition_model, source_image, enable_all_generate, mask_image, control_scale, enable_auto_prompt, prompt, a_prompt, n_prompt, num_samples, image_resolution,
-               detect_resolution, ddim_steps, guess_mode, strength, scale, seed, eta]
         run_button.click(fn=process, inputs=ips, outputs=[
             result_gallery, result_text])
         with gr.Row():
@@ -90,6 +87,6 @@ def create_demo(process):
 if __name__ == '__main__':
     model = EditAnythingLoraModel(base_model_path='../chilloutmix_NiPrunedFp32Fix',
-                                  lora_model_path='../40806/mix4', use_blip=True)
     demo = create_demo(model.process)
     demo.queue().launch(server_name='0.0.0.0')

                     label="Images", minimum=1, maximum=12, value=2, step=1)
                 seed = gr.Slider(label="Seed", minimum=-1,
                                  maximum=2147483647, step=1, randomize=True)
+                enable_tile = gr.Checkbox(
+                    label='Tile refinement for high resolution generation.', value=True)
                 with gr.Accordion("Advanced options", open=False):
                     mask_image = gr.Image(
                         source='upload', label="(Optional) Upload a predefined mask of edit region if you do not want to write your prompt.", type="numpy", value=None)
                     image_resolution = gr.Slider(
                 result_gallery = gr.Gallery(
                     label='Output', show_label=False, elem_id="gallery").style(grid=2, height='auto')
                 result_text = gr.Text(label='BLIP2+Human Prompt Text')
+        ips = [source_image, enable_all_generate, mask_image, control_scale, enable_auto_prompt, prompt, a_prompt, n_prompt, num_samples, image_resolution,
+               detect_resolution, ddim_steps, guess_mode, strength, scale, seed, eta, enable_tile]
         run_button.click(fn=process, inputs=ips, outputs=[
             result_gallery, result_text])
         with gr.Row():
 if __name__ == '__main__':
     model = EditAnythingLoraModel(base_model_path='../chilloutmix_NiPrunedFp32Fix',
+                                  lora_model_path='../40806/mix4', use_blip=True, lora_weight=0.5)
     demo = create_demo(model.process)
     demo.queue().launch(server_name='0.0.0.0')

sam2edit_handsome.py CHANGED Viewed

@@ -43,12 +43,9 @@ def create_demo(process):
                     label="Images", minimum=1, maximum=12, value=2, step=1)
                 seed = gr.Slider(label="Seed", minimum=-1,
                                     maximum=2147483647, step=1, randomize=True)
                 with gr.Accordion("Advanced options", open=False):
-                    condition_model = gr.Dropdown(choices=list(config_dict.keys()),
-                                                    value=list(
-                                                        config_dict.keys())[0],
-                                                    label='Model',
-                                                    multiselect=False)
                     mask_image = gr.Image(
                         source='upload', label="(Optional) Upload a predefined mask of edit region if you do not want to write your prompt.", type="numpy", value=None)
                     image_resolution = gr.Slider(
@@ -68,8 +65,8 @@ def create_demo(process):
                 result_gallery = gr.Gallery(
                     label='Output', show_label=False, elem_id="gallery").style(grid=2, height='auto')
                 result_text = gr.Text(label='BLIP2+Human Prompt Text')
-        ips = [condition_model, source_image, enable_all_generate, mask_image, control_scale, enable_auto_prompt, prompt, a_prompt, n_prompt, num_samples, image_resolution,
-                detect_resolution, ddim_steps, guess_mode, strength, scale, seed, eta]
         run_button.click(fn=process, inputs=ips, outputs=[
                             result_gallery, result_text])
         with gr.Row():

                     label="Images", minimum=1, maximum=12, value=2, step=1)
                 seed = gr.Slider(label="Seed", minimum=-1,
                                     maximum=2147483647, step=1, randomize=True)
+                enable_tile = gr.Checkbox(
+                    label='Tile refinement for high resolution generation.', value=True)
                 with gr.Accordion("Advanced options", open=False):
                     mask_image = gr.Image(
                         source='upload', label="(Optional) Upload a predefined mask of edit region if you do not want to write your prompt.", type="numpy", value=None)
                     image_resolution = gr.Slider(
                 result_gallery = gr.Gallery(
                     label='Output', show_label=False, elem_id="gallery").style(grid=2, height='auto')
                 result_text = gr.Text(label='BLIP2+Human Prompt Text')
+        ips = [source_image, enable_all_generate, mask_image, control_scale, enable_auto_prompt, prompt, a_prompt, n_prompt, num_samples, image_resolution,
+                detect_resolution, ddim_steps, guess_mode, strength, scale, seed, eta, enable_tile]
         run_button.click(fn=process, inputs=ips, outputs=[
                             result_gallery, result_text])
         with gr.Row():

sam2edit_lora.py CHANGED Viewed

@@ -26,6 +26,8 @@ from utils.stable_diffusion_controlnet_inpaint import StableDiffusionControlNetI
 # need the latest transformers
 # pip install git+https://github.com/huggingface/transformers.git
 from transformers import AutoProcessor, Blip2ForConditionalGeneration
 # Segment-Anything init.
 # pip install git+https://github.com/facebookresearch/segment-anything.git
@@ -110,6 +112,7 @@ def get_pipeline_embeds(pipeline, prompt, negative_prompt, device):
     return torch.cat(concat_embeds, dim=1), torch.cat(neg_embeds, dim=1)
 def load_lora_weights(pipeline, checkpoint_path, multiplier, device, dtype):
     LORA_PREFIX_UNET = "lora_unet"
     LORA_PREFIX_TEXT_ENCODER = "lora_te"
@@ -238,34 +241,51 @@ def make_inpaint_condition(image, image_mask):
     image = torch.from_numpy(image)
     return image
-def obtain_generation_model(base_model_path, lora_model_path, controlnet_path, generation_only=False, extra_inpaint=True):
-    if generation_only and extra_inpaint:
-        controlnet = ControlNetModel.from_pretrained(
-            controlnet_path, torch_dtype=torch.float16)
         pipe = StableDiffusionControlNetPipeline.from_pretrained(
             base_model_path, controlnet=controlnet, torch_dtype=torch.float16, safety_checker=None
         )
-    elif extra_inpaint:
-        print("Warning: ControlNet based inpainting model only support SD1.5 for now.")
-        controlnet = [
-            ControlNetModel.from_pretrained(
-                controlnet_path, torch_dtype=torch.float16),
-            ControlNetModel.from_pretrained(
-                'lllyasviel/control_v11p_sd15_inpaint', torch_dtype=torch.float16),  # inpainting controlnet
-        ]
         pipe = StableDiffusionControlNetInpaintPipeline.from_pretrained(
             base_model_path, controlnet=controlnet, torch_dtype=torch.float16, safety_checker=None
         )
     else:
-        controlnet = ControlNetModel.from_pretrained(
-            controlnet_path, torch_dtype=torch.float16)
-        pipe = StableDiffusionControlNetInpaintPipeline.from_pretrained(
-            base_model_path, controlnet=controlnet, torch_dtype=torch.float16, safety_checker=None
         )
     if lora_model_path is not None:
         pipe = load_lora_weights(
-            pipe, [lora_model_path], 1.0, 'cpu', torch.float32)
     # speed up diffusion process with faster scheduler and memory optimization
     pipe.scheduler = UniPCMultistepScheduler.from_config(
         pipe.scheduler.config)
@@ -276,6 +296,7 @@ def obtain_generation_model(base_model_path, lora_model_path, controlnet_path, g
     return pipe
 def show_anns(anns):
     if len(anns) == 0:
         return
@@ -310,8 +331,9 @@ class EditAnythingLoraModel:
                  blip_model=None,
                  sam_generator=None,
                  controlmodel_name='LAION Pretrained(v0-4)-SD15',
-                 # used when the base model is not an inpainting model.
-                 extra_inpaint=True,
                  ):
         self.device = device
         self.use_blip = use_blip
@@ -323,7 +345,7 @@ class EditAnythingLoraModel:
         self.defalut_enable_all_generate = False
         self.extra_inpaint = extra_inpaint
         self.pipe = obtain_generation_model(
-            base_model_path, lora_model_path, self.default_controlnet_path, generation_only=False, extra_inpaint=extra_inpaint)
         # Segment-Anything init.
         if sam_generator is not None:
@@ -343,6 +365,12 @@ class EditAnythingLoraModel:
             else:
                 self.blip_model = init_blip_model()
     def get_blip2_text(self, image):
         inputs = self.blip_processor(image, return_tensors="pt").to(
             self.device, torch.float16)
@@ -357,13 +385,23 @@ class EditAnythingLoraModel:
         return full_img, res
     @torch.inference_mode()
-    def process(self, condition_model, source_image, enable_all_generate, mask_image, control_scale, enable_auto_prompt, prompt, a_prompt, n_prompt, num_samples, image_resolution, detect_resolution, ddim_steps, guess_mode, strength, scale, seed, eta):
         input_image = source_image["image"]
         if mask_image is None:
             if enable_all_generate != self.defalut_enable_all_generate:
                 self.pipe = obtain_generation_model(
-                    self.base_model_path, self.lora_model_path, config_dict[condition_model], enable_all_generate, self.extra_inpaint)
                 self.defalut_enable_all_generate = enable_all_generate
             if enable_all_generate:
                 print("source_image",
@@ -372,13 +410,13 @@ class EditAnythingLoraModel:
                     (input_image.shape[0], input_image.shape[1], 3))*255
             else:
                 mask_image = source_image["mask"]
-        if self.default_controlnet_path != config_dict[condition_model]:
-            print("To Use:", config_dict[condition_model],
                   "Current:", self.default_controlnet_path)
-            print("Change condition model to:", config_dict[condition_model])
             self.pipe = obtain_generation_model(
-                self.base_model_path, self.lora_model_path, config_dict[condition_model], enable_all_generate, self.extra_inpaint)
-            self.default_controlnet_path = config_dict[condition_model]
             torch.cuda.empty_cache()
         with torch.no_grad():
@@ -411,11 +449,9 @@ class EditAnythingLoraModel:
             control = einops.rearrange(control, 'b h w c -> b c h w').clone()
             mask_image = HWC3(mask_image.astype(np.uint8))
-            mask_image = cv2.resize(
                 mask_image, (W, H), interpolation=cv2.INTER_LINEAR)
-            if self.extra_inpaint:
-                inpaint_image = make_inpaint_condition(img, mask_image)
-            mask_image = Image.fromarray(mask_image)
             if seed == -1:
                 seed = random.randint(0, 65535)
@@ -429,7 +465,6 @@ class EditAnythingLoraModel:
             negative_prompt_embeds = torch.cat(
                 [negative_prompt_embeds] * num_samples, dim=0)
             if enable_all_generate and self.extra_inpaint:
-                print(control.shape, control_scale)
                 self.pipe.safety_checker = lambda images, clip_input: (
                     images, False)
                 x_samples = self.pipe(
@@ -439,10 +474,19 @@ class EditAnythingLoraModel:
                     generator=generator,
                     height=H,
                     width=W,
-                    image=control.type(torch.float16),
-                    controlnet_conditioning_scale=float(control_scale),
                 ).images
-            elif self.extra_inpaint:
                 x_samples = self.pipe(
                     image=img,
                     mask_image=mask_image,
@@ -450,27 +494,39 @@ class EditAnythingLoraModel:
                     num_images_per_prompt=num_samples,
                     num_inference_steps=ddim_steps,
                     generator=generator,
-                    controlnet_conditioning_image=[control.type(
-                        torch.float16), inpaint_image.type(torch.float16)],
                     height=H,
                     width=W,
-                    controlnet_conditioning_scale=(float(control_scale), 1.0),
                 ).images
-            else:
-                x_samples = self.pipe(
-                    image=img,
-                    mask_image=mask_image,
                     prompt_embeds=prompt_embeds, negative_prompt_embeds=negative_prompt_embeds,
                     num_images_per_prompt=num_samples,
                     num_inference_steps=ddim_steps,
                     generator=generator,
-                    controlnet_conditioning_image=control.type(torch.float16),
-                    height=H,
-                    width=W,
-                    controlnet_conditioning_scale=float(control_scale),
                 ).images
-            results = [x_samples[i] for i in range(num_samples)]
         return [full_segmask, mask_image] + results, prompt
     def download_image(url):

 # need the latest transformers
 # pip install git+https://github.com/huggingface/transformers.git
 from transformers import AutoProcessor, Blip2ForConditionalGeneration
+from diffusers import ControlNetModel, DiffusionPipeline
+import PIL.Image
 # Segment-Anything init.
 # pip install git+https://github.com/facebookresearch/segment-anything.git
     return torch.cat(concat_embeds, dim=1), torch.cat(neg_embeds, dim=1)
 def load_lora_weights(pipeline, checkpoint_path, multiplier, device, dtype):
     LORA_PREFIX_UNET = "lora_unet"
     LORA_PREFIX_TEXT_ENCODER = "lora_te"
     image = torch.from_numpy(image)
     return image
+def obtain_generation_model(base_model_path, lora_model_path, controlnet_path, generation_only=False, extra_inpaint=True, lora_weight=1.0):
+    controlnet = []
+    controlnet.append(ControlNetModel.from_pretrained(controlnet_path, torch_dtype=torch.float16)) # sam control
+    if (not generation_only) and extra_inpaint: # inpainting control
+        print("Warning: ControlNet based inpainting model only support SD1.5 for now.")
+        controlnet.append(
+            ControlNetModel.from_pretrained(
+                'lllyasviel/control_v11p_sd15_inpaint', torch_dtype=torch.float16)  # inpainting controlnet
+        )
+    if generation_only:
         pipe = StableDiffusionControlNetPipeline.from_pretrained(
             base_model_path, controlnet=controlnet, torch_dtype=torch.float16, safety_checker=None
         )
+    else:
         pipe = StableDiffusionControlNetInpaintPipeline.from_pretrained(
             base_model_path, controlnet=controlnet, torch_dtype=torch.float16, safety_checker=None
         )
+    if lora_model_path is not None:
+        pipe = load_lora_weights(
+            pipe, [lora_model_path], lora_weight, 'cpu', torch.float32)
+    # speed up diffusion process with faster scheduler and memory optimization
+    pipe.scheduler = UniPCMultistepScheduler.from_config(
+        pipe.scheduler.config)
+    # remove following line if xformers is not installed
+    pipe.enable_xformers_memory_efficient_attention()
+    pipe.enable_model_cpu_offload()
+    return pipe
+def obtain_tile_model(base_model_path, lora_model_path, lora_weight=1.0):
+    controlnet = ControlNetModel.from_pretrained(
+                'lllyasviel/control_v11f1e_sd15_tile', torch_dtype=torch.float16) # tile controlnet
+    if base_model_path=='runwayml/stable-diffusion-v1-5' or base_model_path=='stabilityai/stable-diffusion-2-inpainting':
+        print("base_model_path", base_model_path)
+        pipe = StableDiffusionControlNetPipeline.from_pretrained(
+            "runwayml/stable-diffusion-v1-5", controlnet=controlnet, torch_dtype=torch.float16, safety_checker=None
+        )
     else:
+        pipe = StableDiffusionControlNetPipeline.from_pretrained(
+             base_model_path, controlnet=controlnet, torch_dtype=torch.float16, safety_checker=None
         )
     if lora_model_path is not None:
         pipe = load_lora_weights(
+            pipe, [lora_model_path], lora_weight, 'cpu', torch.float32)
     # speed up diffusion process with faster scheduler and memory optimization
     pipe.scheduler = UniPCMultistepScheduler.from_config(
         pipe.scheduler.config)
     return pipe
 def show_anns(anns):
     if len(anns) == 0:
         return
                  blip_model=None,
                  sam_generator=None,
                  controlmodel_name='LAION Pretrained(v0-4)-SD15',
+                 extra_inpaint=True, # used when the base model is not an inpainting model.
+                 tile_model=None,
+                 lora_weight=1.0,
                  ):
         self.device = device
         self.use_blip = use_blip
         self.defalut_enable_all_generate = False
         self.extra_inpaint = extra_inpaint
         self.pipe = obtain_generation_model(
+            base_model_path, lora_model_path, self.default_controlnet_path, generation_only=False, extra_inpaint=extra_inpaint, lora_weight=lora_weight)
         # Segment-Anything init.
         if sam_generator is not None:
             else:
                 self.blip_model = init_blip_model()
+        # tile model init.
+        if tile_model is not None:
+            self.tile_pipe = tile_model
+        else:
+            self.tile_pipe = obtain_tile_model(base_model_path, lora_model_path, lora_weight=lora_weight)
     def get_blip2_text(self, image):
         inputs = self.blip_processor(image, return_tensors="pt").to(
             self.device, torch.float16)
         return full_img, res
     @torch.inference_mode()
+    def process(self, source_image, enable_all_generate, mask_image,
+                control_scale,
+                enable_auto_prompt, prompt, a_prompt, n_prompt,
+                num_samples, image_resolution, detect_resolution,
+                ddim_steps, guess_mode, strength, scale, seed, eta,
+                enable_tile=True, condition_model=None):
+        if condition_model is None:
+            this_controlnet_path = self.default_controlnet_path
+        else:
+            this_controlnet_path = config_dict[condition_model]
         input_image = source_image["image"]
         if mask_image is None:
             if enable_all_generate != self.defalut_enable_all_generate:
                 self.pipe = obtain_generation_model(
+                    self.base_model_path, self.lora_model_path, this_controlnet_path, enable_all_generate, self.extra_inpaint)
                 self.defalut_enable_all_generate = enable_all_generate
             if enable_all_generate:
                 print("source_image",
                     (input_image.shape[0], input_image.shape[1], 3))*255
             else:
                 mask_image = source_image["mask"]
+        if self.default_controlnet_path != this_controlnet_path:
+            print("To Use:", this_controlnet_path,
                   "Current:", self.default_controlnet_path)
+            print("Change condition model to:", this_controlnet_path)
             self.pipe = obtain_generation_model(
+                self.base_model_path, self.lora_model_path, this_controlnet_path, enable_all_generate, self.extra_inpaint)
+            self.default_controlnet_path = this_controlnet_path
             torch.cuda.empty_cache()
         with torch.no_grad():
             control = einops.rearrange(control, 'b h w c -> b c h w').clone()
             mask_image = HWC3(mask_image.astype(np.uint8))
+            mask_image_tmp = cv2.resize(
                 mask_image, (W, H), interpolation=cv2.INTER_LINEAR)
+            mask_image = Image.fromarray(mask_image_tmp)
             if seed == -1:
                 seed = random.randint(0, 65535)
             negative_prompt_embeds = torch.cat(
                 [negative_prompt_embeds] * num_samples, dim=0)
             if enable_all_generate and self.extra_inpaint:
                 self.pipe.safety_checker = lambda images, clip_input: (
                     images, False)
                 x_samples = self.pipe(
                     generator=generator,
                     height=H,
                     width=W,
+                    image=[control.type(torch.float16)],
+                    controlnet_conditioning_scale=[float(control_scale)],
                 ).images
+            else:
+                multi_condition_image = []
+                multi_condition_scale = []
+                multi_condition_image.append(control.type(torch.float16))
+                multi_condition_scale.append(float(control_scale))
+                if self.extra_inpaint:
+                    inpaint_image = make_inpaint_condition(img, mask_image_tmp)
+                    print(inpaint_image.shape)
+                    multi_condition_image.append(inpaint_image.type(torch.float16))
+                    multi_condition_scale.append(1.0)
                 x_samples = self.pipe(
                     image=img,
                     mask_image=mask_image,
                     num_images_per_prompt=num_samples,
                     num_inference_steps=ddim_steps,
                     generator=generator,
+                    controlnet_conditioning_image=multi_condition_image,
                     height=H,
                     width=W,
+                    controlnet_conditioning_scale=multi_condition_scale,
                 ).images
+            results = [x_samples[i] for i in range(num_samples)]
+            if True:
+                img_tile = [PIL.Image.fromarray(resize_image(np.array(x_samples[i]), 1024)) for i in range(num_samples)]
+                # for each in img_tile:
+                #     print("tile",each.size)
+                prompt_embeds, negative_prompt_embeds = get_pipeline_embeds(
+                    self.tile_pipe, postive_prompt, negative_prompt, "cuda")
+                prompt_embeds = torch.cat([prompt_embeds] * num_samples, dim=0)
+                negative_prompt_embeds = torch.cat(
+                    [negative_prompt_embeds] * num_samples, dim=0)
+                x_samples_tile = self.tile_pipe(
                     prompt_embeds=prompt_embeds, negative_prompt_embeds=negative_prompt_embeds,
                     num_images_per_prompt=num_samples,
                     num_inference_steps=ddim_steps,
                     generator=generator,
+                    height=img_tile[0].size[1],
+                    width=img_tile[0].size[0],
+                    image=img_tile,
+                    controlnet_conditioning_scale=1.0,
                 ).images
+                results_tile = [x_samples_tile[i] for i in range(num_samples)]
+                results = results_tile + results
         return [full_segmask, mask_image] + results, prompt
     def download_image(url):