tokenflow

Runtime error

App Files Files Community

cocktailpeanut commited on Sep 4, 2023

Commit

ad2d8cc

1 Parent(s): 7a86a0a

update

Browse files

Files changed (3) hide show

app.py +9 -3
preprocess_utils.py +4 -48
tokenflow_pnp.py +2 -2

app.py CHANGED Viewed

@@ -7,7 +7,13 @@ from tokenflow_pnp import TokenFlow
 from preprocess_utils import *
 from tokenflow_utils import *
 # load sd model
-device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model_id = "stabilityai/stable-diffusion-2-1-base"
 # components for the Preprocessor
@@ -21,7 +27,7 @@ unet = UNet2DConditionModel.from_pretrained(model_id, subfolder="unet", revision
                                            torch_dtype=torch.float16).to(device)
 # pipe for TokenFlow
-tokenflow_pipe = StableDiffusionPipeline.from_pretrained(model_id, torch_dtype=torch.float16).to("cuda")
 tokenflow_pipe.enable_xformers_memory_efficient_attention()
 def randomize_seed_fn():
@@ -371,4 +377,4 @@ with gr.Blocks(css="style.css") as demo:
     )
 demo.queue()
-demo.launch()

 from preprocess_utils import *
 from tokenflow_utils import *
 # load sd model
+#device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+if torch.cuda.is_available():
+    device = "cuda"
+elif torch.backends.mps.is_available():
+    device = "mps"
+else:
+    device = "cpu"
 model_id = "stabilityai/stable-diffusion-2-1-base"
 # components for the Preprocessor
                                            torch_dtype=torch.float16).to(device)
 # pipe for TokenFlow
+tokenflow_pipe = StableDiffusionPipeline.from_pretrained(model_id, torch_dtype=torch.float16).to(device)
 tokenflow_pipe.enable_xformers_memory_efficient_attention()
 def randomize_seed_fn():
     )
 demo.queue()
+demo.launch()

preprocess_utils.py CHANGED Viewed

@@ -92,7 +92,7 @@ class Preprocess(nn.Module):
     def prepare_depth_maps(self, model_type='DPT_Large', device='cuda'):
         depth_maps = []
         midas = torch.hub.load("intel-isl/MiDaS", model_type)
-        midas.to(device)
         midas.eval()
         midas_transforms = torch.hub.load("intel-isl/MiDaS", "transforms")
@@ -109,7 +109,7 @@ class Preprocess(nn.Module):
             latent_h = img.shape[0] // 8
             latent_w = img.shape[1] // 8
-            input_batch = transform(img).to(device)
             prediction = midas(input_batch)
             depth_map = torch.nn.functional.interpolate(
@@ -167,10 +167,10 @@ class Preprocess(nn.Module):
     def get_text_embeds(self, prompt, negative_prompt, device="cuda"):
         text_input = self.tokenizer(prompt, padding='max_length', max_length=self.tokenizer.model_max_length,
                                     truncation=True, return_tensors='pt')
-        text_embeddings = self.text_encoder(text_input.input_ids.to(device))[0]
         uncond_input = self.tokenizer(negative_prompt, padding='max_length', max_length=self.tokenizer.model_max_length,
                                       return_tensors='pt')
-        uncond_embeddings = self.text_encoder(uncond_input.input_ids.to(device))[0]
         text_embeddings = torch.cat([uncond_embeddings, text_embeddings])
         return text_embeddings
@@ -329,47 +329,3 @@ class Preprocess(nn.Module):
         return self.frames, self.latents, self.total_inverted_latents, None
-def prep(opt):
-    # timesteps to save
-    if opt["sd_version"] == '2.1':
-        model_key = "stabilityai/stable-diffusion-2-1-base"
-    elif opt["sd_version"] == '2.0':
-        model_key = "stabilityai/stable-diffusion-2-base"
-    elif opt["sd_version"] == '1.5' or opt["sd_version"] == 'ControlNet':
-        model_key = "runwayml/stable-diffusion-v1-5"
-    elif opt["sd_version"] == 'depth':
-        model_key = "stabilityai/stable-diffusion-2-depth"
-    toy_scheduler = DDIMScheduler.from_pretrained(model_key, subfolder="scheduler")
-    toy_scheduler.set_timesteps(opt["save_steps"])
-    timesteps_to_save, num_inference_steps = get_timesteps(toy_scheduler, num_inference_steps=opt["save_steps"],
-                                                           strength=1.0,
-                                                           device=device)
-    seed_everything(opt["seed"])
-    if not opt["frames"]: # original non demo setting
-        save_path = os.path.join(opt["save_dir"],
-                                 f'sd_{opt["sd_version"]}',
-                                 Path(opt["data_path"]).stem,
-                                 f'steps_{opt["steps"]}',
-                                 f'nframes_{opt["n_frames"]}')
-        os.makedirs(os.path.join(save_path, f'latents'), exist_ok=True)
-        add_dict_to_yaml_file(os.path.join(opt["save_dir"], 'inversion_prompts.yaml'), Path(opt["data_path"]).stem, opt["inversion_prompt"])
-        # save inversion prompt in a txt file
-        with open(os.path.join(save_path, 'inversion_prompt.txt'), 'w') as f:
-            f.write(opt["inversion_prompt"])
-    else:
-        save_path = None
-    model = Preprocess(device, opt)
-    frames, latents, total_inverted_latents, rgb_reconstruction = model.extract_latents(
-                                         num_steps=model.config["steps"],
-                                         save_path=save_path,
-                                         batch_size=model.config["batch_size"],
-                                         timesteps_to_save=timesteps_to_save,
-                                         inversion_prompt=model.config["inversion_prompt"],
-    )
-    return frames, latents, total_inverted_latents, rgb_reconstruction

     def prepare_depth_maps(self, model_type='DPT_Large', device='cuda'):
         depth_maps = []
         midas = torch.hub.load("intel-isl/MiDaS", model_type)
+        midas.to(self.device)
         midas.eval()
         midas_transforms = torch.hub.load("intel-isl/MiDaS", "transforms")
             latent_h = img.shape[0] // 8
             latent_w = img.shape[1] // 8
+            input_batch = transform(img).to(self.device)
             prediction = midas(input_batch)
             depth_map = torch.nn.functional.interpolate(
     def get_text_embeds(self, prompt, negative_prompt, device="cuda"):
         text_input = self.tokenizer(prompt, padding='max_length', max_length=self.tokenizer.model_max_length,
                                     truncation=True, return_tensors='pt')
+        text_embeddings = self.text_encoder(text_input.input_ids.to(self.device))[0]
         uncond_input = self.tokenizer(negative_prompt, padding='max_length', max_length=self.tokenizer.model_max_length,
                                       return_tensors='pt')
+        uncond_embeddings = self.text_encoder(uncond_input.input_ids.to(self.device))[0]
         text_embeddings = torch.cat([uncond_embeddings, text_embeddings])
         return text_embeddings
         return self.frames, self.latents, self.total_inverted_latents, None

tokenflow_pnp.py CHANGED Viewed

@@ -78,7 +78,7 @@ class TokenFlow(nn.Module):
     def prepare_depth_maps(self, model_type='DPT_Large', device='cuda'):
         depth_maps = []
         midas = torch.hub.load("intel-isl/MiDaS", model_type)
-        midas.to(device)
         midas.eval()
         midas_transforms = torch.hub.load("intel-isl/MiDaS", "transforms")
@@ -95,7 +95,7 @@ class TokenFlow(nn.Module):
             latent_h = img.shape[0] // 8
             latent_w = img.shape[1] // 8
-            input_batch = transform(img).to(device)
             prediction = midas(input_batch)
             depth_map = torch.nn.functional.interpolate(

     def prepare_depth_maps(self, model_type='DPT_Large', device='cuda'):
         depth_maps = []
         midas = torch.hub.load("intel-isl/MiDaS", model_type)
+        midas.to(self.device)
         midas.eval()
         midas_transforms = torch.hub.load("intel-isl/MiDaS", "transforms")
             latent_h = img.shape[0] // 8
             latent_w = img.shape[1] // 8
+            input_batch = transform(img).to(self.device)
             prediction = midas(input_batch)
             depth_map = torch.nn.functional.interpolate(