Spaces:

ellemac
/

avantGAN

Build error

App Files Files Community

Elle McFarlane commited on Jun 25, 2024

Commit

19ec9f5

1 Parent(s): 48c898d

update to multi-model selection

Browse files

Files changed (3) hide show

app.py +59 -127
model.py +211 -0
requirements.txt +1 -1

app.py CHANGED Viewed

@@ -1,146 +1,78 @@
 import gradio as gr
 import numpy as np
-import random
-from diffusers import DiffusionPipeline
-import torch
-device = "cuda" if torch.cuda.is_available() else "cpu"
-if torch.cuda.is_available():
-    torch.cuda.max_memory_allocated(device=device)
-    pipe = DiffusionPipeline.from_pretrained("stabilityai/sdxl-turbo", torch_dtype=torch.float16, variant="fp16", use_safetensors=True)
-    pipe.enable_xformers_memory_efficient_attention()
-    pipe = pipe.to(device)
-else:
-    pipe = DiffusionPipeline.from_pretrained("stabilityai/sdxl-turbo", use_safetensors=True)
-    pipe = pipe.to(device)
-MAX_SEED = np.iinfo(np.int32).max
-MAX_IMAGE_SIZE = 1024
-def infer(prompt, negative_prompt, seed, randomize_seed, width, height, guidance_scale, num_inference_steps):
-    if randomize_seed:
-        seed = random.randint(0, MAX_SEED)
-    generator = torch.Generator().manual_seed(seed)
-    image = pipe(
-        prompt = prompt,
-        negative_prompt = negative_prompt,
-        guidance_scale = guidance_scale,
-        num_inference_steps = num_inference_steps,
-        width = width,
-        height = height,
-        generator = generator
-    ).images[0]
-    return image
-examples = [
-    "Astronaut in a jungle, cold color palette, muted colors, detailed, 8k",
-    "An astronaut riding a green horse",
-    "A delicious ceviche cheesecake slice",
-]
-css="""
-#col-container {
-    margin: 0 auto;
-    max-width: 520px;
-}
-"""
-if torch.cuda.is_available():
-    power_device = "GPU"
-else:
-    power_device = "CPU"
-with gr.Blocks(css=css) as demo:
-    with gr.Column(elem_id="col-container"):
-        gr.Markdown(f"""
-        # Text-to-Image Gradio Template
-        Currently running on {power_device}.
-        """)
-        with gr.Row():
-            prompt = gr.Text(
-                label="Prompt",
-                show_label=False,
-                max_lines=1,
-                placeholder="Enter your prompt",
-                container=False,
-            )
-            run_button = gr.Button("Run", scale=0)
-        result = gr.Image(label="Result", show_label=False)
-        with gr.Accordion("Advanced Settings", open=False):
-            negative_prompt = gr.Text(
-                label="Negative prompt",
-                max_lines=1,
-                placeholder="Enter a negative prompt",
-                visible=False,
-            )
-            seed = gr.Slider(
-                label="Seed",
-                minimum=0,
-                maximum=MAX_SEED,
-                step=1,
-                value=0,
-            )
-            randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
             with gr.Row():
-                width = gr.Slider(
-                    label="Width",
-                    minimum=256,
-                    maximum=MAX_IMAGE_SIZE,
-                    step=32,
-                    value=512,
-                )
-                height = gr.Slider(
-                    label="Height",
-                    minimum=256,
-                    maximum=MAX_IMAGE_SIZE,
-                    step=32,
-                    value=512,
-                )
             with gr.Row():
-                guidance_scale = gr.Slider(
-                    label="Guidance scale",
-                    minimum=0.0,
-                    maximum=10.0,
-                    step=0.1,
-                    value=0.0,
-                )
-                num_inference_steps = gr.Slider(
-                    label="Number of inference steps",
-                    minimum=1,
-                    maximum=12,
-                    step=1,
-                    value=2,
                 )
-        gr.Examples(
-            examples = examples,
-            inputs = [prompt]
-        )
     run_button.click(
-        fn = infer,
-        inputs = [prompt, negative_prompt, seed, randomize_seed, width, height, guidance_scale, num_inference_steps],
-        outputs = [result]
     )
-demo.queue().launch()

+#!/usr/bin/env python
+from __future__ import annotations
 import gradio as gr
 import numpy as np
+from model import Model
+DESCRIPTION = "# [AvantGAN](https://github.com/ellemcfarlane/AvantGAN)"
+def get_sample_image_url(name: str) -> str:
+    sample_image_dir = "https://huggingface.co/spaces/ellemac/avantGAN/resolve/main/samples"
+    return f"{sample_image_dir}/{name}.png"
+def get_sample_image_markdown(name: str) -> str:
+    url = get_sample_image_url(name)
+    size = 128 if ("stylegan3" in name or "original" in name) else 64
+    return f"""
+    - size: {size}x{size}
+    ![sample images]({url})"""
+model = Model()
+with gr.Blocks(css="style.css") as demo:
+    gr.Markdown(DESCRIPTION)
+    with gr.Tabs():
+        with gr.TabItem("App"):
             with gr.Row():
+                with gr.Column():
+                    model_name = gr.Dropdown(
+                        label="Model", choices=list(model.MODEL_DICT.keys()), value="stylegan3-abstract"
+                    )
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=np.iinfo(np.uint32).max, step=1, value=0)
+                    run_button = gr.Button()
+                with gr.Column():
+                    result = gr.Image(label="Result", elem_id="result", width=300, height=300)
+                    print("RESULT", result, type(result), result.__dict__)
+        with gr.TabItem("Sample Images"):
             with gr.Row():
+                model_name2 = gr.Dropdown(
+                    [
+                        "stylegan3-abstract",
+                        "stylegan3-high-fidelity",
+                        "ada-dcgan",
+                        "original-training-data",
+                    ],
+                    value="stylegan3-abstract",
+                    label="Model",
                 )
+            with gr.Row():
+                text = get_sample_image_markdown(model_name2.value)
+                sample_images = gr.Markdown(text)
     run_button.click(
+        fn=model.set_model_and_generate_image,
+        inputs=[
+            model_name,
+            seed,
+        ],
+        outputs=result,
+        api_name="run",
+    )
+    model_name2.change(
+        fn=get_sample_image_markdown,
+        inputs=model_name2,
+        outputs=sample_images,
+        queue=False,
+        api_name=False,
     )
+if __name__ == "__main__":
+    demo.queue(max_size=20).launch()

model.py ADDED Viewed

	@@ -0,0 +1,211 @@

+# from https://huggingface.co/spaces/hysts/StyleGAN3/blob/main/model.py
+import pathlib
+import pickle
+import sys
+import numpy as np
+import torch
+import torch.nn as nn
+from huggingface_hub import hf_hub_download
+import torch
+import torchvision.utils as vutils
+import matplotlib.pyplot as plt
+from io import BytesIO
+from PIL import Image
+current_dir = pathlib.Path(__file__).parent
+submodule_dir = current_dir / "stylegan3"
+sys.path.insert(0, submodule_dir.as_posix())
+user = "ellemac"
+dcgan_z_dim = 100
+dcgan_gen_feats = 64
+ngf = 64
+dcgan_img_size = 64
+nc = 3
+class Generator(nn.Module):
+    def __init__(self, ngpu, nz):
+        super(Generator, self).__init__()
+        self.ngpu = ngpu
+        self.main = nn.Sequential(
+            # input is Z, going into a convolution
+            nn.ConvTranspose2d(     nz, ngf * 8, 4, 1, 0, bias=False),
+            nn.BatchNorm2d(ngf * 8),
+            nn.LeakyReLU(0.2, inplace=True),
+            # state size. (ngf*8) x 4 x 4
+            nn.ConvTranspose2d(ngf * 8, ngf * 4, 4, 2, 1, bias=False),
+            nn.BatchNorm2d(ngf * 4),
+            nn.LeakyReLU(0.2, inplace=True),
+            # state size. (ngf*4) x 8 x 8
+            nn.ConvTranspose2d(ngf * 4, ngf * 2, 4, 2, 1, bias=False),
+            nn.BatchNorm2d(ngf * 2),
+            nn.LeakyReLU(0.2, inplace=True),
+            # state size. (ngf*2) x 16 x 16
+            nn.ConvTranspose2d(ngf * 2,     ngf, 4, 2, 1, bias=False),
+            nn.BatchNorm2d(ngf),
+            nn.LeakyReLU(0.2, inplace=True),
+            # state size. (ngf) x 32 x 32
+            nn.ConvTranspose2d(    ngf,      nc, 4, 2, 1, bias=False),
+            nn.Tanh()
+            # state size. (nc) x 64 x 64
+        )
+    def forward(self, input):
+        return self.main(input)
+# class Generator(nn.Module):
+#     def __init__(self, n_gen_feats, n_gpu, z_dim, n_channels):
+#         super(Generator, self).__init__()
+#         self.n_gpu = n_gpu
+#         self.main = nn.Sequential(
+#             # input is Z, going into a convolution
+#             nn.ConvTranspose2d(z_dim, n_gen_feats * 8, 4, 1, 0, bias=False),
+#             nn.BatchNorm2d(n_gen_feats * 8),
+#             nn.LeakyReLU(0.2, inplace=True),
+#             # state size. (n_gen_feats*8) x 4 x 4
+#             nn.ConvTranspose2d(n_gen_feats * 8, n_gen_feats * 4, 4, 2, 1, bias=False),
+#             nn.BatchNorm2d(n_gen_feats * 4),
+#             nn.LeakyReLU(0.2, inplace=True),
+#             # state size. (n_gen_feats*4) x 8 x 8
+#             nn.ConvTranspose2d(n_gen_feats * 4, n_gen_feats * 2, 4, 2, 1, bias=False),
+#             nn.BatchNorm2d(n_gen_feats * 2),
+#             nn.LeakyReLU(0.2, inplace=True),
+#             # state size. (n_gen_feats*2) x 16 x 16
+#             nn.ConvTranspose2d(n_gen_feats * 2,     n_gen_feats, 4, 2, 1, bias=False),
+#             nn.BatchNorm2d(n_gen_feats),
+#             nn.LeakyReLU(0.2, inplace=True),
+#             # state size. (n_gen_feats) x 32 x 32
+#             nn.ConvTranspose2d(n_gen_feats, n_channels, 4, 2, 1, bias=False),
+#             nn.Tanh()
+#             # state size. (n_channels) x 64 x 64
+#         )
+#     def forward(self, input):
+#         return self.main(input)
+class Model:
+    MODEL_DICT = {
+        "stylegan3-abstract": {"name": "abstract-560eps.pkl", "repo": "avantStyleGAN3"},
+        "stylegan3-high-fidelity": {"name": "high-fidelity-1120eps.pkl", "repo": "avantStyleGAN3"},
+        "ada-dcgan": {"name": "gen_6kepoch.pt", "repo": "avantGAN"},
+    }
+    def __init__(self):
+        self.device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+        self._download_all_models()
+        self.model_name = "ada-dcgan" #stylegan3-abstract"
+        self.model = self._load_model(self.model_name)
+    def _load_model(self, model_name: str) -> nn.Module:
+        file_name = self.MODEL_DICT[model_name]["name"]
+        repo = self.MODEL_DICT[model_name]["repo"]
+        path = hf_hub_download(f"{user}/{repo}", file_name) # model repo-type
+        if "stylegan" in model_name:
+            with open(path, "rb") as f:
+                model = pickle.load(f)["G_ema"]
+        else:
+            # todo (elle): don't hardcode the config
+            # model = Generator(dcgan_gen_feats, 1, dcgan_z_dim, 3)
+            print("WAS HERE")
+            model = Generator(0, 100)
+        model.eval()
+        model.to(self.device)
+        return model
+    def set_model(self, model_name: str) -> None:
+        if model_name == self.model_name:
+            return
+        self.model_name = model_name
+        self.model = self._load_model(model_name)
+    def _download_all_models(self):
+        for name in self.MODEL_DICT.keys():
+            self._load_model(name)
+    @staticmethod
+    def make_transform(translate: tuple[float, float] = (0,0), angle: float = 0) -> np.ndarray:
+        mat = np.eye(3)
+        sin = np.sin(angle / 360 * np.pi * 2)
+        cos = np.cos(angle / 360 * np.pi * 2)
+        mat[0][0] = cos
+        mat[0][1] = sin
+        mat[0][2] = translate[0]
+        mat[1][0] = -sin
+        mat[1][1] = cos
+        mat[1][2] = translate[1]
+        return mat
+    def generate_z(self, seed: int) -> torch.Tensor:
+        seed = int(np.clip(seed, 0, np.iinfo(np.uint32).max))
+        z = np.random.RandomState(seed).randn(1, self.model.z_dim)
+        return torch.from_numpy(z).float().to(self.device)
+    def postprocess(self, tensor: torch.Tensor) -> np.ndarray:
+        tensor = (tensor.permute(0, 2, 3, 1) * 127.5 + 128).clamp(0, 255).to(torch.uint8)
+        return tensor.cpu().numpy()
+    def dcgan_postprocess(self, tensor: torch.Tensor) -> np.ndarray:
+        tensor = (tensor.permute(0, 2, 3, 1)).clamp(0, 255).to(torch.uint8)
+        return tensor.cpu().numpy()
+    def set_transform(self, tx: float = 0, ty: float = 0, angle: float = 0) -> None:
+        mat = self.make_transform((tx, ty), angle)
+        mat = np.linalg.inv(mat)
+        self.model.synthesis.input.transform.copy_(torch.from_numpy(mat))
+    @torch.inference_mode()
+    def generate(self, z: torch.Tensor, label: torch.Tensor, truncation_psi: float) -> torch.Tensor:
+        return self.model(z, label, truncation_psi=truncation_psi)
+    def generate_image(self, seed: int, truncation_psi: float = 0, tx: float = 0, ty: float = 0, angle: float = 0) -> np.ndarray:
+        self.set_transform(tx, ty, angle)
+        z = self.generate_z(seed)
+        label = torch.zeros([1, self.model.c_dim], device=self.device)
+        out = self.generate(z, label, truncation_psi)
+        out = self.postprocess(out)
+        return out[0]
+    def dcgan_generate_image(self, seed: int) -> np.ndarray:
+        dcgan_img_size = 64
+        dcgan_z_dim = 100
+        with torch.no_grad():
+            n_images = 1
+            z = torch.randn(n_images, dcgan_z_dim, 1, 1, device=self.device)
+            fake_images = self.model(z.to(self.device)).cpu()
+            fake_images = fake_images.view(fake_images.size(0), 3, dcgan_img_size, dcgan_img_size)
+            print('fake', fake_images)
+            print(fake_images.min(), fake_images.max())
+            # Create a grid of images
+            grid = vutils.make_grid(fake_images, normalize=True)
+            print('grid', grid)
+            # Plot the grid and save it to a buffer
+            fig, ax = plt.subplots()
+            ax.imshow(grid.permute(1, 2, 0))  # Convert from CHW to HWC for imshow
+            plt.axis('off')
+            # Save the plot to a buffer
+            buf = BytesIO()
+            plt.savefig(buf, format='png')
+            buf.seek(0)
+            # Load the buffer into a PIL Image
+            img = Image.open(buf)
+            return img
+    def set_model_and_generate_image(
+        self, model_name: str, seed: int, truncation_psi: float = 0, tx: float = 0, ty: float = 0, angle: float = 0
+    ) -> np.ndarray:
+        self.set_model(model_name)
+        if "stylegan3" in model_name:
+            return self.generate_image(seed, truncation_psi, tx, ty, angle)
+        else:
+            return self.dcgan_generate_image(seed)

requirements.txt CHANGED Viewed

@@ -3,4 +3,4 @@ diffusers
 invisible_watermark
 torch
 transformers
-xformers

 invisible_watermark
 torch
 transformers
+xformers