| | |
| |
|
| | import os |
| |
|
| | import gradio as gr |
| | import numpy as np |
| | import PIL.Image |
| | import spaces |
| | import torch |
| | from diffusers import AutoencoderKL, DiffusionPipeline |
| |
|
| | DESCRIPTION = "# SDXL" |
| |
|
| | MAX_SEED = np.iinfo(np.int32).max |
| | MAX_IMAGE_SIZE = int(os.getenv("MAX_IMAGE_SIZE", "1024")) |
| |
|
| | device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu") |
| |
|
| | vae = AutoencoderKL.from_pretrained("madebyollin/sdxl-vae-fp16-fix", torch_dtype=torch.float16) |
| | pipe = DiffusionPipeline.from_pretrained( |
| | "stabilityai/stable-diffusion-xl-base-1.0", |
| | vae=vae, |
| | torch_dtype=torch.float16, |
| | use_safetensors=True, |
| | variant="fp16", |
| | ).to(device) |
| | refiner = DiffusionPipeline.from_pretrained( |
| | "stabilityai/stable-diffusion-xl-refiner-1.0", |
| | vae=vae, |
| | torch_dtype=torch.float16, |
| | use_safetensors=True, |
| | variant="fp16", |
| | ).to(device) |
| |
|
| |
|
| | def get_seed(randomize_seed: bool, seed: int) -> int: |
| | """Determine and return the random seed to use for model generation or sampling. |
| | |
| | - MAX_SEED is the maximum value for a 32-bit integer (np.iinfo(np.int32).max). |
| | - This function is typically used to ensure reproducibility or to introduce randomness in model generation. |
| | - The random seed affects the stochastic processes in downstream model inference or sampling. |
| | |
| | Args: |
| | randomize_seed (bool): If True, a random seed (an integer in [0, MAX_SEED)) is generated using NumPy's default random number generator. If False, the provided seed argument is returned as-is. |
| | seed (int): The seed value to use if randomize_seed is False. |
| | |
| | Returns: |
| | int: The selected seed value. If randomize_seed is True, a randomly generated integer; otherwise, the value of the seed argument. |
| | """ |
| | rng = np.random.default_rng() |
| | return int(rng.integers(0, MAX_SEED)) if randomize_seed else seed |
| |
|
| |
|
| | @spaces.GPU |
| | def generate( |
| | prompt: str, |
| | negative_prompt: str = "", |
| | prompt_2: str = "", |
| | negative_prompt_2: str = "", |
| | use_negative_prompt: bool = False, |
| | use_prompt_2: bool = False, |
| | use_negative_prompt_2: bool = False, |
| | seed: int = 0, |
| | width: int = 1024, |
| | height: int = 1024, |
| | guidance_scale_base: float = 5.0, |
| | guidance_scale_refiner: float = 5.0, |
| | num_inference_steps_base: int = 25, |
| | num_inference_steps_refiner: int = 25, |
| | apply_refiner: bool = False, |
| | progress: gr.Progress = gr.Progress(track_tqdm=True), |
| | ) -> PIL.Image.Image: |
| | """Generates an image from a text prompt using the SDXL (Stable Diffusion XL) model. |
| | |
| | This function allows fine-grained control over image generation through prompts, |
| | negative prompts, and optional refinement stages. |
| | |
| | Note: |
| | All prompt-related inputs (e.g., `prompt`, `negative_prompt`, `prompt_2`, and `negative_prompt_2`) |
| | must be written in English for proper model performance. |
| | |
| | Args: |
| | prompt (str): Main text prompt used to guide image generation. |
| | negative_prompt (str, optional): Text specifying elements to exclude from the image. |
| | prompt_2 (str, optional): Secondary prompt for additional guidance. Used only if `use_prompt_2` is True. |
| | negative_prompt_2 (str, optional): Secondary negative prompt. Used only if `use_negative_prompt_2` is True. |
| | use_negative_prompt (bool, optional): Whether to apply `negative_prompt` during generation. |
| | use_prompt_2 (bool, optional): Whether to apply `prompt_2` during generation. |
| | use_negative_prompt_2 (bool, optional): Whether to apply `negative_prompt_2` during generation. |
| | seed (int, optional): Seed for random number generation. Use 0 to generate a random seed. |
| | width (int, optional): Width of the output image in pixels. |
| | height (int, optional): Height of the output image in pixels. |
| | guidance_scale_base (float, optional): Guidance scale for the base model. Higher values follow the prompt more closely. |
| | guidance_scale_refiner (float, optional): Guidance scale for the refiner model. |
| | num_inference_steps_base (int, optional): Number of inference steps for the base model. |
| | num_inference_steps_refiner (int, optional): Number of inference steps for the refiner model. |
| | apply_refiner (bool, optional): Whether to apply the refiner stage after the base image is generated. |
| | progress (gr.Progress, optional): Gradio progress object to show progress during generation. |
| | |
| | Returns: |
| | PIL.Image.Image: The generated image as a PIL Image object. |
| | """ |
| | generator = torch.Generator().manual_seed(seed) |
| |
|
| | if not use_negative_prompt: |
| | negative_prompt = None |
| | if not use_prompt_2: |
| | prompt_2 = None |
| | if not use_negative_prompt_2: |
| | negative_prompt_2 = None |
| |
|
| | if not apply_refiner: |
| | return pipe( |
| | prompt=prompt, |
| | negative_prompt=negative_prompt, |
| | prompt_2=prompt_2, |
| | negative_prompt_2=negative_prompt_2, |
| | width=width, |
| | height=height, |
| | guidance_scale=guidance_scale_base, |
| | num_inference_steps=num_inference_steps_base, |
| | generator=generator, |
| | output_type="pil", |
| | ).images[0] |
| | latents = pipe( |
| | prompt=prompt, |
| | negative_prompt=negative_prompt, |
| | prompt_2=prompt_2, |
| | negative_prompt_2=negative_prompt_2, |
| | width=width, |
| | height=height, |
| | guidance_scale=guidance_scale_base, |
| | num_inference_steps=num_inference_steps_base, |
| | generator=generator, |
| | output_type="latent", |
| | ).images |
| | images = refiner( |
| | prompt=prompt, |
| | negative_prompt=negative_prompt, |
| | prompt_2=prompt_2, |
| | negative_prompt_2=negative_prompt_2, |
| | guidance_scale=guidance_scale_refiner, |
| | num_inference_steps=num_inference_steps_refiner, |
| | image=latents, |
| | generator=generator, |
| | ).images |
| | return images[0] |
| |
|
| |
|
| | examples = [ |
| | "Astronaut in a jungle, cold color palette, muted colors, detailed, 8k", |
| | "An astronaut riding a green horse", |
| | ] |
| |
|
| | with gr.Blocks(css_paths="style.css") as demo: |
| | gr.Markdown(DESCRIPTION) |
| |
|
| | with gr.Group(): |
| | with gr.Row(): |
| | prompt = gr.Textbox( |
| | label="Prompt", |
| | show_label=False, |
| | max_lines=1, |
| | placeholder="Enter your prompt", |
| | submit_btn=True, |
| | ) |
| | result = gr.Image(label="Result", show_label=False) |
| | with gr.Accordion("Advanced options", open=False): |
| | with gr.Row(): |
| | use_negative_prompt = gr.Checkbox(label="Use negative prompt", value=False) |
| | use_prompt_2 = gr.Checkbox(label="Use prompt 2", value=False) |
| | use_negative_prompt_2 = gr.Checkbox(label="Use negative prompt 2", value=False) |
| | negative_prompt = gr.Textbox( |
| | label="Negative prompt", |
| | max_lines=1, |
| | placeholder="Enter a negative prompt", |
| | visible=False, |
| | value="", |
| | ) |
| | prompt_2 = gr.Textbox( |
| | label="Prompt 2", |
| | max_lines=1, |
| | placeholder="Enter your prompt", |
| | visible=False, |
| | value="", |
| | ) |
| | negative_prompt_2 = gr.Textbox( |
| | label="Negative prompt 2", |
| | max_lines=1, |
| | placeholder="Enter a negative prompt", |
| | visible=False, |
| | value="", |
| | ) |
| |
|
| | seed = gr.Slider( |
| | label="Seed", |
| | minimum=0, |
| | maximum=MAX_SEED, |
| | step=1, |
| | value=0, |
| | ) |
| | randomize_seed = gr.Checkbox(label="Randomize seed", value=True) |
| | with gr.Row(): |
| | width = gr.Slider( |
| | label="Width", |
| | minimum=256, |
| | maximum=MAX_IMAGE_SIZE, |
| | step=32, |
| | value=1024, |
| | ) |
| | height = gr.Slider( |
| | label="Height", |
| | minimum=256, |
| | maximum=MAX_IMAGE_SIZE, |
| | step=32, |
| | value=1024, |
| | ) |
| | apply_refiner = gr.Checkbox(label="Apply refiner", value=True) |
| | with gr.Row(): |
| | guidance_scale_base = gr.Slider( |
| | label="Guidance scale for base", |
| | minimum=1, |
| | maximum=20, |
| | step=0.1, |
| | value=5.0, |
| | ) |
| | num_inference_steps_base = gr.Slider( |
| | label="Number of inference steps for base", |
| | minimum=10, |
| | maximum=100, |
| | step=1, |
| | value=25, |
| | ) |
| | with gr.Row() as refiner_params: |
| | guidance_scale_refiner = gr.Slider( |
| | label="Guidance scale for refiner", |
| | minimum=1, |
| | maximum=20, |
| | step=0.1, |
| | value=5.0, |
| | ) |
| | num_inference_steps_refiner = gr.Slider( |
| | label="Number of inference steps for refiner", |
| | minimum=10, |
| | maximum=100, |
| | step=1, |
| | value=25, |
| | ) |
| |
|
| | gr.Examples( |
| | examples=examples, |
| | inputs=prompt, |
| | outputs=result, |
| | fn=generate, |
| | ) |
| |
|
| | use_negative_prompt.change( |
| | fn=lambda x: gr.Textbox(visible=x), |
| | inputs=use_negative_prompt, |
| | outputs=negative_prompt, |
| | queue=False, |
| | api_name=False, |
| | ) |
| | use_prompt_2.change( |
| | fn=lambda x: gr.Textbox(visible=x), |
| | inputs=use_prompt_2, |
| | outputs=prompt_2, |
| | queue=False, |
| | api_name=False, |
| | ) |
| | use_negative_prompt_2.change( |
| | fn=lambda x: gr.Textbox(visible=x), |
| | inputs=use_negative_prompt_2, |
| | outputs=negative_prompt_2, |
| | queue=False, |
| | api_name=False, |
| | ) |
| | apply_refiner.change( |
| | fn=lambda x: gr.Row(visible=x), |
| | inputs=apply_refiner, |
| | outputs=refiner_params, |
| | queue=False, |
| | api_name=False, |
| | ) |
| |
|
| | gr.on( |
| | triggers=[ |
| | prompt.submit, |
| | negative_prompt.submit, |
| | prompt_2.submit, |
| | negative_prompt_2.submit, |
| | ], |
| | fn=get_seed, |
| | inputs=[randomize_seed, seed], |
| | outputs=seed, |
| | queue=False, |
| | ).then( |
| | fn=generate, |
| | inputs=[ |
| | prompt, |
| | negative_prompt, |
| | prompt_2, |
| | negative_prompt_2, |
| | use_negative_prompt, |
| | use_prompt_2, |
| | use_negative_prompt_2, |
| | seed, |
| | width, |
| | height, |
| | guidance_scale_base, |
| | guidance_scale_refiner, |
| | num_inference_steps_base, |
| | num_inference_steps_refiner, |
| | apply_refiner, |
| | ], |
| | outputs=result, |
| | api_name="predict", |
| | ) |
| |
|
| | if __name__ == "__main__": |
| | demo.launch(mcp_server=True) |
| |
|