Spaces:

prithivMLmods
/

Qwen-Image-Diffusion

Running on Zero

App Files Files Community

Qwen-Image-Diffusion / app.py

prithivMLmods

update app

a5827fa verified about 1 month ago

raw

history blame

11.8 kB

	import gradio as gr
	import numpy as np
	import random
	import torch
	import spaces
	import os
	from PIL import Image

	from diffusers import FlowMatchEulerDiscreteScheduler
	from optimization import optimize_pipeline_
	from qwenimage.pipeline_qwenimage_edit_plus import QwenImageEditPlusPipeline
	from qwenimage.transformer_qwenimage import QwenImageTransformer2DModel
	from qwenimage.qwen_fa3_processor import QwenDoubleStreamAttnProcessorFA3

	from gradio.themes import Soft
	from gradio.themes.utils import colors, fonts, sizes

	colors.steel_blue = colors.Color(
	name="steel_blue",
	c50="#EBF3F8",
	c100="#D3E5F0",
	c200="#A8CCE1",
	c300="#7DB3D2",
	c400="#529AC3",
	c500="#4682B4",
	c600="#3E72A0",
	c700="#36638C",
	c800="#2E5378",
	c900="#264364",
	c950="#1E3450",
	)

	class SteelBlueTheme(Soft):
	def __init__(
	self,
	*,
	primary_hue: colors.Color \| str = colors.gray,
	secondary_hue: colors.Color \| str = colors.steel_blue,
	neutral_hue: colors.Color \| str = colors.slate,
	text_size: sizes.Size \| str = sizes.text_lg,
	font: fonts.Font \| str \| Iterable[fonts.Font \| str] = (
	fonts.GoogleFont("Outfit"), "Arial", "sans-serif",
	),
	font_mono: fonts.Font \| str \| Iterable[fonts.Font \| str] = (
	fonts.GoogleFont("IBM Plex Mono"), "ui-monospace", "monospace",
	),
	):
	super().__init__(
	primary_hue=primary_hue,
	secondary_hue=secondary_hue,
	neutral_hue=neutral_hue,
	text_size=text_size,
	font=font,
	font_mono=font_mono,
	)
	super().set(
	background_fill_primary="*primary_50",
	background_fill_primary_dark="*primary_900",
	body_background_fill="linear-gradient(135deg, primary_200, primary_100)",
	body_background_fill_dark="linear-gradient(135deg, primary_900, primary_800)",
	button_primary_text_color="white",
	button_primary_text_color_hover="white",
	button_primary_background_fill="linear-gradient(90deg, secondary_500, secondary_600)",
	button_primary_background_fill_hover="linear-gradient(90deg, secondary_600, secondary_700)",
	button_primary_background_fill_dark="linear-gradient(90deg, secondary_600, secondary_800)",
	button_primary_background_fill_hover_dark="linear-gradient(90deg, secondary_500, secondary_500)",
	button_secondary_text_color="black",
	button_secondary_text_color_hover="white",
	button_secondary_background_fill="linear-gradient(90deg, primary_300, primary_300)",
	button_secondary_background_fill_hover="linear-gradient(90deg, primary_400, primary_400)",
	button_secondary_background_fill_dark="linear-gradient(90deg, primary_500, primary_600)",
	button_secondary_background_fill_hover_dark="linear-gradient(90deg, primary_500, primary_500)",
	slider_color="*secondary_500",
	slider_color_dark="*secondary_600",
	block_title_text_weight="600",
	block_border_width="3px",
	block_shadow="*shadow_drop_lg",
	button_primary_shadow="*shadow_drop_lg",
	button_large_padding="11px",
	color_accent_soft="*primary_100",
	block_label_background_fill="*primary_200",
	)

	steel_blue_theme = SteelBlueTheme()

	# --- Constants and Setup ---
	MAX_SEED = np.iinfo(np.int32).max
	dtype = torch.bfloat16
	device = "cuda" if torch.cuda.is_available() else "cpu"

	# --- Model Loading ---
	# Load the base pipeline and the optimized transformer
	pipe = QwenImageEditPlusPipeline.from_pretrained(
	"Qwen/Qwen-Image-Edit-2509",
	transformer=QwenImageTransformer2DModel.from_pretrained(
	"linoyts/Qwen-Image-Edit-Rapid-AIO",
	subfolder='transformer',
	torch_dtype=dtype,
	device_map='cuda'
	),
	torch_dtype=dtype
	).to(device)

	# Load all LoRA adapters with unique names
	pipe.load_lora_weights(
	"dx8152/Qwen-Image-Edit-2509-Light_restoration",
	weight_name="移除光影.safetensors",
	adapter_name="light_restoration"
	)
	pipe.load_lora_weights(
	"dx8152/Qwen-Edit-2509-Multiple-angles",
	weight_name="镜头转换.safetensors",
	adapter_name="multiple_angles"
	)
	pipe.load_lora_weights(
	"autoweeb/Qwen-Image-Edit-2509-Photo-to-Anime",
	weight_name="Qwen-Image-Edit-2509-Photo-to-Anime_000001000.safetensors",
	adapter_name="photo_to_anime"
	)
	pipe.load_lora_weights(
	"dx8152/Qwen-Image-Edit-2509-Relight",
	weight_name="Qwen-Edit-Relight.safetensors",
	adapter_name="relight"
	)

	# Apply optimizations
	pipe.transformer.__class__ = QwenImageTransformer2DModel
	pipe.transformer.set_attn_processor(QwenDoubleStreamAttnProcessorFA3())
	optimize_pipeline_(pipe, image=[Image.new("RGB", (1024, 1024)), Image.new("RGB", (1024, 1024))], prompt="prompt")


	# --- Inference Logic ---
	@spaces.GPU
	def infer(
	image,
	prompt,
	lora_adapter,
	seed,
	randomize_seed,
	true_guidance_scale,
	num_inference_steps,
	height,
	width,
	progress=gr.Progress(track_tqdm=True)
	):
	if image is None:
	raise gr.Error("Please upload an image to get started.")

	# Set the active LoRA adapter based on user selection
	if lora_adapter == "Shadow/Light Restoration":
	pipe.set_adapters(["light_restoration"], adapter_weights=[1.0])
	elif lora_adapter == "Multiple Angles":
	pipe.set_adapters(["multiple_angles"], adapter_weights=[1.0])
	elif lora_adapter == "Photo to Anime":
	pipe.set_adapters(["photo_to_anime"], adapter_weights=[1.0])
	elif lora_adapter == "Advanced Relighting":
	pipe.set_adapters(["relight"], adapter_weights=[1.0])

	if randomize_seed:
	seed = random.randint(0, MAX_SEED)
	generator = torch.Generator(device=device).manual_seed(seed)

	result = pipe(
	image=image.convert("RGB"),
	prompt=prompt,
	height=height,
	width=width,
	num_inference_steps=num_inference_steps,
	generator=generator,
	true_cfg_scale=true_guidance_scale,
	num_images_per_prompt=1,
	).images[0]

	return result, seed

	# --- UI Helper Functions ---
	def update_dimensions_on_upload(image):
	"""Adjusts the height and width sliders to match the uploaded image's aspect ratio."""
	if image is None:
	return 1024, 1024

	original_width, original_height = image.size

	if original_width > original_height:
	new_width = 1024
	new_height = int(new_width * (original_height / original_width))
	else:
	new_height = 1024
	new_width = int(new_height * (original_width / original_height))

	# Ensure dimensions are multiples of 8 for model compatibility
	new_width = (new_width // 8) * 8
	new_height = (new_height // 8) * 8

	return new_width, new_height

	def update_prompt_on_adapter_change(adapter_name):
	"""Provides a suggested prompt when a new adapter is selected."""
	prompts = {
	"Shadow/Light Restoration": "Remove shadows and relight the image using soft lighting.",
	"Multiple Angles": "A photo of the scene from a top-down view.",
	"Photo to Anime": "Transform into anime, masterpiece, best quality.",
	"Advanced Relighting": "Relight the image using soft, diffused lighting that simulates sunlight filtering through curtains."
	}
	return prompts.get(adapter_name, "")

	# --- Gradio UI ---
	css = '''
	#col-container {
	max-width: 960px;
	margin: 0 auto;
	font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, Helvetica, Arial, sans-serif;
	}
	.dark .progress-text { color: white !important }
	#examples { max-width: 960px; margin: 0 auto; }
	.gradio-container {
	background: linear-gradient(135deg, #f5f7fa 0%, #c3cfe2 100%);
	}
	.gr-button-primary {
	background: linear-gradient(135deg, #667eea 0%, #764ba2 100%) !important;
	border: none !important;
	border-radius: 12px !important;
	padding: 12px 24px !important;
	font-weight: 600 !important;
	}
	.gr-box {
	border-radius: 16px !important;
	box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1) !important;
	}
	'''

	with gr.Blocks(theme=steel_blue_theme, css=css) as demo:
	with gr.Column(elem_id="col-container"):
	gr.Markdown("# Qwen Image Edit - Fast LoRA")
	with gr.Row():
	with gr.Column(scale=1):
	image = gr.Image(label="Upload Image", type="pil", height=450)

	lora_adapter = gr.Dropdown(
	label="Choose an Editing Tool",
	choices=[
	"Shadow/Light Restoration",
	"Multiple Angles",
	"Photo to Anime",
	"Advanced Relighting"
	],
	value="Shadow/Light Restoration"
	)

	prompt = gr.Textbox(
	label="Prompt",
	value="Remove shadows and relight the image using soft lighting.",
	lines=2
	)

	run_btn = gr.Button("Generate", variant="primary", size="lg")

	with gr.Accordion("⚙️ Advanced Settings", open=False):
	seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
	randomize_seed = gr.Checkbox(label="Randomize Seed", value=True)
	true_guidance_scale = gr.Slider(label="Guidance Scale", minimum=1.0, maximum=10.0, step=0.1, value=1.0)
	num_inference_steps = gr.Slider(label="Inference Steps", minimum=1, maximum=40, step=1, value=4)
	height = gr.Slider(label="Height", minimum=256, maximum=2048, step=8, value=1024)
	width = gr.Slider(label="Width", minimum=256, maximum=2048, step=8, value=1024)

	with gr.Column(scale=1):
	result = gr.Image(label="Output Image", interactive=False, height=500, format="png")

	gr.Examples(
	elem_id="examples",
	examples=[
	[
	"examples/example1.png",
	"A photo of the scene from a low angle shot.",
	"Multiple Angles",
	],
	[
	"examples/example2.png",
	"Remove shadows and relight the image using soft lighting.",
	"Shadow/Light Restoration",
	],
	[
	"examples/example3.png",
	"Transform into anime, masterpiece, best quality, girl with cherry blossoms.",
	"Photo to Anime",
	],
	[
	"examples/example4.png",
	"Relight the image using soft, diffused lighting that simulates sunlight filtering through curtains.",
	"Advanced Relighting",
	],
	],
	inputs=[image, prompt, lora_adapter],
	outputs=[result, seed],
	fn=infer,
	cache_examples=False
	)

	# --- Event Handlers ---
	run_btn.click(
	fn=infer,
	inputs=[image, prompt, lora_adapter, seed, randomize_seed, true_guidance_scale, num_inference_steps, height, width],
	outputs=[result, seed]
	)

	image.upload(
	fn=update_dimensions_on_upload,
	inputs=[image],
	outputs=[width, height]
	)

	lora_adapter.change(
	fn=update_prompt_on_adapter_change,
	inputs=[lora_adapter],
	outputs=[prompt]
	)

	demo.launch(mcp_server=True, ssr_mode=False, show_error=True)