Spaces:
Paused
Paused
File size: 22,701 Bytes
c50111a c3cd30b f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 c3cd30b f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 c3cd30b a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 a77e2f8 f09a9f1 c3cd30b f09a9f1 a77e2f8 f09a9f1 c3cd30b a77e2f8 f09a9f1 a77e2f8 f09a9f1 c3cd30b f09a9f1 a77e2f8 f09a9f1 c3cd30b f09a9f1 c3cd30b f09a9f1 a77e2f8 f09a9f1 c3cd30b f09a9f1 e422165 f09a9f1 a77e2f8 f09a9f1 a77e2f8 c3cd30b f09a9f1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 |
try:
import spaces
SPACES_AVAILABLE = True
print("β
Spaces available - ZeroGPU mode")
except ImportError:
SPACES_AVAILABLE = False
print("β οΈ Spaces not available - running in regular mode")
import gradio as gr
import torch
from diffusers import DiffusionPipeline, StableDiffusionXLPipeline
from PIL import Image
import datetime
import io
import json
import os
import re
from typing import Optional, List, Dict
import numpy as np
# ======================
# Configuration Section (Modify here to expand)
# ======================
# 1. Base Model - Illustrious XL v1.0
BASE_MODEL = "OnomaAIResearch/Illustrious-XL-v1.0"
# 2. Fixed LoRAs (Auto-loaded, not user-selectable)
FIXED_LORAS = {
"quality_enhancer": {
"repo_id": "stabilityai/stable-diffusion-xl-base-1.0",
"filename": "sd_xl_base_1.0.safetensors",
"weight": 0.8,
"trigger_words": "high quality, detailed, sharp"
},
"pose_control": {
"repo_id": "latent-consistency/lcm-lora-sdxl",
"filename": None,
"weight": 0.7,
"trigger_words": "perfect anatomy, natural pose"
}
}
# 3. Style Templates (Auto-prepended to user prompts)
STYLE_PROMPTS = {
"None": "",
"Realistic": "photorealistic, ultra-detailed skin, natural lighting, 8k uhd, professional photography, DSLR, soft lighting, high quality, film grain, Fujifilm XT3, masterpiece, ",
"Anime": "anime style, cel shading, vibrant colors, detailed eyes, studio ghibli style, manga style, trending on pixiv, masterpiece, ",
"Comic": "comic book style, bold outlines, dynamic angles, comic panel, Marvel DC style, inked lines, pop art, masterpiece, ",
"Watercolor": "watercolor painting, soft brush strokes, translucent layers, artistic, painterly, paper texture, traditional art, masterpiece, ",
}
# 4. Optional LoRAs (User-selectable via dropdown, can select multiple)
OPTIONAL_LORAS = {
"None": {
"repo_id": None,
"weight": 0.0,
"trigger_words": "",
"description": "No additional LoRA"
},
"Detail Enhancement": {
"repo_id": "ByteDance/SDXL-Lightning",
"weight": 0.8,
"trigger_words": "extremely detailed, intricate details, hyperdetailed",
"description": "Enhances fine details and textures"
},
"Portrait Master": {
"repo_id": "ostris/face-helper-sdxl-lora",
"weight": 0.9,
"trigger_words": "perfect face, beautiful eyes, detailed skin texture",
"description": "Specializes in realistic portraits"
},
"Cinematic Style": {
"repo_id": "goofyai/cyborg_style_xl",
"weight": 0.7,
"trigger_words": "cinematic lighting, dramatic shadows, film noir",
"description": "Adds cinematic atmosphere"
},
"Vintage Photo": {
"repo_id": "artificialguybr/LogoRedmond-LogoLoraForSDXL-V2",
"weight": 0.6,
"trigger_words": "vintage photo, retro style, film photography",
"description": "Vintage photography effects"
},
"Art Nouveau": {
"repo_id": "ostris/super-cereal-sdxl-lora",
"weight": 0.8,
"trigger_words": "art nouveau style, ornate decorations, flowing lines",
"description": "Art Nouveau artistic style"
}
}
# Default Parameters
DEFAULT_SEED = -1
DEFAULT_WIDTH = 1024
DEFAULT_HEIGHT = 1024
DEFAULT_LORA_SCALE = 0.8
DEFAULT_STEPS = 30
DEFAULT_CFG = 7.5
# Supported Languages (for future expansion)
SUPPORTED_LANGUAGES = {
"en": "English",
"zh": "δΈζ",
"ja": "ζ₯ζ¬θͺ",
"ko": "νκ΅μ΄"
}
# ======================
# Global Variables: Lazy Loading
# ======================
pipe = None
current_loras = {}
device = "cuda" if torch.cuda.is_available() else "cpu"
def load_pipeline():
"""Load the base Illustrious XL pipeline"""
global pipe
if pipe is None:
print("π Loading Illustrious XL base model...")
pipe = StableDiffusionXLPipeline.from_pretrained(
BASE_MODEL,
torch_dtype=torch.float16,
use_safetensors=True,
variant="fp16"
).to(device)
# Enable memory optimizations for ZeroGPU
pipe.enable_attention_slicing()
pipe.enable_vae_slicing()
pipe.enable_model_cpu_offload()
pipe.enable_xformers_memory_efficient_attention()
print("β
Illustrious XL model loaded successfully.")
return pipe
def unload_pipeline():
"""Unload pipeline to free memory"""
global pipe, current_loras
if pipe is not None:
# Clear any loaded LoRAs
try:
pipe.unload_lora_weights()
except:
pass
del pipe
torch.cuda.empty_cache()
pipe = None
current_loras = {}
print("ποΈ Pipeline unloaded.")
def load_lora_weights(lora_configs: List[Dict]):
"""Load multiple LoRA weights efficiently"""
global pipe, current_loras
if not lora_configs:
return
# Unload existing LoRAs if different
new_lora_ids = [config['repo_id'] for config in lora_configs if config['repo_id']]
if set(current_loras.keys()) != set(new_lora_ids):
try:
pipe.unload_lora_weights()
current_loras = {}
except:
pass
# Load new LoRAs
adapter_names = []
adapter_weights = []
for config in lora_configs:
if config['repo_id'] and config['repo_id'] not in current_loras:
try:
pipe.load_lora_weights(
config['repo_id'],
adapter_name=config['name']
)
current_loras[config['repo_id']] = config['name']
print(f"β
Loaded LoRA: {config['name']}")
except Exception as e:
print(f"β Failed to load LoRA {config['name']}: {e}")
continue
if config['repo_id']:
adapter_names.append(config['name'])
adapter_weights.append(config['weight'])
# Set adapter weights
if adapter_names:
try:
pipe.set_adapters(adapter_names, adapter_weights=adapter_weights)
except Exception as e:
print(f"β οΈ Warning setting adapter weights: {e}")
def process_long_prompt(prompt: str, max_length: int = 77) -> str:
"""Process long prompts by intelligent truncation and optimization"""
if len(prompt.split()) <= max_length:
return prompt
# Split into sentences and prioritize
sentences = re.split(r'[.!?]+', prompt)
sentences = [s.strip() for s in sentences if s.strip()]
# Keep most important parts (first sentence + key descriptors)
if sentences:
result = sentences[0]
remaining = max_length - len(result.split())
for sentence in sentences[1:]:
words = sentence.split()
if len(words) <= remaining:
result += ". " + sentence
remaining -= len(words)
else:
# Add partial sentence with most important words
important_words = [w for w in words if len(w) > 3][:remaining]
if important_words:
result += ". " + " ".join(important_words)
break
return result
return " ".join(prompt.split()[:max_length])
# ======================
# Main Generation Function
# ======================
@spaces.GPU(duration=60) if SPACES_AVAILABLE else lambda x: x
def generate_image(
prompt: str,
negative_prompt: str,
style: str,
seed: int,
width: int,
height: int,
selected_loras: List[str],
lora_scale: float,
steps: int,
cfg_scale: float,
language: str = "en"
):
"""Main image generation function with ZeroGPU optimization"""
global pipe
try:
# Load pipeline
pipe = load_pipeline()
# Handle seed
if seed == -1:
seed = torch.randint(0, 2**32, (1,)).item()
generator = torch.Generator(device=device).manual_seed(seed)
# Process prompts
style_prefix = STYLE_PROMPTS.get(style, "")
processed_prompt = process_long_prompt(style_prefix + prompt, max_length=150)
processed_negative = process_long_prompt(negative_prompt, max_length=100)
# Prepare LoRA configurations
lora_configs = []
active_trigger_words = []
# Add fixed LoRAs
for name, config in FIXED_LORAS.items():
if config["repo_id"]:
lora_configs.append({
'name': name,
'repo_id': config["repo_id"],
'weight': config["weight"]
})
if config["trigger_words"]:
active_trigger_words.append(config["trigger_words"])
# Add selected optional LoRAs
for lora_name in selected_loras:
if lora_name != "None" and lora_name in OPTIONAL_LORAS:
config = OPTIONAL_LORAS[lora_name]
if config["repo_id"]:
lora_configs.append({
'name': lora_name,
'repo_id': config["repo_id"],
'weight': config["weight"] * lora_scale
})
if config["trigger_words"]:
active_trigger_words.append(config["trigger_words"])
# Load LoRAs
load_lora_weights(lora_configs)
# Combine trigger words with prompt
if active_trigger_words:
trigger_text = ", ".join(active_trigger_words)
final_prompt = f"{processed_prompt}, {trigger_text}"
else:
final_prompt = processed_prompt
# Generate image
with torch.autocast(device):
image = pipe(
prompt=final_prompt,
negative_prompt=processed_negative,
num_inference_steps=steps,
guidance_scale=cfg_scale,
width=width,
height=height,
generator=generator,
).images[0]
# Generate metadata
timestamp = datetime.datetime.now()
metadata = {
"prompt": final_prompt,
"original_prompt": prompt,
"negative_prompt": processed_negative,
"base_model": BASE_MODEL,
"style": style,
"fixed_loras": [name for name in FIXED_LORAS.keys()],
"selected_loras": [name for name in selected_loras if name != "None"],
"lora_scale": lora_scale,
"seed": seed,
"steps": steps,
"cfg_scale": cfg_scale,
"width": width,
"height": height,
"language": language,
"timestamp": timestamp.isoformat(),
"trigger_words": active_trigger_words
}
# Generate filenames
timestamp_str = timestamp.strftime("%y%m%d%H%M")
filename_base = f"{seed}-{timestamp_str}"
# Save image as WebP
img_buffer = io.BytesIO()
image.save(img_buffer, format="WEBP", quality=95, method=6)
img_buffer.seek(0)
# Save metadata as JSON
metadata_str = json.dumps(metadata, indent=2, ensure_ascii=False)
return (
image,
metadata_str,
f"{filename_base}.webp",
f"{filename_base}.txt"
)
except Exception as e:
error_msg = f"Generation failed: {str(e)}"
print(f"β {error_msg}")
return None, error_msg, "", ""
# ======================
# Gradio Interface
# ======================
def create_interface():
"""Create the Gradio interface"""
with gr.Blocks(
theme=gr.themes.Soft(
primary_hue="blue",
secondary_hue="green",
neutral_hue="slate",
).set(
body_background_fill="linear-gradient(135deg, #1e40af, #059669)",
button_primary_background_fill="white",
button_primary_text_color="#1e40af",
input_background_fill="rgba(255,255,255,0.9)",
block_background_fill="rgba(255,255,255,0.1)",
),
css="""
body {
font-family: 'Segoe UI', 'Arial', sans-serif;
background: linear-gradient(135deg, #1e40af, #059669);
}
.gr-button {
font-family: 'Segoe UI', 'Arial', sans-serif;
font-weight: 600;
border-radius: 8px;
}
.gr-textbox {
font-family: 'Consolas', 'Monaco', 'Courier New', monospace;
border-radius: 8px;
}
.gr-dropdown, .gr-slider, .gr-radio {
border-radius: 8px;
}
.gr-form {
background: rgba(255,255,255,0.05);
border-radius: 16px;
padding: 20px;
margin: 10px;
}
""",
title="AI Photo Generator - Illustrious XL"
) as demo:
gr.Markdown("""
# π¨ AI Photo Generator (Illustrious XL + Multi-LoRA)
**PRO + ZeroGPU Optimized | Multi-LoRA Support | Style Templates | Metadata Export | 1536x1536 Native Resolution**
""")
with gr.Row():
# Left Column - Controls
with gr.Column(scale=3, elem_classes=["gr-form"]):
# a. Prompt Input
prompt_input = gr.Textbox(
label="Prompt (Positive)",
placeholder="A beautiful woman with flowing hair, golden hour lighting, cinematic composition, high detail...",
lines=6,
max_lines=20,
elem_classes=["gr-textbox"]
)
# b. Negative Prompt Input
negative_prompt_input = gr.Textbox(
label="Negative Prompt",
value="blurry, low quality, deformed, cartoon, anime, text, watermark, signature, username, worst quality, low res, bad anatomy, bad hands, error, missing fingers, extra digit, fewer digits, cropped, jpeg artifacts, bad feet, extra fingers, mutated hands, poorly drawn hands, bad proportions, extra limbs, disfigured, ugly, gross proportions, malformed limbs",
lines=4,
max_lines=15,
elem_classes=["gr-textbox"]
)
# c. Style Selection
style_radio = gr.Radio(
choices=list(STYLE_PROMPTS.keys()),
label="Style Template",
value="Realistic",
elem_classes=["gr-radio"]
)
# Multi-row controls
with gr.Row():
# d. Seed Control
with gr.Column():
seed_input = gr.Slider(
minimum=-1,
maximum=99999999,
step=1,
value=DEFAULT_SEED,
label="Seed (-1 = Random)"
)
seed_reset = gr.Button("Reset Seed", size="sm")
with gr.Row():
# e. Width Control
with gr.Column():
width_input = gr.Slider(
minimum=512,
maximum=1536,
step=64,
value=DEFAULT_WIDTH,
label="Width"
)
width_reset = gr.Button("Reset Width", size="sm")
# f. Height Control
with gr.Column():
height_input = gr.Slider(
minimum=512,
maximum=1536,
step=64,
value=DEFAULT_HEIGHT,
label="Height"
)
height_reset = gr.Button("Reset Height", size="sm")
# g. LoRA Selection (Multi-select)
lora_dropdown = gr.Dropdown(
choices=list(OPTIONAL_LORAS.keys()),
label="Optional LoRAs (Multi-select)",
value=["None"],
multiselect=True,
elem_classes=["gr-dropdown"]
)
# h. LoRA Scale Control
with gr.Row():
lora_scale_slider = gr.Slider(
minimum=0.0,
maximum=1.5,
step=0.05,
value=DEFAULT_LORA_SCALE,
label="LoRA Scale"
)
lora_reset = gr.Button("Reset LoRA", size="sm")
# i. Generation Controls
with gr.Row():
steps_slider = gr.Slider(
minimum=10,
maximum=100,
step=1,
value=DEFAULT_STEPS,
label="Steps"
)
cfg_slider = gr.Slider(
minimum=1.0,
maximum=20.0,
step=0.5,
value=DEFAULT_CFG,
label="CFG Scale"
)
gen_reset = gr.Button("Reset Generation", size="sm")
# Language Selection (Optional)
language_dropdown = gr.Dropdown(
choices=list(SUPPORTED_LANGUAGES.keys()),
label="Language (Optional)",
value="en",
visible=False # Hidden for now, can be enabled later
)
# m. Generate Button
generate_btn = gr.Button(
"β¨ Generate Image",
variant="primary",
size="lg",
elem_classes=["gr-button"]
)
# Right Column - Outputs
with gr.Column(scale=2):
# j. Image Display
image_output = gr.Image(
label="Generated Image",
height=600,
format="webp"
)
# l. Download Buttons (between image and metadata)
with gr.Row():
download_img_btn = gr.DownloadButton(
"β¬οΈ Download Image (WebP)",
variant="secondary"
)
download_meta_btn = gr.DownloadButton(
"β¬οΈ Download Metadata (TXT)",
variant="secondary"
)
# k. Metadata Display
metadata_output = gr.Textbox(
label="Generation Metadata (JSON)",
lines=15,
max_lines=25,
elem_classes=["gr-textbox"]
)
# ======================
# Event Handlers
# ======================
# Reset buttons
seed_reset.click(fn=lambda: -1, outputs=seed_input)
width_reset.click(fn=lambda: DEFAULT_WIDTH, outputs=width_input)
height_reset.click(fn=lambda: DEFAULT_HEIGHT, outputs=height_input)
lora_reset.click(fn=lambda: DEFAULT_LORA_SCALE, outputs=lora_scale_slider)
gen_reset.click(
fn=lambda: (DEFAULT_STEPS, DEFAULT_CFG),
outputs=[steps_slider, cfg_slider]
)
# Main generation function
def generate_and_prepare_downloads(*args):
result = generate_image(*args)
if result[0] is not None: # Success
image, metadata, img_filename, meta_filename = result
# Prepare download files
img_buffer = io.BytesIO()
image.save(img_buffer, format="WEBP", quality=95)
img_buffer.seek(0)
meta_buffer = io.BytesIO()
meta_buffer.write(metadata.encode('utf-8'))
meta_buffer.seek(0)
return (
image,
metadata,
gr.DownloadButton.update(value=img_buffer.getvalue(), filename=img_filename),
gr.DownloadButton.update(value=meta_buffer.getvalue(), filename=meta_filename)
)
else: # Error
return result[0], result[1], None, None
# Generate button click
generate_btn.click(
fn=generate_and_prepare_downloads,
inputs=[
prompt_input, negative_prompt_input, style_radio,
seed_input, width_input, height_input,
lora_dropdown, lora_scale_slider,
steps_slider, cfg_slider, language_dropdown
],
outputs=[
image_output, metadata_output,
download_img_btn, download_meta_btn
]
)
# Show LoRA descriptions
def show_lora_info(selected_loras):
if not selected_loras or selected_loras == ["None"]:
return "No LoRAs selected"
info = "Selected LoRAs:\n"
for lora_name in selected_loras:
if lora_name in OPTIONAL_LORAS:
config = OPTIONAL_LORAS[lora_name]
info += f"β’ {lora_name}: {config['description']}\n"
if config['trigger_words']:
info += f" Triggers: {config['trigger_words']}\n"
return info
lora_dropdown.change(
fn=show_lora_info,
inputs=[lora_dropdown],
outputs=[gr.Textbox(label="LoRA Information", visible=False)]
)
return demo
# ======================
# Launch Application
# ======================
if __name__ == "__main__":
demo = create_interface()
demo.queue(max_size=20)
demo.launch(
server_name="0.0.0.0",
server_port=7860,
share=False,
show_error=True
) |