import os import io import re import random import requests import numpy as np import torch import gradio as gr from PIL import Image from openai import OpenAI from diffusers import ( StableDiffusionXLPipeline, StableDiffusionPipeline, EulerAncestralDiscreteScheduler, DPMSolverMultistepScheduler, KDPM2AncestralDiscreteScheduler, ) # DEVICE device = torch.device("cuda" if torch.cuda.is_available() else "cpu") IS_CPU = device.type == "cpu" DTYPE = torch.float32 if IS_CPU else torch.float16 print(f"[INFO] Device: {device} | dtype: {DTYPE}") #app = gr.mount_gradio_app( # FastAPI(), # demo, # path="/" #) # MODELS SDXL_MODELS = { #"Tongyi-MAI/Z-Image-Turbo": "Z-Image Turbo ⚡", "Heartsync/NSFW-Uncensored": "NSFW Uncensored", "stabilityai/stable-diffusion-xl-base-1.0": "SDXL Base 1.0", "RunDiffusion/Juggernaut-XL-v9": "Juggernaut XL v9", "SG161222/RealVisXL_V4.0": "RealVisXL V4.0", "cagliostrolab/animagine-xl-3.1": "Animagine XL 3.1", "Lykon/dreamshaper-xl-1-0": "DreamShaper XL", "playgroundai/playground-v2.5-1024px-aesthetic": "Playground v2.5", "dataautogpt3/OpenDalleV1.1": "OpenDalle V1.1", "fluently/Fluently-XL-Final": "Fluently XL", "Corcelio/mobius": "Mobius", } SD15_MODELS = { "Tongyi-MAI/Z-Image-Turbo": "Z-Image Turbo ⚡", "runwayml/stable-diffusion-v1-5": "SD 1.5 (Ringan)", "Lykon/dreamshaper-8": "DreamShaper 8", "stablediffusionapi/realistic-vision-v51": "Realistic Vision v5.1", "stablediffusionapi/anything-v5": "Anything v5 (Anime)", "stablediffusionapi/chilloutmix": "ChilloutMix", "digiplay/AbsoluteReality_v1.8.1": "AbsoluteReality v1.8", } AVAILABLE_MODELS = {**SDXL_MODELS, **SD15_MODELS} TURBO_MODELS = { "Tongyi-MAI/Z-Image-Turbo", } # ------------------------------------------------------------ # SCHEDULERS # ------------------------------------------------------------ SCHEDULERS = { "Euler Ancestral": "EulerAncestral", "DPM++ 2M Karras": "DPM++2MKarras", "KDPM2 Ancestral": "KDPM2Ancestral", } def set_scheduler(pipe, key): if key == "EulerAncestral": pipe.scheduler = EulerAncestralDiscreteScheduler.from_config(pipe.scheduler.config) elif key == "DPM++2MKarras": pipe.scheduler = DPMSolverMultistepScheduler.from_config( pipe.scheduler.config, use_karras_sigmas=True) elif key == "KDPM2Ancestral": pipe.scheduler = KDPM2AncestralDiscreteScheduler.from_config(pipe.scheduler.config) return pipe # ------------------------------------------------------------ # PIPELINE CACHE # ------------------------------------------------------------ loaded_pipelines = {} def load_pipeline(model_id): if model_id in loaded_pipelines: return loaded_pipelines[model_id] print(f"[INFO] Loading: {model_id}") is_xl = model_id in SDXL_MODELS PipeClass = StableDiffusionXLPipeline if is_xl else StableDiffusionPipeline for kwargs in [ {"torch_dtype": DTYPE, "variant": "fp16" if not IS_CPU else None, "use_safetensors": True}, {"torch_dtype": DTYPE, "use_safetensors": True}, {"torch_dtype": DTYPE}, ]: try: kwargs = {k: v for k, v in kwargs.items() if v is not None} pipe = PipeClass.from_pretrained(model_id, **kwargs) break except Exception as e: print(f"[WARN] Load attempt failed: {e}") continue else: raise RuntimeError(f"Failed to load model: {model_id}") pipe.scheduler = EulerAncestralDiscreteScheduler.from_config(pipe.scheduler.config) pipe.to(device) if IS_CPU: pipe.enable_attention_slicing() loaded_pipelines[model_id] = pipe print(f"[INFO] Loaded: {model_id}") return pipe # ------------------------------------------------------------ # OPENROUTER # ------------------------------------------------------------ or_api_key = os.getenv("OPENROUTER_API_KEY") or_client = None if or_api_key: try: or_client = OpenAI(base_url="https://openrouter.ai/api/v1", api_key=or_api_key) print("[INFO] OpenRouter ready") except Exception as e: print(f"[ERROR] OpenRouter: {e}") HF_TOKEN = os.getenv("HF_TOKEN") LLM_MODEL = "google/gemini-2.0-flash-001" # ------------------------------------------------------------ # LANGUAGE # ------------------------------------------------------------ def is_non_english(text): if not text: return False for pattern in [r'[\uac00-\ud7a3]', r'[\u3040-\u30ff]', r'[\u4e00-\u9fff]', r'[^\x00-\x7F]']: if re.search(pattern, text): return True return False def translate_to_english(text): if not or_client or not is_non_english(text): return text try: resp = or_client.chat.completions.create( model=LLM_MODEL, messages=[ {"role": "system", "content": "Translate to English. Only provide translation."}, {"role": "user", "content": text}, ], temperature=0.1, ) result = resp.choices[0].message.content.strip() return result if len(result) > 3 else text except Exception as e: print(f"[ERROR] Translate: {e}") return text # ------------------------------------------------------------ # EXAMPLES & TEMPLATES # ------------------------------------------------------------ prompt_examples = [ "Hyperrealistic portrait of a beautiful woman, studio lighting, 8k photography", "Anime girl with long silver hair, school uniform, cherry blossoms, detailed art", "A couple sharing a passionate kiss in Paris at night, Eiffel Tower glowing, cinematic", "Digital art, fantasy woman warrior, detailed armor, epic lighting, concept art", "Mature anime woman, elegant kimono, traditional Japanese setting, high quality", "Watercolor illustration, graceful woman, flowing dress, soft pastel colors", "Fashion photography, elegant model, dramatic lighting, high fashion, detailed", "Two lovers walking on a moonlit beach, waves crashing, intimate moment", "Moody anime scene, neon lights, rain, two characters, sensual atmosphere", "Oil painting style, figure study, classical art, soft colors, detailed brushwork", ] TEMPLATES = { "🎭 Romantic": [ "A couple in a passionate embrace, soft candlelight, romantic atmosphere, detailed", "Two lovers walking on a moonlit beach, waves crashing, intimate moment, photorealistic", "A woman in elegant evening dress, soft lighting, romantic dinner setting, beautiful", ], "🌸 Anime": [ "Anime girl with long silver hair, school uniform, cherry blossoms, detailed anime art", "Mature anime woman, elegant kimono, traditional Japanese setting, high quality", "Moody anime scene, neon lights, rain, two characters, sensual atmosphere", ], "📸 Realistic": [ "Hyperrealistic portrait of a beautiful woman, studio lighting, 8k photography", "Cinematic shot, beautiful woman, soft natural light, photorealistic, high detail", "Fashion photography, elegant model, dramatic lighting, high fashion, detailed", ], "🎨 Artistic": [ "Oil painting style, figure study, classical art, soft colors, detailed brushwork", "Digital art, fantasy woman warrior, detailed armor, epic lighting, concept art", "Watercolor illustration, graceful woman, flowing dress, soft pastel colors", ], } # ------------------------------------------------------------ # BOOST # ------------------------------------------------------------ def boost_prompt(keyword): if not keyword or not keyword.strip(): return "Please enter a keyword first." if is_non_english(keyword): keyword = translate_to_english(keyword) if not or_client: return f"{keyword}, highly detailed, beautiful, masterpiece, best quality, 8k" try: resp = or_client.chat.completions.create( model=LLM_MODEL, messages=[ {"role": "system", "content": "Generate ONE detailed image prompt in English. 1-3 sentences. No prefixes. Just the prompt."}, {"role": "user", "content": keyword}, ], temperature=0.8, ) result = resp.choices[0].message.content.strip() result = re.sub(r'^(Prompt:|Output:|Result:)\s*', '', result, flags=re.IGNORECASE) if is_non_english(result): result = translate_to_english(result) return result if len(result) > 10 else f"{keyword}, detailed, high quality" except Exception as e: return f"{keyword}, highly detailed, beautiful, masterpiece" def get_random_prompt(): return random.choice(prompt_examples) # ------------------------------------------------------------ # HF INFERENCE API # ------------------------------------------------------------ HF_API_SUPPORTED = { # "Tongyi-MAI/Z-Image-Turbo", "stabilityai/stable-diffusion-xl-base-1.0", "runwayml/stable-diffusion-v1-5", "Lykon/dreamshaper-8", "Lykon/dreamshaper-xl-1-0", "cagliostrolab/animagine-xl-3.1", "dataautogpt3/OpenDalleV1.1", } def infer_via_api(prompt, negative_prompt, model_id, width, height, steps, guidance): if not HF_TOKEN or model_id not in HF_API_SUPPORTED: return None try: print(f"[INFO] HF API: {model_id}") r = requests.post( f"https://api-inference.huggingface.co/models/{model_id}", headers={"Authorization": f"Bearer {HF_TOKEN}"}, json={ "inputs": prompt, "parameters": { "negative_prompt": negative_prompt, "width": min(width, 1024), "height": min(height, 1024), "num_inference_steps": steps, "guidance_scale": guidance, }, }, timeout=120, ) if r.status_code == 200: print("[INFO] HF API success") return Image.open(io.BytesIO(r.content)) print(f"[WARN] HF API {r.status_code}") return None except Exception as e: print(f"[ERROR] HF API: {e}") return None # ------------------------------------------------------------ # LOCAL INFERENCE # ------------------------------------------------------------ def infer_local(prompt, negative_prompt, model_id, seed, width, height, guidance, steps, scheduler_key, clip_skip): try: pipe = load_pipeline(model_id) pipe = set_scheduler(pipe, scheduler_key) except Exception as e: print(f"[ERROR] Load model: {e}") return None # Turbo models: kurangi steps otomatis if model_id in TURBO_MODELS: steps = min(steps, 8) guidance = min(guidance, 5.0) print(f"[INFO] Turbo mode: steps={steps}, guidance={guidance}") generator = torch.Generator(device=device).manual_seed(seed) kwargs = dict( prompt=prompt, negative_prompt=negative_prompt, guidance_scale=guidance, num_inference_steps=steps, width=width, height=height, generator=generator, ) if clip_skip > 1 and model_id in SDXL_MODELS: kwargs["clip_skip"] = clip_skip try: return pipe(**kwargs).images[0] except RuntimeError as e: print(f"[ERROR] Inference: {e}") return None # ------------------------------------------------------------ # MAIN INFER # ------------------------------------------------------------ MAX_SEED = np.iinfo(np.int32).max MAX_IMAGE_SIZE = 1216 def infer(model_id, prompt, negative_prompt, seed, randomize_seed, width, height, guidance_scale, num_inference_steps, scheduler_name, clip_skip): if is_non_english(prompt): prompt = translate_to_english(prompt) if is_non_english(negative_prompt): negative_prompt = translate_to_english(negative_prompt) if randomize_seed: seed = random.randint(0, MAX_SEED) scheduler_key = SCHEDULERS.get(scheduler_name, "EulerAncestral") print(f"[INFO] Model: {model_id} | Seed: {seed}") print(f"[INFO] Prompt: {prompt[:80]}") # 1. HF API image = infer_via_api( prompt, negative_prompt, model_id, width, height, num_inference_steps, guidance_scale ) # 2. Local fallback if image is None: print("[INFO] Fallback to local") image = infer_local( prompt, negative_prompt, model_id, seed, width, height, guidance_scale, num_inference_steps, scheduler_key, clip_skip ) if image is None: image = Image.new("RGB", (512, 512), color=(15, 15, 20)) return image, seed # ------------------------------------------------------------ # CSS # ------------------------------------------------------------ css = """ @import url('https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600&display=swap'); * { box-sizing: border-box; margin: 0; padding: 0; } body { background: #0c0c10; color: #e0dff0; font-family: 'Inter', sans-serif; } footer { display: none !important; } #main { max-width: 700px; margin: 0 auto; padding: 24px 16px 48px; } .hdr { text-align: center; margin-bottom: 24px; padding-bottom: 18px; border-bottom: 1px solid rgba(255,255,255,0.05); } .hdr h1 { font-size: 1.4rem; font-weight: 600; color: #fff; letter-spacing: -0.02em; } .hdr h1 span { color: #a78bfa; } .hdr p { font-size: 0.72rem; color: rgba(255,255,255,0.25); margin-top: 3px; } .sec { background: rgba(255,255,255,0.025); border: 1px solid rgba(255,255,255,0.055); border-radius: 11px; padding: 13px; margin-bottom: 9px; } .sec-title { font-size: 0.63rem; font-weight: 600; text-transform: uppercase; letter-spacing: 0.1em; color: rgba(255,255,255,0.2); margin-bottom: 9px; } .tpl-btn { background: rgba(255,255,255,0.02) !important; border: 1px solid rgba(255,255,255,0.06) !important; color: rgba(255,255,255,0.4) !important; border-radius: 7px !important; font-size: 0.71rem !important; padding: 7px 10px !important; cursor: pointer !important; text-align: left !important; transition: all 0.15s !important; } .tpl-btn:hover { background: rgba(167,139,250,0.07) !important; border-color: rgba(167,139,250,0.2) !important; color: rgba(255,255,255,0.65) !important; } #prompt-input textarea { background: rgba(255,255,255,0.04) !important; border: 1px solid rgba(255,255,255,0.08) !important; border-radius: 9px !important; color: #f0eeff !important; font-size: 0.88rem !important; min-height: 80px !important; } #prompt-input textarea:focus { border-color: rgba(167,139,250,0.4) !important; } #prompt-input label { display: none !important; } #boost-btn { background: rgba(251,146,60,0.1) !important; border: 1px solid rgba(251,146,60,0.25) !important; color: #fb923c !important; border-radius: 8px !important; font-size: 0.75rem !important; } #boost-btn:hover { background: rgba(251,146,60,0.2) !important; } #random-btn { background: rgba(96,165,250,0.08) !important; border: 1px solid rgba(96,165,250,0.2) !important; color: #60a5fa !important; border-radius: 8px !important; font-size: 0.75rem !important; } #gen-btn { background: linear-gradient(135deg, #7c3aed, #a78bfa) !important; border: none !important; border-radius: 10px !important; color: #fff !important; font-size: 0.9rem !important; font-weight: 600 !important; padding: 13px !important; box-shadow: 0 4px 18px rgba(124,58,237,0.3) !important; margin-top: 2px !important; } #gen-btn:hover { transform: translateY(-1px) !important; box-shadow: 0 6px 24px rgba(124,58,237,0.45) !important; } #out-img { border-radius: 10px !important; border: 1px solid rgba(255,255,255,0.07) !important; margin-top: 10px !important; } .gr-accordion { background: rgba(255,255,255,0.02) !important; border: 1px solid rgba(255,255,255,0.06) !important; border-radius: 10px !important; margin-top: 10px !important; } .gr-accordion .label-wrap { color: rgba(255,255,255,0.3) !important; font-size: 0.72rem !important; text-transform: uppercase !important; letter-spacing: 0.1em !important; } label { color: rgba(255,255,255,0.35) !important; font-size: 0.72rem !important; } select { background: rgba(255,255,255,0.05) !important; border: 1px solid rgba(255,255,255,0.1) !important; border-radius: 7px !important; color: #e0dff0 !important; } input[type="checkbox"] { accent-color: #7c3aed !important; } .cpu-warn { background: rgba(251,146,60,0.07); border: 1px solid rgba(251,146,60,0.18); border-radius: 8px; padding: 8px 12px; font-size: 0.7rem; color: #fb923c; margin-bottom: 10px; } .div { height: 1px; background: rgba(255,255,255,0.04); margin: 10px 0; } ::-webkit-scrollbar { width: 3px; } ::-webkit-scrollbar-thumb { background: rgba(124,58,237,0.25); border-radius: 4px; } """ # ------------------------------------------------------------ # UI # ------------------------------------------------------------ with gr.Blocks(css=css, theme=gr.themes.Base()) as demo: gr.HTML("""
Multi-model · CPU friendly · Auto-translate