Qwen-Image-Edit-2509-LoRAs-Fast

Running on Zero

App Files Files Community

Opera8 commited on Dec 9, 2025

Commit

2210ab4

verified ·

1 Parent(s): ad1b5e0

Update app.py

Browse files

Files changed (1) hide show

app.py +114 -69

app.py CHANGED Viewed

@@ -8,7 +8,9 @@ from PIL import Image
 from typing import Iterable
 from gradio.themes import Soft
 from gradio.themes.utils import colors, fonts, sizes
 colors.steel_blue = colors.Color(
     name="steel_blue",
     c50="#EBF3F8",
@@ -33,7 +35,7 @@ class SteelBlueTheme(Soft):
         neutral_hue: colors.Color | str = colors.slate,
         text_size: sizes.Size | str = sizes.text_lg,
         font: fonts.Font | str | Iterable[fonts.Font | str] = (
-            fonts.GoogleFont("Outfit"), "Arial", "sans-serif",
         ),
         font_mono: fonts.Font | str | Iterable[fonts.Font | str] = (
             fonts.GoogleFont("IBM Plex Mono"), "ui-monospace", "monospace",
@@ -79,17 +81,7 @@ steel_blue_theme = SteelBlueTheme()
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-print("CUDA_VISIBLE_DEVICES=", os.environ.get("CUDA_VISIBLE_DEVICES"))
-print("torch.__version__ =", torch.__version__)
-print("torch.version.cuda =", torch.version.cuda)
-print("cuda available:", torch.cuda.is_available())
-print("cuda device count:", torch.cuda.device_count())
-if torch.cuda.is_available():
-    print("current device:", torch.cuda.current_device())
-    print("device name:", torch.cuda.get_device_name(torch.cuda.current_device()))
-print("Using device:", device)
 from diffusers import FlowMatchEulerDiscreteScheduler
 from qwenimage.pipeline_qwenimage_edit_plus import QwenImageEditPlusPipeline
 from qwenimage.transformer_qwenimage import QwenImageTransformer2DModel
@@ -98,10 +90,11 @@ from qwenimage.qwen_fa3_processor import QwenDoubleStreamAttnProcessorFA3
 dtype = torch.bfloat16
 device = "cuda" if torch.cuda.is_available() else "cpu"
 pipe = QwenImageEditPlusPipeline.from_pretrained(
     "Qwen/Qwen-Image-Edit-2509",
     transformer=QwenImageTransformer2DModel.from_pretrained(
-        "linoyts/Qwen-Image-Edit-Rapid-AIO", # [transformer weights extracted from: Phr00t/Qwen-Image-Edit-Rapid-AIO]
         subfolder='transformer',
         torch_dtype=dtype,
         device_map='cuda'
@@ -109,6 +102,7 @@ pipe = QwenImageEditPlusPipeline.from_pretrained(
     torch_dtype=dtype
 ).to(device)
 pipe.load_lora_weights("autoweeb/Qwen-Image-Edit-2509-Photo-to-Anime",
                        weight_name="Qwen-Image-Edit-2509-Photo-to-Anime_000001000.safetensors",
                        adapter_name="anime")
@@ -137,6 +131,31 @@ pipe.load_lora_weights("vafipas663/Qwen-Edit-2509-Upscale-LoRA",
 pipe.transformer.set_attn_processor(QwenDoubleStreamAttnProcessorFA3())
 MAX_SEED = np.iinfo(np.int32).max
 def update_dimensions_on_upload(image):
     if image is None:
         return 1024, 1024
@@ -162,7 +181,7 @@ def update_dimensions_on_upload(image):
 def infer(
     input_image,
     prompt,
-    lora_adapter,
     seed,
     randomize_seed,
     guidance_scale,
@@ -170,39 +189,34 @@ def infer(
     progress=gr.Progress(track_tqdm=True)
 ):
     if input_image is None:
-        raise gr.Error("Please upload an image to edit.")
-    if lora_adapter == "Photo-to-Anime":
-        pipe.set_adapters(["anime"], adapter_weights=[1.0])
-    elif lora_adapter == "Multiple-Angles":
-        pipe.set_adapters(["multiple-angles"], adapter_weights=[1.0])
-    elif lora_adapter == "Light-Restoration":
-        pipe.set_adapters(["light-restoration"], adapter_weights=[1.0])
-    elif lora_adapter == "Relight":
-        pipe.set_adapters(["relight"], adapter_weights=[1.0])
-    elif lora_adapter == "Multi-Angle-Lighting":
-        pipe.set_adapters(["multi-angle-lighting"], adapter_weights=[1.0])
-    elif lora_adapter == "Edit-Skin":
-        pipe.set_adapters(["edit-skin"], adapter_weights=[1.0])
-    elif lora_adapter == "Next-Scene":
-        pipe.set_adapters(["next-scene"], adapter_weights=[1.0])
-    elif lora_adapter == "Upscale-Image":
-        pipe.set_adapters(["upscale-image"], adapter_weights=[1.0])
     if randomize_seed:
         seed = random.randint(0, MAX_SEED)
     generator = torch.Generator(device=device).manual_seed(seed)
     negative_prompt = "worst quality, low quality, bad anatomy, bad hands, text, error, missing fingers, extra digit, fewer digits, cropped, jpeg artifacts, signature, watermark, username, blurry"
     original_image = input_image.convert("RGB")
-    # Use the new function to update dimensions
     width, height = update_dimensions_on_upload(original_image)
     result = pipe(
         image=original_image,
-        prompt=prompt,
         negative_prompt=negative_prompt,
         height=height,
         width=width,
@@ -218,73 +232,104 @@ def infer_example(input_image, prompt, lora_adapter):
     input_pil = input_image.convert("RGB")
     guidance_scale = 1.0
     steps = 4
     result, seed = infer(input_pil, prompt, lora_adapter, 0, True, guidance_scale, steps)
     return result, seed
 css="""
 #col-container {
     margin: 0 auto;
     max-width: 960px;
 }
-#main-title h1 {font-size: 2.1em !important;}
 """
-with gr.Blocks() as demo:
     with gr.Column(elem_id="col-container"):
-        gr.Markdown("# **Qwen-Image-Edit-2509-LoRAs-Fast**", elem_id="main-title")
-        gr.Markdown("Perform diverse image edits using specialized [LoRA](https://huggingface.co/models?other=base_model:adapter:Qwen/Qwen-Image-Edit-2509) adapters for the [Qwen-Image-Edit](https://huggingface.co/Qwen/Qwen-Image-Edit-2509) model.")
         with gr.Row(equal_height=True):
             with gr.Column():
-                input_image = gr.Image(label="Upload Image", type="pil", height=290)
                 prompt = gr.Text(
-                    label="Edit Prompt",
                     show_label=True,
-                    placeholder="e.g., transform into anime..",
                 )
-                run_button = gr.Button("Edit Image", variant="primary")
             with gr.Column():
-                output_image = gr.Image(label="Output Image", interactive=False, format="png", height=353)
                 with gr.Row():
                     lora_adapter = gr.Dropdown(
-                        label="Choose Editing Style",
-                        choices=["Photo-to-Anime", "Multiple-Angles", "Light-Restoration", "Multi-Angle-Lighting", "Upscale-Image", "Relight", "Next-Scene", "Edit-Skin"],
-                        value="Photo-to-Anime"
                     )
-                with gr.Accordion("Advanced Settings", open=False, visible=False):
-                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
-                    randomize_seed = gr.Checkbox(label="Randomize Seed", value=True)
-                    guidance_scale = gr.Slider(label="Guidance Scale", minimum=1.0, maximum=10.0, step=0.1, value=1.0)
-                    steps = gr.Slider(label="Inference Steps", minimum=1, maximum=50, step=1, value=4)
         gr.Examples(
             examples=[
-                ["examples/1.jpg", "Transform into anime.", "Photo-to-Anime"],
-                ["examples/5.jpg", "Remove shadows and relight the image using soft lighting.", "Light-Restoration"],
-                ["examples/4.jpg", "Use a subtle golden-hour filter with smooth light diffusion.", "Relight"],
-                ["examples/2.jpeg", "Rotate the camera 45 degrees to the left.", "Multiple-Angles"],
-                ["examples/7.jpg", "Light source from the Right Rear", "Multi-Angle-Lighting"],
-                ["examples/10.jpeg", "Upscale the image.", "Upscale-Image"],
-                ["examples/7.jpg", "Light source from the Below", "Multi-Angle-Lighting"],
-                ["examples/2.jpeg", "Switch the camera to a top-down right corner view.", "Multiple-Angles"],
-                ["examples/9.jpg", "The camera moves slightly forward as sunlight breaks through the clouds, casting a soft glow around the character's silhouette in the mist. Realistic cinematic style, atmospheric depth.", "Next-Scene"],
-                ["examples/8.jpg", "Make the subjects skin details more prominent and natural.", "Edit-Skin"],
-                ["examples/6.jpg", "Switch the camera to a bottom-up view.", "Multiple-Angles"],
-                ["examples/6.jpg", "Rotate the camera 180 degrees upside down.", "Multiple-Angles"],
-                ["examples/4.jpg", "Rotate the camera 45 degrees to the right.", "Multiple-Angles"],
-                ["examples/4.jpg", "Switch the camera to a top-down view.", "Multiple-Angles"],
-                ["examples/4.jpg", "Switch the camera to a wide-angle lens.", "Multiple-Angles"],
             ],
             inputs=[input_image, prompt, lora_adapter],
             outputs=[output_image, seed],
             fn=infer_example,
             cache_examples=False,
-            label="Examples"
         )
     run_button.click(
@@ -294,4 +339,4 @@ with gr.Blocks() as demo:
     )
 if __name__ == "__main__":
-    demo.queue(max_size=30).launch(css=css, theme=steel_blue_theme, mcp_server=True, ssr_mode=False, show_error=True)

 from typing import Iterable
 from gradio.themes import Soft
 from gradio.themes.utils import colors, fonts, sizes
+from deep_translator import GoogleTranslator  # کتابخانه ترجمه اضافه شد
+# --- تنظیمات تم ---
 colors.steel_blue = colors.Color(
     name="steel_blue",
     c50="#EBF3F8",
         neutral_hue: colors.Color | str = colors.slate,
         text_size: sizes.Size | str = sizes.text_lg,
         font: fonts.Font | str | Iterable[fonts.Font | str] = (
+            fonts.GoogleFont("Vazirmatn"), "Arial", "sans-serif", # فونت وزیر برای فارسی بهتر است
         ),
         font_mono: fonts.Font | str | Iterable[fonts.Font | str] = (
             fonts.GoogleFont("IBM Plex Mono"), "ui-monospace", "monospace",
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+# --- بارگذاری مدل ---
 from diffusers import FlowMatchEulerDiscreteScheduler
 from qwenimage.pipeline_qwenimage_edit_plus import QwenImageEditPlusPipeline
 from qwenimage.transformer_qwenimage import QwenImageTransformer2DModel
 dtype = torch.bfloat16
 device = "cuda" if torch.cuda.is_available() else "cpu"
+print("Loading pipeline...")
 pipe = QwenImageEditPlusPipeline.from_pretrained(
     "Qwen/Qwen-Image-Edit-2509",
     transformer=QwenImageTransformer2DModel.from_pretrained(
+        "linoyts/Qwen-Image-Edit-Rapid-AIO",
         subfolder='transformer',
         torch_dtype=dtype,
         device_map='cuda'
     torch_dtype=dtype
 ).to(device)
+# بارگذاری LoRA ها
 pipe.load_lora_weights("autoweeb/Qwen-Image-Edit-2509-Photo-to-Anime",
                        weight_name="Qwen-Image-Edit-2509-Photo-to-Anime_000001000.safetensors",
                        adapter_name="anime")
 pipe.transformer.set_attn_processor(QwenDoubleStreamAttnProcessorFA3())
 MAX_SEED = np.iinfo(np.int32).max
+# --- نگاشت نام‌های فارسی به نام‌های داخلی مدل ---
+LORA_MAPPING = {
+    "تبدیل عکس به انیمه": "anime",
+    "تغییر زاویه دید": "multiple-angles",
+    "اصلاح نور و سایه": "light-restoration",
+    "نورپردازی مجدد (Relight)": "relight",
+    "نورپردازی چند زاویه‌ای": "multi-angle-lighting",
+    "روتوش پوست": "edit-skin",
+    "صحنه بعدی (سینمایی)": "next-scene",
+    "افزایش کیفیت (Upscale)": "upscale-image"
+}
+def translate_prompt(text):
+    """ترجمه متن فارسی به انگلیسی"""
+    if not text:
+        return ""
+    try:
+        # اگر متن تماماً انگلیسی باشد، ممکن است نیازی به ترجمه نباشد اما auto هندل می‌کند
+        translated = GoogleTranslator(source='auto', target='en').translate(text)
+        print(f"Original: {text} -> Translated: {translated}")
+        return translated
+    except Exception as e:
+        print(f"Translation Error: {e}")
+        return text # در صورت خطا متن اصلی را برمی‌گرداند
 def update_dimensions_on_upload(image):
     if image is None:
         return 1024, 1024
 def infer(
     input_image,
     prompt,
+    lora_adapter_persian, # ورودی نام فارسی است
     seed,
     randomize_seed,
     guidance_scale,
     progress=gr.Progress(track_tqdm=True)
 ):
     if input_image is None:
+        raise gr.Error("لطفاً یک تصویر برای ویرایش بارگذاری کنید.")
+    # ترجمه متن کاربر
+    english_prompt = translate_prompt(prompt)
+    # انتخاب آداپتور بر اساس نام فارسی
+    adapter_internal_name = LORA_MAPPING.get(lora_adapter_persian)
+    # غیرفعال کردن همه آداپتورها ابتدا (برای اطمینان)
+    # pipe.disable_lora() # متد دقیق ممکن است متفاوت باشد اما set_adapters جایگزین می‌کند
+    if adapter_internal_name:
+        pipe.set_adapters([adapter_internal_name], adapter_weights=[1.0])
     if randomize_seed:
         seed = random.randint(0, MAX_SEED)
     generator = torch.Generator(device=device).manual_seed(seed)
+    # پرامپت منفی به انگلیسی (ثابت)
     negative_prompt = "worst quality, low quality, bad anatomy, bad hands, text, error, missing fingers, extra digit, fewer digits, cropped, jpeg artifacts, signature, watermark, username, blurry"
     original_image = input_image.convert("RGB")
     width, height = update_dimensions_on_upload(original_image)
     result = pipe(
         image=original_image,
+        prompt=english_prompt, # استفاده از متن ترجمه شده
         negative_prompt=negative_prompt,
         height=height,
         width=width,
     input_pil = input_image.convert("RGB")
     guidance_scale = 1.0
     steps = 4
+    # infer به صورت خودکار ترجمه را انجام می‌دهد
     result, seed = infer(input_pil, prompt, lora_adapter, 0, True, guidance_scale, steps)
     return result, seed
+# استایل CSS برای راست‌چین کردن (RTL) و فونت فارسی
 css="""
+@import url('https://fonts.googleapis.com/css2?family=Vazirmatn:wght@400;700&display=swap');
+body, .gradio-container {
+    font-family: 'Vazirmatn', sans-serif !important;
+}
 #col-container {
     margin: 0 auto;
     max-width: 960px;
+    direction: rtl; /* راست‌چین */
+    text-align: right;
+}
+#main-title h1 {
+    font-size: 2.1em !important;
+    text-align: center;
+}
+#main-description {
+    text-align: center;
+    font-size: 1.1em;
+    margin-bottom: 20px;
+}
+/* اصلاح جهت ورودی‌ها و لیست‌ها */
+.gr-dropdown, .gr-textbox, .gr-slider, .gr-checkbox {
+    direction: rtl;
+    text-align: right;
+}
+.gr-input-label {
+    text-align: right !important;
 }
 """
+with gr.Blocks(css=css, theme=steel_blue_theme) as demo:
     with gr.Column(elem_id="col-container"):
+        gr.Markdown("# **Qwen-Image-Edit-2509: ویرایشگر هوشمند تصاویر**", elem_id="main-title")
+        gr.Markdown(
+            "ویرایش تصاویر با استفاده از مدل قدرتمند [Qwen-Image-Edit](https://huggingface.co/Qwen/Qwen-Image-Edit-2509) و آداپتورهای اختصاصی LoRA. "
+            "شما می‌توانید دستورات خود را به **فارسی** بنویسید.",
+            elem_id="main-description"
+        )
         with gr.Row(equal_height=True):
             with gr.Column():
+                input_image = gr.Image(label="بارگذاری تصویر", type="pil", height=290)
                 prompt = gr.Text(
+                    label="دستور ویرایش (به فارسی)",
                     show_label=True,
+                    placeholder="مثال: تصویر را به سبک انیمه تبدیل کن...",
+                    rtl=True # فعال کردن RTL برای ورودی متن
                 )
+                run_button = gr.Button("شروع ویرایش تصویر", variant="primary")
             with gr.Column():
+                output_image = gr.Image(label="تصویر خروجی", interactive=False, format="png", height=353)
                 with gr.Row():
                     lora_adapter = gr.Dropdown(
+                        label="انتخاب سبک ویرایش (LoRA)",
+                        choices=list(LORA_MAPPING.keys()), # نمایش نام‌های فارسی
+                        value="تبدیل عکس به انیمه"
                     )
+                with gr.Accordion("تنظیمات پیشرفته", open=False, visible=True): # Accordion visible
+                    seed = gr.Slider(label="دانه تصادفی (Seed)", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="استفاده از Seed تصادفی", value=True)
+                    guidance_scale = gr.Slider(label="میزان وفاداری به متن (Guidance Scale)", minimum=1.0, maximum=10.0, step=0.1, value=1.0)
+                    steps = gr.Slider(label="تعداد مراحل پردازش (Steps)", minimum=1, maximum=50, step=1, value=4)
+        # مثال‌های فارسی شده
         gr.Examples(
             examples=[
+                ["examples/1.jpg", "تبدیل به انیمه کن.", "تبدیل عکس به انیمه"],
+                ["examples/5.jpg", "سایه‌ها را حذف کن و نورپردازی نرم به تصویر بده.", "اصلاح نور و سایه"],
+                ["examples/4.jpg", "از فیلتر ساعت طلایی با پخش نور ملایم استفاده کن.", "نورپردازی مجدد (Relight)"],
+                ["examples/2.jpeg", "دوربین را ۴۵ درجه به سمت چپ بچرخان.", "تغییر زاویه دید"],
+                ["examples/7.jpg", "منبع نور را از سمت راست عقب قرار بده.", "نورپردازی چند زاویه‌ای"],
+                ["examples/10.jpeg", "کیفیت تصویر را افزایش بده (Upscale).", "افزایش کیفیت (Upscale)"],
+                ["examples/7.jpg", "منبع نور را از پایین بتابان.", "نورپردازی چند زاویه‌ای"],
+                ["examples/2.jpeg", "زاویه دوربین را به نمای بالا گوشه راست تغییر بده.", "تغییر زاویه دید"],
+                ["examples/9.jpg", "دوربین کمی به جلو حرکت می‌کند در حالی که نور خورشید از میان ابرها می‌تابد و درخششی نرم اطراف شبح شخصیت در مه ایجاد می‌کند. سبک سینمایی واقعی.", "صحنه ��عدی (سینمایی)"],
+                ["examples/8.jpg", "جزئیات پوست سوژه را برجسته‌تر و طبیعی‌تر کن.", "روتوش پوست"],
+                ["examples/6.jpg", "دوربین را به نمای پایین به بالا تغییر بده.", "تغییر زاویه دید"],
             ],
             inputs=[input_image, prompt, lora_adapter],
             outputs=[output_image, seed],
             fn=infer_example,
             cache_examples=False,
+            label="نمونه‌ها"
         )
     run_button.click(
     )
 if __name__ == "__main__":
+    demo.queue(max_size=30).launch(show_error=True)