Qwen-Image-2512-Fast

Paused

App Files Files Community

linoyts HF Staff commited on Dec 30, 2025

Commit

8cde3cb

verified ·

1 Parent(s): c10249f

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -6

app.py CHANGED Viewed

@@ -5,7 +5,7 @@ import torch
 import spaces
 from PIL import Image
-from diffusers import QwenImagePipeline
 from qwenimage.qwen_fa3_processor import QwenDoubleStreamAttnProcessorFA3
 from optimization import optimize_pipeline_
 import os
@@ -333,8 +333,30 @@ def rewrite(input_prompt):
 dtype = torch.bfloat16
 device = "cuda" if torch.cuda.is_available() else "cpu"
 # Load the model pipeline
-pipe = QwenImagePipeline.from_pretrained("Qwen/Qwen-Image-2512", torch_dtype=dtype).to(device)
 pipe.transformer.set_attn_processor(QwenDoubleStreamAttnProcessorFA3())
 # --- Ahead-of-time compilation ---
@@ -433,7 +455,13 @@ css = """
 with gr.Blocks(css=css) as demo:
     with gr.Column(elem_id="col-container"):
-        gr.Markdown('<img src="https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen-Image/qwen_image_logo.png" alt="Qwen-Image Logo" width="400" style="display: block; margin: 0 auto;">')
         gr.Markdown("[Learn more](https://github.com/QwenLM/Qwen-Image) about the Qwen-Image series. Try on [Qwen Chat](https://chat.qwen.ai/), or [download model](https://huggingface.co/Qwen/Qwen-Image) to run locally with ComfyUI or diffusers.")
         with gr.Row():
             prompt = gr.Text(
@@ -473,15 +501,15 @@ with gr.Blocks(css=css) as demo:
                     minimum=0.0,
                     maximum=10.0,
                     step=0.1,
-                    value=4.0,
                 )
                 num_inference_steps = gr.Slider(
                     label="Number of inference steps",
                     minimum=1,
-                    maximum=50,
                     step=1,
-                    value=50,
                 )
         gr.Examples(examples=examples, inputs=[prompt], outputs=[result, seed], fn=infer, cache_examples=False)

 import spaces
 from PIL import Image
+from diffusers import QwenImagePipeline, FlowMatchEulerDiscreteScheduler
 from qwenimage.qwen_fa3_processor import QwenDoubleStreamAttnProcessorFA3
 from optimization import optimize_pipeline_
 import os
 dtype = torch.bfloat16
 device = "cuda" if torch.cuda.is_available() else "cpu"
+scheduler_config = {
+    "base_image_seq_len": 256,
+    "base_shift": math.log(3),  # We use shift=3 in distillation
+    "invert_sigmas": False,
+    "max_image_seq_len": 8192,
+    "max_shift": math.log(3),  # We use shift=3 in distillation
+    "num_train_timesteps": 1000,
+    "shift": 1.0,
+    "shift_terminal": None,  # set shift_terminal to None
+    "stochastic_sampling": False,
+    "time_shift_type": "exponential",
+    "use_beta_sigmas": False,
+    "use_dynamic_shifting": True,
+    "use_exponential_sigmas": False,
+    "use_karras_sigmas": False,
+}
+scheduler = FlowMatchEulerDiscreteScheduler.from_config(scheduler_config)
 # Load the model pipeline
+pipe = QwenImagePipeline.from_pretrained("Qwen/Qwen-Image-2512", scheduler=scheduler, torch_dtype=dtype).to(device)
+pipe.load_lora_weights(
+    "lightx2v/Qwen-Image-Lightning", weight_name="Qwen-Image-Lightning-4steps-V2.0-bf16.safetensors"
+)
+pipe.fuse_lora()
 pipe.transformer.set_attn_processor(QwenDoubleStreamAttnProcessorFA3())
 # --- Ahead-of-time compilation ---
 with gr.Blocks(css=css) as demo:
     with gr.Column(elem_id="col-container"):
+        #gr.Markdown('<img src="https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen-Image/qwen_image_logo.png" alt="Qwen-Image Logo" width="400" style="display: block; margin: 0 auto;">')
+        gr.HTML("""
+        <div id="logo-title">
+            <img src="https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen-Image/qwen_image_logo.png" alt="Qwen-Image Logo" width="400" style="display: block; margin: 0 auto;">
+            <h2 style="font-style: italic;color: #5b47d1;margin-top: -33px !important;margin-left: 133px;">Fast, 4-steps with Lightining LoRA</h2>
+        </div>
+        """)
         gr.Markdown("[Learn more](https://github.com/QwenLM/Qwen-Image) about the Qwen-Image series. Try on [Qwen Chat](https://chat.qwen.ai/), or [download model](https://huggingface.co/Qwen/Qwen-Image) to run locally with ComfyUI or diffusers.")
         with gr.Row():
             prompt = gr.Text(
                     minimum=0.0,
                     maximum=10.0,
                     step=0.1,
+                    value=1.0,
                 )
                 num_inference_steps = gr.Slider(
                     label="Number of inference steps",
                     minimum=1,
+                    maximum=20,
                     step=1,
+                    value=4,
                 )
         gr.Examples(examples=examples, inputs=[prompt], outputs=[result, seed], fn=infer, cache_examples=False)