Spaces:

dmorawiec
/

Nunchaku_Qwen-Image-Edit-2509

Running

App Files Files Community

Darius Morawiec commited on Oct 15

Commit

053d37b

1 Parent(s): 2ac61e9

Add video of denoising steps

Browse files

Files changed (5) hide show

.gitignore +4 -0
app.py +138 -78
pyproject.toml +2 -1
requirements.txt +4 -1
uv.lock +31 -13

.gitignore CHANGED Viewed

@@ -1,3 +1,7 @@
 # Created by https://www.toptal.com/developers/gitignore/api/linux,macos,dotenv,python,windows,intellij,visualstudio,visualstudiocode
 # Edit at https://www.toptal.com/developers/gitignore?templates=linux,macos,dotenv,python,windows,intellij,visualstudio,visualstudiocode

+.gradio
+.vscode
+output
 # Created by https://www.toptal.com/developers/gitignore/api/linux,macos,dotenv,python,windows,intellij,visualstudio,visualstudiocode
 # Edit at https://www.toptal.com/developers/gitignore?templates=linux,macos,dotenv,python,windows,intellij,visualstudio,visualstudiocode

app.py CHANGED Viewed

@@ -1,13 +1,14 @@
-# from pathlib import Path
 from pathlib import Path
 import gradio as gr
 import PIL.Image
 import torch
 from diffusers import (
     DiffusionPipeline,  # type: ignore
-    QwenImageEditPlusPipeline,
 )
 # from diffusers.utils import load_image
@@ -20,49 +21,18 @@ RANK = 128
 TRANSFORMER_ID = f"nunchaku-tech/nunchaku-qwen-image-edit-2509/svdq-{get_precision()}_r{RANK}-qwen-image-edit-2509.safetensors"
 PIPELINE_ID = "Qwen/Qwen-Image-Edit-2509"
-def callback(
-    pipeline: DiffusionPipeline,
-    step: int,
-    timestep: int,
-    callback_kwargs: dict,
-):
-    print(f"Step {step}, Timestep {timestep}, Kwargs: {callback_kwargs.keys()}")
-    latents = callback_kwargs.get("latents", None)
-    height = callback_kwargs.get("height", 800)
-    width = callback_kwargs.get("width", 512)
-    if latents is not None:
-        print(f"Latents shape: {latents.shape}, dtype: {latents.dtype}")
-        latents = pipeline._unpack_latents(
-            latents, height, width, pipeline.vae_scale_factor
-        )
-        latents = latents.to(pipeline.vae.dtype)
-        latents_mean = (
-            torch.tensor(pipeline.vae.config.latents_mean)
-            .view(1, pipeline.vae.config.z_dim, 1, 1, 1)
-            .to(latents.device, latents.dtype)
-        )
-        latents_std = 1.0 / torch.tensor(pipeline.vae.config.latents_std).view(
-            1, pipeline.vae.config.z_dim, 1, 1, 1
-        ).to(latents.device, latents.dtype)
-        latents = latents / latents_std + latents_mean
-        image = pipeline.vae.decode(latents, return_dict=False)[0][:, :, 0]
-        image = pipeline.image_processor.postprocess(image, output_type="pil")
-        image = image[0]
-        image_filename = f"step_{step:03d}_t{timestep}.png"
-        output_dir = Path(__file__).parent / "output"
-        output_dir.mkdir(parents=True, exist_ok=True)
-        image.save(output_dir / image_filename)
-    return {}
 class Model:
     def __init__(self):
         transformer = NunchakuQwenImageTransformer2DModel.from_pretrained(
             TRANSFORMER_ID
         )
@@ -95,7 +65,14 @@ class Model:
         num_inference_steps: int = 40,
         image_width: int = 512,
         image_height: int = 512,
-    ) -> PIL.Image.Image:
         # Validate inputs
         if not images:
             raise gr.Error("No images provided. Please upload at least one image.")
@@ -116,49 +93,81 @@ class Model:
             width=image_width,
             height=image_height,
             generator=torch.manual_seed(0),
-            callback_on_step_end=callback,
             # output_type="latent"
         )
         output = self.pipeline(**inputs)
         output_image = output.images[0]
-        return output_image
-model = Model()
-def process_images(
-    images,
-    prompt,
-    negative_prompt,
-    true_cfg_scale,
-    num_inference_steps,
-    image_width,
-    image_height,
-):
-    """Wrapper function to handle errors gracefully"""
-    pil_images = []
-    for contents in images:
-        for content in contents:
-            if isinstance(content, PIL.Image.Image):
-                pil_images.append(content)
-                break
-    try:
-        return model.compute(
-            pil_images,
-            prompt,
-            negative_prompt,
-            true_cfg_scale,
-            num_inference_steps,
-            image_width,
-            image_height,
-        )
-    except Exception as e:
-        print(f"Error processing images: {e}")
-        raise gr.Error(f"Failed to process images: {str(e)}")
 with gr.Blocks() as demo:
@@ -189,6 +198,18 @@ with gr.Blocks() as demo:
                 format="png",
             )
     with gr.Row():
         with gr.Column():
             gr.Markdown("## Prompts")
@@ -210,8 +231,8 @@ with gr.Blocks() as demo:
             num_inference_steps = gr.Slider(
                 1,
-                100,
-                value=40,
                 step=1,
                 interactive=True,
                 label="Number of denoising steps:",
@@ -238,6 +259,41 @@ with gr.Blocks() as demo:
     with gr.Row():
         run_button = gr.Button("Run")
     # Connect the button to the detection function
     run_button.click(
         fn=process_images,
@@ -252,9 +308,13 @@ with gr.Blocks() as demo:
         ],
         outputs=[
             image_output,
         ],
     )
 if __name__ == "__main__":
-    demo.launch()

+import shutil
+import time
 from pathlib import Path
+import cv2
 import gradio as gr
 import PIL.Image
 import torch
 from diffusers import (
     DiffusionPipeline,  # type: ignore
+    QwenImageEditPlusPipeline,  # type: ignore
 )
 # from diffusers.utils import load_image
 TRANSFORMER_ID = f"nunchaku-tech/nunchaku-qwen-image-edit-2509/svdq-{get_precision()}_r{RANK}-qwen-image-edit-2509.safetensors"
 PIPELINE_ID = "Qwen/Qwen-Image-Edit-2509"
+OUTPUT_DIR = Path(__file__).parent / "output"
+IMAGES_DIR = OUTPUT_DIR / "images"
+IMAGES_DIR.mkdir(parents=True, exist_ok=True)
+VIDEO_PATH = OUTPUT_DIR / "video.mp4"
 class Model:
     def __init__(self):
+        self.progress = gr.Progress()
+        self.num_inference_steps = 50
+        self.current_inference_step = 0
         transformer = NunchakuQwenImageTransformer2DModel.from_pretrained(
             TRANSFORMER_ID
         )
         num_inference_steps: int = 40,
         image_width: int = 512,
         image_height: int = 512,
+    ) -> tuple[PIL.Image.Image, Path]:
+        self.num_inference_steps = num_inference_steps
+        self.current_inference_step = 0
+        self.progress((self.current_inference_step, self.num_inference_steps))
+        shutil.rmtree(IMAGES_DIR, ignore_errors=True)
+        IMAGES_DIR.mkdir(parents=True, exist_ok=True)
         # Validate inputs
         if not images:
             raise gr.Error("No images provided. Please upload at least one image.")
             width=image_width,
             height=image_height,
             generator=torch.manual_seed(0),
+            callback_on_step_end=self.callback,
             # output_type="latent"
         )
         output = self.pipeline(**inputs)
         output_image = output.images[0]
+        # Create video from saved images
+        print(list(IMAGES_DIR.glob("*.png")))
+        # Get all PNG files and sort them
+        image_files = sorted(IMAGES_DIR.glob("step_*.png"))
+        if image_files:
+            # Read first image to get dimensions
+            first_img = cv2.imread(str(image_files[0]))
+            height, width, _ = first_img.shape
+            # Create video writer
+            fourcc = cv2.VideoWriter_fourcc(*"mp4v")
+            fps = 10  # Adjust frame rate as needed
+            video_writer = cv2.VideoWriter(
+                str(VIDEO_PATH.absolute()), fourcc, fps, (width, height)
+            )
+            # Add each image to video
+            for img_path in image_files:
+                img = cv2.imread(str(img_path))
+                video_writer.write(img)
+            video_writer.release()
+            print(f"Video saved to: {VIDEO_PATH}")
+            time.sleep(3)
+        return output_image, VIDEO_PATH
+    def callback(
+        self,
+        pipeline: DiffusionPipeline,
+        step: int,
+        timestep: int,
+        callback_kwargs: dict,
+    ):
+        latents = callback_kwargs.get("latents", None)
+        height = callback_kwargs.get("height", 800)
+        width = callback_kwargs.get("width", 512)
+        if latents is not None:
+            print(f"Latents shape: {latents.shape}, dtype: {latents.dtype}")
+            latents = pipeline._unpack_latents(
+                latents, height, width, pipeline.vae_scale_factor
+            )
+            latents = latents.to(pipeline.vae.dtype)
+            latents_mean = (
+                torch.tensor(pipeline.vae.config.latents_mean)
+                .view(1, pipeline.vae.config.z_dim, 1, 1, 1)
+                .to(latents.device, latents.dtype)
+            )
+            latents_std = 1.0 / torch.tensor(pipeline.vae.config.latents_std).view(
+                1, pipeline.vae.config.z_dim, 1, 1, 1
+            ).to(latents.device, latents.dtype)
+            latents = latents / latents_std + latents_mean
+            image = pipeline.vae.decode(latents, return_dict=False)[0][:, :, 0]
+            image = pipeline.image_processor.postprocess(image, output_type="pil")
+            image = image[0]
+            image.save(IMAGES_DIR / f"step_{step:03d}.png")
+            self.current_inference_step += 1
+            self.progress((self.current_inference_step, self.num_inference_steps))
+        return {}
 with gr.Blocks() as demo:
                 format="png",
             )
+        with gr.Column():
+            gr.Markdown("## Output Video")
+            video_output = gr.Video(
+                label="Output Video",
+                format="mp4",
+                show_download_button=True,
+                streaming=True,
+                autoplay=True,
+                loop=False,
+            )
     with gr.Row():
         with gr.Column():
             gr.Markdown("## Prompts")
             num_inference_steps = gr.Slider(
                 1,
+                300,
+                value=50,
                 step=1,
                 interactive=True,
                 label="Number of denoising steps:",
     with gr.Row():
         run_button = gr.Button("Run")
+    model = Model()
+    def process_images(
+        images,
+        prompt,
+        negative_prompt,
+        true_cfg_scale,
+        num_inference_steps,
+        image_width,
+        image_height,
+    ):
+        """Wrapper function to handle errors gracefully"""
+        pil_images = []
+        for contents in images:
+            for content in contents:
+                if isinstance(content, PIL.Image.Image):
+                    pil_images.append(content)
+                    break
+        try:
+            return model.compute(
+                pil_images,
+                prompt,
+                negative_prompt,
+                true_cfg_scale,
+                num_inference_steps,
+                image_width,
+                image_height,
+            )
+        except Exception as e:
+            print(f"Error processing images: {e}")
+            raise gr.Error(f"Failed to process images: {str(e)}")
     # Connect the button to the detection function
     run_button.click(
         fn=process_images,
         ],
         outputs=[
             image_output,
+            video_output,
         ],
     )
 if __name__ == "__main__":
+    demo.launch(
+        allowed_paths=["output/video.mp4"],
+        share=True,
+    )

pyproject.toml CHANGED Viewed

@@ -7,7 +7,8 @@ dependencies = [
     "nunchaku",
     "torch~=2.7.0",
     "transformers[torch]>=4.57.0",
-    "gradio~=5.49.1"
 ]
 [tool.uv.sources]

     "nunchaku",
     "torch~=2.7.0",
     "transformers[torch]>=4.57.0",
+    "gradio~=5.49.1",
+    "opencv-python-headless>=4.12.0.88",
 ]
 [tool.uv.sources]

requirements.txt CHANGED Viewed

@@ -101,11 +101,12 @@ mpmath==1.3.0
     # via sympy
 networkx==3.5
     # via torch
-numpy==2.3.3
     # via
     #   accelerate
     #   diffusers
     #   gradio
     #   pandas
     #   peft
     #   torchvision
@@ -149,6 +150,8 @@ nvidia-nvjitlink-cu12==12.6.85
     #   torch
 nvidia-nvtx-cu12==12.6.77
     # via torch
 orjson==3.11.3
     # via gradio
 packaging==25.0

     # via sympy
 networkx==3.5
     # via torch
+numpy==2.2.6
     # via
     #   accelerate
     #   diffusers
     #   gradio
+    #   opencv-python-headless
     #   pandas
     #   peft
     #   torchvision
     #   torch
 nvidia-nvtx-cu12==12.6.77
     # via torch
+opencv-python-headless==4.12.0.88
+    # via nunchaku-qwen-image-edit-2509 (pyproject.toml)
 orjson==3.11.3
     # via gradio
 packaging==25.0

uv.lock CHANGED Viewed

@@ -423,21 +423,20 @@ wheels = [
 [[package]]
 name = "numpy"
-version = "2.3.3"
 source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/d0/19/95b3d357407220ed24c139018d2518fab0a61a948e68286a25f1a4d049ff/numpy-2.3.3.tar.gz", hash = "sha256:ddc7c39727ba62b80dfdbedf400d1c10ddfa8eefbd7ec8dcb118be8b56d31029", size = 20576648, upload-time = "2025-09-09T16:54:12.543Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/51/5d/bb7fc075b762c96329147799e1bcc9176ab07ca6375ea976c475482ad5b3/numpy-2.3.3-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:cfdd09f9c84a1a934cde1eec2267f0a43a7cd44b2cca4ff95b7c0d14d144b0bf", size = 20957014, upload-time = "2025-09-09T15:56:29.966Z" },
-    { url = "https://files.pythonhosted.org/packages/6b/0e/c6211bb92af26517acd52125a237a92afe9c3124c6a68d3b9f81b62a0568/numpy-2.3.3-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:cb32e3cf0f762aee47ad1ddc6672988f7f27045b0783c887190545baba73aa25", size = 14185220, upload-time = "2025-09-09T15:56:32.175Z" },
-    { url = "https://files.pythonhosted.org/packages/22/f2/07bb754eb2ede9073f4054f7c0286b0d9d2e23982e090a80d478b26d35ca/numpy-2.3.3-cp312-cp312-macosx_14_0_arm64.whl", hash = "sha256:396b254daeb0a57b1fe0ecb5e3cff6fa79a380fa97c8f7781a6d08cd429418fe", size = 5113918, upload-time = "2025-09-09T15:56:34.175Z" },
-    { url = "https://files.pythonhosted.org/packages/81/0a/afa51697e9fb74642f231ea36aca80fa17c8fb89f7a82abd5174023c3960/numpy-2.3.3-cp312-cp312-macosx_14_0_x86_64.whl", hash = "sha256:067e3d7159a5d8f8a0b46ee11148fc35ca9b21f61e3c49fbd0a027450e65a33b", size = 6647922, upload-time = "2025-09-09T15:56:36.149Z" },
-    { url = "https://files.pythonhosted.org/packages/5d/f5/122d9cdb3f51c520d150fef6e87df9279e33d19a9611a87c0d2cf78a89f4/numpy-2.3.3-cp312-cp312-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:1c02d0629d25d426585fb2e45a66154081b9fa677bc92a881ff1d216bc9919a8", size = 14281991, upload-time = "2025-09-09T15:56:40.548Z" },
-    { url = "https://files.pythonhosted.org/packages/51/64/7de3c91e821a2debf77c92962ea3fe6ac2bc45d0778c1cbe15d4fce2fd94/numpy-2.3.3-cp312-cp312-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:d9192da52b9745f7f0766531dcfa978b7763916f158bb63bdb8a1eca0068ab20", size = 16641643, upload-time = "2025-09-09T15:56:43.343Z" },
-    { url = "https://files.pythonhosted.org/packages/30/e4/961a5fa681502cd0d68907818b69f67542695b74e3ceaa513918103b7e80/numpy-2.3.3-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:cd7de500a5b66319db419dc3c345244404a164beae0d0937283b907d8152e6ea", size = 16056787, upload-time = "2025-09-09T15:56:46.141Z" },
-    { url = "https://files.pythonhosted.org/packages/99/26/92c912b966e47fbbdf2ad556cb17e3a3088e2e1292b9833be1dfa5361a1a/numpy-2.3.3-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:93d4962d8f82af58f0b2eb85daaf1b3ca23fe0a85d0be8f1f2b7bb46034e56d7", size = 18579598, upload-time = "2025-09-09T15:56:49.844Z" },
-    { url = "https://files.pythonhosted.org/packages/17/b6/fc8f82cb3520768718834f310c37d96380d9dc61bfdaf05fe5c0b7653e01/numpy-2.3.3-cp312-cp312-win32.whl", hash = "sha256:5534ed6b92f9b7dca6c0a19d6df12d41c68b991cef051d108f6dbff3babc4ebf", size = 6320800, upload-time = "2025-09-09T15:56:52.499Z" },
-    { url = "https://files.pythonhosted.org/packages/32/ee/de999f2625b80d043d6d2d628c07d0d5555a677a3cf78fdf868d409b8766/numpy-2.3.3-cp312-cp312-win_amd64.whl", hash = "sha256:497d7cad08e7092dba36e3d296fe4c97708c93daf26643a1ae4b03f6294d30eb", size = 12786615, upload-time = "2025-09-09T15:56:54.422Z" },
-    { url = "https://files.pythonhosted.org/packages/49/6e/b479032f8a43559c383acb20816644f5f91c88f633d9271ee84f3b3a996c/numpy-2.3.3-cp312-cp312-win_arm64.whl", hash = "sha256:ca0309a18d4dfea6fc6262a66d06c26cfe4640c3926ceec90e57791a82b6eee5", size = 10195936, upload-time = "2025-09-09T15:56:56.541Z" },
 ]
 [[package]]
@@ -531,6 +530,7 @@ dependencies = [
     { name = "diffusers" },
     { name = "gradio" },
     { name = "nunchaku" },
     { name = "torch" },
     { name = "transformers", extra = ["torch"] },
 ]
@@ -540,6 +540,7 @@ requires-dist = [
     { name = "diffusers", git = "https://github.com/huggingface/diffusers?rev=a519272d97f011332588e1aaa73d32952d80f3f5" },
     { name = "gradio", specifier = "~=5.49.1" },
     { name = "nunchaku", url = "https://github.com/nunchaku-tech/nunchaku/releases/download/v1.0.1/nunchaku-1.0.1+torch2.7-cp312-cp312-linux_x86_64.whl" },
     { name = "torch", specifier = "~=2.7.0" },
     { name = "transformers", extras = ["torch"], specifier = ">=4.57.0" },
 ]
@@ -677,6 +678,23 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/9e/4e/0d0c945463719429b7bd21dece907ad0bde437a2ff12b9b12fee94722ab0/nvidia_nvtx_cu12-12.6.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:6574241a3ec5fdc9334353ab8c479fe75841dbe8f4532a8fc97ce63503330ba1", size = 89265, upload-time = "2024-10-01T17:00:38.172Z" },
 ]
 [[package]]
 name = "orjson"
 version = "3.11.3"

 [[package]]
 name = "numpy"
+version = "2.2.6"
 source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/76/21/7d2a95e4bba9dc13d043ee156a356c0a8f0c6309dff6b21b4d71a073b8a8/numpy-2.2.6.tar.gz", hash = "sha256:e29554e2bef54a90aa5cc07da6ce955accb83f21ab5de01a62c8478897b264fd", size = 20276440, upload-time = "2025-05-17T22:38:04.611Z" }
 wheels = [
+    { url = "https://files.pythonhosted.org/packages/82/5d/c00588b6cf18e1da539b45d3598d3557084990dcc4331960c15ee776ee41/numpy-2.2.6-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:41c5a21f4a04fa86436124d388f6ed60a9343a6f767fced1a8a71c3fbca038ff", size = 20875348, upload-time = "2025-05-17T21:34:39.648Z" },
+    { url = "https://files.pythonhosted.org/packages/66/ee/560deadcdde6c2f90200450d5938f63a34b37e27ebff162810f716f6a230/numpy-2.2.6-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:de749064336d37e340f640b05f24e9e3dd678c57318c7289d222a8a2f543e90c", size = 14119362, upload-time = "2025-05-17T21:35:01.241Z" },
+    { url = "https://files.pythonhosted.org/packages/3c/65/4baa99f1c53b30adf0acd9a5519078871ddde8d2339dc5a7fde80d9d87da/numpy-2.2.6-cp312-cp312-macosx_14_0_arm64.whl", hash = "sha256:894b3a42502226a1cac872f840030665f33326fc3dac8e57c607905773cdcde3", size = 5084103, upload-time = "2025-05-17T21:35:10.622Z" },
+    { url = "https://files.pythonhosted.org/packages/cc/89/e5a34c071a0570cc40c9a54eb472d113eea6d002e9ae12bb3a8407fb912e/numpy-2.2.6-cp312-cp312-macosx_14_0_x86_64.whl", hash = "sha256:71594f7c51a18e728451bb50cc60a3ce4e6538822731b2933209a1f3614e9282", size = 6625382, upload-time = "2025-05-17T21:35:21.414Z" },
+    { url = "https://files.pythonhosted.org/packages/f8/35/8c80729f1ff76b3921d5c9487c7ac3de9b2a103b1cd05e905b3090513510/numpy-2.2.6-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f2618db89be1b4e05f7a1a847a9c1c0abd63e63a1607d892dd54668dd92faf87", size = 14018462, upload-time = "2025-05-17T21:35:42.174Z" },
+    { url = "https://files.pythonhosted.org/packages/8c/3d/1e1db36cfd41f895d266b103df00ca5b3cbe965184df824dec5c08c6b803/numpy-2.2.6-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:fd83c01228a688733f1ded5201c678f0c53ecc1006ffbc404db9f7a899ac6249", size = 16527618, upload-time = "2025-05-17T21:36:06.711Z" },
+    { url = "https://files.pythonhosted.org/packages/61/c6/03ed30992602c85aa3cd95b9070a514f8b3c33e31124694438d88809ae36/numpy-2.2.6-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:37c0ca431f82cd5fa716eca9506aefcabc247fb27ba69c5062a6d3ade8cf8f49", size = 15505511, upload-time = "2025-05-17T21:36:29.965Z" },
+    { url = "https://files.pythonhosted.org/packages/b7/25/5761d832a81df431e260719ec45de696414266613c9ee268394dd5ad8236/numpy-2.2.6-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:fe27749d33bb772c80dcd84ae7e8df2adc920ae8297400dabec45f0dedb3f6de", size = 18313783, upload-time = "2025-05-17T21:36:56.883Z" },
+    { url = "https://files.pythonhosted.org/packages/57/0a/72d5a3527c5ebffcd47bde9162c39fae1f90138c961e5296491ce778e682/numpy-2.2.6-cp312-cp312-win32.whl", hash = "sha256:4eeaae00d789f66c7a25ac5f34b71a7035bb474e679f410e5e1a94deb24cf2d4", size = 6246506, upload-time = "2025-05-17T21:37:07.368Z" },
+    { url = "https://files.pythonhosted.org/packages/36/fa/8c9210162ca1b88529ab76b41ba02d433fd54fecaf6feb70ef9f124683f1/numpy-2.2.6-cp312-cp312-win_amd64.whl", hash = "sha256:c1f9540be57940698ed329904db803cf7a402f3fc200bfe599334c9bd84a40b2", size = 12614190, upload-time = "2025-05-17T21:37:26.213Z" },
 ]
 [[package]]
     { name = "diffusers" },
     { name = "gradio" },
     { name = "nunchaku" },
+    { name = "opencv-python-headless" },
     { name = "torch" },
     { name = "transformers", extra = ["torch"] },
 ]
     { name = "diffusers", git = "https://github.com/huggingface/diffusers?rev=a519272d97f011332588e1aaa73d32952d80f3f5" },
     { name = "gradio", specifier = "~=5.49.1" },
     { name = "nunchaku", url = "https://github.com/nunchaku-tech/nunchaku/releases/download/v1.0.1/nunchaku-1.0.1+torch2.7-cp312-cp312-linux_x86_64.whl" },
+    { name = "opencv-python-headless", specifier = ">=4.12.0.88" },
     { name = "torch", specifier = "~=2.7.0" },
     { name = "transformers", extras = ["torch"], specifier = ">=4.57.0" },
 ]
     { url = "https://files.pythonhosted.org/packages/9e/4e/0d0c945463719429b7bd21dece907ad0bde437a2ff12b9b12fee94722ab0/nvidia_nvtx_cu12-12.6.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:6574241a3ec5fdc9334353ab8c479fe75841dbe8f4532a8fc97ce63503330ba1", size = 89265, upload-time = "2024-10-01T17:00:38.172Z" },
 ]
+[[package]]
+name = "opencv-python-headless"
+version = "4.12.0.88"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "numpy" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a4/63/6861102ec149c3cd298f4d1ea7ce9d6adbc7529221606ff1dab991a19adb/opencv-python-headless-4.12.0.88.tar.gz", hash = "sha256:cfdc017ddf2e59b6c2f53bc12d74b6b0be7ded4ec59083ea70763921af2b6c09", size = 95379675, upload-time = "2025-07-07T09:21:06.815Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/f7/7d/414e243c5c8216a5277afd104a319cc1291c5e23f5eeef512db5629ee7f4/opencv_python_headless-4.12.0.88-cp37-abi3-macosx_13_0_arm64.whl", hash = "sha256:1e58d664809b3350c1123484dd441e1667cd7bed3086db1b9ea1b6f6cb20b50e", size = 37877864, upload-time = "2025-07-07T09:14:41.693Z" },
+    { url = "https://files.pythonhosted.org/packages/05/14/7e162714beed1cd5e7b5eb66fcbcba2f065c51b1d9da2463024c84d2f7c0/opencv_python_headless-4.12.0.88-cp37-abi3-macosx_13_0_x86_64.whl", hash = "sha256:365bb2e486b50feffc2d07a405b953a8f3e8eaa63865bc650034e5c71e7a5154", size = 57326608, upload-time = "2025-07-07T09:14:51.885Z" },
+    { url = "https://files.pythonhosted.org/packages/69/4e/116720df7f1f7f3b59abc608ca30fbec9d2b3ae810afe4e4d26483d9dfa0/opencv_python_headless-4.12.0.88-cp37-abi3-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:aeb4b13ecb8b4a0beb2668ea07928160ea7c2cd2d9b5ef571bbee6bafe9cc8d0", size = 33145800, upload-time = "2025-07-07T09:15:00.367Z" },
+    { url = "https://files.pythonhosted.org/packages/89/53/e19c21e0c4eb1275c3e2c97b081103b6dfb3938172264d283a519bf728b9/opencv_python_headless-4.12.0.88-cp37-abi3-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:236c8df54a90f4d02076e6f9c1cc763d794542e886c576a6fee46ec8ff75a7a9", size = 54023419, upload-time = "2025-07-07T09:15:10.164Z" },
+    { url = "https://files.pythonhosted.org/packages/bf/9c/a76fd5414de6ec9f21f763a600058a0c3e290053cea87e0275692b1375c0/opencv_python_headless-4.12.0.88-cp37-abi3-win32.whl", hash = "sha256:fde2cf5c51e4def5f2132d78e0c08f9c14783cd67356922182c6845b9af87dbd", size = 30225230, upload-time = "2025-07-07T09:15:17.045Z" },
+    { url = "https://files.pythonhosted.org/packages/f2/35/0858e9e71b36948eafbc5e835874b63e515179dc3b742cbe3d76bc683439/opencv_python_headless-4.12.0.88-cp37-abi3-win_amd64.whl", hash = "sha256:86b413bdd6c6bf497832e346cd5371995de148e579b9774f8eba686dee3f5528", size = 38923559, upload-time = "2025-07-07T09:15:25.229Z" },
+]
 [[package]]
 name = "orjson"
 version = "3.11.3"