Qwen-Image-Edit-Object-Manipulator

Runtime error

App Files Files Community

prithivMLmods commited on Dec 21, 2025

Commit

d1e8913

verified ·

1 Parent(s): d3a73a2

update app

Browse files

Files changed (1) hide show

app.py +8 -8

app.py CHANGED Viewed

@@ -349,11 +349,11 @@ css="""
 """
 with gr.Blocks() as demo:
-    gr.Markdown("# **Molmo2 HF Demo🖥️**", elem_id="main-title")
-    gr.Markdown("Perform multi-image QA, pointing, general video QA, and tracking using the [Molmo2](https://huggingface.co/allenai/Molmo2-8B) multimodal model.")
     with gr.Tabs():
-        with gr.Tab("Images (QA & Pointing)"):
             with gr.Row():
                 with gr.Column():
                     img_input = gr.Gallery(label="Input Images", type="filepath", height=400)
@@ -367,9 +367,9 @@ with gr.Blocks() as demo:
             gr.Examples(
                 examples=[
                     [["example-images/compare1.jpg", "example-images/compare2.jpeg"], "Compare these two images."],
-                    [["example-images/cat1.jpg", "example-images/cat2.jpg", "example-images/dog1.jpg"], "Point to the cats."],
-                    [["example-images/candy.JPG"], "Point to all the candies."],
-                    [["example-images/premium_photo-1691752881339-d78da354ee7e.jpg"], "Point to the girls."],
                     ],
                 inputs=[img_input, img_prompt],
                 label="Image Examples"
@@ -380,7 +380,7 @@ with gr.Blocks() as demo:
                 outputs=[img_text_out, img_out]
             )
-        with gr.Tab("Video (QA, Pointing & Tracking)"):
             gr.Markdown("**Note:** Video processing takes longer as frames are sampled.")
             with gr.Row():
                 with gr.Column():
@@ -394,7 +394,7 @@ with gr.Blocks() as demo:
             gr.Examples(
                 examples=[
-                    ["example-videos/sample_video.mp4", "Track the football."],
                     ["example-videos/drink.mp4", "Explain the video."],
                     ],
                     inputs=[vid_input, vid_prompt],

 """
 with gr.Blocks() as demo:
+    gr.Markdown("# **Qwen3-VL-4B-Abliterated🔥**", elem_id="main-title")
+    gr.Markdown("Perform multi-image QA, general video QA, and Analysis using the [Qwen3-VL-4B-Instruct-abliterated-v1](https://huggingface.co/prithivMLmods/Qwen3-VL-4B-Instruct-abliterated-v1) multimodal model.")
     with gr.Tabs():
+        with gr.Tab("Multi-Image QA"):
             with gr.Row():
                 with gr.Column():
                     img_input = gr.Gallery(label="Input Images", type="filepath", height=400)
             gr.Examples(
                 examples=[
                     [["example-images/compare1.jpg", "example-images/compare2.jpeg"], "Compare these two images."],
+                    [["example-images/cat1.jpg", "example-images/cat2.jpg", "example-images/dog1.jpg"], "Odd one out."],
+                    [["example-images/candy.JPG"], "Mention the coordinates of the candies."],
+                    [["example-images/premium_photo-1691752881339-d78da354ee7e.jpg"], "Analyze the image in detail."],
                     ],
                 inputs=[img_input, img_prompt],
                 label="Image Examples"
                 outputs=[img_text_out, img_out]
             )
+        with gr.Tab("Video QA"):
             gr.Markdown("**Note:** Video processing takes longer as frames are sampled.")
             with gr.Row():
                 with gr.Column():
             gr.Examples(
                 examples=[
+                    ["example-videos/sample_video.mp4", "Analyze the football movements."],
                     ["example-videos/drink.mp4", "Explain the video."],
                     ],
                     inputs=[vid_input, vid_prompt],