Spaces:

Werli
/

Multi-Tagger

Running

App Files Files Community

Werli commited on Apr 12, 2025

Commit

bf666fd

verified ·

1 Parent(s): e44cf4f

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -5

app.py CHANGED Viewed

@@ -70,14 +70,12 @@ else:
 TITLE = "Multi-Tagger"
 DESCRIPTION = """
 Multi-Tagger is a powerful and versatile application that integrates two cutting-edge models: Waifu Diffusion and Florence 2. This app is designed to provide comprehensive image analysis and captioning capabilities, making it a valuable tool for AI artists, researchers, and enthusiasts.
 Features:
 - Supports batch processing of multiple images.
 - Tags images with multiple categories: general tags, character tags, and ratings.
 - Displays categorized tags in a structured format.
 - Includes a separate tab for image captioning using Florence 2. This model supports CUDA, MPS or CPU if one of them is available.
 - Supports various captioning tasks (e.g., Caption, Detailed Caption, Object Detection), as well it can display output text and images for tasks that generate visual outputs.
 Example image by [me.](https://huggingface.co/Werli)
 """
 colormap = ['blue','orange','green','purple','brown','pink','gray','olive','cyan','red',
@@ -215,7 +213,6 @@ class Llama3Reorganize:
         loadModel: bool = False,
     ):
         """Initializes the Llama model.
         Args:
           repoId: LLAMA model repo.
           device: Device to use for computation (cpu, cuda, ipu, xpu, mkldnn, opengl, opencl,
@@ -1023,6 +1020,7 @@ with gr.Blocks(title=TITLE, css=css, theme="Werli/Multi-Tagger", fill_width=True
                     [
                         download_file,
                         sorted_general_strings,
                         categorized,
                         rating,
                         character_res,
@@ -1037,7 +1035,7 @@ with gr.Blocks(title=TITLE, css=css, theme="Werli/Multi-Tagger", fill_width=True
             upload_button.upload(extend_gallery, inputs=[gallery, upload_button], outputs=gallery)
             # Event to update the selected image when an image is clicked in the gallery
             selected_image = gr.Textbox(label="Selected Image", visible=False)
-            gallery.select(get_selection_from_gallery, inputs=[gallery, tag_results], outputs=[selected_image, sorted_general_strings, categorized, rating, character_res, general_res, unclassified])
             # Event to remove a selected image from the gallery
             remove_button.click(remove_image_from_gallery, inputs=[gallery, selected_image], outputs=gallery)
         submit.click(
@@ -1055,7 +1053,7 @@ with gr.Blocks(title=TITLE, css=css, theme="Werli/Multi-Tagger", fill_width=True
                 additional_tags_append,
                 tag_results,
             ],
-            outputs=[download_file, sorted_general_strings, categorized, rating, character_res, general_res, unclassified, tag_results,  categorized_output,],
         )
         gr.Examples(
             [["images/1girl.png", VIT_LARGE_MODEL_DSV3_REPO, 0.35, False, 0.85, False]],

 TITLE = "Multi-Tagger"
 DESCRIPTION = """
 Multi-Tagger is a powerful and versatile application that integrates two cutting-edge models: Waifu Diffusion and Florence 2. This app is designed to provide comprehensive image analysis and captioning capabilities, making it a valuable tool for AI artists, researchers, and enthusiasts.
 Features:
 - Supports batch processing of multiple images.
 - Tags images with multiple categories: general tags, character tags, and ratings.
 - Displays categorized tags in a structured format.
 - Includes a separate tab for image captioning using Florence 2. This model supports CUDA, MPS or CPU if one of them is available.
 - Supports various captioning tasks (e.g., Caption, Detailed Caption, Object Detection), as well it can display output text and images for tasks that generate visual outputs.
 Example image by [me.](https://huggingface.co/Werli)
 """
 colormap = ['blue','orange','green','purple','brown','pink','gray','olive','cyan','red',
         loadModel: bool = False,
     ):
         """Initializes the Llama model.
         Args:
           repoId: LLAMA model repo.
           device: Device to use for computation (cpu, cuda, ipu, xpu, mkldnn, opengl, opencl,
                     [
                         download_file,
                         sorted_general_strings,
+                        categorized_output,
                         categorized,
                         rating,
                         character_res,
             upload_button.upload(extend_gallery, inputs=[gallery, upload_button], outputs=gallery)
             # Event to update the selected image when an image is clicked in the gallery
             selected_image = gr.Textbox(label="Selected Image", visible=False)
+            gallery.select(get_selection_from_gallery, inputs=[gallery, tag_results], outputs=[selected_image, sorted_general_strings, categorized, categorized_output, rating, character_res, general_res, unclassified])
             # Event to remove a selected image from the gallery
             remove_button.click(remove_image_from_gallery, inputs=[gallery, selected_image], outputs=gallery)
         submit.click(
                 additional_tags_append,
                 tag_results,
             ],
+            outputs=[download_file, sorted_general_strings, categorized, categorized_output, rating, character_res, general_res, unclassified, tag_results,  categorized_output,],
         )
         gr.Examples(
             [["images/1girl.png", VIT_LARGE_MODEL_DSV3_REPO, 0.35, False, 0.85, False]],