Spaces:

bakyt92
/

Image_manager

Sleeping

App Files Files Community

bakyt92 commited on Jun 22, 2025

Commit

978622c

1 Parent(s): 18839b3

Update app.py - add PIllow

Browse files

Files changed (1) hide show

app.py +113 -50

app.py CHANGED Viewed

@@ -1,9 +1,8 @@
 import gradio as gr
 import requests
-from PIL import Image
 import io
 import openai
-from gradio_image_annotation import image_annotator
 # Image Generation Functions
 def generate_ideogram_image(api_key, prompt, aspect_ratio="ASPECT_1_1"):
@@ -73,21 +72,70 @@ def process_uploaded_image(image):
         return None, "No image uploaded"
     return image, "Image uploaded successfully!"
-# Image Annotation Functions
-def get_annotations_json(annotations):
-    """Extract annotations as JSON"""
-    return annotations.get("boxes", [])
-def save_annotated_image(annotations):
-    """Return the annotated image"""
-    if annotations and annotations.get("image") is not None:
-        return annotations["image"]
-    return None
 # Create the Gradio Interface
-with gr.Blocks(title="AI Image Generator & Annotator MCP Server") as demo:
-    gr.Markdown("# 🎨 AI Image Generator & Annotator")
-    gr.Markdown("Generate images with AI or upload your own, then add annotations!")
     # Tab 1: Image Generation
     with gr.Tab("🖼️ Image Generation", id="generation_tab"):
@@ -161,56 +209,71 @@ with gr.Blocks(title="AI Image Generator & Annotator MCP Server") as demo:
             outputs=[generated_image, status_message]
         )
-    # Tab 2: Image Annotation
-    with gr.Tab("📝 Image Annotation", id="annotation_tab"):
-        gr.Markdown("## Add Signs and Annotations to Images")
-        gr.Markdown("Upload an image or use one from the generation tab, then add bounding boxes and labels.")
         with gr.Row():
             with gr.Column():
-                # Image annotation component
-                annotator = image_annotator(
-                    label="Image Annotator",
-                    label_list=["Person", "Object", "Vehicle", "Animal", "Building", "Sign", "Text", "Custom"],
-                    label_colors=[
-                        (255, 0, 0),    # Red for Person
-                        (0, 255, 0),    # Green for Object
-                        (0, 0, 255),    # Blue for Vehicle
-                        (255, 255, 0),  # Yellow for Animal
-                        (255, 0, 255),  # Magenta for Building
-                        (0, 255, 255),  # Cyan for Sign
-                        (128, 0, 128),  # Purple for Text
-                        (255, 165, 0)   # Orange for Custom
                     ],
-                    image_type="pil"
                 )
                 with gr.Row():
-                    get_annotations_btn = gr.Button("📊 Get Annotations", variant="secondary")
-                    save_image_btn = gr.Button("💾 Save Annotated Image", variant="primary")
             with gr.Column():
-                # Outputs
-                annotated_output = gr.Image(label="Annotated Image")
-                annotations_json = gr.JSON(label="Annotations Data")
-        # Event handlers for Tab 2
-        get_annotations_btn.click(
-            get_annotations_json,
-            inputs=[annotator],
-            outputs=[annotations_json]
-        )
-        save_image_btn.click(
-            save_annotated_image,
-            inputs=[annotator],
-            outputs=[annotated_output]
         )
-# Launch as MCP Server
 if __name__ == "__main__":
     demo.launch(
-        share=True,       # Create public link for testing
         server_name="0.0.0.0",
         server_port=7860
     )

 import gradio as gr
 import requests
+from PIL import Image, ImageDraw, ImageFont
 import io
 import openai
 # Image Generation Functions
 def generate_ideogram_image(api_key, prompt, aspect_ratio="ASPECT_1_1"):
         return None, "No image uploaded"
     return image, "Image uploaded successfully!"
+# Text Overlay Functions
+def add_text_to_image(img, pattern, line1, line2, line3, font_size, color):
+    """Overlay 2- or 3-line text on the image in a preset layout."""
+    if img is None:
+        return None, "Please supply an image first."
+    # Ensure editable copy
+    original_mode = img.mode
+    image = img.convert("RGBA")
+    draw = ImageDraw.Draw(image)
+    # Pick a font (robust fallback for different platforms)
+    try:
+        font = ImageFont.truetype("DejaVuSans-Bold.ttf", font_size)
+    except (OSError, IOError):
+        try:
+            # Try common system fonts
+            font = ImageFont.truetype("arial.ttf", font_size)  # Windows
+        except (OSError, IOError):
+            try:
+                font = ImageFont.truetype("/System/Library/Fonts/Arial.ttf", font_size)  # macOS
+            except (OSError, IOError):
+                try:
+                    font = ImageFont.truetype("/usr/share/fonts/truetype/dejavu/DejaVuSans-Bold.ttf", font_size)  # Linux
+                except (OSError, IOError):
+                    font = ImageFont.load_default()
+    w, h = image.size
+    positions = []
+    # Define text positioning patterns
+    if pattern == "2-lines-top":
+        positions = [(w / 2, h * 0.10), (w / 2, h * 0.20)]
+    elif pattern == "2-lines-bottom":
+        positions = [(w / 2, h * 0.80), (w / 2, h * 0.90)]
+    elif pattern == "2-lines-center":
+        positions = [(w / 2, h * 0.45), (w / 2, h * 0.55)]
+    elif pattern == "3-lines-center":
+        positions = [(w / 2, h * 0.40), (w / 2, h * 0.50), (w / 2, h * 0.60)]
+    elif pattern == "3-lines-top":
+        positions = [(w / 2, h * 0.10), (w / 2, h * 0.20), (w / 2, h * 0.30)]
+    elif pattern == "3-lines-bottom":
+        positions = [(w / 2, h * 0.70), (w / 2, h * 0.80), (w / 2, h * 0.90)]
+    # Ensure color is in the right format
+    if isinstance(color, str) and color.startswith('#'):
+        color = color  # PIL handles hex colors fine
+    # Draw text lines
+    lines = [line1, line2, line3][:len(positions)]
+    for (x, y), txt in zip(positions, lines):
+        if txt and txt.strip():  # Only draw non-empty text
+            draw.text((x, y), txt, fill=color, font=font, anchor="mm")
+    # Convert back to original mode if needed
+    if original_mode != "RGBA":
+        image = image.convert(original_mode)
+    return image, "Text added successfully!"
 # Create the Gradio Interface
+with gr.Blocks(title="AI Image Generator & Text Overlay") as demo:
+    gr.Markdown("# 🎨 AI Image Generator & Text Overlay")
+    gr.Markdown("Generate images with AI or upload your own, then add custom text overlays!")
     # Tab 1: Image Generation
     with gr.Tab("🖼️ Image Generation", id="generation_tab"):
             outputs=[generated_image, status_message]
         )
+    # Tab 2: Add Text Overlay
+    with gr.Tab("📝 Add Text", id="text_tab"):
+        gr.Markdown("## Overlay Text on Images")
+        gr.Markdown("Choose a layout pattern, type your text, and render it on the current image.")
         with gr.Row():
             with gr.Column():
+                # Text pattern selection
+                pattern = gr.Dropdown(
+                    choices=[
+                        ("2-lines-top", "2 lines - Top"),
+                        ("2-lines-center", "2 lines - Center"),
+                        ("2-lines-bottom", "2 lines - Bottom"),
+                        ("3-lines-top", "3 lines - Top"),
+                        ("3-lines-center", "3 lines - Center"),
+                        ("3-lines-bottom", "3 lines - Bottom")
                     ],
+                    value="2-lines-top",
+                    label="Layout Pattern"
+                )
+                # Text input fields
+                line1_inp = gr.Textbox(
+                    label="Line 1",
+                    placeholder="Enter first line of text..."
+                )
+                line2_inp = gr.Textbox(
+                    label="Line 2",
+                    placeholder="Enter second line of text..."
+                )
+                line3_inp = gr.Textbox(
+                    label="Line 3",
+                    placeholder="Enter third line of text..."
                 )
+                # Styling options
                 with gr.Row():
+                    font_size = gr.Slider(
+                        minimum=12,
+                        maximum=120,
+                        value=48,
+                        step=2,
+                        label="Font Size"
+                    )
+                    color = gr.ColorPicker(
+                        label="Text Color",
+                        value="#FFFFFF"
+                    )
+                add_text_btn = gr.Button("✨ Add Text to Image", variant="primary")
             with gr.Column():
+                # Output
+                text_image = gr.Image(label="Image with Text Overlay")
+        # Event handler for Tab 2
+        add_text_btn.click(
+            add_text_to_image,
+            inputs=[generated_image, pattern, line1_inp, line2_inp, line3_inp, font_size, color],
+            outputs=[text_image, status_message]
         )
+# Launch the application
 if __name__ == "__main__":
     demo.launch(
         server_name="0.0.0.0",
         server_port=7860
     )