Spaces:

AkashKumarave
/

11

Running

App Files Files Community

AkashKumarave commited on Sep 4

Commit

0a3b563

verified ·

1 Parent(s): 3380cf2

Update app.py

Browse files

Files changed (1) hide show

app.py +193 -196

app.py CHANGED Viewed

@@ -1,197 +1,194 @@
-import json
-import os
-import time
-import uuid
-import tempfile
-from PIL import Image, ImageDraw, ImageFont
-import gradio as gr
-import base64
-import mimetypes
-from io import BytesIO
-from google import genai
-from google.genai import types
-def generate(text, images, api_key, model="gemini-2.5-flash-image-preview"):
-    # Initialize client using provided api_key (or fallback to env variable)
-    client = genai.Client(api_key=(api_key.strip() if api_key and api_key.strip() != ""
-                                     else os.environ.get("GEMINI_API_KEY")))
-    # Prepare contents with images first, then text
-    contents = images + [text]
-    response = client.models.generate_content(
-        model=model,
-        contents=contents,
-    )
-    text_response = ""
-    image_path = None
-    for part in response.candidates[0].content.parts:
-        if part.text is not None:
-            text_response += part.text + "\n"
-        elif part.inline_data is not None:
-            # Create a temporary file to store the generated image
-            with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
-                temp_path = tmp.name
-                generated_image = Image.open(BytesIO(part.inline_data.data))
-                generated_image.save(temp_path)
-                image_path = temp_path
-                print(f"Generated image saved to: {temp_path} with prompt: {text}")
-    return image_path, text_response
-def load_uploaded_images(uploaded_files):
-    """Load and display uploaded images immediately"""
-    uploaded_images = []
-    if uploaded_files:
-        for file in uploaded_files:
-            if file.name.lower().endswith(('.png', '.jpg', '.jpeg', '.webp')):
-                img = Image.open(file.name)
-                if img.mode == "RGBA":
-                    img = img.convert("RGBA")
-                uploaded_images.append(img)
-    return uploaded_images
-def process_image_and_prompt(uploaded_files, prompt, gemini_api_key):
-    try:
-        input_text = prompt
-        model = "gemini-2.5-flash-image-preview"
-        # Load images from uploaded files
-        images = []
-        uploaded_images = []
-        if uploaded_files:
-            for file in uploaded_files:
-                if file.name.lower().endswith(('.png', '.jpg', '.jpeg', '.webp')):
-                    img = Image.open(file.name)
-                    if img.mode == "RGBA":
-                        img = img.convert("RGBA")
-                    images.append(img)
-                    uploaded_images.append(img)
-        if not images:
-            raise gr.Error("Please upload at least one image", duration=5)
-        # Format: [dress_image, model_image, text_input] or [image1, image2, ..., text_input]
-        image_path, text_response = generate(text=input_text, images=images, api_key=gemini_api_key, model=model)
-        if image_path:
-            # Load and convert the image if needed.
-            result_img = Image.open(image_path)
-            if result_img.mode == "RGBA":
-                result_img = result_img.convert("RGBA")
-            return uploaded_images, [result_img], ""  # Return uploaded images, generated image, and empty text output.
-        else:
-            # Return uploaded images, no generated image, and the text response.
-            return uploaded_images, None, text_response
-    except Exception as e:
-        raise gr.Error(f"Error Getting {e}", duration=5)
-# Build a Blocks-based interface with a custom HTML header and CSS
-with gr.Blocks(css_paths="style.css",) as demo:
-    # Custom HTML header with proper class for styling
-    gr.HTML(
-    """
-    <div class="header-container">
-      <div>
-          <img src="https://www.gstatic.com/lamda/images/gemini_favicon_f069958c85030456e93de685481c559f160ea06b.png" alt="Gemini logo">
-      </div>
-      <div>
-          <h1>Gemini for Image Editing</h1>
-          <p>Powered by <a href="https://gradio.app/">Gradio</a>⚡️|
-          <a href="https://huggingface.co/spaces/ameerazam08/Gemini-Image-Edit?duplicate=true">Duplicate</a> this Repo |
-          <a href="https://aistudio.google.com/apikey">Get an API Key</a> |
-          Follow me on Twitter: <a href="https://x.com/Ameerazam18">Ameerazam18</a></p>
-      </div>
-    </div>
-    """
-    )
-    with gr.Accordion("⚠️ API Configuration ⚠️", open=False, elem_classes="config-accordion"):
-        gr.Markdown("""
-    - **Issue:** ❗ Sometimes the model returns text instead of an image.
-    ### 🔧 Steps to Address:
-    1. **🛠️ Duplicate the Repository**
-       - Create a separate copy for modifications.
-    2. **🔑 Use Your Own Gemini API Key**
-       - You **must** configure your own Gemini key for generation!
-    """)
-    with gr.Accordion("📌 Usage Instructions", open=False, elem_classes="instructions-accordion"):
-        gr.Markdown("""
-    ### 📌 Usage
-    - Upload an image and enter a prompt to generate outputs.
-    - If text is returned instead of an image, it will appear in the text output.
-    - Upload Only PNG Image
-    - ❌ **Do not use NSFW images!**
-    """)
-    with gr.Row(elem_classes="main-content"):
-        with gr.Column(elem_classes="input-column"):
-            image_input = gr.File(
-                file_types=["image"],
-                file_count="multiple",
-                label="Upload Images ",
-                elem_id="image-input",
-                elem_classes="upload-box"
-            )
-            gemini_api_key = gr.Textbox(
-                lines=1,
-                placeholder="Enter Gemini API Key (optional)",
-                label="Gemini API Key (optional)",
-                elem_classes="api-key-input"
-            )
-            prompt_input = gr.Textbox(
-                lines=2,
-                placeholder="Enter prompt here...",
-                label="Prompt",
-                elem_classes="prompt-input"
-            )
-            submit_btn = gr.Button("Generate", elem_classes="generate-btn")
-        with gr.Column(elem_classes="output-column"):
-            uploaded_gallery = gr.Gallery(label="Uploaded Images", elem_classes="uploaded-gallery")
-            output_gallery = gr.Gallery(label="Generated Outputs", elem_classes="output-gallery")
-            output_text = gr.Textbox(
-                label="Gemini Output",
-                placeholder="Text response will appear here if no image is generated.",
-                elem_classes="output-text"
-            )
-    # Set up the interaction with three outputs.
-    submit_btn.click(
-        fn=process_image_and_prompt,
-        inputs=[image_input, prompt_input, gemini_api_key],
-        outputs=[uploaded_gallery, output_gallery, output_text],
-    )
-    # Update uploaded gallery immediately when files are uploaded
-    image_input.upload(
-        fn=load_uploaded_images,
-        inputs=[image_input],
-        outputs=[uploaded_gallery],
-    )
-    gr.Markdown("## Try these examples", elem_classes="gr-examples-header")
-    examples = [
-        ["data/1.webp", 'change text to "AMEER"'],
-        ["data/2.webp", "remove the spoon from hand only"],
-        ["data/3.webp", 'change text to "Make it "'],
-        ["data/1.jpg", "add joker style only on face"],
-        ["data/1777043.jpg", "add joker style only on face"],
-        ["data/2807615.jpg", "add lipstick on lip only"],
-        ["data/76860.jpg", "add lipstick on lip only"],
-        ["data/2807615.jpg", "make it happy looking face only"],
-    ]
-    gr.Examples(
-        examples=examples,
-        inputs=[image_input, prompt_input,],
-        elem_id="examples-grid"
-    )
 demo.queue(max_size=50).launch(mcp_server=True, share=True)

+import json
+import os
+import time
+import uuid
+import tempfile
+from PIL import Image
+import gradio as gr
+import base64
+import mimetypes
+from io import BytesIO
+from google import genai
+def generate(text, images, api_key=None, model="gemini-2.5-flash-image-preview"):
+    # Initialize client using provided api_key or fallback to environment variable
+    api_key = api_key.strip() if api_key and api_key.strip() != "" else os.environ.get("GEMINI_API_KEY", "AIzaSyDL5Rilo7ptJpUOZdY6wy8PJYUcVcnDADs")
+    client = genai.Client(api_key=api_key)
+    # Prepare contents with images first, then text
+    contents = images + [text]
+    response = client.models.generate_content(
+        model=model,
+        contents=contents,
+    )
+    text_response = ""
+    image_path = None
+    for part in response.candidates[0].content.parts:
+        if part.text is not None:
+            text_response += part.text + "\n"
+        elif part.inline_data is not None:
+            # Create a temporary file to store the generated image
+            with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
+                temp_path = tmp.name
+                generated_image = Image.open(BytesIO(part.inline_data.data))
+                generated_image.save(temp_path)
+                image_path = temp_path
+                print(f"Generated image saved to: {temp_path} with prompt: {text}")
+    return image_path, text_response
+def load_uploaded_images(uploaded_files):
+    """Load and display uploaded images immediately"""
+    uploaded_images = []
+    if uploaded_files:
+        for file in uploaded_files:
+            if file.name.lower().endswith(('.png', '.jpg', '.jpeg', '.webp')):
+                img = Image.open(file.name)
+                if img.mode == "RGBA":
+                    img = img.convert("RGBA")
+                uploaded_images.append(img)
+    return uploaded_images
+def process_image_and_prompt(uploaded_files, prompt, gemini_api_key):
+    try:
+        input_text = prompt
+        model = "gemini-2.5-flash-image-preview"
+        # Load images from uploaded files
+        images = []
+        uploaded_images = []
+        if uploaded_files:
+            for file in uploaded_files:
+                if file.name.lower().endswith(('.png', '.jpg', '.jpeg', '.webp')):
+                    img = Image.open(file.name)
+                    if img.mode == "RGBA":
+                        img = img.convert("RGBA")
+                    images.append(img)
+                    uploaded_images.append(img)
+        if not images:
+            raise gr.Error("Please upload at least one image", duration=5)
+        # Call generate with images and prompt
+        image_path, text_response = generate(text=input_text, images=images, api_key=gemini_api_key, model=model)
+        if image_path:
+            # Load and convert the generated image if needed
+            result_img = Image.open(image_path)
+            if result_img.mode == "RGBA":
+                result_img = result_img.convert("RGBA")
+            return uploaded_images, [result_img], ""  # Return uploaded images, generated image, and empty text output
+        else:
+            # Return uploaded images, no generated image, and the text response
+            return uploaded_images, None, text_response
+    except Exception as e:
+        raise gr.Error(f"Error: {e}", duration=5)
+# Build a Blocks-based interface with a custom HTML header and CSS
+with gr.Blocks(css="style.css") as demo:
+    # Custom HTML header with proper class for styling
+    gr.HTML(
+        """
+        <div class="header-container">
+          <div>
+              <img src="https://www.gstatic.com/lamda/images/gemini_favicon_f069958c85030456e93de685481c559f160ea06b.png" alt="Gemini logo">
+          </div>
+          <div>
+              <h1>Gemini for Image Editing</h1>
+              <p>Powered by <a href="https://gradio.app/">Gradio</a> |
+              <a href="https://huggingface.co/spaces/ameerazam08/Gemini-Image-Edit?duplicate=true">Duplicate</a> this Repo |
+              <a href="https://aistudio.google.com/apikey">Get an API Key</a> |
+              Follow me on Twitter: <a href="https://x.com/Ameerazam18">Ameerazam18</a></p>
+          </div>
+        </div>
+        """
+    )
+    with gr.Accordion("API Configuration", open=False, elem_classes="config-accordion"):
+        gr.Markdown("""
+        - **Issue:** Sometimes the model returns text instead of an image.
+        ### Steps to Address:
+        1. **Duplicate the Repository**
+           - Create a separate copy for modifications.
+        2. **Use Your Own Gemini API Key**
+           - You **must** configure your own Gemini key for generation!
+        """)
+    with gr.Accordion("Usage Instructions", open=False, elem_classes="instructions-accordion"):
+        gr.Markdown("""
+        ### Usage
+        - Upload an image and enter a prompt to generate outputs.
+        - If text is returned instead of an image, it will appear in the text output.
+        - Upload only PNG, JPG, JPEG, or WEBP images.
+        - **Do not use NSFW images!**
+        """)
+    with gr.Row(elem_classes="main-content"):
+        with gr.Column(elem_classes="input-column"):
+            image_input = gr.File(
+                file_types=["image"],
+                file_count="multiple",
+                label="Upload Images",
+                elem_id="image-input",
+                elem_classes="upload-box"
+            )
+            gemini_api_key = gr.Textbox(
+                lines=1,
+                placeholder="Enter Gemini API Key (optional)",
+                label="Gemini API Key (optional)",
+                elem_classes="api-key-input"
+            )
+            prompt_input = gr.Textbox(
+                lines=2,
+                placeholder="Enter prompt here...",
+                label="Prompt",
+                elem_classes="prompt-input"
+            )
+            submit_btn = gr.Button("Generate", elem_classes="generate-btn")
+        with gr.Column(elem_classes="output-column"):
+            uploaded_gallery = gr.Gallery(label="Uploaded Images", elem_classes="uploaded-gallery")
+            output_gallery = gr.Gallery(label="Generated Outputs", elem_classes="output-gallery")
+            output_text = gr.Textbox(
+                label="Gemini Output",
+                placeholder="Text response will appear here if no image is generated.",
+                elem_classes="output-text"
+            )
+    # Set up the interaction with three outputs
+    submit_btn.click(
+        fn=process_image_and_prompt,
+        inputs=[image_input, prompt_input, gemini_api_key],
+        outputs=[uploaded_gallery, output_gallery, output_text],
+    )
+    # Update uploaded gallery immediately when files are uploaded
+    image_input.upload(
+        fn=load_uploaded_images,
+        inputs=[image_input],
+        outputs=[uploaded_gallery],
+    )
+    gr.Markdown("## Try these examples", elem_classes="gr-examples-header")
+    examples = [
+        ["data/1.webp", 'change text to "AMEER"'],
+        ["data/2.webp", "remove the spoon from hand only"],
+        ["data/3.webp", 'change text to "Make it "'],
+        ["data/1.jpg", "add joker style only on face"],
+        ["data/1777043.jpg", "add joker style only on face"],
+        ["data/2807615.jpg", "add lipstick on lip only"],
+        ["data/76860.jpg", "add lipstick on lip only"],
+        ["data/2807615.jpg", "make it happy looking face only"],
+    ]
+    gr.Examples(
+        examples=examples,
+        inputs=[image_input, prompt_input],
+        elem_id="examples-grid"
+    )
 demo.queue(max_size=50).launch(mcp_server=True, share=True)