Spaces:

scmlewis
/

image_edit_generation

Sleeping

App Files Files Community

scmlewis commited on Oct 21, 2025

Commit

56cc452

verified ·

1 Parent(s): 85c6816

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -172

app.py CHANGED Viewed

@@ -1,6 +1,5 @@
 import os
 import tempfile
-import time
 from PIL import Image
 import gradio as gr
 from google import genai
@@ -12,15 +11,10 @@ def save_binary_file(file_name, data):
         f.write(data)
 def generate_edit(prompt, pil_image, api_key, model="gemini-2.0-flash-exp"):
-    # Initialize client
     client = genai.Client(api_key=(api_key.strip() if api_key and api_key.strip() != "" else os.environ.get("GEMINI_API_KEY")))
-    # Save image to a temp path for upload
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_img:
         image_path = tmp_img.name
         pil_image.save(image_path)
-    # Upload and prepare content
     files = [client.files.upload(file=image_path)]
     contents = [
         types.Content(
@@ -31,8 +25,6 @@ def generate_edit(prompt, pil_image, api_key, model="gemini-2.0-flash-exp"):
             ],
         ),
     ]
-    # Config with image + text modalities
     generate_content_config = types.GenerateContentConfig(
         temperature=1,
         top_p=0.95,
@@ -41,11 +33,8 @@ def generate_edit(prompt, pil_image, api_key, model="gemini-2.0-flash-exp"):
         response_modalities=["image", "text"],
         response_mime_type="text/plain",
     )
     text_response = ""
     image_out_path = None
-    # Streamed generation to capture inline image data
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_out:
         out_path = tmp_out.name
         for chunk in client.models.generate_content_stream(
@@ -62,17 +51,11 @@ def generate_edit(prompt, pil_image, api_key, model="gemini-2.0-flash-exp"):
                 break
             else:
                 text_response += chunk.text + "\n"
-    # Cleanup
-    try:
-        del files
-    except Exception:
-        pass
     return image_out_path, text_response
 def process_image_and_prompt(pil_image, prompt, api_key, progress_callback=None):
     try:
-        # Indicate starting
         if progress_callback:
             progress_callback("Generating…")
         image_path, text_out = generate_edit(prompt, pil_image, api_key)
@@ -80,12 +63,10 @@ def process_image_and_prompt(pil_image, prompt, api_key, progress_callback=None)
             img = Image.open(image_path)
             if img.mode == "RGBA":
                 img = img.convert("RGB")
-            # success
             if progress_callback:
                 progress_callback("Done ✓")
             return img, "Image generated successfully!", None
         else:
-            # fail to generate image
             if progress_callback:
                 progress_callback("Failed to generate image")
             return None, f"⚠️ {text_out.strip()}", None
@@ -97,146 +78,47 @@ def process_image_and_prompt(pil_image, prompt, api_key, progress_callback=None)
 def reset_inputs(api_key_value=None):
     return None, "", api_key_value or "", ""
-# Styles
 css_style = """
-:root {
-  --bg: #14161c;
-  --panel: #1e1f25;
-  --text: #e8eaf6;
-  --muted: #a0aec0;
-  --accent: #6a8efd;
-}
-body, .app-container {
-  background: var(--bg);
-  color: var(--text);
-}
-.header-block {
-  width: 100%;
-  display: flex;
-  align-items: center;
-  justify-content: center;
-  padding: 18px;
-}
-.header-gradient {
-  width: 100%;
-  padding: 28px 0;
-  border-radius: 14px;
-  background: linear-gradient(90deg, #6a8efd, #44abc7);
-  box-shadow: 0 2px 12px rgb(50 50 70 / 12%);
-  text-align: center;
-}
-.header-title {
-  margin: 0;
-  font-size: 2.8rem;
-  font-weight: 900;
-  color: #fff;
-  text-shadow: 1px 3px 12px rgba(0,0,0,.25);
-}
-.header-subtitle {
-  margin-top: 6px;
-  font-size: 1.05rem;
-  color: #e8f2ff;
-}
-.gradient-button {
-  background: linear-gradient(90deg, #44abc7, #6a8efd);
-  color: white;
-  font-weight: 700;
-  border: none;
-  padding: 12px 28px;
-  border-radius: 10px;
-  cursor: pointer;
-  transition: background 0.25s ease;
-}
-.gradient-button:hover {
-  background: linear-gradient(90deg, #6a8efd, #44abc7);
-}
-.main {
-  display: flex;
-  gap: 22px;
-}
-.sidebar {
-  background: #1f2230;
-  padding: 20px;
-  border-radius: 12px;
-  min-height: 360px;
-  width: 320px;
-  box-shadow: 0 2px 10px rgb(0 0 0 / 0.25);
-}
-.sidebar h2 {
-  color: #8ab4ff;
-  font-size: 1rem;
-  margin: 6px 0 8px;
-}
-.sidebar ul {
-  margin: 0;
-  padding-left: 18px;
-  color: #dbeafe;
-  line-height: 1.8;
-}
-.sidebar a { color: #97b7ff; text-decoration: none; }
-.sidebar a:hover { text-decoration: underline; }
-.main-panel {
-  flex: 1;
-  min-width: 0;
-}
-.section-header {
-  font-size: 1.15rem;
-  font-weight: 700;
-  color: #cbd5e1;
-  margin: 8px 0;
-}
-.input-area, .output-area {
-  background: #1b1e28;
-  border-radius: 12px;
-  padding: 14px;
-  box-shadow: inset 0 0 0 rgba(0,0,0,0.0);
-}
-.input-area { margin-bottom: 12px; }
-.output-area { margin-top: 6px; text-align: center; }
-#status-text {
-  height: 1.2em;
-  line-height: 1.2em;
-  font-weight: 600;
-  text-align: left;
-  overflow: hidden;
-  white-space: nowrap;
-  padding: 0;
-  border: none;
-  background: transparent;
-  color: #cbd5e1;
-}
-#output-image {
-  display: flex;
-  justify-content: center;
-  align-items: center;
-}
-#output-image img {
-  max-width: 100%;
-  max-height: 420px;
-  width: auto;
-  height: auto;
-  object-fit: contain;
-  border-radius: 12px;
-  background: #23252b;
 }
 """
-# Layout
 with gr.Blocks(css=css_style) as app:
-    gr.HTML(
-        """
-        <div class='header-block'>
-          <div class='header-gradient'>
-            <h1 class='header-title'>🖼️ Image Editor <span style="font-size:1.1em;">(Powered by Gemini)</span> 🔮</h1>
-            <div class='header-subtitle'>Step-by-step prompts with a persistent status banner and progress feedback</div>
-          </div>
-        </div>
-        """
-    )
     with gr.Row():
-        # Sidebar (instructions)
         with gr.Column(scale=3, elem_classes="sidebar"):
             gr.Markdown(
                 """
@@ -251,28 +133,31 @@ with gr.Blocks(css=css_style) as app:
                 <div>Get your key here: <a href="https://aistudio.google.com/apikey" target="_blank">Get your Google API key</a></div>
                 """
             )
-        # Main panel (steps and outputs)
         with gr.Column(scale=9, elem_classes="main-panel"):
-            with gr.Column():
-                # Step 1: Upload Image
-                gr.Markdown("<div class='section-header'>Step 1: Upload Image</div>")
-                image_input = gr.Image(type="pil", label=None, image_mode="RGBA")
-                # Step 2: Prompt + API Key
-                gr.Markdown("<div class='section-header'>Step 2: Enter Editing Prompt</div>")
-                prompt_input = gr.Textbox(label="Edit Prompt", placeholder="Describe how to edit the image", lines=2)
-                api_key_input = gr.Textbox(label="Gemini API Key (required)", placeholder="Enter your Gemini API key here", type="password")
-                with gr.Row():
-                    submit_btn = gr.Button("Generate Edit", elem_classes="gradient-button")
-                    reset_btn = gr.Button("Reset Inputs")
-                # Step 3: Output
-                gr.Markdown("<div class='section-header'>Step 3: Image Output</div>")
-                output_image = gr.Image(label=None, show_label=False, type="pil")
-                status_text = gr.Textbox(label="Status", interactive=False, lines=1, elem_id="status-text")
-            # Callback wiring
             def on_submit(pil_img, prompt, key, progress=None):
                 if not key or key.strip() == "":
                     raise gr.Error("Gemini API Key is required!")
@@ -282,13 +167,13 @@ with gr.Blocks(css=css_style) as app:
             submit_btn.click(
                 fn=on_submit,
                 inputs=[image_input, prompt_input, api_key_input],
-                outputs=[output_image, status_text]
             )
             reset_btn.click(
                 fn=reset_inputs,
                 inputs=[api_key_input],
-                outputs=[image_input, prompt_input, api_key_input, status_text]
             )
 app.launch()

 import os
 import tempfile
 from PIL import Image
 import gradio as gr
 from google import genai
         f.write(data)
 def generate_edit(prompt, pil_image, api_key, model="gemini-2.0-flash-exp"):
     client = genai.Client(api_key=(api_key.strip() if api_key and api_key.strip() != "" else os.environ.get("GEMINI_API_KEY")))
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_img:
         image_path = tmp_img.name
         pil_image.save(image_path)
     files = [client.files.upload(file=image_path)]
     contents = [
         types.Content(
             ],
         ),
     ]
     generate_content_config = types.GenerateContentConfig(
         temperature=1,
         top_p=0.95,
         response_modalities=["image", "text"],
         response_mime_type="text/plain",
     )
     text_response = ""
     image_out_path = None
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_out:
         out_path = tmp_out.name
         for chunk in client.models.generate_content_stream(
                 break
             else:
                 text_response += chunk.text + "\n"
+    del files
     return image_out_path, text_response
 def process_image_and_prompt(pil_image, prompt, api_key, progress_callback=None):
     try:
         if progress_callback:
             progress_callback("Generating…")
         image_path, text_out = generate_edit(prompt, pil_image, api_key)
             img = Image.open(image_path)
             if img.mode == "RGBA":
                 img = img.convert("RGB")
             if progress_callback:
                 progress_callback("Done ✓")
             return img, "Image generated successfully!", None
         else:
             if progress_callback:
                 progress_callback("Failed to generate image")
             return None, f"⚠️ {text_out.strip()}", None
 def reset_inputs(api_key_value=None):
     return None, "", api_key_value or "", ""
 css_style = """
+:root { --bg:#0f111a; --panel:#151a24; --text:#e9eefc; --muted:#9fb3c8; --accent:#6a8efd; }
+body, .app-container { background: var(--bg); color: var(--text); }
+.header-block { width: 100%; display: flex; justify-content: center; padding: 12px 0; }
+.header-gradient { width: 100%; padding: 22px 0; border-radius: 12px; background: linear-gradient(90deg, #6a8efd, #44abc7); box-shadow: 0 2px 12px rgb(50 50 70 / 12%); text-align: center; }
+.header-title { margin: 0; font-size: 2.6rem; font-weight: 900; color: #fff; text-shadow: 0 2px 8px rgba(0,0,0,.25); }
+.header-subtitle { margin-top: 6px; font-size: 1.05rem; color: #e8f0ff; }
+.main { display: flex; gap: 20px; align-items: stretch; padding: 0 16px; }
+.sidebar { width: 320px; background: #1b1f2b; padding: 16px; border-radius: 12px; }
+.sidebar h2 { color: #89b4ff; font-size: 1rem; margin: 8px 0; }
+.sidebar ul { margin: 0; padding-left: 20px; color: #d6e3ff; line-height: 1.9; }
+.main-panel { flex: 1; display: flex; flex-direction: column; gap: 12px; }
+.layout-row { display: flex; gap: 16px; align-items: flex-start; }
+.left, .right { flex: 1; min-width: 0; }
+.section-header { font-weight: 800; font-size: 1.05rem; color: #cbd5e1; margin: 0 0 6px 0; }
+.input-area, .output-area { background: #202533; border-radius: 12px; padding: 12px; }
+#status-text { height: 1.6em; line-height: 1.6em; white-space: nowrap; overflow: hidden; text-overflow: ellipsis; padding: 0 8px; border: none; background: transparent; color: #cbd5e1; font-weight: 700; }
+#output-viewport { display: flex; justify-content: center; align-items: center; min-height: 260px; }
+#output-image { width: 100%; display: flex; justify-content: center; align-items: center; }
+#output-image img { max-width: 100%; max-height: 420px; object-fit: contain; border-radius: 12px; background: #23252b; }
+@media (max-width: 1100px) {
+  .main { flex-direction: column; }
+  .sidebar { display: none; }
 }
 """
 with gr.Blocks(css=css_style) as app:
+    gr.HTML("""
+    <div class='header-block'>
+      <div class='header-gradient'>
+        <h1 class='header-title'>🖼️ Image Editor <span style="font-size:1.1em;">(Powered by Gemini)</span> 🔮</h1>
+        <div class='header-subtitle'>Step-by-step prompts with a persistent status banner and progress feedback</div>
+      </div>
+    </div>
+    """)
     with gr.Row():
         with gr.Column(scale=3, elem_classes="sidebar"):
             gr.Markdown(
                 """
                 <div>Get your key here: <a href="https://aistudio.google.com/apikey" target="_blank">Get your Google API key</a></div>
                 """
             )
         with gr.Column(scale=9, elem_classes="main-panel"):
+            # Step 1: Upload on left; Step 3: Output on right
+            # We’ll implement side-by-side using a two-column sub-layout
+            with gr.Row(class_name="layout-row"):
+                with gr.Column(class_name="left"):
+                    gr.Markdown("<div class='section-header'>Step 1: Upload Image</div>")
+                    image_input = gr.Image(type="pil", label=None, image_mode="RGBA")
+                with gr.Column(class_name="right"):
+                    gr.Markdown("<div class='section-header'>Step 3: Image Output</div>")
+                    output_image = gr.Image(label=None, show_label=False, type="pil")
+            # Step 2 area (prompt + API)
+            gr.Markdown("<div class='section-header'>Step 2: Enter Editing Prompt</div>")
+            prompt_input = gr.Textbox(label="Edit Prompt", placeholder="Describe how to edit the image", lines=2)
+            api_key_input = gr.Textbox(label="Gemini API Key (required)", placeholder="Enter your Gemini API key here", type="password")
+            with gr.Row():
+                submit_btn = gr.Button("Generate Edit", elem_classes="gradient-button")
+                reset_btn = gr.Button("Reset Inputs")
+            with gr.Row():
+                # Status bar (persistent)
+                status_bar = gr.Textbox(label="Status", interactive=False, lines=1, elem_id="status-text")
+            # Wire callbacks
             def on_submit(pil_img, prompt, key, progress=None):
                 if not key or key.strip() == "":
                     raise gr.Error("Gemini API Key is required!")
             submit_btn.click(
                 fn=on_submit,
                 inputs=[image_input, prompt_input, api_key_input],
+                outputs=[output_image, status_bar]
             )
             reset_btn.click(
                 fn=reset_inputs,
                 inputs=[api_key_input],
+                outputs=[image_input, prompt_input, api_key_input, status_bar]
             )
 app.launch()