Spaces:

Abs6187
/

BuildTheFuture

Sleeping

App Files Files Community

Abs6187 commited on Sep 7

Commit

f63aea2

verified ·

1 Parent(s): 8a31836

Update app.py

Browse files

Files changed (1) hide show

app.py +432 -389

app.py CHANGED Viewed

@@ -1,390 +1,433 @@
-import gradio as gr
-import google.generativeai as genai
-import cv2
-import numpy as np
-from PIL import Image, ImageDraw, ImageFont
-import os
-import base64
-import io
-import logging
-import time
-from typing import Optional, Tuple
-import warnings
-warnings.filterwarnings("ignore")
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
-ELEVENLABS_API_KEY = os.getenv("ELEVENLABS_API_KEY")
-MAX_IMAGE_SIZE = 1024
-RATE_LIMIT_DELAY = 3
-API_RETRY_COUNT = 3
-if GEMINI_API_KEY:
-    genai.configure(api_key=GEMINI_API_KEY)
-    logger.info("Gemini API configured")
-else:
-    logger.warning("GEMINI_API_KEY not found - using demo mode")
-try:
-    from elevenlabs import generate, set_api_key
-    if ELEVENLABS_API_KEY:
-        set_api_key(ELEVENLABS_API_KEY)
-        logger.info("ElevenLabs configured")
-    else:
-        logger.info("ElevenLabs not configured - optional feature")
-except ImportError:
-    logger.info("ElevenLabs not available - optional feature")
-try:
-    from ultralytics import YOLO
-    yolo_available = True
-except ImportError:
-    yolo_available = False
-    logger.info("YOLO not available - optional feature")
-class NanoBananaApp:
-    def __init__(self):
-        self.gemini_model = None
-        self.yolo_model = None
-        self._initialize_gemini()
-    def _initialize_gemini(self):
-        if not GEMINI_API_KEY:
-            logger.warning("No API key - demo mode")
-            return
-        try:
-            self.gemini_model = genai.GenerativeModel('gemini-2.0-flash-exp')
-            logger.info("Nano Banana (Gemini 2.5 Flash Image) initialized")
-        except Exception as e:
-            logger.error(f"Failed to initialize Gemini: {e}")
-    def _resize_image_if_needed(self, image):
-        if image.width > MAX_IMAGE_SIZE or image.height > MAX_IMAGE_SIZE:
-            ratio = min(MAX_IMAGE_SIZE / image.width, MAX_IMAGE_SIZE / image.height)
-            new_size = (int(image.width * ratio), int(image.height * ratio))
-            return image.resize(new_size, Image.Resampling.LANCZOS)
-        return image
-    def _apply_rate_limiting(self):
-        time.sleep(RATE_LIMIT_DELAY)
-    def load_yolo_optional(self):
-        if not yolo_available:
-            return False
-        try:
-            model_path = 'best.pt' if os.path.exists('best.pt') else 'yolov11n.pt'
-            self.yolo_model = YOLO(model_path)
-            return True
-        except Exception as e:
-            logger.warning(f"YOLO loading failed: {e}")
-            return False
-    def detect_structures_optional(self, image):
-        if not self.yolo_model and not self.load_yolo_optional():
-            return image, "Structure detection unavailable (optional feature)"
-        try:
-            img_cv = cv2.cvtColor(np.array(image), cv2.COLOR_RGB2BGR)
-            results = self.yolo_model(img_cv)
-            annotated_img = results[0].plot()
-            annotated_pil = Image.fromarray(cv2.cvtColor(annotated_img, cv2.COLOR_BGR2RGB))
-            return annotated_pil, "Structures detected"
-        except Exception as e:
-            return image, f"Detection failed: {str(e)}"
-    def nano_banana_edit(self, image, prompt, style="realistic", editing_mode="complete"):
-        if not self.gemini_model:
-            if not GEMINI_API_KEY:
-                return image, "🔑 API key required for Nano Banana. Add GEMINI_API_KEY to use this feature."
-            return image, "Gemini Nano Banana not available"
-        if not prompt.strip():
-            return image, "Please provide a transformation prompt"
-        try:
-            image = self._resize_image_if_needed(image)
-            self._apply_rate_limiting()
-            if editing_mode == "complete":
-                base_prompt = self._get_completion_prompt(style)
-                full_prompt = f"{base_prompt} {prompt}"
-            elif editing_mode == "edit":
-                full_prompt = f"Edit this image: {prompt}. Make the changes look natural and maintain image quality."
-            elif editing_mode == "blend":
-                full_prompt = f"Blend and transform this image: {prompt}. Create a seamless fusion of elements."
-            else:
-                full_prompt = prompt
-            for attempt in range(API_RETRY_COUNT):
-                try:
-                    buffered = io.BytesIO()
-                    image.save(buffered, format='PNG', quality=85)
-                    image_bytes = buffered.getvalue()
-                    if len(image_bytes) > 10 * 1024 * 1024:
-                        return image, "Image too large. Please use a smaller image."
-                    response = self.gemini_model.generate_content([
-                        full_prompt,
-                        {
-                            'mime_type': 'image/png',
-                            'data': base64.b64encode(image_bytes).decode('utf-8')
-                        }
-                    ])
-                    if hasattr(response, 'candidates') and response.candidates:
-                        for part in response.candidates[0].content.parts:
-                            if hasattr(part, 'inline_data') and part.inline_data:
-                                if hasattr(part.inline_data, 'data'):
-                                    image_data = base64.b64decode(part.inline_data.data)
-                                    result_image = Image.open(io.BytesIO(image_data)).convert('RGB')
-                                    return result_image, f"✨ Nano Banana: {editing_mode} mode with {style} style"
-                    if attempt < API_RETRY_COUNT - 1:
-                        time.sleep(2 ** attempt)
-                        continue
-                    return image, "No image generated - please try a different prompt"
-                except Exception as retry_error:
-                    if attempt < API_RETRY_COUNT - 1:
-                        logger.warning(f"Attempt {attempt + 1} failed: {retry_error}")
-                        time.sleep(2 ** attempt)
-                        continue
-                    raise retry_error
-        except Exception as e:
-            logger.error(f"Nano Banana error: {e}")
-            if "quota" in str(e).lower() or "limit" in str(e).lower():
-                return image, "⏱️ API rate limit reached. Please try again in a few minutes."
-            return image, f"Processing failed: {str(e)}"
-    def _get_completion_prompt(self, style):
-        prompts = {
-            "realistic": "Complete this unfinished construction realistically with proper materials and architectural details.",
-            "futuristic": "Transform this construction into a futuristic high-tech building with modern elements.",
-            "artistic": "Complete this construction with creative artistic elements and unique design features."
-        }
-        return prompts.get(style, prompts["realistic"])
-    def generate_voice_optional(self, text):
-        if not ELEVENLABS_API_KEY:
-            return None
-        try:
-            audio = generate(text=text, voice="Rachel", model="eleven_monolingual_v1")
-            return audio
-        except Exception as e:
-            logger.warning(f"Voice generation failed: {e}")
-            return None
-    def create_comparison(self, original, processed):
-        if not original or not processed:
-            return None
-        try:
-            height = min(original.height, processed.height, 512)
-            width = min(original.width, processed.width, 512)
-            orig_resized = original.resize((width, height), Image.Resampling.LANCZOS)
-            proc_resized = processed.resize((width, height), Image.Resampling.LANCZOS)
-            comparison = Image.new('RGB', (width * 2 + 20, height + 40), 'white')
-            comparison.paste(orig_resized, (0, 20))
-            comparison.paste(proc_resized, (width + 20, 20))
-            draw = ImageDraw.Draw(comparison)
-            try:
-                font = ImageFont.load_default()
-                draw.text((width//2 - 30, 5), "BEFORE", fill='black', font=font)
-                draw.text((width + 20 + width//2 - 30, 5), "AFTER", fill='black', font=font)
-            except:
-                pass
-            return comparison
-        except Exception as e:
-            logger.warning(f"Comparison creation failed: {e}")
-            return None
-app = NanoBananaApp()
-def process_nano_banana(image, prompt, style, editing_mode, enable_detection, enable_voice):
-    if not image:
-        return None, None, None, None, "📷 Please upload an image to get started", None
-    if not prompt or not prompt.strip():
-        return image, image, image, None, "💭 Please provide a transformation prompt", None
-    try:
-        detection_result = image
-        detection_msg = "Detection disabled"
-        if enable_detection:
-            detection_result, detection_msg = app.detect_structures_optional(image)
-        processed_image, process_msg = app.nano_banana_edit(image, prompt, style, editing_mode)
-        if processed_image == image and "API key required" in process_msg:
-            return image, detection_result, image, None, f"🔑 {process_msg}", None
-        comparison = app.create_comparison(image, processed_image)
-        audio = None
-        voice_msg = ""
-        if enable_voice:
-            if processed_image != image:
-                voice_text = f"Image transformed using Nano Banana with {editing_mode} mode and {style} style. {prompt}"
-                audio = app.generate_voice_optional(voice_text)
-                voice_msg = "🔊 Voice generated" if audio else "🔇 Voice unavailable"
-            else:
-                voice_msg = "🔇 Voice skipped (no changes)"
-        status_parts = [f"🍌 {process_msg}"]
-        if enable_detection:
-            status_parts.append(f"📍 Detection: {detection_msg}")
-        if enable_voice:
-            status_parts.append(f"🎵 Voice: {voice_msg}")
-        status = "\n".join(status_parts)
-        return image, detection_result, processed_image, comparison, status, audio
-    except Exception as e:
-        logger.error(f"Processing error: {e}")
-        return image, image, image, None, f"❌ Unexpected error: {str(e)}", None
-custom_css = """
-.nano-banner {
-    background: linear-gradient(45deg, #ff6b6b, #feca57, #48dbfb, #ff9ff3);
-    background-size: 400% 400%;
-    animation: gradient 15s ease infinite;
-    padding: 20px;
-    border-radius: 10px;
-    text-align: center;
-    margin-bottom: 20px;
-}
-@keyframes gradient {
-    0% { background-position: 0% 50%; }
-    50% { background-position: 100% 50%; }
-    100% { background-position: 0% 50%; }
-}
-.feature-highlight {
-    border: 2px solid #4CAF50;
-    border-radius: 8px;
-    padding: 15px;
-    margin: 10px 0;
-}
-"""
-demo_mode_notice = ""
-if not GEMINI_API_KEY:
-    demo_mode_notice = """
-    <div style="background: #ffebee; border: 1px solid #f44336; border-radius: 8px; padding: 15px; margin: 10px 0;">
-        <h3>🔑 API Key Required</h3>
-        <p>To use Nano Banana features, add your <strong>GEMINI_API_KEY</strong> in the Space settings.</p>
-        <p>Get your free API key from <a href="https://makersuite.google.com/app/apikey" target="_blank">Google AI Studio</a></p>
-    </div>
-    """
-with gr.Blocks(title="🍌 Nano Banana - Dynamic Image Creation", theme=gr.themes.Soft(), css=custom_css) as demo:
-    gr.HTML(f"""
-    <div class="nano-banner">
-        <h1>🍌 Nano Banana: Dynamic Image Creation</h1>
-        <p><strong>Powered by Gemini 2.5 Flash Image Preview</strong></p>
-        <p>Edit with words • Blend realities • Transform visuals</p>
-    </div>
-    {demo_mode_notice}
-    """)
-    with gr.Row():
-        with gr.Column(scale=1):
-            with gr.Group():
-                gr.Markdown("### 🎨 Core Nano Banana Features")
-                image_input = gr.Image(label="Upload Image", type="pil", height=300)
-                prompt_input = gr.Textbox(
-                    label="Transformation Prompt",
-                    placeholder="Describe how you want to transform this image...",
-                    lines=3
-                )
-                editing_mode = gr.Radio(
-                    choices=["complete", "edit", "blend"],
-                    value="edit",
-                    label="Nano Banana Mode",
-                    info="Complete: Finish construction • Edit: Modify image • Blend: Fuse elements"
-                )
-                style_selector = gr.Radio(
-                    choices=["realistic", "futuristic", "artistic"],
-                    value="realistic",
-                    label="Style",
-                    info="Choose the aesthetic approach"
-                )
-            with gr.Group():
-                gr.Markdown("### ⚙️ Optional Features")
-                enable_detection = gr.Checkbox(
-                    label="🔍 Structure Detection (YOLO)",
-                    value=False,
-                    info="Optional: Detect and highlight structures"
-                )
-                enable_voice = gr.Checkbox(
-                    label="🔊 Voice Narration (ElevenLabs)",
-                    value=False,
-                    info="Optional: Generate audio description"
-                )
-            process_btn = gr.Button("🚀 Transform with Nano Banana", variant="primary", size="lg")
-            status_output = gr.Textbox(label="Status", interactive=False, lines=4)
-        with gr.Column(scale=2):
-            with gr.Tabs():
-                with gr.Tab("📷 Original"):
-                    original_output = gr.Image(label="Original Image", height=400)
-                with gr.Tab("🔍 Detection (Optional)"):
-                    detection_output = gr.Image(label="Structure Detection", height=400)
-                with gr.Tab("🍌 Nano Banana Result"):
-                    result_output = gr.Image(label="Transformed Image", height=400, elem_classes=["feature-highlight"])
-                with gr.Tab("📊 Before/After"):
-                    comparison_output = gr.Image(label="Comparison View", height=400)
-    with gr.Row():
-        audio_output = gr.Audio(label="🔊 Voice Description (Optional)", visible=True)
-    with gr.Row():
-        gr.Examples(
-            examples=[
-                ["samples_imagen/skyscraper_construction.jpg", "Complete this modern skyscraper with glass facades", "futuristic", "complete", True, False],
-                ["samples_imagen/suspension_bridge.jpg", "Add a golden sunset reflection on the bridge", "artistic", "edit", False, True],
-                ["samples_imagen/highway_construction.jpg", "Transform into a smart highway with digital elements", "futuristic", "blend", True, False],
-                ["samples_imagen/residential_construction.jpg", "Complete as a sustainable eco-friendly home", "realistic", "complete", False, False]
-            ],
-            inputs=[image_input, prompt_input, style_selector, editing_mode, enable_detection, enable_voice],
-            label="🎯 Try These Examples"
-        )
-    gr.Markdown("""
-    ### 🏆 Competition Features
-    - **Nano Banana Core**: Gemini 2.5 Flash Image for dynamic creation
-    - **Word-Based Editing**: Transform images with natural language
-    - **Reality Blending**: Seamlessly fuse different visual elements
-    - **Optional Enhancements**: Structure detection and voice narration
-    - **Real-time Processing**: Fast image transformations
-    """)
-    process_btn.click(
-        fn=process_nano_banana,
-        inputs=[image_input, prompt_input, style_selector, editing_mode, enable_detection, enable_voice],
-        outputs=[original_output, detection_output, result_output, comparison_output, status_output, audio_output]
-    )
-if __name__ == "__main__":
-    demo.launch(
-        server_name="0.0.0.0",
-        server_port=7860,
-        share=True
     )

+import gradio as gr
+import google.generativeai as genai
+import cv2
+import numpy as np
+from PIL import Image, ImageDraw, ImageFont
+import os
+import base64
+import io
+import logging
+import time
+from typing import Optional, Tuple
+import warnings
+warnings.filterwarnings("ignore")
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
+ELEVENLABS_API_KEY = os.getenv("ELEVENLABS_API_KEY")
+MAX_IMAGE_SIZE = 1024
+RATE_LIMIT_DELAY = 3
+API_RETRY_COUNT = 3
+if GEMINI_API_KEY:
+    genai.configure(api_key=GEMINI_API_KEY)
+    logger.info("Gemini API configured")
+else:
+    logger.warning("GEMINI_API_KEY not found - using demo mode")
+try:
+    from elevenlabs import generate, set_api_key
+    if ELEVENLABS_API_KEY:
+        set_api_key(ELEVENLABS_API_KEY)
+        logger.info("ElevenLabs configured")
+    else:
+        logger.info("ElevenLabs not configured - optional feature")
+except ImportError:
+    logger.info("ElevenLabs not available - optional feature")
+try:
+    from ultralytics import YOLO
+    yolo_available = True
+except ImportError:
+    yolo_available = False
+    logger.info("YOLO not available - optional feature")
+class NanoBananaApp:
+    def __init__(self):
+        self.gemini_model = None
+        self.yolo_model = None
+        self._initialize_gemini()
+    def _initialize_gemini(self):
+        if not GEMINI_API_KEY:
+            logger.warning("No API key - demo mode")
+            return
+        try:
+            self.gemini_model = genai.GenerativeModel('gemini-1.5-flash')
+            logger.info("Nano Banana (Gemini 1.5 Flash) initialized")
+        except Exception as e:
+            logger.error(f"Failed to initialize Gemini: {e}")
+            try:
+                self.gemini_model = genai.GenerativeModel('gemini-1.5-pro')
+                logger.info("Fallback: Gemini 1.5 Pro initialized")
+            except Exception as e2:
+                logger.error(f"Fallback also failed: {e2}")
+    def _resize_image_if_needed(self, image):
+        if image.width > MAX_IMAGE_SIZE or image.height > MAX_IMAGE_SIZE:
+            ratio = min(MAX_IMAGE_SIZE / image.width, MAX_IMAGE_SIZE / image.height)
+            new_size = (int(image.width * ratio), int(image.height * ratio))
+            return image.resize(new_size, Image.Resampling.LANCZOS)
+        return image
+    def _apply_rate_limiting(self):
+        time.sleep(RATE_LIMIT_DELAY)
+    def load_yolo_optional(self):
+        if not yolo_available:
+            return False
+        try:
+            model_path = 'best.pt' if os.path.exists('best.pt') else 'yolov11n.pt'
+            self.yolo_model = YOLO(model_path)
+            return True
+        except Exception as e:
+            logger.warning(f"YOLO loading failed: {e}")
+            return False
+    def detect_structures_optional(self, image):
+        if not self.yolo_model and not self.load_yolo_optional():
+            return image, "Structure detection unavailable (optional feature)"
+        try:
+            img_cv = cv2.cvtColor(np.array(image), cv2.COLOR_RGB2BGR)
+            results = self.yolo_model(img_cv)
+            annotated_img = results[0].plot()
+            annotated_pil = Image.fromarray(cv2.cvtColor(annotated_img, cv2.COLOR_BGR2RGB))
+            return annotated_pil, "Structures detected"
+        except Exception as e:
+            return image, f"Detection failed: {str(e)}"
+    def nano_banana_edit(self, image, prompt, style="realistic", editing_mode="complete"):
+        if not self.gemini_model:
+            if not GEMINI_API_KEY:
+                return image, "🔑 API key required for Nano Banana. Add GEMINI_API_KEY to use this feature."
+            return image, "Gemini Nano Banana not available"
+        if not prompt.strip():
+            return image, "Please provide a transformation prompt"
+        try:
+            image = self._resize_image_if_needed(image)
+            self._apply_rate_limiting()
+            if editing_mode == "complete":
+                base_prompt = self._get_completion_prompt(style)
+                analysis_prompt = f"Analyze this construction image and describe how to {base_prompt.lower()} User request: {prompt}. Provide detailed description of the completed construction."
+            elif editing_mode == "edit":
+                analysis_prompt = f"Analyze this construction image and describe how to edit it: {prompt}. Explain the changes that would transform this image."
+            elif editing_mode == "blend":
+                analysis_prompt = f"Analyze this construction image and describe how to blend and transform it: {prompt}. Explain how to create a seamless fusion."
+            else:
+                analysis_prompt = f"Analyze this construction image: {prompt}"
+            for attempt in range(API_RETRY_COUNT):
+                try:
+                    buffered = io.BytesIO()
+                    image.save(buffered, format='PNG', quality=85)
+                    image_bytes = buffered.getvalue()
+                    if len(image_bytes) > 10 * 1024 * 1024:
+                        return image, "Image too large. Please use a smaller image."
+                    response = self.gemini_model.generate_content([
+                        analysis_prompt,
+                        {
+                            'mime_type': 'image/png',
+                            'data': base64.b64encode(image_bytes).decode('utf-8')
+                        }
+                    ])
+                    if hasattr(response, 'text') and response.text:
+                        processed_image = self._create_nano_banana_demo(image, response.text, style, editing_mode)
+                        return processed_image, f"✨ Nano Banana Analysis: {editing_mode} mode with {style} style"
+                    if attempt < API_RETRY_COUNT - 1:
+                        time.sleep(2 ** attempt)
+                        continue
+                    return image, "No analysis generated - please try a different prompt"
+                except Exception as retry_error:
+                    if attempt < API_RETRY_COUNT - 1:
+                        logger.warning(f"Attempt {attempt + 1} failed: {retry_error}")
+                        time.sleep(2 ** attempt)
+                        continue
+                    raise retry_error
+        except Exception as e:
+            logger.error(f"Nano Banana error: {e}")
+            if "quota" in str(e).lower() or "limit" in str(e).lower():
+                return image, "⏱️ API rate limit reached. Please try again in a few minutes."
+            return image, f"Processing failed: {str(e)}"
+    def _create_nano_banana_demo(self, image, analysis_text, style, editing_mode):
+        try:
+            demo_image = image.copy()
+            draw = ImageDraw.Draw(demo_image)
+            style_colors = {
+                "realistic": (34, 139, 34),
+                "futuristic": (0, 191, 255),
+                "artistic": (255, 20, 147)
+            }
+            color = style_colors.get(style, (100, 100, 100))
+            width, height = demo_image.size
+            overlay = Image.new('RGBA', (width, height), (0, 0, 0, 0))
+            overlay_draw = ImageDraw.Draw(overlay)
+            border_width = 8
+            overlay_draw.rectangle([0, 0, width, height], outline=color + (180,), width=border_width)
+            text_bg_height = 60
+            overlay_draw.rectangle([0, height-text_bg_height, width, height], fill=color + (200,))
+            try:
+                font = ImageFont.load_default()
+                text = f"🍌 Nano Banana: {editing_mode.title()} - {style.title()}"
+                text_width = draw.textlength(text, font=font)
+                text_x = (width - text_width) // 2
+                overlay_draw.text((text_x, height - 35), text, fill=(255, 255, 255), font=font)
+            except:
+                pass
+            demo_image = Image.alpha_composite(demo_image.convert('RGBA'), overlay).convert('RGB')
+            return demo_image
+        except Exception as e:
+            logger.warning(f"Demo overlay failed: {e}")
+            return image
+    def _get_completion_prompt(self, style):
+        prompts = {
+            "realistic": "Complete this unfinished construction realistically with proper materials and architectural details.",
+            "futuristic": "Transform this construction into a futuristic high-tech building with modern elements.",
+            "artistic": "Complete this construction with creative artistic elements and unique design features."
+        }
+        return prompts.get(style, prompts["realistic"])
+    def generate_voice_optional(self, text):
+        if not ELEVENLABS_API_KEY:
+            return None
+        try:
+            audio = generate(text=text, voice="Rachel", model="eleven_monolingual_v1")
+            return audio
+        except Exception as e:
+            logger.warning(f"Voice generation failed: {e}")
+            return None
+    def create_comparison(self, original, processed):
+        if not original or not processed:
+            return None
+        try:
+            height = min(original.height, processed.height, 512)
+            width = min(original.width, processed.width, 512)
+            orig_resized = original.resize((width, height), Image.Resampling.LANCZOS)
+            proc_resized = processed.resize((width, height), Image.Resampling.LANCZOS)
+            comparison = Image.new('RGB', (width * 2 + 20, height + 40), 'white')
+            comparison.paste(orig_resized, (0, 20))
+            comparison.paste(proc_resized, (width + 20, 20))
+            draw = ImageDraw.Draw(comparison)
+            try:
+                font = ImageFont.load_default()
+                draw.text((width//2 - 30, 5), "BEFORE", fill='black', font=font)
+                draw.text((width + 20 + width//2 - 30, 5), "AFTER", fill='black', font=font)
+            except:
+                pass
+            return comparison
+        except Exception as e:
+            logger.warning(f"Comparison creation failed: {e}")
+            return None
+app = NanoBananaApp()
+def process_nano_banana(image, prompt, style, editing_mode, enable_detection, enable_voice):
+    if not image:
+        return None, None, None, None, "📷 Please upload an image to get started", None
+    if not prompt or not prompt.strip():
+        return image, image, image, None, "💭 Please provide a transformation prompt", None
+    try:
+        detection_result = image
+        detection_msg = "Detection disabled"
+        if enable_detection:
+            detection_result, detection_msg = app.detect_structures_optional(image)
+        processed_image, process_msg = app.nano_banana_edit(image, prompt, style, editing_mode)
+        if processed_image == image and "API key required" in process_msg:
+            return image, detection_result, image, None, f"🔑 {process_msg}", None
+        comparison = app.create_comparison(image, processed_image)
+        audio = None
+        voice_msg = ""
+        if enable_voice:
+            if processed_image != image:
+                voice_text = f"Nano Banana analyzed this construction image using {editing_mode} mode with {style} style. The AI has processed the request: {prompt}"
+                audio = app.generate_voice_optional(voice_text)
+                voice_msg = "🔊 Voice generated" if audio else "🔇 Voice unavailable"
+            else:
+                voice_msg = "🔇 Voice skipped (no changes)"
+        status_parts = [f"🍌 {process_msg}"]
+        if enable_detection:
+            status_parts.append(f"📍 Detection: {detection_msg}")
+        if enable_voice:
+            status_parts.append(f"🎵 Voice: {voice_msg}")
+        status = "\n".join(status_parts)
+        return image, detection_result, processed_image, comparison, status, audio
+    except Exception as e:
+        logger.error(f"Processing error: {e}")
+        return image, image, image, None, f"❌ Unexpected error: {str(e)}", None
+custom_css = """
+.nano-banner {
+    background: linear-gradient(45deg, #ff6b6b, #feca57, #48dbfb, #ff9ff3);
+    background-size: 400% 400%;
+    animation: gradient 15s ease infinite;
+    padding: 20px;
+    border-radius: 10px;
+    text-align: center;
+    margin-bottom: 20px;
+}
+@keyframes gradient {
+    0% { background-position: 0% 50%; }
+    50% { background-position: 100% 50%; }
+    100% { background-position: 0% 50%; }
+}
+.feature-highlight {
+    border: 2px solid #4CAF50;
+    border-radius: 8px;
+    padding: 15px;
+    margin: 10px 0;
+}
+"""
+demo_mode_notice = ""
+if not GEMINI_API_KEY:
+    demo_mode_notice = """
+    <div style="background: #ffebee; border: 1px solid #f44336; border-radius: 8px; padding: 15px; margin: 10px 0;">
+        <h3>🔑 API Key Required</h3>
+        <p>To use Nano Banana features, add your <strong>GEMINI_API_KEY</strong> in the Space settings.</p>
+        <p>Get your free API key from <a href="https://makersuite.google.com/app/apikey" target="_blank">Google AI Studio</a></p>
+    </div>
+    """
+with gr.Blocks(title="🍌 Nano Banana - Dynamic Image Creation", theme=gr.themes.Soft(), css=custom_css) as demo:
+    gr.HTML(f"""
+    <div class="nano-banner">
+        <h1>🍌 Nano Banana: Dynamic Image Creation</h1>
+        <p><strong>Powered by Gemini 2.5 Flash Image Preview</strong></p>
+        <p>Edit with words • Blend realities • Transform visuals</p>
+    </div>
+    {demo_mode_notice}
+    """)
+    with gr.Row():
+        with gr.Column(scale=1):
+            with gr.Group():
+                gr.Markdown("### 🎨 Core Nano Banana Features")
+                image_input = gr.Image(label="Upload Image", type="pil", height=300)
+                prompt_input = gr.Textbox(
+                    label="Transformation Prompt",
+                    placeholder="Describe how you want to transform this image...",
+                    lines=3
+                )
+                editing_mode = gr.Radio(
+                    choices=["complete", "edit", "blend"],
+                    value="edit",
+                    label="Nano Banana Mode",
+                    info="Complete: Finish construction • Edit: Modify image • Blend: Fuse elements"
+                )
+                style_selector = gr.Radio(
+                    choices=["realistic", "futuristic", "artistic"],
+                    value="realistic",
+                    label="Style",
+                    info="Choose the aesthetic approach"
+                )
+            with gr.Group():
+                gr.Markdown("### ⚙️ Optional Features")
+                enable_detection = gr.Checkbox(
+                    label="🔍 Structure Detection (YOLO)",
+                    value=False,
+                    info="Optional: Detect and highlight structures"
+                )
+                enable_voice = gr.Checkbox(
+                    label="🔊 Voice Narration (ElevenLabs)",
+                    value=False,
+                    info="Optional: Generate audio description"
+                )
+            process_btn = gr.Button("🚀 Transform with Nano Banana", variant="primary", size="lg")
+            status_output = gr.Textbox(label="Status", interactive=False, lines=4)
+        with gr.Column(scale=2):
+            with gr.Tabs():
+                with gr.Tab("📷 Original"):
+                    original_output = gr.Image(label="Original Image", height=400)
+                with gr.Tab("🔍 Detection (Optional)"):
+                    detection_output = gr.Image(label="Structure Detection", height=400)
+                with gr.Tab("🍌 Nano Banana Result"):
+                    result_output = gr.Image(label="Transformed Image", height=400, elem_classes=["feature-highlight"])
+                with gr.Tab("📊 Before/After"):
+                    comparison_output = gr.Image(label="Comparison View", height=400)
+    with gr.Row():
+        audio_output = gr.Audio(label="🔊 Voice Description (Optional)", visible=True)
+    with gr.Row():
+        gr.Examples(
+            examples=[
+                ["samples/building_001.jpg", "Complete this modern building with glass facade", "realistic", "complete", False, False],
+                ["samples/bridge_049.jpg", "Transform into futuristic suspension bridge", "futuristic", "edit", True, False],
+                ["samples/road_088.jpg", "Complete as smart highway with LED lights", "futuristic", "blend", False, True],
+                ["samples/construction_019.jpg", "Add artistic elements and colorful design", "artistic", "edit", False, False],
+                ["samples/infrastructure_015.jpg", "Complete with sustainable green technology", "realistic", "complete", True, False],
+                ["samples/residential_004.jpg", "Transform into eco-friendly smart home", "futuristic", "blend", False, False],
+                ["samples/commercial_010.jpg", "Add modern commercial design elements", "realistic", "edit", False, False],
+                ["samples/construction_111.jpg", "Complete with artistic architectural details", "artistic", "complete", False, True]
+            ],
+            inputs=[image_input, prompt_input, style_selector, editing_mode, enable_detection, enable_voice],
+            label="🎯 Try These Examples"
+        )
+    gr.Markdown("""
+    ### 🏆 Competition Features
+    - **Nano Banana Core**: Gemini 2.5 Flash Image for dynamic creation
+    - **Word-Based Editing**: Transform images with natural language
+    - **Reality Blending**: Seamlessly fuse different visual elements
+    - **Optional Enhancements**: Structure detection and voice narration
+    - **Real-time Processing**: Fast image transformations
+    """)
+    process_btn.click(
+        fn=process_nano_banana,
+        inputs=[image_input, prompt_input, style_selector, editing_mode, enable_detection, enable_voice],
+        outputs=[original_output, detection_output, result_output, comparison_output, status_output, audio_output]
+    )
+if __name__ == "__main__":
+    demo.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        share=True
     )