Spaces:

bhatanerohan
/

SAM3d

Running

App Files Files Community

bhatanerohan commited on Dec 2, 2025

Commit

70fa0ce

verified ·

1 Parent(s): 0e13096

Update app.py

Browse files

Files changed (1) hide show

app.py +48 -61

app.py CHANGED Viewed

@@ -6,6 +6,7 @@ MCP Server + Gradio UI for MCP Hackathon
 import os
 import io
 import json
 import tempfile
 import gradio as gr
 from google import genai
@@ -55,7 +56,7 @@ def generate_3d_model(prompt: str) -> str:
         prompt: Text description of the object to generate (e.g., "a red sports car", "a wooden chair")
     Returns:
-        JSON string with paths to generated files
     """
     if not client:
         if not init_gemini():
@@ -78,7 +79,7 @@ def generate_3d_model(prompt: str) -> str:
                 break
         if initial_image is None:
-            return json.dumps({"error": "Image generation failed"})
         # STEP 2: Remove background
         edit_prompt = "Remove the background completely, make the background transparent. Preserve the object's shadow for realism."
@@ -100,7 +101,7 @@ def generate_3d_model(prompt: str) -> str:
                 break
         if final_image is None:
-            return json.dumps({"error": "Background removal failed"})
         # STEP 3: Create grayscale mask
         gray = final_image.convert("L")
@@ -108,59 +109,52 @@ def generate_3d_model(prompt: str) -> str:
         # STEP 4: Run SAM-3D
         ply_bytes, glb_bytes = run_sam3d(final_image, gray)
-        # Save all outputs
-        temp_dir = tempfile.mkdtemp()
-        original_path = os.path.join(temp_dir, "original.png")
-        nobg_path = os.path.join(temp_dir, "transparent.png")
-        mask_path = os.path.join(temp_dir, "mask.png")
-        ply_path = os.path.join(temp_dir, "model.ply")
-        initial_image.save(original_path)
-        final_image.save(nobg_path)
-        gray.save(mask_path)
-        with open(ply_path, 'wb') as f:
-            f.write(ply_bytes)
-        glb_path = None
-        if glb_bytes:
-            glb_path = os.path.join(temp_dir, "model.glb")
-            with open(glb_path, 'wb') as f:
-                f.write(glb_bytes)
         return json.dumps({
             "success": True,
             "prompt": prompt,
-            "original_image": original_path,
-            "transparent_image": nobg_path,
-            "mask_image": mask_path,
-            "ply_model": ply_path,
-            "glb_model": glb_path,
-            "message": f"Successfully generated 3D model for: {prompt}"
         })
     except Exception as e:
-        return json.dumps({"error": str(e)})
-def edit_3d_model(edit_prompt: str, transparent_image_path: str) -> str:
     """
     Edit an existing 3D model by modifying its transparent image and regenerating.
     Args:
         edit_prompt: Description of the edit to apply (e.g., "remove the wings", "change color to blue")
-        transparent_image_path: Path to the transparent PNG image from a previous generation
     Returns:
-        JSON string with paths to the new edited files
     """
     if not client:
         if not init_gemini():
             return json.dumps({"error": "GEMINI_API_KEY not configured"})
     try:
-        current_image = Image.open(transparent_image_path)
         image_part = types.Part.from_bytes(
             data=image_to_bytes(current_image),
@@ -182,42 +176,35 @@ def edit_3d_model(edit_prompt: str, transparent_image_path: str) -> str:
                 break
         if edited_image is None:
-            return json.dumps({"error": "Edit failed"})
         gray = edited_image.convert("L")
         ply_bytes, glb_bytes = run_sam3d(edited_image, gray)
-        temp_dir = tempfile.mkdtemp()
-        nobg_path = os.path.join(temp_dir, "edited.png")
-        mask_path = os.path.join(temp_dir, "mask.png")
-        ply_path = os.path.join(temp_dir, "model.ply")
-        edited_image.save(nobg_path)
-        gray.save(mask_path)
-        with open(ply_path, 'wb') as f:
-            f.write(ply_bytes)
-        glb_path = None
-        if glb_bytes:
-            glb_path = os.path.join(temp_dir, "model.glb")
-            with open(glb_path, 'wb') as f:
-                f.write(glb_bytes)
         return json.dumps({
             "success": True,
             "edit_prompt": edit_prompt,
-            "transparent_image": nobg_path,
-            "mask_image": mask_path,
-            "ply_model": ply_path,
-            "glb_model": glb_path,
-            "message": f"Successfully applied edit: {edit_prompt}"
         })
     except Exception as e:
-        return json.dumps({"error": str(e)})
 # ============================================================
 # GRADIO UI FUNCTIONS
@@ -422,7 +409,7 @@ edit_tool = gr.Interface(
     fn=edit_3d_model,
     inputs=[
         gr.Textbox(label="Edit Prompt", placeholder="Remove the wings"),
-        gr.Textbox(label="Transparent Image Path", placeholder="/path/to/transparent.png")
     ],
     outputs=gr.Textbox(label="Result (JSON)"),
     api_name="edit_3d",

 import os
 import io
 import json
+import base64
 import tempfile
 import gradio as gr
 from google import genai
         prompt: Text description of the object to generate (e.g., "a red sports car", "a wooden chair")
     Returns:
+        JSON string with base64-encoded files
     """
     if not client:
         if not init_gemini():
                 break
         if initial_image is None:
+            return json.dumps({"error": "Image generation failed - no image in response"})
         # STEP 2: Remove background
         edit_prompt = "Remove the background completely, make the background transparent. Preserve the object's shadow for realism."
                 break
         if final_image is None:
+            return json.dumps({"error": "Background removal failed - no image in response"})
         # STEP 3: Create grayscale mask
         gray = final_image.convert("L")
         # STEP 4: Run SAM-3D
         ply_bytes, glb_bytes = run_sam3d(final_image, gray)
+        # STEP 5: Encode outputs as base64 (NO FILE PATHS!)
+        original_b64 = base64.b64encode(image_to_bytes(initial_image)).decode()
+        transparent_b64 = base64.b64encode(image_to_bytes(final_image)).decode()
+        mask_b64 = base64.b64encode(image_to_bytes(gray)).decode()
+        ply_b64 = base64.b64encode(ply_bytes).decode()
+        glb_b64 = base64.b64encode(glb_bytes).decode() if glb_bytes else None
         return json.dumps({
             "success": True,
             "prompt": prompt,
+            "message": f"✅ Successfully generated 3D model for: {prompt}",
+            "files": {
+                "original_image_base64": original_b64,
+                "transparent_image_base64": transparent_b64,
+                "mask_image_base64": mask_b64,
+                "ply_model_base64": ply_b64,
+                "glb_model_base64": glb_b64
+            },
+            "instructions": "Files are base64-encoded. To save: decode base64 and write to disk."
         })
     except Exception as e:
+        return json.dumps({
+            "error": str(e),
+            "error_type": type(e).__name__
+        })
+def edit_3d_model(edit_prompt: str, transparent_image_base64: str) -> str:
     """
     Edit an existing 3D model by modifying its transparent image and regenerating.
     Args:
         edit_prompt: Description of the edit to apply (e.g., "remove the wings", "change color to blue")
+        transparent_image_base64: Base64-encoded transparent PNG image from a previous generation
     Returns:
+        JSON string with base64-encoded edited files
     """
     if not client:
         if not init_gemini():
             return json.dumps({"error": "GEMINI_API_KEY not configured"})
     try:
+        # Decode base64 image (instead of reading file path)
+        image_bytes = base64.b64decode(transparent_image_base64)
+        current_image = Image.open(io.BytesIO(image_bytes))
         image_part = types.Part.from_bytes(
             data=image_to_bytes(current_image),
                 break
         if edited_image is None:
+            return json.dumps({"error": "Edit failed - no image in response"})
         gray = edited_image.convert("L")
         ply_bytes, glb_bytes = run_sam3d(edited_image, gray)
+        # Encode outputs as base64 (NO FILE PATHS!)
+        transparent_b64 = base64.b64encode(image_to_bytes(edited_image)).decode()
+        mask_b64 = base64.b64encode(image_to_bytes(gray)).decode()
+        ply_b64 = base64.b64encode(ply_bytes).decode()
+        glb_b64 = base64.b64encode(glb_bytes).decode() if glb_bytes else None
         return json.dumps({
             "success": True,
             "edit_prompt": edit_prompt,
+            "message": f"✅ Successfully applied edit: {edit_prompt}",
+            "files": {
+                "transparent_image_base64": transparent_b64,
+                "mask_image_base64": mask_b64,
+                "ply_model_base64": ply_b64,
+                "glb_model_base64": glb_b64
+            },
+            "instructions": "Files are base64-encoded. To save: decode base64 and write to disk."
         })
     except Exception as e:
+        return json.dumps({
+            "error": str(e),
+            "error_type": type(e).__name__
+        })
 # ============================================================
 # GRADIO UI FUNCTIONS
     fn=edit_3d_model,
     inputs=[
         gr.Textbox(label="Edit Prompt", placeholder="Remove the wings"),
+        gr.Textbox(label="Transparent Image (base64)", placeholder="Paste base64-encoded PNG from previous generation")
     ],
     outputs=gr.Textbox(label="Result (JSON)"),
     api_name="edit_3d",