Spaces:

hmgill
/

Cellpose-SAM-Agent

Runtime error

File size: 9,644 Bytes

"""
Gradio web interface for CellposeAgent
"""
import os
import json
import gradio as gr
from pathlib import Path
from langfuse import get_client
from openinference.instrumentation.smolagents import SmolagentsInstrumentor
from smolagents.agents import ActionStep

from config import settings
from agents.agent import CellposeAgent
from stores import neo4j_store
from utils.prechecks import check_hf_persistent_storage


def setup_observability():
    """Initializes Langfuse and Smolagents instrumentation."""
    try:
        if os.getenv("LANGFUSE_PUBLIC_KEY") and os.getenv("LANGFUSE_SECRET_KEY"):
            get_client()
            SmolagentsInstrumentor().instrument()
            print("✓ Observability and instrumentation initialized.")
        else:
            print("⚠️  Langfuse keys not found. Observability disabled.")
    except Exception as e:
        print(f"⚠️  Could not initialize observability: {e}")


def initialize_app():
    """Initialize the application and verify prerequisites."""
    print("\n--- Initializing Cellpose Agent Application ---")
    
    # Setup observability
    setup_observability()
    
    # Configure LlamaIndex
    settings.configure_llama_index()

    # check for cellpose-db
    check_hf_persistent_storage(
        repo_id = "hmgill/Cellpose-DB",
        target = "cellpose_db",
        file_or_folder="folder"
    )

    # check for cellpose sam
    check_hf_persistent_storage(
        repo_id = "hmgill/Cellpose-SAM-Checkpoint",
        target = "sam_vit_h_4b8939.pth",
        file_or_folder="file"
    )

    # Verify knowledge graph is ready
    try:
        node_count, _ = neo4j_store.check_graph_status()
        if node_count == 0:
            print("\n❌ WARNING: The knowledge graph is empty.")
            print("Please run the setup script to build the knowledge graph:")
            print("\n    python setup_kg.py\n")
            return False
        print(f"✓ Knowledge graph is ready with {node_count} nodes.")
    except Exception as e:
        print(f"❌ ERROR: Could not connect to Neo4j: {e}")
        print("Please ensure Neo4j is running and accessible.")
        return False
    
    return True


def process_image_task(image_path: str, task_text: str, agent: CellposeAgent) -> tuple[str, str | None]:
    """
    Process a user task with the CellposeAgent.
    
    The image_path is now passed SEPARATELY to agent.run() so it gets stored
    in global context. This prevents the LLM from needing to reproduce the 
    exact path string (which it often corrupts).
    
    Args:
        image_path: Path to the uploaded image file
        task_text: User's text prompt/question
        agent: Initialized CellposeAgent instance
    
    Returns:
        tuple: (agent's text response, path to segmented image or None)
    """
    if not image_path:
        return "⚠️ Please upload an image first.", None
    
    # Build task WITHOUT embedding the full path
    # The agent instructions tell it to use image_path="" and the tool will resolve from context
    if not task_text or task_text.strip() == "":
        task = "Analyze the uploaded image and recommend optimal segmentation parameters. Then run segmentation."
    else:
        # Don't include the path in the task - it will be available via context
        task = task_text
    
    try:
        # Pass image_path SEPARATELY - this stores it in global context
        # Tools will retrieve the correct path from context instead of relying on LLM
        result = agent.run(task=task, image_path=image_path)
        get_client().flush()
        
        # Extract output image path from agent's memory (more reliable than parsing text)
        output_image_path = None
        try:
            # Search through agent's memory steps in reverse order (most recent first)
            for step in reversed(agent.agent.memory.steps):
                if isinstance(step, ActionStep) and step.observations:
                    try:
                        obs_data = json.loads(step.observations)
                        
                        # Check if this step contains segmentation output
                        if obs_data.get("status") == "success" and "output_path" in obs_data:
                            candidate_path = obs_data["output_path"]
                            
                            # Verify the file exists
                            if Path(candidate_path).exists():
                                output_image_path = candidate_path
                                print(f"✓ Found segmentation output: {output_image_path}")
                                break
                                
                    except (json.JSONDecodeError, Exception) as parse_error:
                        continue
            
            if output_image_path is None:
                print("ℹ️ No segmentation output found in agent memory")
                    
        except Exception as e:
            print(f"Warning: Could not extract output image from agent memory: {e}")
        
        return result, output_image_path
        
    except Exception as e:
        return f"❌ Error processing task: {str(e)}", None


def create_gradio_interface():
    """Creates and configures the Gradio interface."""
    
    # Initialize the agent once at startup
    if not initialize_app():
        raise RuntimeError("Failed to initialize application. Please check logs.")
    
    agent = CellposeAgent()
    print("✓ CellposeAgent initialized and ready.")
    
    with gr.Blocks(title="Cellpose-SAM Agent", theme=gr.themes.Soft()) as demo:
        gr.Markdown(
            """
            # 🔬 Cellpose-SAM Segmentation Agent
            
            Upload a microscopy image and ask the AI agent to recommend optimal segmentation parameters,
            run segmentation, or answer questions about the cellpose-sam pipeline.
            """
        )
        
        with gr.Row():
            with gr.Column(scale=1):
                # Image upload
                image_input = gr.Image(
                    label="Upload Microscopy Image",
                    type="filepath",
                    height=300
                )
                
                # Task input
                task_input = gr.Textbox(
                    label="Task / Question",
                    placeholder="e.g., 'What parameters would work best?' or 'Run segmentation' (image path handled automatically)",
                    lines=3
                )
                
                # Submit button
                submit_btn = gr.Button("Run Agent", variant="primary", size="lg")
                
                # Example tasks
                gr.Markdown("### 💡 Example Tasks")
                gr.Examples(
                    examples=[
                        ["What parameters would work best for this image?"],
                        ["Analyze this image and run segmentation with optimal parameters."],
                        ["What is the flow_threshold parameter and how does it affect segmentation?"],
                        ["Run segmentation with diameter=30, flow_threshold=0.5, cellprob_threshold=0, min_size=20"],
                    ],
                    inputs=task_input,
                    label="Click to use:"
                )
            
            with gr.Column(scale=1):
                # Text output
                output = gr.Textbox(
                    label="Agent Response",
                    lines=12,
                    max_lines=20,
                    show_copy_button=True
                )
                
                # Image output for segmentation results
                output_image = gr.Image(
                    label="Segmentation Result",
                    type="filepath",
                    height=400
                )
        
        # Event handler
        submit_btn.click(
            fn=lambda img, task: process_image_task(img, task, agent),
            inputs=[image_input, task_input],
            outputs=[output, output_image]
        )
        
        gr.Markdown(
            """
            ---
            ### 📚 What can this agent do?
            
            - **Parameter Recommendation**: Analyzes your image and suggests optimal segmentation parameters
            - **Automated Segmentation**: Runs the full cellpose-sam pipeline with parameter refinement
            - **Visual Analysis**: Uses vision-language models to assess segmentation quality
            - **Documentation Search**: Answers questions about parameters using RAG and knowledge graphs
            - **Iterative Refinement**: Automatically adjusts parameters based on visual feedback
            
            ### 🔍 How it works
            
            1. Upload your microscopy image
            2. The agent finds similar images and recommends parameters
            3. Visually analyzes your image to validate recommendations
            4. Runs segmentation and checks quality
            5. Refines parameters if needed (up to 2 iterations)
            6. **Displays the segmented overlay image with colored cell masks**
            
            ### ⚙️ Technical Note
            
            Image paths are handled automatically by the system - the agent doesn't need to 
            reproduce exact file paths, preventing common path corruption issues with LLMs.
            """
        )
    
    return demo


def main():
    """Launch the Gradio application."""
    demo = create_gradio_interface()
    demo.launch(server_port=7860)


if __name__ == "__main__":
    main()