"""
FastAPI endpoints for Ollama chat and donor/volunteer recommendation system.

Endpoints:
- /chat: Chat with Ollama model using LangGraph with memory
- /donors/register: Register a donor and generate embedding
- /volunteers/register: Register a volunteer and generate embedding
- /donors/recommend: Find similar donors based on query
- /volunteers/recommend: Find similar volunteers based on query
- /forms/{id}: Get/Delete a stored form
- /forms/stats: Get form counts by type
"""

import os
import sys
import asyncio
from contextlib import asynccontextmanager
from typing import Optional, List, Dict, Any

# Add app directory to path for local module imports
APP_DIR = os.path.dirname(os.path.abspath(__file__))
if APP_DIR not in sys.path:
    sys.path.insert(0, APP_DIR)

from fastapi import FastAPI, HTTPException
from fastapi.responses import StreamingResponse
from fastapi.middleware.cors import CORSMiddleware
from pydantic import BaseModel, Field

# Windows-specific fix for psycopg async compatibility
if sys.platform == "win32":
    asyncio.set_event_loop_policy(asyncio.WindowsSelectorEventLoopPolicy())

# Load .env file for local development
try:
    from dotenv import load_dotenv
    load_dotenv()
except ImportError:
    pass

# Lazy imports for encoder/recommender (avoid import errors if deps missing)
encoder = None
vector_store = None
pool = None
gis_recommender = None


# ============================================================================
# Pydantic Models
# ============================================================================

class ChatResponse(BaseModel):
    response: str


class DonorFormRequest(BaseModel):
    """Donor registration form."""
    id: str = Field(..., description="Unique identifier for the donor")
    name: str = Field(..., description="Donor name")
    donor_type: str = Field(..., description="Type: individual, corporate, foundation")
    country: str = Field(..., description="ASEAN country code (SG, MY, TH, VN, ID, PH, etc.)")
    preferred_language: str = Field(..., description="Primary language code")
    causes: List[str] = Field(default_factory=list, description="Interested causes")
    donation_frequency: Optional[str] = Field(None, description="one-time, monthly, quarterly, annual")
    amount_range: Optional[str] = Field(None, description="Preferred donation range")
    bio: Optional[str] = Field(None, description="Donor background")
    motivation: Optional[str] = Field(None, description="Why they want to donate")


class VolunteerFormRequest(BaseModel):
    """Volunteer registration form."""
    id: str = Field(..., description="Unique identifier for the volunteer")
    name: str = Field(..., description="Volunteer name")
    volunteer_type: str = Field(..., description="Type: regular, event_based, skilled")
    country: str = Field(..., description="ASEAN country code")
    preferred_language: str = Field(..., description="Primary language code")
    languages_spoken: List[str] = Field(default_factory=list, description="All languages spoken")
    skills: List[str] = Field(default_factory=list, description="Professional/technical skills")
    availability: str = Field(..., description="weekends, evenings, flexible, full_time")
    causes: List[str] = Field(default_factory=list, description="Interested causes")
    experience: Optional[str] = Field(None, description="Prior volunteer experience")
    goals: Optional[str] = Field(None, description="What they hope to achieve")


class RecommendRequest(BaseModel):
    """Request for recommendations based on a query form."""
    # Either provide a form_id to use existing embedding, or provide form data
    form_id: Optional[str] = Field(None, description="Existing form ID to use as query")
    # Or provide inline form data
    country: Optional[str] = None
    preferred_language: Optional[str] = None
    causes: List[str] = Field(default_factory=list)
    bio: Optional[str] = None
    motivation: Optional[str] = None
    # Search options
    limit: int = Field(default=10, ge=1, le=50)
    country_filter: Optional[str] = None
    exclude_ids: List[str] = Field(default_factory=list)


class FormResponse(BaseModel):
    """Response for form operations."""
    id: str
    form_type: str
    message: str
    embedding_dimension: Optional[int] = None


class ClientProfileRequest(BaseModel):
    """Client profile with spatial and behavioral data."""

    user_id: str
    coordinates: List[float] = Field(
        default=[1.3521, 103.8198], description="[lat, lng]"
    )
    planning_area: str = Field(default="central", description="Singapore planning area")
    housing_type: str = Field(
        default="hdb_4_room", description="Housing type for income proxy"
    )
    interests: List[str] = Field(default_factory=list)
    causes: List[str] = Field(default_factory=list)
    preferred_language: str = Field(default="en")
    is_donor: bool = False
    total_donated: float = 0.0
    donation_count: int = 0
    age_range: Optional[str] = None


class LookalikeRequest(BaseModel):
    """Request for lookalike client search."""

    seed_causes: List[str] = Field(..., description="Causes to find lookalikes for")
    seed_interests: List[str] = Field(default_factory=list)
    planning_area_filter: Optional[str] = Field(
        None, description="Geo-fence by planning area"
    )
    housing_type_filter: Optional[List[str]] = Field(
        None, description="Filter by housing types"
    )
    limit: int = Field(default=50, ge=1, le=200)
    min_score: float = Field(default=0.0, ge=0.0, le=1.0)
    include_geojson: bool = Field(
        default=True, description="Include GeoJSON for mapping"
    )


class ScoredClientResponse(BaseModel):
    """Single scored client result."""

    user_id: str
    planning_area: str
    housing_type: str
    causes: List[str]
    interests: List[str]
    is_donor: bool
    final_score: float
    vector_similarity: float
    spatial_proxy: float
    proximity: float
    coordinates: Optional[List[float]] = None  # Reduced precision


class LookalikeResponse(BaseModel):
    """Response containing lookalike clients with optional GeoJSON."""

    seed_causes: List[str]
    total_found: int
    tiers: Dict[str, List[ScoredClientResponse]]
    geojson: Optional[Dict[str, Any]] = None


class SingpassMockData(BaseModel):
    """Mock Singpass data for autofill."""

    name: str
    nric_masked: str
    email: str
    mobile: str
    registered_address: str
    planning_area: str
    organization_name: Optional[str] = None
    organization_uen: Optional[str] = None
    organization_type: Optional[str] = None


class RecommendationResult(BaseModel):
    """Single recommendation result."""
    id: str
    form_type: str
    score: float
    distance: float
    form_data: Dict[str, Any]


class RecommendResponse(BaseModel):
    """Response containing recommendations."""
    query_id: Optional[str]
    results: List[RecommendationResult]
    total_found: int


class StatsResponse(BaseModel):
    """Form statistics response."""
    donor: int
    volunteer: int
    total: int


# ============================================================================
# Database & Encoder Setup
# ============================================================================

async def init_services():
    """Initialize encoder and database connection."""
    global encoder, vector_store, pool, gis_recommender

    try:
        from encoders.sealion import SeaLionEncoder
        from recommender.vector_store import DonorVectorStore
        from recommender.gis_recommender import GISRecommender
        from psycopg_pool import AsyncConnectionPool

        # Initialize encoder (reads SEALION_ENDPOINT from env)
        encoder = SeaLionEncoder()

        # Build connection string from env vars
        db_host = os.getenv("SUPABASE_DB_HOST")
        db_port = os.getenv("SUPABASE_DB_PORT", "6543")
        db_name = os.getenv("SUPABASE_DB_NAME", "postgres")
        db_user = os.getenv("SUPABASE_DB_USER")
        db_password = os.getenv("SUPABASE_DB_PASSWORD")
        db_sslmode = os.getenv("SUPABASE_DB_SSLMODE", "require")

        if db_host and db_user and db_password:
            conn_string = (
                f"postgresql://{db_user}:{db_password}@{db_host}:{db_port}/{db_name}"
                f"?sslmode={db_sslmode}"
            )
            pool = AsyncConnectionPool(
                conninfo=conn_string,
                max_size=10,
                kwargs={"autocommit": True, "prepare_threshold": None},
            )
            await pool.open()
            vector_store = DonorVectorStore(pool)
            gis_recommender = GISRecommender(vector_store=vector_store, encoder=encoder)
            print("[OK] Database connection pool initialized")
            print("[OK] GIS Recommender initialized")
        else:
            print("[WARN] Database credentials not configured, vector store disabled")

        print("[OK] SeaLion encoder initialized")

    except Exception as e:
        print(f"[WARN] Service initialization error: {e}")
        print("  Some endpoints may not be available")


async def close_services():
    """Close database connections."""
    global pool
    if pool:
        await pool.close()
        print("[OK] Database connection pool closed")


@asynccontextmanager
async def lifespan(app: FastAPI):
    """Lifespan context manager for startup/shutdown."""
    await init_services()
    await init_langgraph()
    yield
    await close_services()


# ============================================================================
# FastAPI App
# ============================================================================

app = FastAPI(
    title="Donor Recommendation API",
    description="API for chat, donor/volunteer registration, and recommendations",
    version="1.0.0",
    lifespan=lifespan,
)

# CORS middleware
app.add_middleware(
    CORSMiddleware,
    allow_origins=["*"],
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)


# ============================================================================
# LangGraph Chat Setup
# ============================================================================

# Global graph instance (initialized at startup)
langgraph_chat = None


async def init_langgraph():
    """Initialize LangGraph with memory."""
    global langgraph_chat
    try:
        from graph.builder import build_graph_with_memory
        graph, _, _ = await build_graph_with_memory()
        langgraph_chat = graph
        print("[OK] LangGraph chat with memory initialized")
    except Exception as e:
        import traceback
        print(f"[WARN] LangGraph initialization error: {e}")
        traceback.print_exc()
        print("  /chat endpoint may not be available")


# ============================================================================
# Helper Functions
# ============================================================================

def donor_form_to_text(form: DonorFormRequest) -> str:
    """Convert donor form to encoding text."""
    parts = [
        f"Donor type: {form.donor_type}",
        f"Country: {form.country}",
        f"Preferred language: {form.preferred_language}",
    ]
    if form.causes:
        parts.append(f"Causes interested in: {', '.join(form.causes)}")
    if form.donation_frequency:
        parts.append(f"Donation frequency: {form.donation_frequency}")
    if form.amount_range:
        parts.append(f"Amount range: {form.amount_range}")
    if form.bio:
        parts.append(f"Bio: {form.bio}")
    if form.motivation:
        parts.append(f"Motivation: {form.motivation}")
    return "\n".join(parts)


def volunteer_form_to_text(form: VolunteerFormRequest) -> str:
    """Convert volunteer form to encoding text."""
    parts = [
        f"Volunteer type: {form.volunteer_type}",
        f"Country: {form.country}",
        f"Preferred language: {form.preferred_language}",
    ]
    if form.languages_spoken:
        parts.append(f"Languages spoken: {', '.join(form.languages_spoken)}")
    if form.skills:
        parts.append(f"Skills: {', '.join(form.skills)}")
    parts.append(f"Availability: {form.availability}")
    if form.causes:
        parts.append(f"Causes interested in: {', '.join(form.causes)}")
    if form.experience:
        parts.append(f"Experience: {form.experience}")
    if form.goals:
        parts.append(f"Goals: {form.goals}")
    return "\n".join(parts)


def recommend_request_to_text(req: RecommendRequest) -> str:
    """Convert recommendation request to encoding text."""
    parts = []
    if req.country:
        parts.append(f"Country: {req.country}")
    if req.preferred_language:
        parts.append(f"Preferred language: {req.preferred_language}")
    if req.causes:
        parts.append(f"Causes interested in: {', '.join(req.causes)}")
    if req.bio:
        parts.append(f"Bio: {req.bio}")
    if req.motivation:
        parts.append(f"Motivation: {req.motivation}")
    return "\n".join(parts) if parts else "General query"


# ============================================================================
# Health Endpoints
# ============================================================================

@app.get("/")
def root():
    """Root endpoint with service status."""
    return {
        "status": "healthy",
        "message": "Donor Recommendation API is running",
        "services": {
            "langgraph_chat": langgraph_chat is not None,
            "encoder": encoder is not None,
            "database": vector_store is not None,
        }
    }


@app.get("/health")
def health():
    """Health check endpoint."""
    return {"status": "healthy"}


# ============================================================================
# Chat Endpoints
# ============================================================================

class ChatRequestWithMemory(BaseModel):
    message: str
    user_id: str = "default_user"
    thread_id: str = "default_thread"
    stream: bool = False


@app.post("/chat")
async def chat(request: ChatRequestWithMemory):
    """Chat with LangGraph-powered chatbot with memory."""
    if not langgraph_chat:
        raise HTTPException(
            status_code=503,
            detail="LangGraph chat not initialized. Check server logs."
        )

    config = {
        "configurable": {
            "thread_id": request.thread_id,
            "user_id": request.user_id,
        }
    }

    try:
        if request.stream:
            async def generate_stream():
                async for chunk in langgraph_chat.astream(
                    {"messages": [{"role": "user", "content": request.message}]},
                    config,
                    stream_mode="values",
                ):
                    if chunk.get("messages"):
                        last_msg = chunk["messages"][-1]
                        if hasattr(last_msg, 'content') and last_msg.type == 'ai':
                            yield last_msg.content

            return StreamingResponse(
                generate_stream(),
                media_type="text/event-stream"
            )
        else:
            # Non-streaming: collect full response
            response_content = ""
            async for chunk in langgraph_chat.astream(
                {"messages": [{"role": "user", "content": request.message}]},
                config,
                stream_mode="values",
            ):
                if chunk.get("messages"):
                    last_msg = chunk["messages"][-1]
                    if hasattr(last_msg, 'content') and last_msg.type == 'ai':
                        response_content = last_msg.content

            return ChatResponse(response=response_content)
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


# ============================================================================
# Agentic RAG Endpoints
# ============================================================================

# Global agentic RAG agent instance
agentic_rag_agent = None


class AgenticRAGRequest(BaseModel):
    """Request for Agentic RAG search."""
    query: str = Field(..., description="Natural language query for donor/volunteer search")
    max_iterations: int = Field(default=10, ge=1, le=20, description="Max tool call iterations")


class AgenticRAGResponse(BaseModel):
    """Response from Agentic RAG search."""
    response: str
    tool_calls: List[Dict[str, Any]]
    message_count: int


async def init_agentic_rag():
    """Initialize the Agentic RAG agent."""
    global agentic_rag_agent
    
    if encoder is None or vector_store is None:
        print("[WARN] Cannot initialize Agentic RAG: encoder or vector_store not available")
        return
    
    try:
        from agents.agentic_rag import AgenticRAGAgent
        from langchain_ollama import ChatOllama
        
        # Create LLM for the agent
        api_key = os.getenv('OLLAMA_API_KEY')
        if api_key:
            llm = ChatOllama(
                model="gpt-oss:120b",
                base_url="https://ollama.com",
                client_kwargs={
                    "headers": {"Authorization": f"Bearer {api_key}"}
                }
            )
        else:
            llm = ChatOllama(model="gpt-oss:120b-cloud")
        
        agentic_rag_agent = AgenticRAGAgent(llm, encoder, vector_store)
        print("[OK] Agentic RAG agent initialized")
        
    except Exception as e:
        import traceback
        print(f"[WARN] Agentic RAG initialization error: {e}")
        traceback.print_exc()


@app.post("/rag/search", response_model=AgenticRAGResponse)
async def agentic_rag_search(request: AgenticRAGRequest):
    """
    Agentic RAG search - the agent autonomously explores the vector store.
    
    The agent will:
    1. Analyze your query to understand what you're looking for
    2. Explore available categories in the database
    3. Perform semantic and/or filtered searches
    4. Iteratively refine results if needed
    5. Return detailed findings with reasoning
    
    Example queries:
    - "Find donors interested in education in Singapore"
    - "Show me corporate donors who focus on environmental causes"
    - "Find volunteers with tech skills available on weekends"
    """
    global agentic_rag_agent
    
    # Lazy initialization if not done yet
    if agentic_rag_agent is None:
        await init_agentic_rag()
    
    if agentic_rag_agent is None:
        raise HTTPException(
            status_code=503,
            detail="Agentic RAG not available. Ensure encoder and database are configured."
        )
    
    try:
        result = await agentic_rag_agent.search(request.query)
        
        return AgenticRAGResponse(
            response=result["response"],
            tool_calls=result["tool_calls"],
            message_count=result["message_count"]
        )
    except Exception as e:
        import traceback
        traceback.print_exc()
        raise HTTPException(status_code=500, detail=str(e))


@app.get("/rag/tools")
async def list_rag_tools():
    """List available RAG tools and their descriptions."""
    from tools.rag_tools import RAG_TOOLS
    
    tools_info = []
    for tool in RAG_TOOLS:
        tools_info.append({
            "name": tool.name,
            "description": tool.description,
        })
    
    return {
        "tools": tools_info,
        "total": len(tools_info)
    }


@app.get("/rag/categories")
async def get_rag_categories():
    """Get available categories in the vector store for filtering."""
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")
    
    from tools.rag_tools import list_available_categories, set_rag_dependencies
    
    # Ensure dependencies are set
    if encoder and vector_store:
        set_rag_dependencies(encoder, vector_store)
    
    try:
        result = await list_available_categories.ainvoke({})
        import json
        return json.loads(result)
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


# ============================================================================
# Donor Endpoints
# ============================================================================

@app.post("/donors/register", response_model=FormResponse)
async def register_donor(form: DonorFormRequest):
    """Register a donor and generate embedding."""
    if not encoder:
        raise HTTPException(status_code=503, detail="Encoder not initialized")
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    try:
        # Convert form to encoding text
        text = donor_form_to_text(form)

        # Generate embedding
        embedding = await encoder.encode(text)

        # Store in database
        form_data = form.model_dump()
        await vector_store.store_embedding(
            form_id=form.id,
            form_type="donor",
            embedding=embedding,
            form_data=form_data
        )

        return FormResponse(
            id=form.id,
            form_type="donor",
            message="Donor registered successfully",
            embedding_dimension=len(embedding)
        )

    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/donors/recommend", response_model=RecommendResponse)
async def recommend_donors(request: RecommendRequest):
    """Find similar donors based on query."""
    if not encoder:
        raise HTTPException(status_code=503, detail="Encoder not initialized")
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    try:
        # Get query embedding
        if request.form_id:
            # Use existing form's embedding
            existing = await vector_store.get_embedding(request.form_id)
            if not existing:
                raise HTTPException(status_code=404, detail=f"Form {request.form_id} not found")
            # Re-encode for query (could also store raw embedding)
            text = recommend_request_to_text(request)
            query_embedding = await encoder.encode(text)
        else:
            # Generate new embedding from request data
            text = recommend_request_to_text(request)
            query_embedding = await encoder.encode(text)

        # Find similar donors
        results = await vector_store.find_similar(
            query_embedding=query_embedding,
            form_type="donor",
            limit=request.limit,
            country_filter=request.country_filter,
            exclude_ids=request.exclude_ids if request.exclude_ids else None
        )

        return RecommendResponse(
            query_id=request.form_id,
            results=[
                RecommendationResult(
                    id=r.id,
                    form_type=r.form_type,
                    score=r.score,
                    distance=r.distance,
                    form_data=r.form_data
                )
                for r in results
            ],
            total_found=len(results)
        )

    except HTTPException:
        raise
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


# ============================================================================
# Volunteer Endpoints
# ============================================================================

@app.post("/volunteers/register", response_model=FormResponse)
async def register_volunteer(form: VolunteerFormRequest):
    """Register a volunteer and generate embedding."""
    if not encoder:
        raise HTTPException(status_code=503, detail="Encoder not initialized")
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    try:
        # Convert form to encoding text
        text = volunteer_form_to_text(form)

        # Generate embedding
        embedding = await encoder.encode(text)

        # Store in database
        form_data = form.model_dump()
        await vector_store.store_embedding(
            form_id=form.id,
            form_type="volunteer",
            embedding=embedding,
            form_data=form_data
        )

        return FormResponse(
            id=form.id,
            form_type="volunteer",
            message="Volunteer registered successfully",
            embedding_dimension=len(embedding)
        )

    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/volunteers/recommend", response_model=RecommendResponse)
async def recommend_volunteers(request: RecommendRequest):
    """Find similar volunteers based on query."""
    if not encoder:
        raise HTTPException(status_code=503, detail="Encoder not initialized")
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    try:
        # Generate query embedding
        text = recommend_request_to_text(request)
        query_embedding = await encoder.encode(text)

        # Find similar volunteers
        results = await vector_store.find_similar(
            query_embedding=query_embedding,
            form_type="volunteer",
            limit=request.limit,
            country_filter=request.country_filter,
            exclude_ids=request.exclude_ids if request.exclude_ids else None
        )

        return RecommendResponse(
            query_id=request.form_id,
            results=[
                RecommendationResult(
                    id=r.id,
                    form_type=r.form_type,
                    score=r.score,
                    distance=r.distance,
                    form_data=r.form_data
                )
                for r in results
            ],
            total_found=len(results)
        )

    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


# ============================================================================
# Form Management Endpoints
# ============================================================================

@app.get("/forms/{form_id}")
async def get_form(form_id: str):
    """Get a stored form by ID."""
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    result = await vector_store.get_embedding(form_id)
    if not result:
        raise HTTPException(status_code=404, detail=f"Form {form_id} not found")

    return {
        "id": result.id,
        "form_type": result.form_type,
        "form_data": result.form_data
    }


@app.delete("/forms/{form_id}")
async def delete_form(form_id: str):
    """Delete a form by ID."""
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    deleted = await vector_store.delete_embedding(form_id)
    if not deleted:
        raise HTTPException(status_code=404, detail=f"Form {form_id} not found")

    return {"message": f"Form {form_id} deleted successfully"}


@app.get("/forms/stats/summary", response_model=StatsResponse)
async def get_form_stats():
    """Get form counts by type."""
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    try:
        counts = await vector_store.count_by_type()
        return StatsResponse(
            donor=counts.get("donor", 0),
            volunteer=counts.get("volunteer", 0),
            total=counts.get("total", 0)
        )
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


# ============================================================================
# Cause-based Search Endpoint
# ============================================================================

@app.post("/forms/search/causes")
async def search_by_causes(
    causes: List[str],
    limit: int = 20
):
    """Search forms by causes with embedding ranking."""
    if not encoder:
        raise HTTPException(status_code=503, detail="Encoder not initialized")
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    try:
        # Create a synthetic query embedding for ranking
        query_text = f"Causes interested in: {', '.join(causes)}"
        query_embedding = await encoder.encode(query_text)

        results = await vector_store.find_by_causes(
            target_causes=causes,
            query_embedding=query_embedding,
            limit=limit
        )

        return {
            "causes": causes,
            "results": [
                {
                    "id": r.id,
                    "form_type": r.form_type,
                    "score": r.score,
                    "distance": r.distance,
                    "form_data": r.form_data
                }
                for r in results
            ],
            "total_found": len(results)
        }

    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


# ============================================================================
# GIS & Client Targeting Endpoints
# ============================================================================

# Mock Singpass data for different organization profiles
MOCK_SINGPASS_PROFILES = {
    "org_001": SingpassMockData(
        name="Sarah Tan Wei Ling",
        nric_masked="S****567A",
        email="sarah.tan@example.org",
        mobile="+65 9123 4567",
        registered_address="123 Orchard Road, #12-01, Singapore 238867",
        planning_area="orchard",
        organization_name="Hearts of Hope Foundation",
        organization_uen="201912345K",
        organization_type="charity",
    ),
    "org_002": SingpassMockData(
        name="Ahmad bin Ibrahim",
        nric_masked="S****234B",
        email="ahmad.ibrahim@greensg.org",
        mobile="+65 9876 5432",
        registered_address="45 Jurong East Ave 1, #05-12, Singapore 609788",
        planning_area="jurong_east",
        organization_name="Green Singapore Initiative",
        organization_uen="201823456M",
        organization_type="ngo",
    ),
    "org_003": SingpassMockData(
        name="Lee Mei Hua",
        nric_masked="S****789C",
        email="meihua@eldercare.sg",
        mobile="+65 8765 4321",
        registered_address="78 Toa Payoh Lorong 1, #08-22, Singapore 310078",
        planning_area="toa_payoh",
        organization_name="ElderCare Singapore",
        organization_uen="200934567N",
        organization_type="social_enterprise",
    ),
}


@app.get("/singpass/mock/{profile_id}", response_model=SingpassMockData)
async def get_singpass_mock_data(profile_id: str):
    """
    Get mock Singpass data for autofill demonstration.

    Available profiles: org_001, org_002, org_003
    """
    if profile_id not in MOCK_SINGPASS_PROFILES:
        # Return a random profile if not found
        profile_id = "org_001"

    return MOCK_SINGPASS_PROFILES[profile_id]


@app.get("/singpass/mock", response_model=Dict[str, SingpassMockData])
async def list_singpass_mock_profiles():
    """List all available mock Singpass profiles."""
    return MOCK_SINGPASS_PROFILES


@app.get("/planning-areas")
async def get_planning_areas():
    """Get all Singapore planning areas with coordinates."""
    from recommender.gis_recommender import PLANNING_AREAS

    return PLANNING_AREAS


@app.get("/housing-types")
async def get_housing_types():
    """Get all housing types with income proxy scores."""
    from recommender.gis_recommender import HOUSING_INCOME_PROXY, HousingType

    return {
        "types": [h.value for h in HousingType],
        "income_proxy": {h.value: score for h, score in HOUSING_INCOME_PROXY.items()},
    }


@app.post("/clients/register", response_model=FormResponse)
async def register_client(profile: ClientProfileRequest):
    """
    Register a client profile with spatial and behavioral data.

    This creates an embedding combining interests/causes with spatial context.
    """
    if not encoder:
        raise HTTPException(status_code=503, detail="Encoder not initialized")
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    try:
        from recommender.gis_recommender import ClientProfile, HousingType

        # Create client profile
        client = ClientProfile(
            user_id=profile.user_id,
            coordinates=tuple(profile.coordinates),
            planning_area=profile.planning_area,
            housing_type=HousingType(profile.housing_type),
            interests=profile.interests,
            causes=profile.causes,
            preferred_language=profile.preferred_language,
            is_donor=profile.is_donor,
            total_donated=profile.total_donated,
            donation_count=profile.donation_count,
            age_range=profile.age_range,
        )

        # Generate embedding
        text = client.to_embedding_text()
        embedding = await encoder.encode(text)

        # Store in database
        form_data = client.to_dict()
        form_data["country"] = "SG"  # For existing filter compatibility

        await vector_store.store_embedding(
            form_id=profile.user_id,
            form_type="client",
            embedding=embedding,
            form_data=form_data,
        )

        return FormResponse(
            id=profile.user_id,
            form_type="client",
            message="Client profile registered successfully",
            embedding_dimension=len(embedding),
        )

    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/clients/lookalike", response_model=LookalikeResponse)
async def find_lookalike_clients(request: LookalikeRequest):
    """
    Find lookalike clients (potential donors) based on a seed profile.

    This uses the GIS recommender with hybrid semantic-spatial matching:
    1. Find registered donors from database via vector search
    2. Apply spatial/housing filters
    3. Score using tiered targeting (vector + spatial proxy + proximity)
    4. Fall back to mock data if database has insufficient results
    5. Return results with optional GeoJSON for mapping

    Note: Searches BOTH donors (from /donors/register) and clients
    (from /clients/register) to find potential matches.
    """
    try:
        from recommender.gis_recommender import (
            ClientProfile,
            HousingType,
            GISRecommender,
            generate_seed_donor_profile,
            generate_mock_clients,
        )

        # Create seed profile from request
        seed = generate_seed_donor_profile(
            cause=request.seed_causes[0] if request.seed_causes else "education"
        )
        seed.causes = request.seed_causes
        seed.interests = request.seed_interests

        # Update seed coordinates if planning area specified
        if request.planning_area_filter:
            from recommender.gis_recommender import PLANNING_AREAS

            if request.planning_area_filter in PLANNING_AREAS:
                area = PLANNING_AREAS[request.planning_area_filter]
                seed.coordinates = (area["lat"], area["lng"])
                seed.planning_area = request.planning_area_filter

        # Regenerate embeddings for updated seed
        seed.embedding = None  # Force regeneration
        local_recommender = GISRecommender()
        seed.embedding = local_recommender._generate_fallback_embedding(seed)
        seed.compute_reduced_embeddings()

        # Convert housing type filter
        housing_filter = None
        if request.housing_type_filter:
            housing_filter = [HousingType(h) for h in request.housing_type_filter]

        scored_clients = []
        db_results_count = 0

        # Try database search first if available
        if gis_recommender and encoder and vector_store:
            try:
                print(
                    f"Searching database for donors matching causes: {request.seed_causes}"
                )
                scored_clients = await gis_recommender.find_lookalikes(
                    seed_profile=seed,
                    k=request.limit * 2,  # Get more to allow for filtering
                    planning_area_filter=None,  # Remove strict filter for DB search
                    housing_type_filter=None,  # Filter after retrieval
                    use_hybrid=False,
                )
                db_results_count = len(scored_clients)
                print(f"Found {db_results_count} donors/clients from database")

                # Apply filters after retrieval for more flexible matching
                if request.planning_area_filter:
                    scored_clients = [
                        sc
                        for sc in scored_clients
                        if sc.client.planning_area == request.planning_area_filter
                    ]

                if housing_filter:
                    scored_clients = [
                        sc
                        for sc in scored_clients
                        if sc.client.housing_type in housing_filter
                    ]

            except Exception as e:
                print(f"Database search failed: {e}")
                import traceback

                traceback.print_exc()

        # If insufficient results from database, supplement with mock data
        min_results = max(request.limit // 2, 10)  # At least half the requested or 10
        if len(scored_clients) < min_results:
            print(f"Only {len(scored_clients)} from DB, supplementing with mock data")

            # Generate mock candidates
            fallback_candidates = generate_mock_clients(150)

            # Filter by causes for relevance
            if request.seed_causes:
                cause_matched = [
                    c
                    for c in fallback_candidates
                    if any(cause in c.causes for cause in request.seed_causes)
                ]
                if len(cause_matched) >= 20:
                    fallback_candidates = cause_matched

            # Use hybrid matching on mock data
            mock_results = local_recommender.find_lookalikes_hybrid(
                seed_profile=seed,
                candidates=fallback_candidates,
                k=request.limit - len(scored_clients),
                planning_area_filter=request.planning_area_filter,
                housing_type_filter=housing_filter,
            )

            scored_clients.extend(mock_results)
            print(
                f"Added {len(mock_results)} mock results, total: {len(scored_clients)}"
            )

        # Sort combined results by score
        scored_clients.sort(key=lambda x: x.final_score, reverse=True)
        scored_clients = scored_clients[: request.limit]

        # Apply tiered targeting with relaxed min_score for small datasets
        effective_min_score = max(0, request.min_score - 0.1)  # Relax slightly
        tiered = local_recommender.apply_tiered_targeting(
            scored_clients, min_score=effective_min_score
        )

        # Convert to response format
        def to_response(sc):
            return ScoredClientResponse(
                user_id=sc.client.user_id,
                planning_area=sc.client.planning_area,
                housing_type=sc.client.housing_type.value,
                causes=sc.client.causes,
                interests=sc.client.interests,
                is_donor=sc.client.is_donor,
                final_score=round(sc.final_score, 3),
                vector_similarity=round(sc.vector_similarity_score, 3),
                spatial_proxy=round(sc.spatial_proxy_score, 3),
                proximity=round(sc.proximity_score, 3),
                coordinates=(
                    list(sc.client.coordinates) if request.include_geojson else None
                ),
            )

        tiers_response = {
            "tier_1": [to_response(sc) for sc in tiered["tier_1"]],
            "tier_2": [to_response(sc) for sc in tiered["tier_2"]],
            "tier_3": [to_response(sc) for sc in tiered["tier_3"]],
        }

        # Generate GeoJSON if requested
        geojson = None
        if request.include_geojson:
            all_clients = tiered["tier_1"] + tiered["tier_2"] + tiered["tier_3"]
            geojson = local_recommender.to_geojson(all_clients)

        total = sum(len(t) for t in tiered.values())

        return LookalikeResponse(
            seed_causes=request.seed_causes,
            total_found=total,
            tiers=tiers_response,
            geojson=geojson,
        )

    except Exception as e:
        import traceback

        traceback.print_exc()
        raise HTTPException(status_code=500, detail=str(e))


async def _get_mock_lookalike_response(request: LookalikeRequest) -> LookalikeResponse:
    """Generate mock lookalike response when GIS recommender unavailable."""
    from recommender.gis_recommender import (
        generate_mock_clients,
        PLANNING_AREAS,
        HOUSING_INCOME_PROXY,
        HousingType,
    )

    # Generate mock clients
    mock_clients = generate_mock_clients(100)

    # Filter by causes
    filtered = [
        c
        for c in mock_clients
        if any(cause in c.causes for cause in request.seed_causes)
    ]

    # Apply planning area filter
    if request.planning_area_filter:
        filtered = [
            c for c in filtered if c.planning_area == request.planning_area_filter
        ]

    # Score and sort
    scored = []
    for client in filtered[: request.limit]:
        # Calculate mock scores
        cause_match = len(set(client.causes) & set(request.seed_causes)) / max(
            len(request.seed_causes), 1
        )
        spatial_score = HOUSING_INCOME_PROXY.get(client.housing_type, 0.5)
        final_score = 0.5 * cause_match + 0.3 * spatial_score + 0.2 * 0.5

        scored.append(
            {
                "client": client,
                "final_score": final_score,
                "vector_similarity": cause_match,
                "spatial_proxy": spatial_score,
                "proximity": 0.5,
            }
        )

    scored.sort(key=lambda x: x["final_score"], reverse=True)

    # Apply min score filter
    scored = [s for s in scored if s["final_score"] >= request.min_score]

    # Create tiers
    n = len(scored)
    tier_size = max(n // 3, 1)

    def to_response(s):
        c = s["client"]
        return ScoredClientResponse(
            user_id=c.user_id,
            planning_area=c.planning_area,
            housing_type=c.housing_type.value,
            causes=c.causes,
            interests=c.interests,
            is_donor=c.is_donor,
            final_score=round(s["final_score"], 3),
            vector_similarity=round(s["vector_similarity"], 3),
            spatial_proxy=round(s["spatial_proxy"], 3),
            proximity=round(s["proximity"], 3),
            coordinates=list(c.coordinates) if request.include_geojson else None,
        )

    tiers = {
        "tier_1": [to_response(s) for s in scored[:tier_size]],
        "tier_2": [to_response(s) for s in scored[tier_size : tier_size * 2]],
        "tier_3": [to_response(s) for s in scored[tier_size * 2 :]],
    }

    # Generate GeoJSON
    geojson = None
    if request.include_geojson:
        features = []
        for s in scored:
            c = s["client"]
            features.append(
                {
                    "type": "Feature",
                    "geometry": {
                        "type": "Point",
                        "coordinates": [
                            round(c.coordinates[1], 3),
                            round(c.coordinates[0], 3),
                        ],
                    },
                    "properties": {
                        "user_id": c.user_id,
                        "planning_area": c.planning_area,
                        "housing_type": c.housing_type.value,
                        "causes": c.causes,
                        "is_donor": c.is_donor,
                        "final_score": round(s["final_score"], 3),
                    },
                }
            )
        geojson = {"type": "FeatureCollection", "features": features}

    return LookalikeResponse(
        seed_causes=request.seed_causes,
        total_found=len(scored),
        tiers=tiers,
        geojson=geojson,
    )


@app.post("/clients/seed-mock-data")
async def seed_mock_client_data(count: int = 100):
    """
    Seed the database with mock client profiles for testing.

    This populates the vector store with realistic Singapore client data.
    """
    if not encoder:
        raise HTTPException(status_code=503, detail="Encoder not initialized")
    if not vector_store:
        raise HTTPException(status_code=503, detail="Database not connected")

    try:
        from recommender.gis_recommender import generate_mock_clients

        clients = generate_mock_clients(count)
        registered = 0

        for client in clients:
            text = client.to_embedding_text()
            embedding = await encoder.encode(text)

            form_data = client.to_dict()
            form_data["country"] = "SG"

            await vector_store.store_embedding(
                form_id=client.user_id,
                form_type="client",
                embedding=embedding,
                form_data=form_data,
            )
            registered += 1

        return {
            "message": f"Seeded {registered} mock client profiles",
            "count": registered,
        }

    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))


@app.get("/debug/database-stats")
async def get_database_stats():
    """
    Debug endpoint to check what's stored in the vector database.

    Returns counts of donors, volunteers, and clients in the database.
    """
    if not vector_store:
        return {"error": "Database not connected", "stats": None}

    try:
        async with vector_store.pool.connection() as conn:
            async with conn.cursor() as cur:
                # Count by form_type
                await cur.execute(
                    """
                    SELECT 
                        metadata->>'form_type' as form_type,
                        COUNT(*) as count
                    FROM my_embeddings
                    GROUP BY metadata->>'form_type'
                    ORDER BY count DESC
                """
                )
                type_counts = await cur.fetchall()

                # Get sample entries
                await cur.execute(
                    """
                    SELECT source_id, metadata->>'form_type', 
                           LEFT(text_content::text, 200) as preview
                    FROM my_embeddings
                    ORDER BY id DESC
                    LIMIT 10
                """
                )
                recent = await cur.fetchall()

        return {
            "connected": True,
            "form_type_counts": {row[0]: row[1] for row in type_counts},
            "total_entries": sum(row[1] for row in type_counts),
            "recent_entries": [
                {"id": row[0], "form_type": row[1], "preview": row[2]} for row in recent
            ],
        }
    except Exception as e:
        return {"error": str(e), "stats": None}


@app.get("/clients/map-demographics")
async def get_map_demographics(
    causes: Optional[str] = None,  # Comma-separated causes
    include_donors: bool = True,
    include_clients: bool = True,
):
    """
    Get aggregated demographics data for Singapore map visualization.

    Returns:
    - Planning area aggregates (donor counts, cause distribution, housing breakdown)
    - Individual donor/client points with coordinates
    - Demographics summary for clusters
    """
    from recommender.gis_recommender import (
        PLANNING_AREAS,
        HousingType,
        HOUSING_INCOME_PROXY,
    )

    if not vector_store:
        # Return mock data if database not available
        return await _generate_mock_map_demographics(causes)

    try:
        cause_list = causes.split(",") if causes else None

        # Query all donors and clients from database
        all_entries = []

        if include_donors:
            donor_results = await vector_store.find_by_form_type("donor", limit=500)
            all_entries.extend(donor_results)

        if include_clients:
            client_results = await vector_store.find_by_form_type("client", limit=500)
            all_entries.extend(client_results)

        # Aggregate by planning area
        area_stats = {}
        individual_points = []

        for entry in all_entries:
            form_data = (
                entry.form_data
                if hasattr(entry, "form_data")
                else entry.get("form_data", {})
            )
            entry_id = entry.id if hasattr(entry, "id") else entry.get("id", "")
            form_type = (
                entry.form_type
                if hasattr(entry, "form_type")
                else entry.get("form_type", "")
            )

            # Get planning area
            planning_area = form_data.get("planning_area", "unknown")
            if planning_area == "unknown" and form_data.get("country") == "SG":
                # Infer planning area from ID hash for donors without explicit area
                import hashlib

                area_list = list(PLANNING_AREAS.keys())
                idx = int(hashlib.md5(entry_id.encode()).hexdigest(), 16) % len(
                    area_list
                )
                planning_area = area_list[idx]

            # Get causes
            entry_causes = form_data.get("causes", [])
            if isinstance(entry_causes, str):
                entry_causes = [entry_causes]

            # Filter by causes if specified
            if cause_list:
                if not any(c in entry_causes for c in cause_list):
                    continue

            # Get housing type
            housing_type = form_data.get("housing_type", "hdb_4_room")
            amount_range = form_data.get("amount_range", "")
            if not housing_type or housing_type == "unknown":
                # Infer from amount_range
                if "10000" in str(amount_range) or "5000" in str(amount_range):
                    housing_type = "landed"
                elif "1000" in str(amount_range):
                    housing_type = "condo"
                elif "500" in str(amount_range):
                    housing_type = "hdb_executive"
                else:
                    housing_type = "hdb_4_room"

            # Get coordinates
            if planning_area in PLANNING_AREAS:
                area_info = PLANNING_AREAS[planning_area]
                lat = area_info["lat"] + (hash(entry_id) % 100 - 50) * 0.0005
                lng = area_info["lng"] + (hash(entry_id[::-1]) % 100 - 50) * 0.0005
            else:
                lat, lng = 1.3521, 103.8198  # Singapore center

            # Aggregate by area
            if planning_area not in area_stats:
                area_stats[planning_area] = {
                    "name": PLANNING_AREAS.get(planning_area, {}).get(
                        "name", planning_area.replace("_", " ").title()
                    ),
                    "lat": PLANNING_AREAS.get(planning_area, {}).get("lat", 1.3521),
                    "lng": PLANNING_AREAS.get(planning_area, {}).get("lng", 103.8198),
                    "total_count": 0,
                    "donor_count": 0,
                    "client_count": 0,
                    "causes": {},
                    "housing_breakdown": {},
                    "avg_income_proxy": 0,
                    "income_proxies": [],
                }

            stats = area_stats[planning_area]
            stats["total_count"] += 1
            if form_type == "donor":
                stats["donor_count"] += 1
            else:
                stats["client_count"] += 1

            # Count causes
            for cause in entry_causes:
                stats["causes"][cause] = stats["causes"].get(cause, 0) + 1

            # Count housing
            stats["housing_breakdown"][housing_type] = (
                stats["housing_breakdown"].get(housing_type, 0) + 1
            )

            # Track income proxy
            try:
                income_proxy = HOUSING_INCOME_PROXY.get(HousingType(housing_type), 0.5)
            except:
                income_proxy = 0.5
            stats["income_proxies"].append(income_proxy)

            # Add individual point
            individual_points.append(
                {
                    "id": entry_id,
                    "type": form_type,
                    "lat": lat,
                    "lng": lng,
                    "planning_area": planning_area,
                    "housing_type": housing_type,
                    "causes": entry_causes[:5],  # Limit for performance
                    "is_donor": form_type == "donor",
                }
            )

        # Calculate averages
        for area, stats in area_stats.items():
            if stats["income_proxies"]:
                stats["avg_income_proxy"] = round(
                    sum(stats["income_proxies"]) / len(stats["income_proxies"]), 3
                )
            del stats["income_proxies"]

        # Create GeoJSON for areas (polygons would need actual boundary data, using circles)
        area_geojson = {
            "type": "FeatureCollection",
            "features": [
                {
                    "type": "Feature",
                    "geometry": {
                        "type": "Point",
                        "coordinates": [stats["lng"], stats["lat"]],
                    },
                    "properties": {
                        "planning_area": area,
                        "name": stats["name"],
                        **{k: v for k, v in stats.items() if k not in ["lat", "lng"]},
                    },
                }
                for area, stats in area_stats.items()
            ],
        }

        # Create GeoJSON for individual points
        points_geojson = {
            "type": "FeatureCollection",
            "features": [
                {
                    "type": "Feature",
                    "geometry": {
                        "type": "Point",
                        "coordinates": [p["lng"], p["lat"]],
                    },
                    "properties": {
                        "id": p["id"],
                        "type": p["type"],
                        "planning_area": p["planning_area"],
                        "housing_type": p["housing_type"],
                        "causes": p["causes"],
                        "is_donor": p["is_donor"],
                    },
                }
                for p in individual_points
            ],
        }

        # Summary statistics
        all_causes = {}
        all_housing = {}
        for stats in area_stats.values():
            for cause, count in stats["causes"].items():
                all_causes[cause] = all_causes.get(cause, 0) + count
            for housing, count in stats["housing_breakdown"].items():
                all_housing[housing] = all_housing.get(housing, 0) + count

        return {
            "total_donors": sum(s["donor_count"] for s in area_stats.values()),
            "total_clients": sum(s["client_count"] for s in area_stats.values()),
            "areas_with_data": len(area_stats),
            "summary": {
                "top_causes": sorted(
                    all_causes.items(), key=lambda x: x[1], reverse=True
                )[:10],
                "housing_distribution": all_housing,
            },
            "area_aggregates": area_geojson,
            "individual_points": points_geojson,
            "planning_areas": PLANNING_AREAS,
        }

    except Exception as e:
        import traceback

        traceback.print_exc()
        return await _generate_mock_map_demographics(causes)


async def _generate_mock_map_demographics(causes: Optional[str] = None):
    """Generate mock demographics data for map visualization."""
    from recommender.gis_recommender import (
        PLANNING_AREAS,
        HOUSING_INCOME_PROXY,
        HousingType,
    )
    import random

    cause_list = (
        causes.split(",")
        if causes
        else ["education", "animals", "poverty", "environment", "health"]
    )

    area_stats = {}
    individual_points = []

    for area_id, area_info in PLANNING_AREAS.items():
        count = random.randint(3, 25)
        donors = random.randint(1, count)

        area_stats[area_id] = {
            "name": area_info["name"],
            "lat": area_info["lat"],
            "lng": area_info["lng"],
            "total_count": count,
            "donor_count": donors,
            "client_count": count - donors,
            "causes": {
                cause: random.randint(1, count)
                for cause in random.sample(cause_list, min(3, len(cause_list)))
            },
            "housing_breakdown": {
                "hdb_4_room": random.randint(0, count // 2),
                "condo": random.randint(0, count // 3),
                "landed": random.randint(0, count // 4),
            },
            "avg_income_proxy": round(random.uniform(0.3, 0.8), 3),
        }

        # Generate individual points
        for i in range(count):
            lat = area_info["lat"] + (random.random() - 0.5) * 0.02
            lng = area_info["lng"] + (random.random() - 0.5) * 0.02
            housing_types = [
                "hdb_3_room",
                "hdb_4_room",
                "hdb_5_room",
                "hdb_executive",
                "condo",
                "landed",
            ]

            individual_points.append(
                {
                    "id": f"mock_{area_id}_{i}",
                    "type": "donor" if i < donors else "client",
                    "lat": lat,
                    "lng": lng,
                    "planning_area": area_id,
                    "housing_type": random.choice(housing_types),
                    "causes": random.sample(cause_list, min(2, len(cause_list))),
                    "is_donor": i < donors,
                }
            )

    # Create GeoJSON
    area_geojson = {
        "type": "FeatureCollection",
        "features": [
            {
                "type": "Feature",
                "geometry": {
                    "type": "Point",
                    "coordinates": [stats["lng"], stats["lat"]],
                },
                "properties": {
                    "planning_area": area,
                    "name": stats["name"],
                    **{k: v for k, v in stats.items() if k not in ["lat", "lng"]},
                },
            }
            for area, stats in area_stats.items()
        ],
    }

    points_geojson = {
        "type": "FeatureCollection",
        "features": [
            {
                "type": "Feature",
                "geometry": {"type": "Point", "coordinates": [p["lng"], p["lat"]]},
                "properties": {k: v for k, v in p.items() if k not in ["lat", "lng"]},
            }
            for p in individual_points
        ],
    }

    return {
        "total_donors": sum(s["donor_count"] for s in area_stats.values()),
        "total_clients": sum(s["client_count"] for s in area_stats.values()),
        "areas_with_data": len(area_stats),
        "summary": {
            "top_causes": [(c, random.randint(10, 50)) for c in cause_list[:5]],
            "housing_distribution": {
                "hdb_4_room": 120,
                "condo": 45,
                "landed": 20,
                "hdb_5_room": 30,
            },
        },
        "area_aggregates": area_geojson,
        "individual_points": points_geojson,
        "planning_areas": PLANNING_AREAS,
    }


@app.get("/debug/search-donors")
async def debug_search_donors(cause: str = "education", limit: int = 10):
    """
    Debug endpoint to directly search for donors in the database.

    This bypasses the GIS recommender to see raw database results.
    """
    if not encoder or not vector_store:
        return {"error": "Encoder or database not available"}

    try:
        # Create a simple query embedding
        query_text = f"Donor interested in {cause} causes, looking to support {cause} initiatives"
        query_embedding = await encoder.encode(query_text)

        # Search for donors
        donor_results = await vector_store.find_similar(
            query_embedding=query_embedding,
            form_type="donor",
            limit=limit,
        )

        # Also search for clients
        client_results = await vector_store.find_similar(
            query_embedding=query_embedding,
            form_type="client",
            limit=limit,
        )

        return {
            "query_cause": cause,
            "donor_results": [
                {
                    "id": r.id,
                    "form_type": r.form_type,
                    "score": round(r.score, 4),
                    "distance": round(r.distance, 4),
                    "causes": r.form_data.get("causes", []),
                    "country": r.form_data.get("country"),
                }
                for r in donor_results
            ],
            "client_results": [
                {
                    "id": r.id,
                    "form_type": r.form_type,
                    "score": round(r.score, 4),
                    "distance": round(r.distance, 4),
                    "causes": r.form_data.get("causes", []),
                    "planning_area": r.form_data.get("planning_area"),
                }
                for r in client_results
            ],
            "total_donors": len(donor_results),
            "total_clients": len(client_results),
        }
    except Exception as e:
        import traceback

        return {"error": str(e), "traceback": traceback.format_exc()}


# ============================================================================
# Main
# ============================================================================

if __name__ == "__main__":
    import uvicorn

    # Windows-specific fix: must be set before uvicorn starts its event loop
    if sys.platform == "win32":
        asyncio.set_event_loop_policy(asyncio.WindowsSelectorEventLoopPolicy())

    uvicorn.run(app, host="0.0.0.0", port=7860)