"""
src/graphs/graph_factory.py

Factory function that builds a LangGraph StateGraph for any medical specialty.
Architecture: __start__ → information_retrieval → interpretation_generation → __end__
"""
from __future__ import annotations

import json
from typing import Any, Dict, List

from langchain_core.messages import AIMessage, HumanMessage
from langgraph.graph import END, StateGraph

from src.llms.groqllm import GroqLLM
from src.states.expert_subgraph_state import ExpertSubgraphState
from src.utils.prompts import get_expert_prompt
from src.utils.utils import EXPERT_TOOLS, get_today_str
from src.utils.vector_store import get_history, save_interpretation
from src.utils.db import insert_interpretation


def _augment_with_ml_models(specialty: str, telemetry: Dict[str, Any]) -> Dict[str, Any]:
    """
    Attach structured-model outputs (ECGFounder, respiratory CNN, fetal
    health, retinal classifiers, …) to the tool_results dict when the
    relevant adapter has weights loaded and the telemetry snapshot
    carries the inputs the adapter needs.

    Returns a dict of extra {tool_name: json_string} entries — empty when
    no adapters are ready or no relevant inputs are present.

    Each branch gates on (a) specialty match, (b) adapter.is_loaded, and
    (c) snapshot contains the right modality data. Each adapter call is
    wrapped in try/except so a single broken weight file can never break
    the whole graph run.
    """
    extras: Dict[str, str] = {}
    telemetry = telemetry or {}
    waveform = telemetry.get("waveform") or {}

    import numpy as np

    # ── Cardiology ───────────────────────────────────────────────────
    if "Cardiology" in specialty:
        if waveform:
            try:
                from src.ml.ecgfounder_adapter import get_ecgfounder
                adapter = get_ecgfounder()
                if adapter.is_loaded and waveform.get("ecg_lead2"):
                    signal = np.asarray(waveform["ecg_lead2"], dtype=float)
                    pred = adapter.classify(signal, fs=waveform.get("fs", 40))
                    if pred is not None:
                        extras["ecgfounder_classification"] = json.dumps(pred)
            except Exception:
                pass
        # ECG arrhythmia tabular baseline — runs even without waveforms
        try:
            from src.ml.ecg_arrhythmia_adapter import get_ecg_arrhythmia
            adapter = get_ecg_arrhythmia()
            if adapter.is_loaded:
                pred = adapter.predict_dict(telemetry)
                if pred is not None:
                    extras["ecg_arrhythmia_prediction"] = json.dumps(pred)
        except Exception:
            pass
        # Cardiac age regression with delta-vs-chronological
        try:
            from src.ml.cardiac_age_adapter import get_cardiac_age
            adapter = get_cardiac_age()
            if adapter.is_loaded:
                pred = adapter.predict_with_chrono(telemetry)
                if pred is not None:
                    extras["cardiac_age_prediction"] = json.dumps(pred)
        except Exception:
            pass

    # ── Pulmonary ────────────────────────────────────────────────────
    if "Pulmonary" in specialty or "Respiratory" in specialty:
        if waveform:
            try:
                from src.ml.pulmonary_classifier import get_pulmonary_classifier
                clf = get_pulmonary_classifier()
                if clf.is_loaded and waveform.get("audio"):
                    audio = np.asarray(waveform["audio"], dtype=float)
                    pred = clf.predict(audio, fs=waveform.get("fs", 40))
                    if pred is not None:
                        extras["respiratory_cnn_classification"] = json.dumps({
                            "label": pred.label,
                            "probs": pred.probs,
                            "confidence": pred.confidence,
                        })
            except Exception:
                pass
        # Patient-level lung-sound diagnostic (Healthy / COPD / Asthma / etc.)
        try:
            from src.ml.lung_sound_adapter import get_lung_sound
            adapter = get_lung_sound()
            if adapter.is_loaded:
                pred = adapter.predict_dict(telemetry)
                if pred is not None:
                    extras["lung_sound_prediction"] = json.dumps(pred)
        except Exception:
            pass

    # ── Neurology ────────────────────────────────────────────────────
    if "Neurology" in specialty:
        # Parkinson screener — only runs when voice features are supplied
        # (skipped when telemetry has no voice block; the adapter returns None)
        try:
            from src.ml.parkinson_screener_adapter import get_parkinson_screener
            adapter = get_parkinson_screener()
            if adapter.is_loaded:
                pred = adapter.predict_dict(telemetry)
                if pred is not None:
                    extras["parkinson_screener_prediction"] = json.dumps(pred)
        except Exception:
            pass

    # ── Dermatology ──────────────────────────────────────────────────
    if "Dermatology" in specialty:
        imaging = telemetry.get("imaging") or {}
        skin_path = (imaging.get("skin") or {}).get("image_path")
        demographics = telemetry.get("patient") or {}
        try:
            from src.ml.skin_disease_adapter import get_skin_disease
            adapter = get_skin_disease()
            if adapter.is_loaded:
                pred = adapter.predict_with_image(demographics, image_path=skin_path)
                if pred is not None:
                    extras["skin_disease_prediction"] = json.dumps(pred)
        except Exception:
            pass

    # ── Obstetrics: fetal_health + preterm_labour ────────────────────
    if "Obstetrics" in specialty or "Gynecology" in specialty:
        fetal_block = telemetry.get("fetal") or {}
        if fetal_block:
            try:
                from src.ml.fetal_health_adapter import get_fetal_health
                adapter = get_fetal_health()
                if adapter.is_loaded:
                    pred = adapter.predict_dict(fetal_block)
                    if pred is not None:
                        extras["fetal_health_prediction"] = json.dumps(pred)
            except Exception:
                pass
            try:
                from src.ml.preterm_labour_adapter import get_preterm_labour
                adapter = get_preterm_labour()
                if adapter.is_loaded:
                    pred = adapter.predict_dict({
                        "fetal": fetal_block,
                        "patient": telemetry.get("patient") or {},
                    })
                    if pred is not None:
                        extras["preterm_labour_prediction"] = json.dumps(pred)
            except Exception:
                pass

    # ── Ocular: retinal_disease + retinal_age ────────────────────────
    if "Ocular" in specialty or "Ocul" in specialty:
        imaging = telemetry.get("imaging") or {}
        retinal_path = (imaging.get("retinal") or {}).get("image_path")
        demographics = telemetry.get("patient") or {}
        if demographics or retinal_path:
            try:
                from src.ml.retinal_disease_adapter import get_retinal_disease
                adapter = get_retinal_disease()
                if adapter.is_loaded:
                    pred = adapter.predict_with_image(demographics, image_path=retinal_path)
                    if pred is not None:
                        extras["retinal_disease_prediction"] = json.dumps(pred)
            except Exception:
                pass
            try:
                from src.ml.retinal_age_adapter import get_retinal_age
                adapter = get_retinal_age()
                if adapter.is_loaded:
                    pred = adapter.predict_with_image(demographics, image_path=retinal_path)
                    if pred is not None:
                        extras["retinal_age_prediction"] = json.dumps(pred)
            except Exception:
                pass

    return extras

def _get_model(specialty: str = None):
    # Cannot cache globally if different specialties use different keys!
    return GroqLLM(specialty).get_llm()


# ─── Node Factories ─────────────────────────────────────────────────────────


def _make_information_retrieval(specialty: str):
    """
    Creates the information_retrieval node for a given specialty.

    Behaviour:
      • If `state["sensor_telemetry"]` is present (mobile attached a real
        snapshot — the common case in production), the mock retrieval
        tools are skipped. The LLM still sees the real values via the
        `telemetry_context` block of the system prompt; running the mock
        tools alongside would inject fabricated values that contradict
        the live data and confuse the assessment.
      • If no snapshot is present (e.g. background_agent_runner_loop on
        a quiet system), the mock tools fire so the LLM has *something*
        plausible to interpret instead of empty input.
      • ML-model adapter outputs (graph_factory._augment_with_ml_models)
        are appended in either case — they're real predictions when the
        adapters have weights, and gracefully no-op otherwise.
    """
    tools = EXPERT_TOOLS.get(specialty, [])

    def information_retrieval(state: ExpertSubgraphState) -> Dict[str, Any]:
        tool_results: Dict[str, str] = {}
        telemetry = state.get("sensor_telemetry") or {}
        has_telemetry = bool(telemetry) and (
            bool(telemetry.get("vitals"))
            or bool(telemetry.get("waveform"))
            or bool(telemetry.get("imaging"))
            or bool(telemetry.get("fetal"))
        )

        if has_telemetry:
            # Real telemetry available — skip the mock retrieval tools so
            # the LLM uses the snapshot via telemetry_context exclusively.
            tool_results["live_telemetry"] = (
                "Live telemetry attached to this request — see "
                "## LIVE TELEMETRY CONTEXT in the prompt below. Trust "
                "those numeric values over any other defaults."
            )
        else:
            # No snapshot — run the mock tools so the LLM has structured
            # input to reason over instead of an empty result set.
            for tool_fn in tools:
                try:
                    result = tool_fn.invoke({})
                    tool_results[tool_fn.name] = result
                except Exception as e:
                    tool_results[tool_fn.name] = f"ERROR: {e}"

        # ML-adapter outputs — real predictions when weights load,
        # silent no-op otherwise. Run in both branches.
        try:
            ml_extras = _augment_with_ml_models(specialty, telemetry)
            tool_results.update(ml_extras)
        except Exception:
            pass

        return {
            "tool_results": tool_results,
            "messages": [
                AIMessage(
                    content=f"[{specialty}] Information retrieval complete. "
                    f"{len(tool_results)} tools executed."
                )
            ],
            "traces": [
                {
                    "step": "information_retrieval",
                    "specialty": specialty,
                    "tools_called": list(tool_results.keys()),
                    "snapshot_present": has_telemetry,
                }
            ],
        }

    return information_retrieval


def _make_interpretation_generation(specialty: str):
    """
    Creates the interpretation_generation node for a given specialty.
    Loads domain knowledge + session history, calls LLM with comprehensive
    system prompt, saves output summary to vector store.
    """

    def interpretation_generation(state: ExpertSubgraphState) -> Dict[str, Any]:
        domain = state.get("expert_domain") or specialty
        tool_results = state.get("tool_results") or {}
        shared = state.get("shared_context") or {}
        telemetry = state.get("sensor_telemetry") or {}

        # Pull the user's actual question out of state["messages"] so it
        # reaches the LLM. Without this the chat is just a generic
        # assessment regardless of what was typed. Walk backwards because
        # the prior information_retrieval node appended its own
        # AIMessage after the user's question, so messages[-1] is the
        # status note, not the question.
        user_message = ""
        msgs = state.get("messages") or []
        for msg in reversed(msgs):
            if isinstance(msg, dict):
                role = msg.get("role") or msg.get("type") or ""
                content = msg.get("content", "")
            else:
                # langchain BaseMessage: HumanMessage.type == "human"
                role = getattr(msg, "type", "") or msg.__class__.__name__.lower()
                content = getattr(msg, "content", "")
            if role in ("user", "human", "humanmessage") and content:
                user_message = content
                break
        user_message = (user_message or "").strip()

        # Format tool results for the prompt
        tool_results_str = "\n".join(
            [f"### {name}\n```json\n{result}\n```" for name, result in tool_results.items()]
        )

        # Get patient ID for history lookup (from shared context or default)
        patient_id = shared.get("patient_id", "default_patient")

        # Retrieve past session history from vector store. RAG against the
        # user's question when present so the most relevant prior
        # interpretations come back first.
        rag_query = user_message or f"{domain} assessment current session"
        history = get_history(
            specialty=specialty,
            patient_id=patient_id,
            query=rag_query,
            k=5,
        )

        # Build the patient profile string. Accept either patient_profile
        # (current) or patient_base (legacy field name).
        patient_profile = (
            shared.get("patient_profile")
            or shared.get("patient_base")
            or ""
        )
        if isinstance(patient_profile, dict):
            patient_profile = json.dumps(patient_profile, indent=2)

        # Telemetry context — prefer the snapshot the client attached
        # (mobile sends real vest readings) over the mock tool defaults.
        telemetry_str = json.dumps(telemetry, indent=2) if telemetry else ""

        # Assemble the base expert system prompt (telemetry, tools, KB, history).
        system_prompt = get_expert_prompt(
            specialty=specialty,
            tool_results=tool_results_str,
            history=history if history else None,
            patient_profile=str(patient_profile),
            telemetry_context=telemetry_str,
        )

        # Append the user's question. Frame the JSON 'finding' field as
        # a direct, conversational answer rather than a generic write-up.
        if user_message:
            system_prompt += f"""

## USER QUESTION
The patient (or clinician) has asked the following. Answer it directly,
grounding every claim in the live telemetry, tool results, patient
profile, and clinical reference knowledge above. The 'finding' field
of your JSON output must be a substantive answer to THIS specific
question — not a generic assessment.

QUESTION: {user_message}
"""

        # Call the LLM
        try:
            resp = _get_model(specialty).invoke(
                [HumanMessage(content=system_prompt)]
            )
            content = getattr(resp, "content", None) or str(resp)
        except Exception as e:
            return {
                "error_message": f"{type(e).__name__}: {e}",
                "final_expert_analysis": {
                    "expert_domain": domain,
                    "clinical_findings": f"Interpretation failed: {e}",
                    "anomaly_detected": False,
                    "confidence_score": 0.0,
                },
                "messages": [
                    AIMessage(content=f"[{domain}] Interpretation generation failed.")
                ],
            }

        # Parse the LLM response (robust JSON extraction)
        try:
            import re
            content_clean = content.strip()
            # Greedy match from first { to last }
            json_match = re.search(r'\{.*\}', content_clean, re.DOTALL)
            
            clean = json_match.group(0) if json_match else content_clean
            parsed = json.loads(clean)
        except (json.JSONDecodeError, Exception):
            parsed = {
                "expert": domain,
                "finding": content.strip()[:1000] + "..." if len(content) > 1000 else content.strip(),
                "severity": "unknown",
                "severity_score": 0.0,
                "confidence": 0.5,
            }

        # Build the final analysis
        analysis = {
            "expert_domain": domain,
            "clinical_findings": parsed.get("finding", content),
            "severity": parsed.get("severity", "unknown"),
            "severity_score": parsed.get("severity_score", 0.0),
            "key_observations": parsed.get("key_observations", []),
            "recommendations": parsed.get("recommendations", []),
            "confidence_score": parsed.get("confidence", 0.6),
            "anomaly_detected": parsed.get("severity_score", 0) >= 5,
            "generated_at": get_today_str(),
        }

        # Save interpretation summary to vector store for future sessions
        summary = (
            f"[{domain}] Severity: {analysis['severity']} "
            f"(score: {analysis['severity_score']}). "
            f"Findings: {analysis['clinical_findings'][:300]}"
        )
        try:
            save_interpretation(
                specialty=specialty,
                patient_id=patient_id,
                interpretation=content,
                summary=summary,
                metadata={
                    "severity": analysis["severity"],
                    "severity_score": analysis["severity_score"],
                    "generated_at": analysis["generated_at"],
                },
            )
        except Exception:
            pass  # Don't fail the node if vector store write fails
            
        try:
            insert_interpretation(
                specialty=specialty,
                findings=analysis["clinical_findings"],
                severity=analysis["severity"],
                severity_score=analysis["severity_score"]
            )
        except Exception:
            pass

        return {
            "final_expert_analysis": analysis,
            "messages": [
                AIMessage(content=analysis['clinical_findings'].strip())
            ],
            "traces": [
                {
                    "step": "interpretation_generation",
                    "specialty": specialty,
                    "severity": analysis["severity"],
                    "severity_score": analysis["severity_score"],
                }
            ],
        }

    return interpretation_generation


# ─── Graph Builder ───────────────────────────────────────────────────────────


def build_expert_graph(specialty: str) -> StateGraph:
    """
    Build a LangGraph StateGraph for a given medical specialty.

    Architecture:
        __start__ → information_retrieval → interpretation_generation → __end__

    Args:
        specialty: Key from EXPERT_TOOLS / EXPERT_SYSTEM_PROMPTS

    Returns:
        Uncompiled StateGraph ready for .compile()
    """
    builder = StateGraph(ExpertSubgraphState)

    # Create specialty-specific node functions
    info_retrieval = _make_information_retrieval(specialty)
    interpretation = _make_interpretation_generation(specialty)

    # Add nodes
    builder.add_node("information_retrieval", info_retrieval)
    builder.add_node("interpretation_generation", interpretation)

    # Wire edges
    builder.add_edge("__start__", "information_retrieval")
    builder.add_edge("information_retrieval", "interpretation_generation")
    builder.add_edge("interpretation_generation", END)

    return builder