"""
Extreme Heat Risk Engine — FastAPI Application

Serves synthetic demo data for the dashboard.
When the real pipeline has been run, serves pipeline results instead.
"""

try:
    from dotenv import load_dotenv
    load_dotenv()
except ImportError:
    pass

import asyncio
import logging
import os
import random
import threading
from contextlib import asynccontextmanager
from datetime import datetime, timedelta
from pathlib import Path

from fastapi import FastAPI, BackgroundTasks
from fastapi.middleware.cors import CORSMiddleware
from fastapi.responses import HTMLResponse

from config import ZONES, ZONE_MAP, CITIES, HEAT_THRESHOLDS, PAYOUT_PER_EVENT_USD
from src.indexing.heat_index import calculate_wbgt, calculate_heat_index, count_consecutive_days, count_trigger_days
from src.downscaling import get_uhi_corrector
from src.pricing.burn_analysis import BurnAnalysisPricer
from src.pricing.budget_optimizer import BudgetOptimizer
from src.database.crud import init_db, upsert_zone

logger = logging.getLogger(__name__)

# Database connection — set in lifespan
_db_conn = None


def _prewarm_graphcast() -> None:
    """Load GraphCast model into memory at startup so the first pipeline
    trigger doesn't pay the ~30-120s download/init cost. Runs in a
    background thread — failures are logged, not fatal.
    """
    try:
        from src.prediction.graphcast_inference import load_model
        import time as _time
        t0 = _time.time()
        load_model()
        logger.info("[PREWARM] GraphCast loaded at startup (%.1fs)", _time.time() - t0)
    except Exception as exc:
        logger.warning("[PREWARM] GraphCast prewarm threw: %s", exc)


@asynccontextmanager
async def lifespan(app: FastAPI):
    global _db_conn
    # Sync DB init — same pattern as Weather AI 2
    try:
        _db_conn = init_db()
        if _db_conn:
            for z in ZONES:
                try:
                    upsert_zone(_db_conn, {
                        "zone_id": z.zone_id, "name": z.name, "city": z.city,
                        "country": z.country, "latitude": z.latitude,
                        "longitude": z.longitude, "elevation_m": z.elevation_m,
                        "area_km2": z.area_km2, "population_est": z.population_est,
                        "settlement_type": z.settlement_type,
                        "worker_population_est": z.worker_population_est,
                        "outdoor_exposure_pct": z.outdoor_exposure_pct,
                        "heat_vulnerability": z.heat_vulnerability,
                        "hot_months": z.hot_months, "notes": z.notes,
                    })
                except Exception as exc:
                    logger.warning("Failed to seed zone %s: %s", z.zone_id, exc)
            logger.info("Database ready (postgres, %d zones seeded)", len(ZONES))
        else:
            logger.info("Database ready (in-memory)")
    except Exception as e:
        logger.warning("DB init failed (non-fatal): %s", e)
        _db_conn = None

    prewarm_thread = threading.Thread(
        target=_prewarm_graphcast, daemon=True, name="graphcast-prewarm",
    )
    prewarm_thread.start()

    scheduler = _start_scheduler()
    yield
    if scheduler:
        scheduler.shutdown(wait=False)
    if _db_conn:
        _db_conn.close()


app = FastAPI(title="Extreme Heat Risk Engine", version="1.0.0", lifespan=lifespan)

# CORS origins configurable via ALLOWED_ORIGINS (comma-separated).
# Defaults to "*" so local dev and HF Spaces preview stay permissive.
_allowed_origins_env = os.environ.get("ALLOWED_ORIGINS", "*").strip()
if _allowed_origins_env == "*" or not _allowed_origins_env:
    _allowed_origins = ["*"]
else:
    _allowed_origins = [o.strip() for o in _allowed_origins_env.split(",") if o.strip()]

app.add_middleware(
    CORSMiddleware,
    allow_origins=_allowed_origins,
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)

SEED = 42


def _generate_demo_data():
    """Deterministic synthetic data for the dashboard demo, using real ML models."""
    rng = random.Random(SEED)
    now = datetime(2026, 3, 29, 10, 0, 0)

    # Initialize ML models (UHI_MODEL env var selects synthetic or lst)
    uhi_corrector = get_uhi_corrector()

    # City base temperatures (ERA5-Land grid-level — before UHI correction)
    city_climate = {
        "Dar es Salaam": {"base_temp": 31, "temp_var": 2.5, "base_hum": 78, "hum_var": 8},
        "Kampala": {"base_temp": 28, "temp_var": 2.5, "base_hum": 68, "hum_var": 10},
        "Nairobi": {"base_temp": 25, "temp_var": 2.5, "base_hum": 55, "hum_var": 12},
        "Kigali": {"base_temp": 25, "temp_var": 2, "base_hum": 60, "hum_var": 10},
    }

    # Generate 90 days of daily data per zone
    zones = []
    indices = []
    all_triggers = []
    tid = 1

    for z in ZONES:
        clim = city_climate[z.city]

        daily_grid_temps = []
        daily_temps = []
        daily_humidity = []
        daily_dates = []
        daily_wbgt = []
        daily_hi = []
        daily_uhi_deltas = []

        for d in range(90):
            date = now - timedelta(days=89 - d)
            month = date.month
            seasonal = 1.5 if month in z.hot_months else -0.5
            # Grid-level temperature (ERA5-Land equivalent — before UHI)
            grid_temp = clim["base_temp"] + seasonal + rng.gauss(0, clim["temp_var"] * 0.4)
            grid_temp = round(max(18, min(42, grid_temp)), 1)
            hum = clim["base_hum"] + rng.gauss(0, clim["hum_var"] * 0.3)
            hum = round(max(30, min(95, hum)), 1)
            # ML UHI correction
            corrected, uhi_delta, _ = uhi_corrector.correct_temperature(z, grid_temp, hour=14, month=month)
            temp = round(corrected, 1)
            daily_grid_temps.append(grid_temp)
            wbgt = calculate_wbgt(temp, hum)
            hi = calculate_heat_index(temp, hum)

            daily_temps.append(temp)
            daily_humidity.append(hum)
            daily_dates.append(date.strftime("%Y-%m-%d"))
            daily_wbgt.append(wbgt)
            daily_hi.append(hi)
            daily_uhi_deltas.append(round(uhi_delta, 1))

        max_temp = max(daily_temps)
        max_wbgt = max(daily_wbgt)
        recent_temps = daily_temps[-7:]
        recent_wbgt = daily_wbgt[-7:]
        current_temp = daily_temps[-1]
        current_wbgt = daily_wbgt[-1]
        current_hi = daily_hi[-1]
        watch_temp = HEAT_THRESHOLDS["watch"]["temp_c"]
        consec = count_consecutive_days(recent_temps, watch_temp)
        total_above = count_trigger_days(daily_temps, watch_temp)

        # Risk level from config thresholds
        recent_max = max(recent_temps)
        risk_level = "normal"
        for level in ("critical", "warning", "watch"):
            ht = HEAT_THRESHOLDS[level]
            if recent_max >= ht["temp_c"] and consec >= ht["consecutive_days"]:
                risk_level = level
                break

        # Composite score
        temp_score = min(100, max(0, (max_temp - 28) * 10))
        wbgt_score = min(100, max(0, (max_wbgt - 25) * 12))
        vuln_score = {"high": 85, "moderate": 50, "low": 20}[z.heat_vulnerability]
        exposure_score = z.outdoor_exposure_pct * 100
        composite = round(temp_score * 0.3 + wbgt_score * 0.25 + consec * 10 * 0.2 + vuln_score * 0.15 + exposure_score * 0.1, 1)
        composite = min(100, max(0, composite))

        enrolled = int(z.worker_population_est * rng.uniform(0.15, 0.45))

        # Composite-driven trigger probability for demo shape. Not a model output.
        pred_prob = round(min(1.0, composite / 100), 2)
        pred_conf = 0.5
        pred_tier = "composite_heuristic"

        zone_data = {
            "zone_id": z.zone_id,
            "name": z.name,
            "city": z.city,
            "country": z.country,
            "latitude": z.latitude,
            "longitude": z.longitude,
            "elevation_m": z.elevation_m,
            "settlement_type": z.settlement_type,
            "worker_population_est": z.worker_population_est,
            "outdoor_exposure_pct": z.outdoor_exposure_pct,
            "heat_vulnerability": z.heat_vulnerability,
            "risk_level": risk_level,
            "current_temp_c": current_temp,
            "current_wbgt_c": current_wbgt,
            "current_heat_index_c": current_hi,
            "max_temp_c": round(max_temp, 1),
            "max_wbgt_c": round(max_wbgt, 1),
            "consecutive_hot_days": consec,
            "total_days_above_33": total_above,
            "heat_risk_score": composite,
            "grid_temp_c": daily_grid_temps[-1],
            "uhi_delta_c": daily_uhi_deltas[-1],
            "corrected_temp_c": temp,
            "trigger_probability_7d": round(pred_prob, 2),
            "prediction_confidence": round(pred_conf, 2),
            "model_tier": pred_tier,
            "enrolled_workers": enrolled,
            "data_quality": round(rng.uniform(0.80, 0.98), 2),
            "last_updated": now.isoformat(),
        }
        zones.append(zone_data)

        # Index data with daily history
        indices.append({
            "zone_id": z.zone_id,
            "zone_name": z.name,
            "city": z.city,
            "risk_level": risk_level,
            "temp_current": current_temp,
            "wbgt_current": current_wbgt,
            "heat_index_current": current_hi,
            "consecutive_hot_days": consec,
            "heat_risk_score": composite,
            "grid_temp_c": daily_grid_temps[-1],
            "uhi_delta_c": daily_uhi_deltas[-1],
            "trigger_probability_7d": round(pred_prob, 2),
            "prediction_confidence": round(pred_conf, 2),
            "model_tier": pred_tier,
            "daily_history": [
                {"date": daily_dates[i], "temp_c": daily_temps[i], "grid_temp_c": daily_grid_temps[i], "uhi_delta_c": daily_uhi_deltas[i], "humidity_pct": daily_humidity[i], "wbgt_c": daily_wbgt[i], "heat_index_c": daily_hi[i]}
                for i in range(90)
            ],
        })

        # Triggers
        if risk_level != "normal":
            payout = PAYOUT_PER_EVENT_USD.get(risk_level, 5)
            all_triggers.append({
                "trigger_id": f"TRG-{tid:04d}",
                "zone_id": z.zone_id,
                "zone_name": z.name,
                "city": z.city,
                "trigger_level": risk_level,
                "trigger_date": (now - timedelta(hours=rng.randint(2, 48))).isoformat(),
                "heat_risk_score": composite,
                "max_temp_c": round(max_temp, 1),
                "max_wbgt_c": round(max_wbgt, 1),
                "consecutive_days": consec,
                "total_days_above": total_above,
                "settlement_type": z.settlement_type,
                "payout_per_worker_usd": payout,
                "enrolled_workers": enrolled,
                "total_payout_usd": payout * enrolled,
                "status": "active",
            })
            tid += 1

    # Basis risk
    basis_risk = []
    for z_data in zones:
        zone_obj = ZONE_MAP[z_data["zone_id"]]
        if zone_obj.heat_vulnerability == "high" and zone_obj.settlement_type == "informal":
            score = rng.uniform(0.25, 0.40)
        elif zone_obj.heat_vulnerability == "high":
            score = rng.uniform(0.18, 0.32)
        elif zone_obj.heat_vulnerability == "moderate":
            score = rng.uniform(0.10, 0.22)
        else:
            score = rng.uniform(0.05, 0.15)
        basis_risk.append({
            "zone_id": z_data["zone_id"],
            "zone_name": z_data["name"],
            "city": z_data["city"],
            "overall_score": round(score, 3),
            "false_positive_rate": round(score * rng.uniform(0.4, 0.7), 3),
            "false_negative_rate": round(score * rng.uniform(0.3, 0.6), 3),
            "correlation": round(1 - score * rng.uniform(0.8, 1.1), 3),
            "settlement_type": z_data["settlement_type"],
            "heat_vulnerability": z_data["heat_vulnerability"],
            "recommendation": (
                "Urban heat island effect significant — consider localized temperature sensors"
                if zone_obj.settlement_type == "informal"
                else "Station temperature may underestimate worker-experienced heat by 2-3°C"
                if score > 0.2
                else "Current calibration adequate for this zone"
            ),
        })

    # Notifications
    notifications = []
    nid = 1
    for trigger in all_triggers:
        if trigger["trigger_level"] in ("critical", "warning"):
            notifications.append({
                "id": f"NOT-{nid:04d}",
                "zone_id": trigger["zone_id"],
                "zone_name": trigger["zone_name"],
                "city": trigger["city"],
                "trigger_level": trigger["trigger_level"],
                "channel": rng.choice(["sms", "whatsapp"]),
                "language": rng.choice(["en", "sw"]),
                "recipient_count": trigger["enrolled_workers"],
                "message_preview": (
                    f"HEAT ALERT [{trigger['trigger_level'].upper()}]: "
                    f"{trigger['zone_name']}, {trigger['city']}. "
                    f"Temperature {trigger['max_temp_c']}°C (WBGT {trigger['max_wbgt_c']}°C). "
                    f"Payout: ${trigger['payout_per_worker_usd']}."
                ),
                "status": "sent",
                "delivered_at": trigger["trigger_date"],
                "cost_estimate": round(trigger["enrolled_workers"] * 0.0075, 2),
            })
            nid += 1
            notifications.append({
                "id": f"NOT-{nid:04d}",
                "zone_id": trigger["zone_id"],
                "zone_name": trigger["zone_name"],
                "city": trigger["city"],
                "trigger_level": trigger["trigger_level"],
                "channel": "sms",
                "language": "sw",
                "recipient_count": trigger["enrolled_workers"],
                "message_preview": (
                    f"TAHADHARI YA JOTO [{trigger['trigger_level'].upper()}]: "
                    f"{trigger['zone_name']}, {trigger['city']}. "
                    f"Joto {trigger['max_temp_c']}°C. "
                    f"Malipo: ${trigger['payout_per_worker_usd']}."
                ),
                "status": "sent",
                "delivered_at": trigger["trigger_date"],
                "cost_estimate": round(trigger["enrolled_workers"] * 0.0075, 2),
            })
            nid += 1

    # Pipeline runs
    pipeline_runs = []
    for i in range(15):
        run_date = now - timedelta(days=i * 2)
        duration = rng.uniform(30, 120)
        cost = rng.uniform(0.06, 0.18)
        status = "ok" if rng.random() > 0.15 else "partial"
        pipeline_runs.append({
            "run_id": f"run-{1000 + i}",
            "started_at": run_date.isoformat(),
            "ended_at": (run_date + timedelta(seconds=duration)).isoformat(),
            "status": status,
            "duration_s": round(duration, 1),
            "zones_processed": 20,
            "triggers_found": rng.randint(0, 8),
            "notifications_sent": rng.randint(0, 16),
            "total_cost_usd": round(cost, 4),
            "steps": [
                {"step": s, "status": "ok", "duration_s": round(duration / 6, 1)}
                for s in ["ingest", "heal", "index", "calibrate", "explain", "notify"]
            ],
        })

    stats = {
        "total_runs": len(pipeline_runs),
        "successful_runs": sum(1 for r in pipeline_runs if r["status"] == "ok"),
        "success_rate": round(sum(1 for r in pipeline_runs if r["status"] == "ok") / len(pipeline_runs), 2),
        "zones_monitored": len(ZONES),
        "cities": len(CITIES),
        "active_triggers": len(all_triggers),
        "total_enrolled": sum(z["enrolled_workers"] for z in zones),
        "total_cost_usd": round(sum(r["total_cost_usd"] for r in pipeline_runs), 2),
        "avg_cost_per_run_usd": round(sum(r["total_cost_usd"] for r in pipeline_runs) / len(pipeline_runs), 4),
        "last_run": pipeline_runs[0]["started_at"],
        "data_sources": ["NASA POWER"],
    }

    return {
        "zones": zones,
        "indices": indices,
        "triggers": all_triggers,
        "basis_risk": basis_risk,
        "notifications": notifications,
        "pipeline_runs": pipeline_runs,
        "stats": stats,
    }


_demo = None


def _get_demo():
    """Lazy initialization of demo data — only generated on first API request."""
    global _demo
    if _demo is None:
        _demo = _generate_demo_data()
    return _demo


# Singletons for calibrate endpoint (avoid re-instantiation per request)
_actuarial_pricer = BurnAnalysisPricer()
_budget_optimizer = BudgetOptimizer()


# ── API Endpoints ──────────────────────────────────────────────────────────

@app.get("/health")
def health():
    return {"status": "ok", "service": "extreme-heat-risk-engine", "version": "1.0.0"}


@app.get("/api/zones")
def get_zones():
    return {"zones": _get_demo()["zones"], "total": len(_get_demo()["zones"]), "cities": CITIES}


@app.get("/api/indices")
def get_indices():
    return {"indices": _get_demo()["indices"], "total": len(_get_demo()["indices"])}


@app.get("/api/triggers")
def get_triggers():
    triggers = _get_demo()["triggers"]
    return {
        "triggers": triggers,
        "total": len(triggers),
        "active": sum(1 for t in triggers if t["status"] == "active"),
        "by_level": {
            level: sum(1 for t in triggers if t["trigger_level"] == level)
            for level in ["critical", "warning", "watch"]
        },
    }


@app.get("/api/basis-risk")
def get_basis_risk():
    br = _get_demo()["basis_risk"]
    return {
        "assessments": br,
        "total": len(br),
        "avg_score": round(sum(b["overall_score"] for b in br) / max(1, len(br)), 3),
    }


@app.get("/api/notifications")
def get_notifications():
    notifs = _get_demo()["notifications"]
    return {
        "notifications": notifs,
        "total": len(notifs),
        "by_language": {
            lang: sum(1 for n in notifs if n["language"] == lang)
            for lang in ["en", "sw"]
        },
    }


@app.get("/api/enrolled-workers")
def get_enrolled():
    by_zone = [
        {"zone_id": z["zone_id"], "zone_name": z["name"], "city": z["city"], "enrolled": z["enrolled_workers"]}
        for z in _get_demo()["zones"]
    ]
    return {"by_zone": by_zone, "total_enrolled": sum(z["enrolled_workers"] for z in _get_demo()["zones"])}


@app.get("/api/pipeline/runs")
def get_pipeline_runs():
    return {"runs": _get_demo()["pipeline_runs"], "total": len(_get_demo()["pipeline_runs"])}


@app.get("/api/pipeline/stats")
def get_pipeline_stats():
    return _get_demo()["stats"]


@app.get("/api/coverage-recommendation")
def get_coverage_recommendation(payout_usd: float = 10.0):
    """Neural model-driven coverage recommendation.

    The model analyzes current heat conditions across all zones and
    recommends: how much coverage is needed, where, and at what cost.
    No budget input — the model TELLS you what the budget should be.
    """
    demo = _get_demo()
    zones_data = demo["zones"]
    indices = demo["indices"]
    basis = demo["basis_risk"]

    basis_by_id = {b["zone_id"]: b for b in basis}
    indices_by_id = {idx["zone_id"]: idx for idx in indices}

    zone_recommendations = []
    total_recommended_budget = 0.0
    total_workers_at_risk = 0
    total_workers_enrolled = 0

    for z in zones_data:
        zone_id = z["zone_id"]
        zone = ZONE_MAP.get(zone_id)
        if not zone:
            continue

        idx = indices_by_id.get(zone_id, {})
        history = idx.get("daily_history", [])
        br = basis_by_id.get(zone_id, {})

        # Get trigger probability from forecast
        trigger_prob = z.get("trigger_probability_7d", 0)
        current_temp = z.get("corrected_temp_c", z.get("current_temp_c", 30))
        current_wbgt = z.get("current_wbgt_c", 28)
        consecutive = z.get("consecutive_hot_days", 0)
        risk_level = z.get("risk_level", "normal")
        enrolled = z.get("enrolled_workers", 0)

        # Neural pricing (uses climate history if available)
        ar = _actuarial_pricer.price_zone(
            zone=zone,
            predicted_frequency=z.get("events_per_year", 10),
            basis_risk_score=br.get("overall_score", 0.2),
            payout_per_event=payout_usd,
            enrolled=max(enrolled, 1),
            climate_history=history if history else None,
        )

        # Workers at risk this week (based on trigger probability)
        workers_at_risk = int(enrolled * trigger_prob * zone.outdoor_exposure_pct)

        # Recommended weekly payout for this zone
        weekly_payout = workers_at_risk * payout_usd
        annual_cost = ar.cost_per_worker_year * enrolled

        # Urgency level
        if trigger_prob > 0.7 or risk_level == "critical":
            urgency = "critical"
        elif trigger_prob > 0.4 or risk_level in ("warning", "high"):
            urgency = "high"
        elif trigger_prob > 0.15:
            urgency = "moderate"
        else:
            urgency = "low"

        total_recommended_budget += annual_cost
        total_workers_at_risk += workers_at_risk
        total_workers_enrolled += enrolled

        # Cost decomposition
        cb = ar.cost_breakdown
        payout_fraction = ar.expected_annual_payouts / max(annual_cost, 1)
        admin_fraction = ar.admin_loading / max(annual_cost, 1)
        basis_risk_fraction = ar.basis_risk_loading / max(annual_cost, 1)

        zone_recommendations.append({
            "zone_id": zone_id,
            "zone_name": zone.name,
            "city": zone.city,
            "settlement_type": zone.settlement_type,
            "heat_vulnerability": zone.heat_vulnerability,
            "urgency": urgency,
            # Current conditions
            "current_temp_c": round(current_temp, 1),
            "current_wbgt_c": round(current_wbgt, 1),
            "consecutive_hot_days": consecutive,
            "trigger_probability_7d": round(trigger_prob, 3),
            "risk_level": risk_level,
            # Worker impact
            "enrolled_workers": enrolled,
            "outdoor_exposure_pct": zone.outdoor_exposure_pct,
            "workers_at_risk_this_week": workers_at_risk,
            # Cost
            "annual_cost_per_worker": round(ar.cost_per_worker_year, 2),
            "annual_cost_total": round(annual_cost, 0),
            "weekly_recommended_payout": round(weekly_payout, 0),
            "payout_usd_per_event": payout_usd,
            # Decomposition
            "cost_to_workers_pct": round(payout_fraction * 100, 1),
            "cost_admin_pct": round(admin_fraction * 100, 1),
            "cost_basis_risk_pct": round(basis_risk_fraction * 100, 1),
            # Neural model outputs (if available)
            "neural_model": cb.get("neural_correction_pct") is not None,
            "neural_correction_pct": cb.get("neural_correction_pct"),
            "learned_frequency": cb.get("learned_frequency"),
            "learned_basis_risk": cb.get("learned_basis_risk"),
            "productivity_loss_rate": cb.get("productivity_loss_rate"),
            "gpd_shape_xi": cb.get("gpd_shape_xi"),
        })

    # Sort by urgency then annual cost
    urgency_order = {"critical": 0, "high": 1, "moderate": 2, "low": 3}
    zone_recommendations.sort(key=lambda z: (urgency_order.get(z["urgency"], 9), -z["annual_cost_total"]))

    # Weekly budget recommendation
    weekly_budget = sum(z["weekly_recommended_payout"] for z in zone_recommendations)

    return {
        "recommendation": {
            "annual_budget_needed": round(total_recommended_budget, 0),
            "weekly_budget_needed": round(weekly_budget, 0),
            "total_workers_enrolled": total_workers_enrolled,
            "workers_at_risk_this_week": total_workers_at_risk,
            "zones_at_risk": sum(1 for z in zone_recommendations if z["urgency"] in ("critical", "high")),
            "payout_per_event": payout_usd,
            "model_type": "burn_analysis",
        },
        "zones": zone_recommendations,
        "cost_summary": {
            "total_to_workers_pct": round(
                sum(z["annual_cost_total"] * z["cost_to_workers_pct"] / 100 for z in zone_recommendations)
                / max(total_recommended_budget, 1) * 100, 1
            ),
            "total_admin_pct": round(
                sum(z["annual_cost_total"] * z["cost_admin_pct"] / 100 for z in zone_recommendations)
                / max(total_recommended_budget, 1) * 100, 1
            ),
            "total_basis_risk_pct": round(
                sum(z["annual_cost_total"] * z["cost_basis_risk_pct"] / 100 for z in zone_recommendations)
                / max(total_recommended_budget, 1) * 100, 1
            ),
        },
    }


@app.get("/api/calibrate")
def calibrate(
    temp_threshold: float = 35.0,
    consecutive_days: int = 2,
    wbgt_threshold: float = 30.0,
    payout_usd: float = 10.0,
    budget_usd: float = 500000.0,
    worker_contribution_usd: float = 0.0,
):
    """Interactive calibration endpoint.

    Run heat risk scoring with custom thresholds against all zones.
    Returns per-zone trigger analysis and program cost estimates.
    """
    rng = random.Random(SEED)
    results = []
    total_trigger_days = 0
    total_annual_cost = 0.0
    zones_triggered = 0

    zones_by_id = {z["zone_id"]: z for z in _get_demo()["zones"]}
    basis_by_id = {b["zone_id"]: b for b in _get_demo()["basis_risk"]}

    for idx_data in _get_demo()["indices"]:
        zone_id = idx_data["zone_id"]
        zone = ZONE_MAP.get(zone_id)
        if not zone:
            continue

        # Extract daily temps and humidity from history
        history = idx_data.get("daily_history", [])
        temps = [d["temp_c"] for d in history]
        humidity = [d["humidity_pct"] for d in history]
        wbgts = [d["wbgt_c"] for d in history]

        # Apply custom thresholds
        days_above_temp = count_trigger_days(temps, temp_threshold)
        days_above_wbgt = count_trigger_days(wbgts, wbgt_threshold)
        consec_temp = count_consecutive_days(temps, temp_threshold)
        consec_wbgt = count_consecutive_days(wbgts, wbgt_threshold)

        # Count trigger events (consecutive runs above threshold)
        trigger_events = 0
        run_length = 0
        for t in temps:
            if t > temp_threshold:
                run_length += 1
            else:
                if run_length >= consecutive_days:
                    trigger_events += 1
                run_length = 0
        if run_length >= consecutive_days:
            trigger_events += 1

        # Annualize (90 days of data → multiply by 4)
        events_per_year = round(trigger_events * (365 / max(len(temps), 1)), 1)

        zone_demo = zones_by_id.get(zone_id, {})
        enrolled = zone_demo.get("enrolled_workers", 0)

        annual_payout = round(events_per_year * payout_usd * enrolled, 2)
        annual_per_worker = round(events_per_year * payout_usd, 2)

        br = basis_by_id.get(zone_id, {})
        basis_score = br.get("overall_score", 0.15)

        triggered = trigger_events > 0
        if triggered:
            zones_triggered += 1
        total_trigger_days += days_above_temp
        total_annual_cost += annual_payout

        results.append({
            "zone_id": zone_id,
            "zone_name": zone.name,
            "city": zone.city,
            "settlement_type": zone.settlement_type,
            "heat_vulnerability": zone.heat_vulnerability,
            "enrolled_workers": enrolled,
            "days_above_temp": days_above_temp,
            "days_above_wbgt": days_above_wbgt,
            "consecutive_days_temp": consec_temp,
            "consecutive_days_wbgt": consec_wbgt,
            "trigger_events": trigger_events,
            "events_per_year": events_per_year,
            "annual_payout_per_worker": annual_per_worker,
            "annual_payout_total": annual_payout,
            "basis_risk_score": basis_score,
            "triggered": triggered,
        })

    total_enrolled = sum(r["enrolled_workers"] for r in results)

    # Actuarial pricing per zone
    indices_by_id = {idx["zone_id"]: idx for idx in _get_demo()["indices"]}
    actuarial_results = []
    for r in results:
        zone = ZONE_MAP.get(r["zone_id"])
        if not zone:
            continue
        idx_data = indices_by_id.get(r["zone_id"])
        history = idx_data.get("daily_history") if idx_data else None
        ar = _actuarial_pricer.price_zone(
            zone=zone,
            predicted_frequency=r["events_per_year"],
            basis_risk_score=r["basis_risk_score"],
            payout_per_event=payout_usd,
            enrolled=r["enrolled_workers"],
            climate_history=history,
        )
        r["actuarial_cost_per_worker"] = round(ar.cost_per_worker_year, 2)
        r["cost_breakdown"] = ar.cost_breakdown
        actuarial_results.append(ar)

    # Budget allocation
    allocation = _budget_optimizer.optimize(
        budget_usd=budget_usd,
        actuarial_results=actuarial_results,
        payout_per_event=payout_usd,
        worker_contribution=worker_contribution_usd,
    )

    # Merge allocation into zone results
    alloc_map = {a.zone_id: a for a in allocation.allocations}
    for r in results:
        a = alloc_map.get(r["zone_id"])
        if a:
            r["allocated_budget"] = round(a.allocated_budget, 2)
            r["workers_covered"] = a.workers_covered
            r["coverage_pct"] = round(a.coverage_pct, 1)
            r["priority_rank"] = a.priority_rank
        else:
            r["allocated_budget"] = 0
            r["workers_covered"] = 0
            r["coverage_pct"] = 0
            r["priority_rank"] = 99

    return {
        "zones": sorted(results, key=lambda r: r.get("priority_rank", 99)),
        "summary": {
            "total_zones": len(results),
            "zones_triggered": zones_triggered,
            "total_trigger_days": total_trigger_days,
            "avg_events_per_year": round(sum(r["events_per_year"] for r in results) / max(1, len(results)), 1),
            "total_annual_cost": round(total_annual_cost, 2),
            "avg_cost_per_worker": round(total_annual_cost / max(1, total_enrolled), 2),
            "total_enrolled": total_enrolled,
            "avg_basis_risk": round(sum(r["basis_risk_score"] for r in results) / max(1, len(results)), 3),
        },
        "allocation": {
            "budget_usd": budget_usd,
            "worker_contribution_usd": worker_contribution_usd,
            "workers_covered": allocation.total_workers_covered,
            "overall_coverage_pct": round(allocation.overall_coverage_pct, 1),
            "zones_fully_funded": allocation.zones_fully_funded,
            "zones_partially_funded": allocation.zones_partially_funded,
            "zones_unfunded": allocation.zones_unfunded,
            "stretch_analysis": allocation.stretch_analysis,
        },
        "thresholds": {
            "temp_threshold": temp_threshold,
            "consecutive_days": consecutive_days,
            "wbgt_threshold": wbgt_threshold,
            "payout_usd": payout_usd,
        },
    }


# ── Pipeline trigger ──────────────────────────────────────────────────────

_pipeline_status = {
    "running": False,
    "current_step": None,
    "current_step_index": 0,
    "total_steps": 6,
    "last_result": None,
    "last_run": None,
}


async def _run_pipeline_async():
    """Run the full pipeline in background, writing results to Neon."""
    global _db_conn
    from src.pipeline import STEP_LABELS

    _pipeline_status["running"] = True
    _pipeline_status["current_step"] = None
    _pipeline_status["current_step_index"] = 0

    # Refresh the Neon connection before the run. _db_conn is created once
    # in lifespan, but between pipeline runs (the space can sit idle for
    # hours/days) Neon's autosuspend kills the underlying socket. Without
    # this refresh the first DB write would throw, _db_write would set
    # self.db=None inside the pipeline, and every downstream write would
    # silently no-op -- the pipeline reports status=ok but Neon has no row.
    if _db_conn is not None:
        try:
            _db_conn._refresh_conn()
        except Exception as exc:
            logger.warning("[PIPELINE] DB refresh failed, reconnecting: %s", exc)
            try:
                _db_conn.close()
            except Exception:
                pass
            try:
                _db_conn = init_db()
            except Exception as reconnect_exc:
                logger.warning("[PIPELINE] DB reconnect failed: %s", reconnect_exc)
                _db_conn = None

    def _progress_cb(step_name, step_index):
        _pipeline_status["current_step"] = step_name
        _pipeline_status["current_step_index"] = step_index
        if step_name:
            label = STEP_LABELS.get(step_name, step_name)
            print(f"[PIPELINE] Step {step_index}/6: {label}", flush=True)

    try:
        from src.pipeline import run_pipeline_sync
        result = await asyncio.get_event_loop().run_in_executor(
            None,
            lambda: run_pipeline_sync(
                days_back=14,
                use_claude_healer=bool(os.environ.get("ANTHROPIC_API_KEY")),
                use_claude_explainer=bool(os.environ.get("ANTHROPIC_API_KEY")),
                delivery_channel="console",
                db=_db_conn,
                progress_callback=_progress_cb,
            ),
        )
        _pipeline_status["last_result"] = {
            "run_id": result.run_id,
            "status": result.status,
            "zones_processed": result.zones_processed,
            "triggers_found": result.triggers_found,
            "duration_s": round(result.duration_s, 1),
        }
        _pipeline_status["last_run"] = datetime.utcnow().isoformat()
        print(f"[PIPELINE] Complete: {result.status} — {result.zones_processed} zones, {result.triggers_found} triggers, {result.duration_s:.1f}s", flush=True)
    except Exception as e:
        print(f"[PIPELINE] FAILED: {e}", flush=True)
        _pipeline_status["last_result"] = {"status": "failed", "error": str(e)}
    finally:
        _pipeline_status["running"] = False
        _pipeline_status["current_step"] = None
        _pipeline_status["current_step_index"] = 0


@app.post("/api/pipeline/trigger")
async def trigger_pipeline(background_tasks: BackgroundTasks):
    """Trigger a pipeline run. Returns immediately; pipeline runs in background."""
    if _pipeline_status["running"]:
        return {"status": "already_running", "message": "A pipeline run is already in progress"}
    background_tasks.add_task(_run_pipeline_async)
    return {"status": "started", "message": "Pipeline run started in background"}


@app.get("/api/pipeline/status")
def pipeline_status():
    """Check if a pipeline run is in progress and get last result."""
    return _pipeline_status


# ── Scheduled pipeline runs ──────────────────────────────────────────────

def _start_scheduler():
    """Start weekly pipeline scheduler (runs in background thread)."""
    try:
        from apscheduler.schedulers.background import BackgroundScheduler
        scheduler = BackgroundScheduler()
        scheduler.add_job(
            lambda: asyncio.run(_run_pipeline_async()),
            "cron",
            day_of_week="tue",
            hour=0, minute=30,
            id="weekly_pipeline",
        )
        scheduler.start()
        logger.info("Weekly pipeline scheduler started (Tuesdays 00:30 UTC)")
        return scheduler
    except ImportError:
        logger.info("apscheduler not installed — no scheduled runs")
        return None
    except Exception as e:
        logger.warning("Scheduler failed to start: %s", e)
        return None


# ── Status page (lightweight, no React build needed) ─────────────────────

_STEP_NAMES = {
    "ingest": "Collecting climate data",
    "heal": "Fixing data issues",
    "downscale": "Adjusting for urban heat",
    "predict": "Forecasting heat danger",
    "explain": "Generating alerts",
    "review": "AI review & recommendation",
}


_PIPELINE_STEPS = ["ingest", "heal", "downscale", "predict", "explain", "review"]


def _pipeline_tracker_html() -> str:
    """Generate HTML for the vertical pipeline tracker with dots and run button."""
    ps = _pipeline_status
    running = ps["running"]
    current = ps.get("current_step")
    last = ps.get("last_result")

    # Build step rows
    completed_steps = []
    if last and last.get("status") in ("ok", "partial") and not running:
        completed_steps = _PIPELINE_STEPS  # all done

    rows = ""
    for step in _PIPELINE_STEPS:
        label = _STEP_NAMES.get(step, step)
        if running:
            if current and _PIPELINE_STEPS.index(step) < _PIPELINE_STEPS.index(current):
                cls = "done"
            elif step == current:
                cls = "active"
            else:
                cls = "pending"
        elif step in completed_steps:
            cls = "done"
        else:
            cls = "pending"
        rows += f'<div class="step-row"><div class="step-dot {cls}"></div><span class="step-name">{label}</span></div>\n'

    # Last run info
    last_html = ""
    if last and not running:
        status = last.get("status", "unknown")
        dur = last.get("duration_s", 0)
        zones = last.get("zones_processed", 0)
        triggers = last.get("triggers_found", 0)
        cls = "ok" if status in ("ok", "partial") else "failed"
        last_html = f'<div class="last-run"><span class="{cls}">{status.upper()}</span> — {zones} zones, {triggers} triggers, {dur:.0f}s</div>'

    btn_disabled = "disabled" if running else ""
    btn_text = "Running..." if running else "Run Pipeline"

    return f"""
    <div class="pipeline-tracker">
      <h3>Pipeline</h3>
      {rows}
      <button class="trigger-btn" {btn_disabled} onclick="fetch('/api/pipeline/trigger',{{method:'POST'}}).then(()=>location.reload())">{btn_text}</button>
      {last_html}
    </div>"""


@app.get("/", response_class=HTMLResponse)
async def status_page():
    """Pipeline tracker for the HF Space."""
    return f"""<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="utf-8">
<meta name="viewport" content="width=device-width, initial-scale=1">
<meta http-equiv="refresh" content="5">
<title>Heat Risk Engine</title>
<style>
  * {{ margin: 0; padding: 0; box-sizing: border-box; }}
  body {{ font-family: system-ui, -apple-system, sans-serif; background: #faf8f5; color: #1a1a1a; padding: 32px; max-width: 480px; margin: 0 auto; }}
  h1 {{ font-size: 1.4rem; font-weight: 700; margin-bottom: 4px; }}
  .subtitle {{ color: #888; font-size: 0.85rem; margin-bottom: 24px; }}
  .link {{ color: #e63946; text-decoration: none; font-weight: 600; }}
  .link:hover {{ text-decoration: underline; }}
  .pipeline-tracker {{ background: #fff; border: 1px solid #e0dcd5; border-radius: 8px; padding: 16px; margin-bottom: 24px; }}
  .pipeline-tracker h3 {{ font-size: 0.8rem; font-weight: 700; text-transform: uppercase; letter-spacing: 0.5px; color: #e63946; margin-bottom: 12px; }}
  .step-row {{ display: flex; align-items: center; gap: 10px; padding: 6px 0; font-size: 0.82rem; }}
  .step-dot {{ width: 10px; height: 10px; border-radius: 50%; flex-shrink: 0; }}
  .step-dot.done {{ background: #2a9d8f; }}
  .step-dot.active {{ background: #e63946; animation: pulse 1.2s infinite; }}
  .step-dot.pending {{ background: #e0dcd5; }}
  .step-dot.failed {{ background: #e63946; }}
  .step-name {{ font-weight: 600; min-width: 110px; }}
  .step-time {{ color: #888; font-size: 0.75rem; }}
  .trigger-btn {{ display: inline-block; margin-top: 12px; padding: 8px 20px; background: #e63946; color: #fff; border: none; border-radius: 6px; font-size: 0.8rem; font-weight: 600; letter-spacing: 0.5px; text-transform: uppercase; cursor: pointer; }}
  .trigger-btn:hover {{ background: #c5303c; }}
  .trigger-btn:disabled {{ opacity: 0.5; cursor: not-allowed; }}
  .last-run {{ font-size: 0.78rem; color: #888; margin-top: 8px; }}
  .last-run .ok {{ color: #2a9d8f; font-weight: 600; }}
  .last-run .failed {{ color: #e63946; font-weight: 600; }}
  @keyframes pulse {{ 0%, 100% {{ opacity: 1; }} 50% {{ opacity: 0.4; }} }}
</style>
</head>
<body>
  <h1>Heat Risk Engine</h1>
  <p class="subtitle"><a class="link" href="https://climate-risk-engine.vercel.app" target="_blank">Open Dashboard</a></p>

  {_pipeline_tracker_html()}
</body>
</html>"""