Spaces:

jtlevine
/

climate-risk-engine

Paused

jtlevine Claude Opus 4.6 (1M context) commited on Mar 31

Commit

8bec5a5

1 Parent(s): 406c2d9

Frontend upgrade: heat-red identity, danger banner, callout cards, richer detail

- Section headers use heat-red (#e63946) bottom borders instead of gold
- Sidebar logo and nav active state use heat-red accent
- Sidebar gradient shifts warm (#221a18) vs Weather AI 2's neutral (#222018)
- Dashboard: danger banner when triggers are active, callout cards explaining
UHI effect and AI prediction (matches Weather AI 2's detail level)
- Stage cards have colored top borders (blue/amber/red)
- Added CSS for callout cards, danger banner, temperature value colors
- Fixed missing Thermometer import in ProgramDesigner

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

Files changed (7) hide show

frontend/src/components/Sidebar.tsx +3 -3
frontend/src/index.css +58 -2
frontend/src/pages/Dashboard.tsx +38 -5
frontend/src/pages/HeatMonitor.tsx +8 -2
frontend/src/pages/ProgramDesigner.tsx +11 -2
frontend/src/pages/Zones.tsx +5 -0
scripts/train_on_era5.py +491 -0

frontend/src/components/Sidebar.tsx CHANGED Viewed

@@ -21,12 +21,12 @@ export default function Sidebar() {
   return (
     <aside
       className="fixed top-0 left-0 z-50 h-full w-56 flex flex-col"
-      style={{ background: 'linear-gradient(180deg, #1a1a1a 0%, #222018 100%)' }}
     >
       {/* Brand */}
       <div className="flex items-center h-16 px-5 border-b border-white/10">
         <NavLink to="/" className="flex items-center gap-2.5 no-underline">
-          <div className="w-8 h-8 rounded-lg bg-gold flex items-center justify-center">
             <Thermometer size={18} className="text-white" />
           </div>
           <div>
@@ -51,7 +51,7 @@ export default function Sidebar() {
             className={({ isActive }) =>
               `flex items-center gap-3 px-3 py-2.5 rounded-lg text-sm font-sans font-medium transition-colors duration-100 ${
                 isActive
-                  ? 'bg-gold/15 text-gold'
                   : 'text-[#e0dcd5] hover:bg-white/5 hover:text-white'
               }`
             }

   return (
     <aside
       className="fixed top-0 left-0 z-50 h-full w-56 flex flex-col"
+      style={{ background: 'linear-gradient(180deg, #1a1a1a 0%, #221a18 100%)' }}
     >
       {/* Brand */}
       <div className="flex items-center h-16 px-5 border-b border-white/10">
         <NavLink to="/" className="flex items-center gap-2.5 no-underline">
+          <div className="w-8 h-8 rounded-lg flex items-center justify-center" style={{ background: '#e63946' }}>
             <Thermometer size={18} className="text-white" />
           </div>
           <div>
             className={({ isActive }) =>
               `flex items-center gap-3 px-3 py-2.5 rounded-lg text-sm font-sans font-medium transition-colors duration-100 ${
                 isActive
+                  ? 'bg-[#e63946]/15 text-[#ff6b6b]'
                   : 'text-[#e0dcd5] hover:bg-white/5 hover:text-white'
               }`
             }

frontend/src/index.css CHANGED Viewed

@@ -255,12 +255,68 @@
     transform: translateY(-3px);
   }
-  /* ── Section headers ── */
   .section-header {
     @apply uppercase text-[0.78rem] font-sans font-semibold text-warm-muted pb-2 mb-4;
     letter-spacing: 1.5px;
-    border-bottom: 2px solid #d4a019;
   }
 }
 @layer utilities {

     transform: translateY(-3px);
   }
+  /* ── Section headers — heat-red accent (distinct from Weather AI 2's gold) ── */
   .section-header {
     @apply uppercase text-[0.78rem] font-sans font-semibold text-warm-muted pb-2 mb-4;
     letter-spacing: 1.5px;
+    border-bottom: 2px solid #e63946;
   }
+  /* ── Stage card top borders (heat-themed color coding) ── */
+  .stage-card[data-stage="data"] { border-top: 3px solid #1565C0; }
+  .stage-card[data-stage="forecast"] { border-top: 3px solid #e67e22; }
+  .stage-card[data-stage="program"] { border-top: 3px solid #e63946; }
+  /* ── Heat status indicators ── */
+  .heat-pill {
+    @apply inline-flex items-center gap-1.5 rounded-full px-2.5 py-1 text-[11px] font-semibold font-sans;
+  }
+  .heat-pill.safe { background: rgba(42, 157, 143, 0.15); color: #2a9d8f; }
+  .heat-pill.caution { background: rgba(212, 160, 25, 0.15); color: #d4a019; }
+  .heat-pill.warning { background: rgba(230, 126, 34, 0.15); color: #e67e22; }
+  .heat-pill.danger { background: rgba(230, 57, 70, 0.15); color: #e63946; }
+  /* ── Callout cards (left-border accent — distinct from Health Optimizer's teal) ── */
+  .callout {
+    @apply bg-white rounded-[10px] border border-warm-border p-4;
+    border-left: 3px solid #e63946;
+  }
+  .callout.amber { border-left-color: #e67e22; }
+  .callout.blue { border-left-color: #1565C0; }
+  .callout.green { border-left-color: #2a9d8f; }
+  .callout-title {
+    @apply text-[0.82rem] font-semibold font-sans text-[#1a1a1a] mb-1;
+  }
+  .callout-body {
+    @apply text-[0.78rem] text-warm-body leading-relaxed;
+  }
+  /* ── Danger banner ── */
+  .danger-banner {
+    @apply rounded-[10px] mb-6 flex items-center gap-3;
+    background: linear-gradient(135deg, rgba(230,57,70,0.06) 0%, rgba(230,126,34,0.04) 100%);
+    border: 1px solid rgba(230,57,70,0.15);
+    padding: 14px 20px;
+  }
+  .danger-dot {
+    width: 10px; height: 10px; border-radius: 50%; flex-shrink: 0;
+    background: #e63946;
+    box-shadow: 0 0 0 3px rgba(230,57,70,0.2);
+  }
+  .danger-text {
+    @apply text-[0.82rem] font-sans font-medium;
+    color: #e63946;
+  }
+  /* ── Temperature value colors ── */
+  .temp-safe { color: #2a9d8f; }
+  .temp-caution { color: #d4a019; }
+  .temp-warning { color: #e67e22; }
+  .temp-danger { color: #d35400; }
+  .temp-extreme { color: #e63946; }
 }
 @layer utilities {

frontend/src/pages/Dashboard.tsx CHANGED Viewed

@@ -4,17 +4,21 @@ import { Satellite, Thermometer, SlidersHorizontal, ChevronDown, ChevronRight, A
 import MetricCard from '../components/MetricCard'
 import StatusBadge from '../components/StatusBadge'
 import { LoadingSpinner, ErrorState } from '../components/LoadingState'
-import { usePipelineStats, usePipelineRuns } from '../lib/api'
 export default function Dashboard() {
   const stats = usePipelineStats()
   const runs = usePipelineRuns()
   const [showRuns, setShowRuns] = useState(false)
   if (stats.isLoading) return <LoadingSpinner />
   if (stats.isError) return <ErrorState onRetry={() => stats.refetch()} />
   const s = stats.data
   return (
     <div className="animate-slide-up">
@@ -26,11 +30,22 @@ export default function Dashboard() {
         </p>
       </div>
       {/* Stage Cards */}
       <div data-tour="stage-cards" className="mb-8">
         <div className="section-header">How It Works</div>
         <div className="grid grid-cols-1 md:grid-cols-3 gap-4 items-center">
-          <Link to="/heat-monitor" className="stage-card no-underline">
             <div className="flex items-center gap-3 mb-2">
               <div className="w-9 h-9 rounded-lg bg-blue-50 flex items-center justify-center">
                 <Satellite size={18} className="text-info" />
@@ -49,7 +64,7 @@ export default function Dashboard() {
             <ArrowRight size={20} className="text-warm-border" />
           </div>
-          <Link to="/heat-monitor" className="stage-card no-underline">
             <div className="flex items-center gap-3 mb-2">
               <div className="w-9 h-9 rounded-lg bg-amber-50 flex items-center justify-center">
                 <Thermometer size={18} className="text-warning" />
@@ -68,7 +83,7 @@ export default function Dashboard() {
             <ArrowRight size={20} className="text-warm-border" />
           </div>
-          <Link to="/calibrate" className="stage-card no-underline">
             <div className="flex items-center gap-3 mb-2">
               <div className="w-9 h-9 rounded-lg bg-red-50 flex items-center justify-center">
                 <SlidersHorizontal size={18} className="text-error" />
@@ -112,12 +127,30 @@ export default function Dashboard() {
         </div>
       </div>
       {/* Run History (collapsible) */}
       <div className="mb-8">
         <button
           onClick={() => setShowRuns(!showRuns)}
           className="flex items-center gap-2 section-header cursor-pointer w-full text-left border-b-0 pb-0 mb-0 bg-transparent border-none"
-          style={{ borderBottom: '2px solid #d4a019', paddingBottom: 8, marginBottom: 16 }}
         >
           {showRuns ? <ChevronDown size={14} /> : <ChevronRight size={14} />}
           Update History

 import MetricCard from '../components/MetricCard'
 import StatusBadge from '../components/StatusBadge'
 import { LoadingSpinner, ErrorState } from '../components/LoadingState'
+import { usePipelineStats, usePipelineRuns, useTriggers } from '../lib/api'
 export default function Dashboard() {
   const stats = usePipelineStats()
   const runs = usePipelineRuns()
+  const triggers = useTriggers()
   const [showRuns, setShowRuns] = useState(false)
   if (stats.isLoading) return <LoadingSpinner />
   if (stats.isError) return <ErrorState onRetry={() => stats.refetch()} />
   const s = stats.data
+  const activeTriggers = triggers.data?.triggers ?? []
+  const criticalZones = activeTriggers.filter((t) => t.trigger_level === 'critical')
+  const dangerNames = activeTriggers.slice(0, 3).map((t) => t.zone_name)
   return (
     <div className="animate-slide-up">
         </p>
       </div>
+      {/* Danger banner — shows when there are active triggers */}
+      {activeTriggers.length > 0 && (
+        <div className="danger-banner">
+          <div className="danger-dot" />
+          <div className="danger-text">
+            <strong>{activeTriggers.length} zone{activeTriggers.length !== 1 ? 's' : ''}</strong> currently exceeding safe heat levels
+            {dangerNames.length > 0 && <> — {dangerNames.join(', ')}{activeTriggers.length > 3 ? ` and ${activeTriggers.length - 3} more` : ''}</>}
+          </div>
+        </div>
+      )}
       {/* Stage Cards */}
       <div data-tour="stage-cards" className="mb-8">
         <div className="section-header">How It Works</div>
         <div className="grid grid-cols-1 md:grid-cols-3 gap-4 items-center">
+          <Link to="/heat-monitor" className="stage-card no-underline" data-stage="data">
             <div className="flex items-center gap-3 mb-2">
               <div className="w-9 h-9 rounded-lg bg-blue-50 flex items-center justify-center">
                 <Satellite size={18} className="text-info" />
             <ArrowRight size={20} className="text-warm-border" />
           </div>
+          <Link to="/heat-monitor" className="stage-card no-underline" data-stage="forecast">
             <div className="flex items-center gap-3 mb-2">
               <div className="w-9 h-9 rounded-lg bg-amber-50 flex items-center justify-center">
                 <Thermometer size={18} className="text-warning" />
             <ArrowRight size={20} className="text-warm-border" />
           </div>
+          <Link to="/calibrate" className="stage-card no-underline" data-stage="program">
             <div className="flex items-center gap-3 mb-2">
               <div className="w-9 h-9 rounded-lg bg-red-50 flex items-center justify-center">
                 <SlidersHorizontal size={18} className="text-error" />
         </div>
       </div>
+      {/* Explainer callouts */}
+      <div className="grid grid-cols-1 md:grid-cols-2 gap-3 mb-8">
+        <div className="callout amber">
+          <div className="callout-title">Urban Heat Island Effect</div>
+          <div className="callout-body">
+            Informal settlements with tin roofs can be 3-6°C hotter than surrounding areas.
+            The system adjusts satellite readings to reflect what workers actually experience on the ground.
+          </div>
+        </div>
+        <div className="callout blue">
+          <div className="callout-title">AI-Powered Prediction</div>
+          <div className="callout-body">
+            Two AI models work together to predict dangerous heat 7 days out.
+            When one model lacks data, the system automatically falls back to the next most reliable method.
+          </div>
+        </div>
+      </div>
       {/* Run History (collapsible) */}
       <div className="mb-8">
         <button
           onClick={() => setShowRuns(!showRuns)}
           className="flex items-center gap-2 section-header cursor-pointer w-full text-left border-b-0 pb-0 mb-0 bg-transparent border-none"
+          style={{ borderBottom: '2px solid #e63946', paddingBottom: 8, marginBottom: 16 }}
         >
           {showRuns ? <ChevronDown size={14} /> : <ChevronRight size={14} />}
           Update History

frontend/src/pages/HeatMonitor.tsx CHANGED Viewed

@@ -61,7 +61,10 @@ export default function HeatMonitor() {
       <div data-tour="heat-monitor-title" className="pt-2 pb-6">
         <h1 className="page-title">Heat Monitor</h1>
         <p className="page-caption">
-          Temperature, WBGT, and heat index tracking across all zones
         </p>
       </div>
@@ -235,8 +238,11 @@ export default function HeatMonitor() {
           {/* Temperature Chart */}
           <div className="card card-body">
             <h3 className="text-sm font-semibold font-sans text-[#1a1a1a] mb-1">
-              90-Day Temperature History: {selectedData?.zone_name}
             </h3>
             <p className="text-xs text-warm-muted mb-4">
               Current:{' '}
               <span style={{ color: tempColor(selectedData?.temp_current ?? 0) }} className="font-semibold">

       <div data-tour="heat-monitor-title" className="pt-2 pb-6">
         <h1 className="page-title">Heat Monitor</h1>
         <p className="page-caption">
+          Temperature, heat stress, and feels-like conditions across all zones
+        </p>
+        <p className="text-sm text-warm-body mt-2 leading-relaxed" style={{ maxWidth: '640px' }}>
+          Live readings from satellite sensors, adjusted for how hot each neighborhood actually feels to someone working outside. Red means danger — workers in those zones face unsafe conditions today.
         </p>
       </div>
           {/* Temperature Chart */}
           <div className="card card-body">
             <h3 className="text-sm font-semibold font-sans text-[#1a1a1a] mb-1">
+              How hot has it been? 90 days in {selectedData?.zone_name}
             </h3>
+            <p className="text-xs text-warm-body mb-1 leading-relaxed">
+              The solid red line is what workers actually feel (adjusted for local conditions). The dashed line is raw satellite data before adjustment. When the red line crosses the 35°C danger mark, outdoor work becomes unsafe.
+            </p>
             <p className="text-xs text-warm-muted mb-4">
               Current:{' '}
               <span style={{ color: tempColor(selectedData?.temp_current ?? 0) }} className="font-semibold">

frontend/src/pages/ProgramDesigner.tsx CHANGED Viewed

@@ -1,4 +1,5 @@
 import { useState, useEffect, useRef } from 'react'
 import MetricCard from '../components/MetricCard'
 import { LoadingSpinner, ErrorState } from '../components/LoadingState'
 import { useCalibrateQuery } from '../lib/api'
@@ -284,8 +285,16 @@ export default function ProgramDesigner() {
               </table>
             </div>
             {sortedZones.length === 0 && (
-              <div className="text-center py-12 text-warm-muted text-sm font-sans">
-                No zones triggered at current thresholds. Try lowering the temperature threshold.
               </div>
             )}
           </>

 import { useState, useEffect, useRef } from 'react'
+import { Thermometer } from 'lucide-react'
 import MetricCard from '../components/MetricCard'
 import { LoadingSpinner, ErrorState } from '../components/LoadingState'
 import { useCalibrateQuery } from '../lib/api'
               </table>
             </div>
             {sortedZones.length === 0 && (
+              <div className="text-center py-16 font-sans">
+                <div className="text-2xl mb-3">
+                  <Thermometer size={36} className="mx-auto text-warm-border" />
+                </div>
+                <p className="text-sm font-semibold text-[#1a1a1a] mb-2">
+                  No zones reached the danger threshold
+                </p>
+                <p className="text-sm text-warm-muted leading-relaxed max-w-md mx-auto">
+                  None of the monitored zones have experienced enough consecutive hot days at this temperature to trigger an alert. Try lowering the danger temperature, reducing the consecutive hot days requirement, or increasing your budget to cover more zones.
+                </p>
               </div>
             )}
           </>

frontend/src/pages/Zones.tsx CHANGED Viewed

@@ -192,6 +192,11 @@ export default function Zones() {
       {activeTab === 'exposure' && (
         <div className="animate-tab-enter">
           {enrolled.isLoading ? (
             <LoadingSpinner message="Loading enrollment data..." />
           ) : enrolled.isError ? (

       {activeTab === 'exposure' && (
         <div className="animate-tab-enter">
+          <div className="card card-body mb-6">
+            <p className="text-sm text-warm-body leading-relaxed m-0">
+              How many workers in each zone spend their day outdoors in the heat — and how many are enrolled in the protection program. Zones with high outdoor exposure but low enrollment are the biggest coverage gaps.
+            </p>
+          </div>
           {enrolled.isLoading ? (
             <LoadingSpinner message="Loading enrollment data..." />
           ) : enrolled.isError ? (

scripts/train_on_era5.py ADDED Viewed

	@@ -0,0 +1,491 @@

+"""
+Train all ML models on real ERA5 reanalysis data.
+Steps:
+1. Fetch 2 years of ERA5 data for all 20 zones via Google ARCO Zarr store
+2. Validate data quality (coverage, temp ranges, nulls)
+3. Retrain XGBoost heat predictor on real data
+4. Retrain LSTM on real data
+5. Verify UHI model works with real ERA5 temps
+"""
+import sys
+import os
+import time
+import logging
+import math
+import numpy as np
+# Project root on sys.path
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+from config import ZONES, ZONE_MAP
+from src.ingestion.era5_fetcher import fetch_era5_sync
+from src.ingestion.models import DailyReading
+from src.indexing.heat_index import calculate_wbgt
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s %(name)s %(levelname)s  %(message)s",
+    datefmt="%H:%M:%S",
+)
+log = logging.getLogger("train_era5")
+# Expected temp ranges per city (max daily temps, deg C)
+EXPECTED_RANGES = {
+    "Nairobi":       (18, 35),
+    "Dar es Salaam": (25, 40),
+    "Kampala":       (22, 36),
+    "Kigali":        (20, 34),
+}
+# ======================================================================
+# Step 1: Fetch ERA5 data
+# ======================================================================
+def fetch_data():
+    log.info("=" * 60)
+    log.info("STEP 1: Fetching 2 years of ERA5 data for %d zones", len(ZONES))
+    log.info("=" * 60)
+    t0 = time.time()
+    data = fetch_era5_sync(ZONES, days_back=730)
+    elapsed = time.time() - t0
+    log.info("Fetch complete in %.1f seconds", elapsed)
+    return data
+# ======================================================================
+# Step 2: Validate data quality
+# ======================================================================
+def validate_data(data: dict[str, list[DailyReading]]):
+    log.info("=" * 60)
+    log.info("STEP 2: Validating ERA5 data quality")
+    log.info("=" * 60)
+    issues = []
+    stats = {}
+    for zone in ZONES:
+        zid = zone.zone_id
+        readings = data.get(zid, [])
+        if not readings:
+            issues.append(f"{zid}: NO DATA")
+            stats[zid] = {"days": 0, "issue": "no data"}
+            continue
+        temps = [r.temp_max_c for r in readings if r.temp_max_c is not None]
+        humids = [r.humidity_pct for r in readings if r.humidity_pct is not None]
+        winds = [r.wind_speed_ms for r in readings if r.wind_speed_ms is not None]
+        if not temps:
+            issues.append(f"{zid}: all temps are null")
+            stats[zid] = {"days": len(readings), "issue": "all null temps"}
+            continue
+        t_min, t_max = min(temps), max(temps)
+        t_mean = sum(temps) / len(temps)
+        # Check physical reasonableness
+        exp_lo, exp_hi = EXPECTED_RANGES.get(zone.city, (15, 42))
+        if t_min < exp_lo - 5 or t_max > exp_hi + 5:
+            issues.append(
+                f"{zid} ({zone.city}): temp range [{t_min:.1f}, {t_max:.1f}] "
+                f"outside expected [{exp_lo-5}, {exp_hi+5}]"
+            )
+        null_count = sum(1 for r in readings if r.temp_max_c is None)
+        stats[zid] = {
+            "days": len(readings),
+            "temp_days": len(temps),
+            "temp_min": round(t_min, 1),
+            "temp_max": round(t_max, 1),
+            "temp_mean": round(t_mean, 1),
+            "humidity_mean": round(sum(humids)/len(humids), 1) if humids else None,
+            "wind_mean": round(sum(winds)/len(winds), 1) if winds else None,
+            "null_temps": null_count,
+        }
+    # Print summary
+    print("\n--- ERA5 Data Summary ---")
+    print(f"{'Zone':<12} {'City':<16} {'Days':>5} {'Temp min':>9} {'Temp max':>9} {'Temp mean':>10} {'Humidity':>9} {'Nulls':>6}")
+    print("-" * 90)
+    by_city = {}
+    for zone in ZONES:
+        s = stats.get(zone.zone_id, {})
+        days = s.get("days", 0)
+        t_lo = s.get("temp_min", "N/A")
+        t_hi = s.get("temp_max", "N/A")
+        t_mn = s.get("temp_mean", "N/A")
+        hum = s.get("humidity_mean", "N/A")
+        nulls = s.get("null_temps", "N/A")
+        print(f"{zone.zone_id:<12} {zone.city:<16} {days:>5} {t_lo:>9} {t_hi:>9} {t_mn:>10} {hum:>9} {nulls:>6}")
+        city = zone.city
+        if city not in by_city:
+            by_city[city] = []
+        by_city[city].append(s)
+    print("\n--- Per-city aggregated temp ranges ---")
+    for city, zone_stats in by_city.items():
+        all_mins = [s["temp_min"] for s in zone_stats if s.get("temp_min") is not None]
+        all_maxs = [s["temp_max"] for s in zone_stats if s.get("temp_max") is not None]
+        if all_mins and all_maxs:
+            print(f"  {city:<16}: {min(all_mins):.1f} - {max(all_maxs):.1f} C")
+    if issues:
+        print(f"\n  ISSUES ({len(issues)}):")
+        for issue in issues:
+            print(f"    - {issue}")
+    else:
+        print("\n  No data quality issues found.")
+    zones_with_data = sum(1 for s in stats.values() if s.get("days", 0) > 0)
+    assert zones_with_data == len(ZONES), f"Only {zones_with_data}/{len(ZONES)} zones have data"
+    print(f"\n  All {zones_with_data} zones have data.\n")
+    return stats
+# ======================================================================
+# Step 3: Retrain XGBoost heat predictor on real data
+# ======================================================================
+def retrain_xgboost(data: dict[str, list[DailyReading]]):
+    log.info("=" * 60)
+    log.info("STEP 3: Retraining XGBoost heat predictor on real ERA5 data")
+    log.info("=" * 60)
+    from src.prediction.heat_forecast import HeatWavePredictor, CITY_THRESHOLDS, CITY_CLIMATE
+    from src.prediction.lstm_model import CITY_CLIMATE as _  # ensure import works
+    import xgboost as xgb
+    # We replicate the training logic from HeatWavePredictor.train() but
+    # use real ERA5 temps/humidity instead of synthetic series.
+    all_X = []
+    all_y = []
+    for zone in ZONES:
+        zid = zone.zone_id
+        readings = data.get(zid, [])
+        if len(readings) < 40:
+            log.warning("Zone %s has only %d readings, skipping for XGBoost training", zid, len(readings))
+            continue
+        city = zone.city
+        threshold = CITY_THRESHOLDS.get(city, 33.0)
+        # Extract time series from real data
+        temps = []
+        humidity = []
+        for r in readings:
+            t = r.temp_max_c
+            h = r.humidity_pct
+            if t is None:
+                continue
+            temps.append(t)
+            humidity.append(h if h is not None else 65.0)
+        n_days = len(temps)
+        if n_days < 40:
+            log.warning("Zone %s has only %d valid temp readings, skipping", zid, n_days)
+            continue
+        # Compute WBGT series
+        wbgt_series = [calculate_wbgt(t, h) for t, h in zip(temps, humidity)]
+        # Labels: trigger within next 7 days (2+ consecutive above threshold)
+        labels = [0] * n_days
+        for day in range(n_days - 7):
+            window = temps[day + 1:day + 8]
+            consec = 0
+            triggered = False
+            for t in window:
+                if t > threshold:
+                    consec += 1
+                    if consec >= 2:
+                        triggered = True
+                        break
+                else:
+                    consec = 0
+            labels[day] = 1 if triggered else 0
+        # Vulnerability encoding
+        vuln_map = {"high": 1.0, "moderate": 0.5, "low": 0.0}
+        zone_vuln = vuln_map.get(zone.heat_vulnerability, 0.5)
+        rng = np.random.default_rng(42)
+        # Build features (need 30-day lookback)
+        for day in range(30, n_days - 7):
+            t_window = temps[day - 30:day + 1]
+            h_window = humidity[day - 30:day + 1]
+            w_window = wbgt_series[day - 30:day + 1]
+            current_temp = t_window[-1]
+            current_wbgt = w_window[-1]
+            current_humidity = h_window[-1]
+            # Trend: slope of last 7 days
+            x7 = np.arange(7, dtype=np.float64)
+            y7 = np.array(t_window[-7:], dtype=np.float64)
+            temp_trend = float(np.polyfit(x7, y7, 1)[0])
+            # Anomaly: current vs 30-day mean
+            temp_anomaly = current_temp - float(np.mean(t_window))
+            # Soil moisture proxy
+            soil_proxy = float(np.clip(1.0 - (temp_anomaly + 2.0) / 4.0, 0.0, 1.0))
+            # Rolling error (use neutral prior for training data)
+            rolling_err = rng.uniform(0.1, 0.5)
+            # Day-of-year encoding (use day index within 365-day cycle)
+            doy = day % 365
+            doy_sin = np.sin(2 * np.pi * doy / 365.0)
+            doy_cos = np.cos(2 * np.pi * doy / 365.0)
+            # Random hour for variety
+            hour = rng.integers(6, 19)
+            hour_sin = np.sin(2 * np.pi * hour / 24.0)
+            hour_cos = np.cos(2 * np.pi * hour / 24.0)
+            row = [
+                current_temp,
+                current_wbgt,
+                current_humidity,
+                temp_trend,
+                temp_anomaly,
+                soil_proxy,
+                rolling_err,
+                doy_sin,
+                doy_cos,
+                hour_sin,
+                hour_cos,
+                zone_vuln,
+            ]
+            all_X.append(row)
+            all_y.append(labels[day])
+    X = np.array(all_X, dtype=np.float32)
+    y = np.array(all_y, dtype=np.int32)
+    pos_rate = y.sum() / len(y) if len(y) > 0 else 0
+    log.info(
+        "XGBoost training data: %d samples, %.1f%% positive rate",
+        len(X), pos_rate * 100,
+    )
+    # Create a fresh predictor to get the model object, then retrain
+    predictor = HeatWavePredictor.__new__(HeatWavePredictor)
+    predictor.model_path = HeatWavePredictor.__init__.__defaults__[0]  # fallback
+    from pathlib import Path
+    predictor.model_path = Path(__file__).resolve().parents[1] / "models" / "heat_predictor_xgb.json"
+    predictor._rolling_errors = []
+    model = xgb.XGBClassifier(
+        n_estimators=150,
+        max_depth=5,
+        learning_rate=0.1,
+        eval_metric="logloss",
+        random_state=42,
+    )
+    # Train/validation split (temporal: first 75% train, last 25% val)
+    split = int(len(X) * 0.75)
+    X_train, X_val = X[:split], X[split:]
+    y_train, y_val = y[:split], y[split:]
+    model.fit(
+        X_train, y_train,
+        eval_set=[(X_val, y_val)],
+        verbose=False,
+    )
+    # Evaluate on validation set
+    from sklearn.metrics import roc_auc_score, precision_score, recall_score
+    val_probs = model.predict_proba(X_val)[:, 1]
+    val_preds = (val_probs > 0.5).astype(int)
+    if len(set(y_val)) > 1:
+        auroc = roc_auc_score(y_val, val_probs)
+        precision = precision_score(y_val, val_preds, zero_division=0)
+        recall = recall_score(y_val, val_preds, zero_division=0)
+    else:
+        auroc, precision, recall = 0.5, 0.0, 0.0
+    print(f"\n--- XGBoost Results (real ERA5 data) ---")
+    print(f"  Training samples:   {len(X_train)}")
+    print(f"  Validation samples: {len(X_val)}")
+    print(f"  Positive rate:      {pos_rate:.1%}")
+    print(f"  Val AUROC:          {auroc:.4f}")
+    print(f"  Val Precision:      {precision:.4f}")
+    print(f"  Val Recall:         {recall:.4f}")
+    # Save model
+    predictor.model_path.parent.mkdir(parents=True, exist_ok=True)
+    model.save_model(str(predictor.model_path))
+    log.info("XGBoost model saved to %s", predictor.model_path)
+    return {
+        "train_samples": len(X_train),
+        "val_samples": len(X_val),
+        "positive_rate": round(pos_rate, 4),
+        "val_auroc": round(auroc, 4),
+        "val_precision": round(precision, 4),
+        "val_recall": round(recall, 4),
+    }
+# ======================================================================
+# Step 4: Retrain LSTM on real data
+# ======================================================================
+def retrain_lstm(data: dict[str, list[DailyReading]]):
+    log.info("=" * 60)
+    log.info("STEP 4: Retraining LSTM on real ERA5 data")
+    log.info("=" * 60)
+    from src.prediction.lstm_model import LSTMTrainer
+    # Convert ERA5 DailyReading objects into the format the LSTM trainer expects:
+    # dict of zone_id -> list of dicts with keys: temp_max_c, humidity_pct, wind_speed_ms, city
+    zone_readings = {}
+    for zone in ZONES:
+        zid = zone.zone_id
+        readings = data.get(zid, [])
+        days = []
+        for r in readings:
+            if r.temp_max_c is None:
+                continue
+            days.append({
+                "temp_max_c": r.temp_max_c,
+                "humidity_pct": r.humidity_pct if r.humidity_pct is not None else 65.0,
+                "wind_speed_ms": r.wind_speed_ms if r.wind_speed_ms is not None else 3.0,
+                "city": zone.city,
+            })
+        if len(days) > 30:
+            zone_readings[zid] = days
+            log.info("Zone %s: %d valid readings for LSTM", zid, len(days))
+        else:
+            log.warning("Zone %s: only %d valid readings, skipping LSTM", zid, len(days))
+    log.info("Training LSTM on %d zones", len(zone_readings))
+    trainer = LSTMTrainer(epochs=50, patience=5)
+    metrics = trainer.train(zone_readings)
+    print(f"\n--- LSTM Results (real ERA5 data) ---")
+    for k, v in metrics.items():
+        print(f"  {k}: {v}")
+    return metrics
+# ======================================================================
+# Step 5: Verify UHI model with real ERA5 temps
+# ======================================================================
+def verify_uhi(data: dict[str, list[DailyReading]]):
+    log.info("=" * 60)
+    log.info("STEP 5: Verifying UHI model with real ERA5 temperatures")
+    log.info("=" * 60)
+    from src.downscaling.uhi_model import UHICorrector
+    corrector = UHICorrector()
+    results = {}
+    for zone in ZONES:
+        zid = zone.zone_id
+        readings = data.get(zid, [])
+        if not readings:
+            continue
+        # Use real ERA5 temps as grid baseline
+        real_temps = [r.temp_max_c for r in readings if r.temp_max_c is not None]
+        if not real_temps:
+            continue
+        # Sample a few real temps and apply UHI correction
+        sample_indices = np.linspace(0, len(real_temps) - 1, min(20, len(real_temps)), dtype=int)
+        deltas = []
+        corrected_temps = []
+        for idx in sample_indices:
+            grid_temp = real_temps[idx]
+            corrected, delta, conf = corrector.correct_temperature(zone, grid_temp, hour=14, month=1)
+            deltas.append(delta)
+            corrected_temps.append(corrected)
+        results[zid] = {
+            "city": zone.city,
+            "settlement": zone.settlement_type,
+            "mean_grid_temp": round(sum(real_temps) / len(real_temps), 1),
+            "mean_uhi_delta": round(sum(deltas) / len(deltas), 2),
+            "mean_corrected": round(sum(corrected_temps) / len(corrected_temps), 1),
+        }
+    print(f"\n--- UHI Verification with Real ERA5 Temps ---")
+    print(f"{'Zone':<12} {'City':<16} {'Type':<12} {'Grid T':>7} {'UHI +':>7} {'Corrected':>10}")
+    print("-" * 70)
+    for zid, r in results.items():
+        print(
+            f"{zid:<12} {r['city']:<16} {r['settlement']:<12} "
+            f"{r['mean_grid_temp']:>6.1f}C {r['mean_uhi_delta']:>+6.2f}C {r['mean_corrected']:>9.1f}C"
+        )
+    return results
+# ======================================================================
+# Main
+# ======================================================================
+def main():
+    t_start = time.time()
+    # Step 1: Fetch
+    data = fetch_data()
+    # Step 2: Validate
+    data_stats = validate_data(data)
+    # Step 3: XGBoost
+    xgb_metrics = retrain_xgboost(data)
+    # Step 4: LSTM
+    lstm_metrics = retrain_lstm(data)
+    # Step 5: UHI verification
+    uhi_results = verify_uhi(data)
+    total_time = time.time() - t_start
+    print("\n" + "=" * 60)
+    print("TRAINING COMPLETE")
+    print("=" * 60)
+    total_days = sum(
+        len([r for r in data.get(z.zone_id, []) if r.temp_max_c is not None])
+        for z in ZONES
+    )
+    print(f"  Total real data points:  {total_days} zone-days across {len(ZONES)} zones")
+    print(f"  XGBoost val AUROC:       {xgb_metrics['val_auroc']:.4f}")
+    print(f"  LSTM val AUROC:          {lstm_metrics.get('val_auroc', 'N/A')}")
+    print(f"  LSTM epochs trained:     {lstm_metrics.get('epochs_trained', 'N/A')}")
+    print(f"  LSTM final val loss:     {lstm_metrics.get('val_loss', 'N/A')}")
+    print(f"  Total time:              {total_time:.1f}s")
+    print()
+if __name__ == "__main__":
+    main()