Spaces:

Syntrex
/

2026_MLB_Model

Running

2026_MLB_Model

File size: 71,141 Bytes

"""
analytics/props_mapper.py

Maps sportsbook HR prop rows to the shared HR probability engine and computes
edge for the Props page.
"""

from __future__ import annotations

from typing import Any, Callable

import pandas as pd

from analytics.no_vig_props import american_to_implied_prob, compute_bet_ev, compute_edge
from analytics.model_voice import build_hr_model_voice, build_strikeout_model_voice
from data.mlb_starters import lookup_pitchers_for_game, lookup_batter_current_team
from data.odds_name_map import map_odds_name_to_model_name
from models.hr_probability_engine import build_hr_probability_result
from models.pitcher_adjustment import build_pitcher_feature_row
from visualization.cards.player_identity import normalize_for_matching, to_canonical_name


def build_strikeout_probability_result_v2(*args, **kwargs):
    from models.strikeout_probability_engine_v2 import (
        build_strikeout_probability_result_v2 as _build_strikeout_probability_result_v2,
    )

    return _build_strikeout_probability_result_v2(*args, **kwargs)


def _build_statcast_name_index(statcast_df: pd.DataFrame) -> dict[str, str]:
    if statcast_df.empty or "player_name" not in statcast_df.columns:
        return {}

    index: dict[str, str] = {}
    for name in statcast_df["player_name"].astype(str).unique():
        normalized = map_odds_name_to_model_name(name)
        if normalized not in index:
            index[normalized] = name

        canonical = to_canonical_name(name)
        if canonical != name:
            canonical_norm = map_odds_name_to_model_name(canonical)
            if canonical_norm not in index:
                index[canonical_norm] = name

            suffix_stripped = normalize_for_matching(canonical)
            if suffix_stripped and suffix_stripped not in index:
                index[suffix_stripped] = name

    return index


def _build_game_context_from_row(row: Any) -> dict[str, Any]:
    return {
        "away_team": str(row.get("away_team", "") or "").strip(),
        "home_team": str(row.get("home_team", "") or "").strip(),
        "venue": str(
            row.get("venue")
            or row.get("stadium")
            or row.get("venue_name")
            or row.get("park")
            or ""
        ).strip(),
        "game_datetime_utc": str(
            row.get("game_datetime_utc")
            or row.get("commence_time")
            or ""
        ).strip(),
        "game_date": str(row.get("game_date", "") or "").strip(),
        "lineup_slot": row.get("lineup_slot"),
        "lineup_slot_source": row.get("lineup_slot_source"),
        "team_total": row.get("team_total"),
        "team_total_source": row.get("team_total_source"),
    }


def _normalize_team_name(value: Any) -> str:
    return " ".join(str(value or "").strip().lower().split())


def _to_display_name(value: Any) -> str:
    return str(value or "").strip()


def _normalize_person_name(value: Any) -> str:
    return normalize_for_matching(to_canonical_name(str(value or "").strip()))


def _names_match(left: Any, right: Any) -> bool:
    left_norm = _normalize_person_name(left)
    right_norm = _normalize_person_name(right)
    return bool(left_norm and right_norm and left_norm == right_norm)


def _compute_verdict(
    bet_ev: float | None,
    edge: float | None,
    confidence_score: float | None,
    is_modeled: bool,
) -> str:
    if not is_modeled:
        return "tracked"
    try:
        ev = float(bet_ev if bet_ev is not None else -9.0)
        ed = float(edge if edge is not None else -9.0)
        conf = float(confidence_score if confidence_score is not None else 0.0)
    except Exception:
        return "pass"
    if ev >= 0.05 and ed >= 0.01 and conf >= 62:
        return "bet"
    if ev >= -0.03 and ed >= -0.01 and conf >= 45:
        return "watch"
    return "pass"


def _confidence_display_remap(raw_score: float | None) -> float | None:
    try:
        raw = float(raw_score)
    except Exception:
        return None
    if raw <= 40.0:
        return max(1.0, min(100.0, raw))
    return max(1.0, min(100.0, 40.0 + ((raw - 40.0) * 1.45)))


def _normalize_confidence_components(value: Any) -> list[dict[str, Any]]:
    if not isinstance(value, list):
        return []
    normalized: list[dict[str, Any]] = []
    for item in value:
        if not isinstance(item, dict):
            continue
        label = str(item.get("label") or "").strip()
        if not label:
            continue
        try:
            component_value = float(item.get("value") or 0.0)
        except Exception:
            component_value = 0.0
        normalized.append(
            {
                "label": label,
                "value": round(component_value, 1),
                "direction": str(item.get("direction") or "").strip().lower() or None,
            }
        )
    return normalized


def _select_confidence_primary_driver(
    penalties: list[dict[str, Any]],
    bonuses: list[dict[str, Any]],
) -> dict[str, Any] | None:
    penalty_candidates = [item for item in penalties if float(item.get("value") or 0.0) > 0.0]
    bonus_candidates = [item for item in bonuses if float(item.get("value") or 0.0) > 0.0]
    if penalty_candidates:
        return max(penalty_candidates, key=lambda item: float(item.get("value") or 0.0))
    if bonus_candidates:
        return max(bonus_candidates, key=lambda item: float(item.get("value") or 0.0))
    return None


def _build_strikeout_confidence_payload(
    probability_result: dict[str, Any],
) -> dict[str, Any]:
    source = str(probability_result.get("confidence_source") or "strikeout_v2_live")
    raw_score = probability_result.get("confidence_score_raw", probability_result.get("confidence_score"))
    raw_bucket = probability_result.get("confidence_bucket")
    reasons = list(probability_result.get("confidence_reasons") or [])
    bonuses = _normalize_confidence_components(probability_result.get("confidence_component_bonuses"))
    penalties = _normalize_confidence_components(probability_result.get("confidence_component_penalties"))

    raw_score_float = float(raw_score) if raw_score is not None else None
    display_score = _confidence_display_remap(raw_score_float)
    display_bucket = None
    if display_score is not None:
        if display_score >= 75:
            display_bucket = "high"
        elif display_score >= 55:
            display_bucket = "medium"
        else:
            display_bucket = "low"
    primary_driver = _select_confidence_primary_driver(penalties, bonuses)
    summary_label = str((primary_driver or {}).get("label") or "").strip() or None

    return {
        "confidence_score_raw": round(raw_score_float, 1) if raw_score_float is not None else None,
        "confidence_score_display": round(display_score, 1) if display_score is not None else None,
        "confidence_source": source,
        "confidence_component_bonuses": bonuses,
        "confidence_component_penalties": penalties,
        "confidence_primary_driver": primary_driver,
        "confidence_summary_label": summary_label,
        "confidence_bucket_raw": raw_bucket,
        "confidence_bucket_display": display_bucket,
        "confidence_reasons": reasons[:5],
    }


def _classify_strikeout_probability_status(
    *,
    fair_prob: float | None,
    implied: float | None,
    pitcher_name: str,
    probability_result: dict[str, Any],
) -> str:
    if fair_prob is not None:
        return "modeled_ok" if implied is not None else "missing_implied_prob"
    if not str(pitcher_name or "").strip():
        return "missing_pitcher_context"
    if str(probability_result.get("pitcher_resolution_status") or "").strip().lower() == "unresolved":
        return "missing_pitcher_context"
    if str(probability_result.get("projected_starter_match_status") or "").strip().lower() == "resolved_pitcher_mismatch":
        return "projected_starter_mismatch"
    return "empty_probability_result"


def _classify_hr_probability_status(
    *,
    threshold_int: int,
    is_modeled: bool,
    model_prob: float | None,
    implied: float | None,
    probability_result: dict[str, Any],
    statcast_df: pd.DataFrame | None,
    pitcher_name: str,
) -> str:
    if threshold_int != 1 or not is_modeled:
        return "unmodeled_ladder"
    if model_prob is not None:
        return "modeled_ok" if implied is not None else "missing_implied_prob"

    if statcast_df is None or statcast_df.empty:
        return "missing_baseline"

    baseline_prob = probability_result.get("baseline_hr_prob")
    pitcher_status = str(probability_result.get("pitcher_resolution_status") or "").strip().lower()
    skipped_layers = str(probability_result.get("skipped_layers") or "").strip().lower()
    batter_rows_missing = baseline_prob is None

    if batter_rows_missing:
        return "missing_baseline"
    if implied is None:
        return "missing_implied_prob"
    if not str(pitcher_name or "").strip():
        return "missing_pitcher_context"
    if pitcher_status in {"pitcher_missing", "unresolved", "matchup_incomplete"}:
        return "missing_pitcher_context"
    if "pitcher_missing" in skipped_layers or "matchup_incomplete" in skipped_layers:
        return "missing_pitcher_context"
    if baseline_prob is not None:
        return "empty_probability_result"
    return "unknown"


def _infer_batter_team(
    batter_name: str,
    batter_statcast_df: pd.DataFrame,
) -> str:
    if (
        batter_statcast_df is None
        or batter_statcast_df.empty
        or not batter_name
        or "player_name" not in batter_statcast_df.columns
    ):
        return ""

    normalized_target = _normalize_person_name(batter_name)
    player_rows = batter_statcast_df[
        batter_statcast_df["player_name"].astype(str).map(_normalize_person_name) == normalized_target
    ].copy()
    if player_rows.empty:
        return ""

    team_values: list[str] = []

    if {"inning_topbot", "home_team", "away_team"}.issubset(player_rows.columns):
        inning_half = player_rows["inning_topbot"].fillna("").astype(str).str.lower()
        top_mask = inning_half.str.contains("top")
        bottom_mask = inning_half.str.contains("bot|bottom")

        if top_mask.any():
            team_values.extend(
                player_rows.loc[top_mask, "away_team"].dropna().astype(str).tolist()
            )
        if bottom_mask.any():
            team_values.extend(
                player_rows.loc[bottom_mask, "home_team"].dropna().astype(str).tolist()
            )

    for col in ["team", "batter_team", "team_name"]:
        if col in player_rows.columns:
            team_values.extend(player_rows[col].dropna().astype(str).tolist())

    normalized = [_normalize_team_name(v) for v in team_values if str(v).strip()]
    if not normalized:
        return ""
    return pd.Series(normalized).mode().iloc[0]


def _resolve_batter_team(
    row: Any,
    batter_name: str,
    batter_statcast_df: pd.DataFrame,
) -> tuple[str, str]:
    row_team, row_source = _resolve_batter_team_from_row_context(
        row=row,
        batter_name=batter_name,
    )
    if row_team:
        return (row_team, row_source)

    away_team = _to_display_name(row.get("away_team"))
    home_team = _to_display_name(row.get("home_team"))
    away_norm = _normalize_team_name(away_team)
    home_norm = _normalize_team_name(home_team)

    statcast_ok = (
        batter_statcast_df is not None
        and not batter_statcast_df.empty
        and batter_name
        and "player_name" in batter_statcast_df.columns
    )
    if statcast_ok:
        normalized_target = _normalize_person_name(batter_name)
        player_rows = batter_statcast_df[
            batter_statcast_df["player_name"].astype(str).map(_normalize_person_name) == normalized_target
        ].copy()
        if not player_rows.empty:
            if "source_season" in player_rows.columns:
                current_rows = player_rows[pd.to_numeric(player_rows["source_season"], errors="coerce") == 2026].copy()
                current_team = _infer_batter_team(batter_name=batter_name, batter_statcast_df=current_rows)
                if current_team:
                    if current_team == away_norm and away_team:
                        return (away_team, "current_season_statcast")
                    if current_team == home_norm and home_team:
                        return (home_team, "current_season_statcast")

            historical_team = _infer_batter_team(batter_name=batter_name, batter_statcast_df=player_rows)
            if historical_team:
                if historical_team == away_norm and away_team:
                    return (away_team, "historical_statcast")
                if historical_team == home_norm and home_team:
                    return (home_team, "historical_statcast")
                # historical_team doesn't match either current game team (player changed teams);
                # fall through to roster lookup instead of returning a stale team name

    # Level 4: current-season MLB roster lookup (handles offseason moves and new players)
    if batter_name:
        roster_team = lookup_batter_current_team(batter_name, away_team or "", home_team or "")
        if roster_team:
            return (roster_team, "mlb_roster_lookup")

    return ("", "unresolved")


def _resolve_batter_team_from_row_context(
    row: Any,
    batter_name: str,
) -> tuple[str, str]:
    away_team = _to_display_name(row.get("away_team"))
    home_team = _to_display_name(row.get("home_team"))
    away_norm = _normalize_team_name(away_team)
    home_norm = _normalize_team_name(home_team)

    for key in ("batter_team", "player_team", "team", "team_name"):
        value = _to_display_name(row.get(key))
        value_norm = _normalize_team_name(value)
        if value_norm == away_norm and away_team:
            return (away_team, f"row_{key}")
        if value_norm == home_norm and home_team:
            return (home_team, f"row_{key}")

    return ("", "unknown")


def _infer_lineup_slot(
    batter_name: str,
    batter_statcast_df: pd.DataFrame,
) -> tuple[int | None, str]:
    if (
        batter_statcast_df is None
        or batter_statcast_df.empty
        or not batter_name
        or "player_name" not in batter_statcast_df.columns
    ):
        return (None, "unknown")

    player_rows = batter_statcast_df[
        batter_statcast_df["player_name"].astype(str).str.casefold() == batter_name.casefold()
    ].copy()
    if player_rows.empty:
        return (None, "unknown")

    for col in ["lineup_slot", "lineup_position", "batting_order", "bat_order"]:
        if col not in player_rows.columns:
            continue
        numeric = pd.to_numeric(player_rows[col], errors="coerce").dropna()
        numeric = numeric[(numeric >= 1) & (numeric <= 9)]
        if not numeric.empty:
            mode = numeric.round().astype(int).mode()
            if not mode.empty:
                return (int(mode.iloc[0]), "projected")
    return (None, "unknown")


def _resolve_pitcher_hand(
    pitcher_name: str,
    pitcher_statcast_df: pd.DataFrame | None,
) -> tuple[str, str]:
    if not pitcher_name or pitcher_statcast_df is None or pitcher_statcast_df.empty:
        return ("", "unavailable")
    if {"player_name", "p_throws"}.issubset(pitcher_statcast_df.columns):
        direct_rows = pitcher_statcast_df[
            pitcher_statcast_df["player_name"].astype(str).map(_normalize_person_name) == _normalize_person_name(pitcher_name)
        ].copy()
        if not direct_rows.empty:
            direct_hand = str(direct_rows.iloc[0].get("p_throws") or "").strip().upper()
            if direct_hand:
                return (direct_hand, "statcast_direct")
    try:
        pitcher_row = build_pitcher_feature_row(
            statcast_df=pitcher_statcast_df,
            pitcher_name=pitcher_name,
        )
        hand = str(pitcher_row.get("p_throws") or "").strip().upper()
        return (hand, "pitcher_feature_row" if hand else "unavailable")
    except Exception:
        return ("", "unavailable")


def _resolve_team_total(
    row: Any,
    batter_team: str,
) -> tuple[float | None, str]:
    direct_keys = ["team_total", "implied_team_total", "batter_team_total"]
    for key in direct_keys:
        value = row.get(key)
        try:
            if value is not None and str(value).strip() not in {"", "nan", "None"}:
                return (float(value), "projected")
        except Exception:
            continue

    away_norm = _normalize_team_name(row.get("away_team"))
    home_norm = _normalize_team_name(row.get("home_team"))
    batter_team_norm = _normalize_team_name(batter_team)

    if batter_team_norm and batter_team_norm == away_norm:
        for key in ["away_team_total", "away_implied_total"]:
            value = row.get(key)
            try:
                if value is not None and str(value).strip() not in {"", "nan", "None"}:
                    return (float(value), "projected")
            except Exception:
                continue

    if batter_team_norm and batter_team_norm == home_norm:
        for key in ["home_team_total", "home_implied_total"]:
            value = row.get(key)
            try:
                if value is not None and str(value).strip() not in {"", "nan", "None"}:
                    return (float(value), "projected")
            except Exception:
                continue

    return (None, "unknown")


def _resolve_pitcher_name(
    row: Any,
    batter_team: str,
    probable_starters: dict | None,
) -> tuple[str, str, str]:
    explicit_pitcher = str(
        row.get("pitcher_name")
        or row.get("pitcher")
        or row.get("opposing_pitcher")
        or ""
    ).strip()

    away_team = str(row.get("away_team") or "").strip()
    home_team = str(row.get("home_team") or "").strip()
    if explicit_pitcher and (not away_team or not home_team or not probable_starters):
        return (explicit_pitcher, "row_explicit", "resolved")

    if not probable_starters:
        return ("", "probable_starters_unavailable", "unresolved")

    if not away_team or not home_team:
        return ("", "matchup_incomplete", "unresolved")

    starters = lookup_pitchers_for_game(
        away_team=away_team,
        home_team=home_team,
        starters_map=probable_starters,
    )
    if not starters:
        return ("", "matchup_not_found", "unresolved")

    away_norm = _normalize_team_name(away_team)
    home_norm = _normalize_team_name(home_team)
    batter_team_norm = _normalize_team_name(batter_team)
    home_pitcher = str(starters.get("home_pitcher") or "").strip()
    away_pitcher = str(starters.get("away_pitcher") or "").strip()

    if explicit_pitcher:
        if _names_match(home_pitcher, explicit_pitcher) or _names_match(away_pitcher, explicit_pitcher):
            return (explicit_pitcher, "row_explicit_validated", "resolved")

    if batter_team_norm and batter_team_norm == away_norm:
        return (
            home_pitcher,
            "probable_starters_matchup",
            "resolved",
        )
    if batter_team_norm and batter_team_norm == home_norm:
        return (
            away_pitcher,
            "probable_starters_matchup",
            "resolved",
        )

    if home_pitcher and not away_pitcher:
        return (home_pitcher, "probable_starters_single_side", "resolved")
    if away_pitcher and not home_pitcher:
        return (away_pitcher, "probable_starters_single_side", "resolved")
    if explicit_pitcher:
        return (explicit_pitcher, "row_explicit_unvalidated", "resolved")
    return ("", "batter_team_unresolved", "unresolved")


def _lookup_projected_starter_context(
    row: Any,
    probable_starters: dict | None,
) -> dict[str, Any]:
    away_team = str(row.get("away_team") or "").strip()
    home_team = str(row.get("home_team") or "").strip()
    out = {
        "projected_home_pitcher": "",
        "projected_away_pitcher": "",
        "projected_starter_available": False,
        "projected_starter_source": "probable_starters_unavailable" if not probable_starters else "matchup_incomplete",
        "projected_home_pitcher_source": "",
        "projected_away_pitcher_source": "",
        "starter_cache_source": "probable_starters_unavailable" if not probable_starters else "matchup_incomplete",
        "fallback_used": False,
    }
    if not probable_starters or not away_team or not home_team:
        return out

    starters = lookup_pitchers_for_game(
        away_team=away_team,
        home_team=home_team,
        starters_map=probable_starters,
    )
    if not starters:
        out["projected_starter_source"] = "matchup_not_found"
        return out

    projected_home = str(starters.get("home_pitcher") or "").strip()
    projected_away = str(starters.get("away_pitcher") or "").strip()
    out.update(
        {
            "projected_home_pitcher": projected_home,
            "projected_away_pitcher": projected_away,
            "projected_starter_available": bool(projected_home or projected_away),
            "projected_starter_source": str(starters.get("starter_cache_source") or "probable_starters_matchup"),
            "projected_home_pitcher_source": str(starters.get("home_pitcher_source") or ""),
            "projected_away_pitcher_source": str(starters.get("away_pitcher_source") or ""),
            "starter_cache_source": str(starters.get("starter_cache_source") or "probable_starters_matchup"),
            "fallback_used": bool(starters.get("fallback_used")),
        }
    )
    return out


def _projected_starter_match_status(
    resolved_pitcher_name: str,
    projected_home_pitcher: str,
    projected_away_pitcher: str,
) -> str:
    resolved = str(resolved_pitcher_name or "").strip()
    if not projected_home_pitcher and not projected_away_pitcher:
        return "projected_starter_unavailable"
    if not resolved:
        return "projected_starter_available_but_unresolved"
    if _names_match(projected_home_pitcher, resolved):
        return "matched_projected_home"
    if _names_match(projected_away_pitcher, resolved):
        return "matched_projected_away"
    return "resolved_pitcher_mismatch"


def _resolve_pitcher_team_and_opponent(
    row: Any,
    pitcher_name: str,
    probable_starters: dict | None,
) -> tuple[str, str]:
    away_team = str(row.get("away_team") or "").strip()
    home_team = str(row.get("home_team") or "").strip()
    if not away_team or not home_team or not pitcher_name or not probable_starters:
        return ("", "")

    starters = lookup_pitchers_for_game(
        away_team=away_team,
        home_team=home_team,
        starters_map=probable_starters,
    )
    if not starters:
        return ("", "")

    away_pitcher = str(starters.get("away_pitcher") or "").strip()
    home_pitcher = str(starters.get("home_pitcher") or "").strip()
    if _names_match(away_pitcher, pitcher_name):
        return (away_team, home_team)
    if _names_match(home_pitcher, pitcher_name):
        return (home_team, away_team)
    return ("", "")


def _resolve_strikeout_pitcher_name(
    row: Any,
    probable_starters: dict | None,
) -> tuple[str, str, str]:
    explicit_pitcher = _to_display_name(row.get("player_name_raw") or row.get("player_name"))
    away_team = str(row.get("away_team") or "").strip()
    home_team = str(row.get("home_team") or "").strip()
    if not explicit_pitcher and not probable_starters:
        return ("", "missing_pitcher_name", "unresolved")
    if not probable_starters or not away_team or not home_team:
        return (explicit_pitcher, "row_explicit", "resolved" if explicit_pitcher else "unresolved")

    starters = lookup_pitchers_for_game(
        away_team=away_team,
        home_team=home_team,
        starters_map=probable_starters,
    )
    if not starters:
        return (explicit_pitcher, "row_explicit", "resolved" if explicit_pitcher else "unresolved")

    projected_home = str(starters.get("home_pitcher") or "").strip()
    projected_away = str(starters.get("away_pitcher") or "").strip()
    if explicit_pitcher and (
        _names_match(projected_home, explicit_pitcher)
        or _names_match(projected_away, explicit_pitcher)
    ):
        return (explicit_pitcher, "row_explicit_validated", "resolved")
    if projected_home and not projected_away:
        return (projected_home, "probable_starters_single_side", "resolved")
    if projected_away and not projected_home:
        return (projected_away, "probable_starters_single_side", "resolved")
    if projected_home and projected_away:
        return ("", "row_explicit_mismatch", "unresolved")
    return (explicit_pitcher, "row_explicit", "resolved" if explicit_pitcher else "unresolved")


def _extract_team_batters_from_statcast(
    team_name: str,
    batter_statcast_df: pd.DataFrame | None,
    max_players: int = 9,
) -> list[str]:
    if (
        not team_name
        or batter_statcast_df is None
        or batter_statcast_df.empty
        or "player_name" not in batter_statcast_df.columns
    ):
        return []

    team_norm = _normalize_team_name(team_name)
    if not team_norm:
        return []

    working = batter_statcast_df.copy()
    if "source_season" in working.columns:
        current_rows = working[pd.to_numeric(working["source_season"], errors="coerce") == 2026].copy()
        if not current_rows.empty:
            working = current_rows

    players = (
        working.get("player_name", pd.Series(dtype="object"))
        .dropna()
        .astype(str)
        .tolist()
    )
    if not players:
        return []

    matched_names: list[str] = []
    seen_norms: set[str] = set()
    for player_name in players:
        inferred_team = _infer_batter_team(player_name, working)
        if inferred_team != team_norm:
            continue
        player_norm = _normalize_person_name(player_name)
        if not player_norm or player_norm in seen_norms:
            continue
        seen_norms.add(player_norm)
        matched_names.append(player_name)
        if len(matched_names) >= max_players:
            break
    return matched_names


def _lookup_baseline_metadata(
    statcast_df: pd.DataFrame | None,
    player_name: str,
) -> dict[str, Any]:
    default = {
        "baseline_mode": None,
        "prior_sample_size": None,
        "season_2026_sample_size": None,
        "prior_weight": None,
        "season_2026_weight": None,
        "baseline_driver": None,
        "rolling_overlay_active": None,
    }
    if (
        statcast_df is None
        or statcast_df.empty
        or not player_name
        or "player_name" not in statcast_df.columns
    ):
        return default

    normalized_target = _normalize_person_name(player_name)
    if not normalized_target:
        return default

    normalized_series = statcast_df["player_name"].astype(str).map(_normalize_person_name)
    rows = statcast_df[normalized_series == normalized_target].copy()
    if rows.empty:
        return default

    first_row = rows.iloc[0]
    return {
        "baseline_mode": first_row.get("baseline_mode"),
        "prior_sample_size": first_row.get("prior_sample_size"),
        "season_2026_sample_size": first_row.get("season_2026_sample_size"),
        "prior_weight": first_row.get("prior_weight"),
        "season_2026_weight": first_row.get("season_2026_weight"),
        "baseline_driver": first_row.get("baseline_driver"),
        "rolling_overlay_active": first_row.get("rolling_overlay_active"),
    }


def get_player_hr_prob(
    player_name_normalized: str,
    statcast_df: pd.DataFrame,
    _name_index: dict[str, str] | None = None,
) -> tuple[float | None, str]:
    """
    Backward-compatible wrapper for callers expecting (prob, source).
    """
    name_index = _name_index if _name_index is not None else _build_statcast_name_index(statcast_df)
    statcast_name = name_index.get(player_name_normalized, player_name_normalized)

    result = build_hr_probability_result(
        batter_statcast_df=statcast_df,
        batter_name=statcast_name,
        mode="pregame",
    )
    prob = result.get("calibrated_hr_prob")
    if prob is None:
        return (None, "unavailable")
    return (float(prob), "shared_pregame_engine")


def map_hr_props_to_model(
    props_df: pd.DataFrame,
    statcast_df: pd.DataFrame,
    prob_fn: Callable[..., Any] | None = None,
    pitcher_stats_df: pd.DataFrame | None = None,
    pitcher_statcast_df: pd.DataFrame | None = None,
    probable_starters: dict | None = None,
) -> pd.DataFrame:
    """
    Join HR prop rows to shared-engine HR probabilities and compute edge.

    Adds columns:
      implied_prob, model_hr_prob, model_hr_prob_source, edge
    and shared-engine diagnostics:
      baseline_hr_prob, pregame_hr_prob, probability_mode,
      component adjustment columns, applied_layers, skipped_layers
    """
    del prob_fn
    if props_df.empty:
        return pd.DataFrame()

    hr_df = props_df[props_df["market"] == "hr"].copy()
    if hr_df.empty:
        return pd.DataFrame()

    pitcher_df = (
        pitcher_statcast_df
        if pitcher_statcast_df is not None
        else pitcher_stats_df
        if pitcher_stats_df is not None
        else statcast_df
    )
    name_index = _build_statcast_name_index(statcast_df)
    runtime_cache: dict[str, Any] = {"name_index": name_index}
    projected_starter_cache: dict[tuple[str, str, str], dict[str, Any]] = {}
    batter_team_cache: dict[tuple[str, str, str, str], tuple[str, str]] = {}
    pitcher_resolution_cache: dict[tuple[str, str, str, str], tuple[str, str, str]] = {}
    pitcher_hand_cache: dict[str, tuple[Any, Any]] = {}
    baseline_meta_cache: dict[tuple[int, str], dict[str, Any]] = {}
    lineup_slot_cache: dict[tuple[str, str, str], tuple[Any, Any]] = {}
    team_total_cache: dict[tuple[str, str, str, str], tuple[Any, Any]] = {}

    mapped_rows: list[dict[str, Any]] = []

    for _, row in hr_df.iterrows():
        odds = row.get("odds_american")
        batter_name_normalized = str(row.get("player_name") or "").strip()
        batter_name = name_index.get(batter_name_normalized, batter_name_normalized)
        threshold = row.get("threshold")
        try:
            threshold_int = int(threshold) if threshold is not None and str(threshold).strip() not in {"", "nan", "None"} else 1
        except Exception:
            threshold_int = 1
        is_modeled = bool(row.get("is_modeled")) if pd.notna(row.get("is_modeled")) else threshold_int == 1
        batter_team_key = (
            str(row.get("away_team") or "").strip().lower(),
            str(row.get("home_team") or "").strip().lower(),
            str(batter_name or "").strip().lower(),
            str(row.get("event_id") or "").strip(),
        )
        if batter_team_key not in batter_team_cache:
            batter_team_cache[batter_team_key] = _resolve_batter_team(
                row=row,
                batter_name=batter_name,
                batter_statcast_df=statcast_df,
            )
        batter_team, batter_team_source = batter_team_cache[batter_team_key]

        starter_key = (
            str(row.get("away_team") or "").strip().lower(),
            str(row.get("home_team") or "").strip().lower(),
            str(row.get("event_id") or "").strip(),
        )
        if starter_key not in projected_starter_cache:
            projected_starter_cache[starter_key] = _lookup_projected_starter_context(
                row=row,
                probable_starters=probable_starters,
            )
        projected_starter_context = projected_starter_cache[starter_key]
        pitcher_resolution_key = (
            starter_key[0],
            starter_key[1],
            str(batter_team or "").strip().lower(),
            str(row.get("pitcher_name") or row.get("pitcher") or "").strip().lower(),
        )
        if pitcher_resolution_key not in pitcher_resolution_cache:
            pitcher_resolution_cache[pitcher_resolution_key] = _resolve_pitcher_name(
                row=row,
                batter_team=batter_team,
                probable_starters=probable_starters,
            )
        pitcher_name, resolved_pitcher_source, pitcher_resolution_status = pitcher_resolution_cache[pitcher_resolution_key]
        projected_starter_match_status = _projected_starter_match_status(
            resolved_pitcher_name=pitcher_name,
            projected_home_pitcher=str(projected_starter_context.get("projected_home_pitcher") or ""),
            projected_away_pitcher=str(projected_starter_context.get("projected_away_pitcher") or ""),
        )
        pitcher_hand_key = str(pitcher_name or "").strip().lower()
        if pitcher_hand_key not in pitcher_hand_cache:
            pitcher_hand_cache[pitcher_hand_key] = _resolve_pitcher_hand(
                pitcher_name=pitcher_name,
                pitcher_statcast_df=pitcher_df,
            )
        pitcher_hand, pitcher_hand_source = pitcher_hand_cache[pitcher_hand_key]
        batter_meta_key = (id(statcast_df), str(batter_name or "").strip().lower())
        if batter_meta_key not in baseline_meta_cache:
            baseline_meta_cache[batter_meta_key] = _lookup_baseline_metadata(statcast_df, batter_name)
        batter_baseline_meta = baseline_meta_cache[batter_meta_key]
        pitcher_meta_key = (id(pitcher_df), str(pitcher_name or "").strip().lower())
        if pitcher_meta_key not in baseline_meta_cache:
            baseline_meta_cache[pitcher_meta_key] = _lookup_baseline_metadata(pitcher_df, pitcher_name)
        pitcher_baseline_meta = baseline_meta_cache[pitcher_meta_key]
        lineup_slot_key = (
            str(batter_team or "").strip().lower(),
            str(batter_name or "").strip().lower(),
            str(pitcher_hand or "").strip().upper(),
        )
        if lineup_slot_key not in lineup_slot_cache:
            lineup_slot, lineup_slot_source = _infer_lineup_slot(
                batter_name=batter_name,
                batter_statcast_df=statcast_df,
            )
            lineup_slot_cache[lineup_slot_key] = (lineup_slot, lineup_slot_source)
        lineup_slot, lineup_slot_source = lineup_slot_cache[lineup_slot_key]
        team_total_key = (
            str(row.get("away_team") or "").strip().lower(),
            str(row.get("home_team") or "").strip().lower(),
            str(batter_team or "").strip().lower(),
            str(row.get("event_id") or "").strip(),
            str(row.get("sportsbook") or "").strip().lower(),
            str(row.get("team_total") or row.get("away_team_total") or row.get("home_team_total") or "").strip(),
        )
        if team_total_key not in team_total_cache:
            team_total_cache[team_total_key] = _resolve_team_total(row=row, batter_team=batter_team)
        team_total, team_total_source = team_total_cache[team_total_key]

        try:
            implied = american_to_implied_prob(odds) if odds is not None else None
        except Exception:
            implied = None

        if is_modeled:
            probability_result = build_hr_probability_result(
                batter_statcast_df=statcast_df,
                batter_name=batter_name,
                pitcher_statcast_df=pitcher_df,
                pitcher_name=pitcher_name,
                game_row={
                    **_build_game_context_from_row(row),
                    "lineup_slot": lineup_slot,
                    "lineup_slot_source": lineup_slot_source,
                    "team_total": team_total,
                    "team_total_source": team_total_source,
                    "projected_home_pitcher": projected_starter_context.get("projected_home_pitcher"),
                    "projected_away_pitcher": projected_starter_context.get("projected_away_pitcher"),
                    "projected_starter_available": projected_starter_context.get("projected_starter_available"),
                    "projected_starter_match_status": projected_starter_match_status,
                },
                weather_row=None,
                mode="pregame",
                runtime_cache=runtime_cache,
            )

            model_prob = probability_result.get("calibrated_hr_prob")
            if model_prob is not None and implied is not None:
                edge = compute_edge(model_prob, implied)
                bet_ev = compute_bet_ev(model_prob, odds) if odds is not None else None
                source = "shared_pregame_engine"
            else:
                edge = None
                bet_ev = None
                source = "unavailable"
        else:
            probability_result = {
                "baseline_hr_prob": None,
                "raw_hr_prob": None,
                "calibrated_hr_prob": None,
                "pregame_hr_prob": None,
                "mode": "pregame",
                "applied_layers": "",
                "skipped_layers": "unmodeled_hr_ladder",
                "confidence_score": None,
                "confidence_bucket": None,
                "confidence_reasons": [],
                "opportunity_hr_adjustment": None,
                "expected_pa": None,
                "pa_multiplier": None,
                "lineup_slot_used": lineup_slot,
                "lineup_slot_source": lineup_slot_source,
                "team_total_used": team_total,
                "team_total_source": team_total_source,
                "opportunity_mode": None,
                "opportunity_reason": None,
                "pregame_pitcher_context_adj": None,
                "pregame_park_context_adj": None,
                "pregame_weather_context_adj": None,
                "pregame_context_applied": False,
                "pitcher_hr_adjustment": None,
                "trend_hr_adjustment": None,
                "zone_hr_adjustment": None,
                "family_zone_hr_adjustment": None,
                "arsenal_hr_adjustment": None,
                "pulled_contact_hr_adjustment": None,
                "env_hr_adjustment": None,
                "park_hr_adjustment": None,
                "weather_hr_adjustment": None,
                "platoon_hr_adjustment": None,
                "trajectory_hr_adjustment": None,
                "rolling_hr_adjustment": None,
                "pitcher_reliability": None,
                "trend_reliability": None,
                "zone_reliability": None,
                "family_zone_reliability": None,
                "arsenal_reliability": None,
                "pulled_contact_reliability": None,
                "environment_reliability": None,
                "trajectory_reliability": None,
                "rolling_reliability": None,
                "opportunity_reliability": None,
                "matchup_platoon_multiplier": None,
                "matchup_platoon_reason": "unmodeled_hr_ladder",
                "pitcher_resolution_status": "unmodeled_hr_ladder",
                "zone_status": "unmodeled_hr_ladder",
                "family_zone_status": "unmodeled_hr_ladder",
                "arsenal_status": "unmodeled_hr_ladder",
                "reason_candidate_count": 0,
                "zone_store_sample_size": None,
                "family_zone_batter_sample_size": None,
                "family_zone_pitcher_sample_size": None,
                "arsenal_batter_sample_size": None,
                "arsenal_pitcher_sample_size": None,
                "model_voice_reason_candidates": [],
                "model_voice_tags": [],
            }
            model_prob = None
            edge = None
            bet_ev = None
            source = "unmodeled_hr_ladder"

        probability_status = _classify_hr_probability_status(
            threshold_int=threshold_int,
            is_modeled=is_modeled,
            model_prob=model_prob,
            implied=implied,
            probability_result=probability_result,
            statcast_df=statcast_df,
            pitcher_name=pitcher_name,
        )

        row_dict = row.to_dict()
        row_dict.update(
            {
                "implied_prob": implied,
                "model_hr_prob": model_prob,
                "fair_prob": model_prob,
                "model_hr_prob_source": source,
                "model_hr_prob_source_detail": probability_result.get("applied_layers", ""),
                "edge": edge,
                "bet_ev": bet_ev,
                "baseline_hr_prob": probability_result.get("baseline_hr_prob"),
                "raw_hr_prob": probability_result.get("raw_hr_prob"),
                "calibrated_hr_prob": probability_result.get("calibrated_hr_prob"),
                "pregame_hr_prob": probability_result.get("pregame_hr_prob"),
                "probability_mode": probability_result.get("mode"),
                "formula_version": probability_result.get("formula_version"),
                "is_modeled": is_modeled,
                "threshold": threshold_int,
                "confidence_score": probability_result.get("confidence_score"),
                "confidence_bucket": probability_result.get("confidence_bucket"),
                "confidence_reasons": probability_result.get("confidence_reasons"),
                "opportunity_hr_adjustment": probability_result.get("opportunity_hr_adjustment"),
                "expected_pa": probability_result.get("expected_pa"),
                "pa_multiplier": probability_result.get("pa_multiplier"),
                "lineup_slot_used": probability_result.get("lineup_slot_used", lineup_slot),
                "lineup_slot_source": probability_result.get("lineup_slot_source", lineup_slot_source),
                "team_total_used": probability_result.get("team_total_used", team_total),
                "team_total_source": probability_result.get("team_total_source", team_total_source),
                "opportunity_mode": probability_result.get("opportunity_mode"),
                "opportunity_reason": probability_result.get("opportunity_reason"),
                "pregame_pitcher_context_adj": probability_result.get("pregame_pitcher_context_adj"),
                "pregame_park_context_adj": probability_result.get("pregame_park_context_adj"),
                "pregame_weather_context_adj": probability_result.get("pregame_weather_context_adj"),
                "pregame_context_applied": probability_result.get("pregame_context_applied", False),
                "pitcher_hr_adjustment": probability_result.get("pitcher_hr_adjustment"),
                "trend_hr_adjustment": probability_result.get("trend_hr_adjustment"),
                "zone_hr_adjustment": probability_result.get("zone_hr_adjustment"),
                "family_zone_hr_adjustment": probability_result.get("family_zone_hr_adjustment"),
                "arsenal_hr_adjustment": probability_result.get("arsenal_hr_adjustment"),
                "pulled_contact_hr_adjustment": probability_result.get("pulled_contact_hr_adjustment"),
                "env_hr_adjustment": probability_result.get("env_hr_adjustment"),
                "park_hr_adjustment": probability_result.get("park_hr_adjustment"),
                "weather_hr_adjustment": probability_result.get("weather_hr_adjustment"),
                "platoon_hr_adjustment": probability_result.get("platoon_hr_adjustment"),
                "trajectory_hr_adjustment": probability_result.get("trajectory_hr_adjustment"),
                "rolling_hr_adjustment": probability_result.get("rolling_hr_adjustment"),
                "damage_zone_alignment_subscore": probability_result.get("damage_zone_alignment_subscore"),
                "pitch_mix_exposure_subscore": probability_result.get("pitch_mix_exposure_subscore"),
                "tunnel_damage_subscore": probability_result.get("tunnel_damage_subscore"),
                "count_pattern_damage_subscore": probability_result.get("count_pattern_damage_subscore"),
                "handedness_damage_subscore": probability_result.get("handedness_damage_subscore"),
                "arsenal_fit_subscore": probability_result.get("arsenal_fit_subscore"),
                "environment_amplification_subscore": probability_result.get("environment_amplification_subscore"),
                "hr_opportunity_projection": probability_result.get("hr_opportunity_projection"),
                "matchup_coverage_confidence": probability_result.get("matchup_coverage_confidence"),
                "component_source_map": probability_result.get("component_source_map"),
                "expected_pitch_mix_by_count": probability_result.get("expected_pitch_mix_by_count"),
                "expected_zone_mix_by_count": probability_result.get("expected_zone_mix_by_count"),
                "expected_pitch_zone_mix_by_count": probability_result.get("expected_pitch_zone_mix_by_count"),
                "tunnel_pair_scores": probability_result.get("tunnel_pair_scores"),
                "predicted_attack_regions": probability_result.get("predicted_attack_regions"),
                "predicted_damage_regions": probability_result.get("predicted_damage_regions"),
                "predicted_whiff_regions": probability_result.get("predicted_whiff_regions"),
                "pitcher_reliability": probability_result.get("pitcher_reliability"),
                "trend_reliability": probability_result.get("trend_reliability"),
                "zone_reliability": probability_result.get("zone_reliability"),
                "family_zone_reliability": probability_result.get("family_zone_reliability"),
                "arsenal_reliability": probability_result.get("arsenal_reliability"),
                "pulled_contact_reliability": probability_result.get("pulled_contact_reliability"),
                "environment_reliability": probability_result.get("environment_reliability"),
                "trajectory_reliability": probability_result.get("trajectory_reliability"),
                "rolling_reliability": probability_result.get("rolling_reliability"),
                "opportunity_reliability": probability_result.get("opportunity_reliability"),
                "applied_layers": probability_result.get("applied_layers"),
                "skipped_layers": probability_result.get("skipped_layers"),
                "matchup_platoon_multiplier": probability_result.get("matchup_platoon_multiplier"),
                "matchup_platoon_reason": probability_result.get("matchup_platoon_reason"),
                "resolved_pitcher_name": pitcher_name,
                "projected_home_pitcher": projected_starter_context.get("projected_home_pitcher"),
                "projected_away_pitcher": projected_starter_context.get("projected_away_pitcher"),
                "projected_starter_available": projected_starter_context.get("projected_starter_available"),
                "projected_starter_source": projected_starter_context.get("projected_starter_source"),
                "projected_home_pitcher_source": projected_starter_context.get("projected_home_pitcher_source"),
                "projected_away_pitcher_source": projected_starter_context.get("projected_away_pitcher_source"),
                "starter_cache_source": projected_starter_context.get("starter_cache_source"),
                "fallback_used": projected_starter_context.get("fallback_used"),
                "projected_starter_match_status": projected_starter_match_status,
                "batter_team": batter_team,
                "batter_team_source": batter_team_source,
                "resolved_pitcher_source": resolved_pitcher_source,
                "pitcher_resolution_status": probability_result.get("pitcher_resolution_status", pitcher_resolution_status),
                "pitcher_hand": pitcher_hand,
                "pitcher_hand_source": pitcher_hand_source,
                "zone_status": probability_result.get("zone_status"),
                "family_zone_status": probability_result.get("family_zone_status"),
                "arsenal_status": probability_result.get("arsenal_status"),
                "reason_candidate_count": probability_result.get("reason_candidate_count"),
                "zone_store_sample_size": probability_result.get("zone_store_sample_size"),
                "family_zone_batter_sample_size": probability_result.get("family_zone_batter_sample_size"),
                "family_zone_pitcher_sample_size": probability_result.get("family_zone_pitcher_sample_size"),
                "arsenal_batter_sample_size": probability_result.get("arsenal_batter_sample_size"),
                "arsenal_pitcher_sample_size": probability_result.get("arsenal_pitcher_sample_size"),
                "model_voice_reason_candidates": probability_result.get("model_voice_reason_candidates", []),
                "model_voice_tags": probability_result.get("model_voice_tags", []),
                "selection_scope": row.get("selection_scope") or "player",
                "expected_modeled_hr_row": bool(threshold_int == 1 and str(row.get("market_family") or row.get("market") or "").strip().lower() == "hr"),
                "has_model_probability": model_prob is not None,
                "has_modeled_edge": edge is not None,
                "model_probability_status": probability_status,
                "modeled_row_available": model_prob is not None,
                "modeled_row_missing_reason": None if model_prob is not None else probability_status,
                "baseline_mode": batter_baseline_meta.get("baseline_mode"),
                "prior_sample_size": batter_baseline_meta.get("prior_sample_size"),
                "season_2026_sample_size": batter_baseline_meta.get("season_2026_sample_size"),
                "prior_weight": batter_baseline_meta.get("prior_weight"),
                "season_2026_weight": batter_baseline_meta.get("season_2026_weight"),
                "baseline_driver": batter_baseline_meta.get("baseline_driver"),
                "rolling_overlay_active": batter_baseline_meta.get("rolling_overlay_active"),
                "pitcher_baseline_mode": pitcher_baseline_meta.get("baseline_mode"),
                "pitcher_prior_sample_size": pitcher_baseline_meta.get("prior_sample_size"),
                "pitcher_season_2026_sample_size": pitcher_baseline_meta.get("season_2026_sample_size"),
                "pitcher_prior_weight": pitcher_baseline_meta.get("prior_weight"),
                "pitcher_season_2026_weight": pitcher_baseline_meta.get("season_2026_weight"),
                "pitcher_baseline_driver": pitcher_baseline_meta.get("baseline_driver"),
                "pitcher_rolling_overlay_active": pitcher_baseline_meta.get("rolling_overlay_active"),
            }
        )
        row_dict["verdict"] = _compute_verdict(
            bet_ev=bet_ev,
            edge=edge,
            confidence_score=row_dict.get("confidence_score"),
            is_modeled=is_modeled,
        )
        row_dict.update(build_hr_model_voice(row_dict))
        mapped_rows.append(row_dict)

    result = pd.DataFrame(mapped_rows)
    if result.empty:
        return result

    has_edge = result["edge"].notna()
    with_edge = result[has_edge].sort_values("edge", ascending=False)
    without_edge = result[~has_edge]
    ordered = pd.concat([with_edge, without_edge], ignore_index=True)

    try:
        from analytics.execution_layer import enrich_with_execution_layer

        return enrich_with_execution_layer(ordered)
    except Exception:
        return ordered


def map_strikeout_props_to_model(
    props_df: pd.DataFrame,
    batter_statcast_df: pd.DataFrame,
    pitcher_statcast_df: pd.DataFrame | None = None,
    probable_starters: dict | None = None,
) -> pd.DataFrame:
    if props_df.empty:
        return pd.DataFrame()

    k_df = props_df[props_df["market"].astype(str).str.lower() == "k"].copy()
    if k_df.empty:
        return pd.DataFrame()

    pitcher_df = pitcher_statcast_df if pitcher_statcast_df is not None else batter_statcast_df
    runtime_cache: dict[str, Any] = {}
    projected_starter_cache: dict[tuple[str, str, str], dict[str, Any]] = {}
    pitcher_resolution_cache: dict[tuple[str, str, str], tuple[str, str, str]] = {}
    team_context_cache: dict[tuple[str, str, str], tuple[str, str]] = {}
    pitcher_hand_cache: dict[str, tuple[Any, Any]] = {}
    baseline_meta_cache: dict[tuple[int, str], dict[str, Any]] = {}
    lineup_cache: dict[str, list[str]] = {}
    strikeout_probability_cache: dict[tuple[Any, ...], dict[str, Any]] = {}
    mapped_rows: list[dict[str, Any]] = []

    for _, row in k_df.iterrows():
        line = row.get("line")
        selection_side = str(row.get("selection_side") or "").strip().lower()
        try:
            implied = american_to_implied_prob(row.get("odds_american")) if row.get("odds_american") is not None else None
        except Exception:
            implied = None

        starter_key = (
            str(row.get("away_team") or "").strip().lower(),
            str(row.get("home_team") or "").strip().lower(),
            str(row.get("event_id") or "").strip(),
        )
        if starter_key not in projected_starter_cache:
            projected_starter_cache[starter_key] = _lookup_projected_starter_context(
                row=row,
                probable_starters=probable_starters,
            )
        projected_starter_context = projected_starter_cache[starter_key]
        pitcher_resolution_key = (
            starter_key[0],
            starter_key[1],
            str(row.get("pitcher_name") or row.get("pitcher") or row.get("player_name") or "").strip().lower(),
        )
        if pitcher_resolution_key not in pitcher_resolution_cache:
            pitcher_resolution_cache[pitcher_resolution_key] = _resolve_strikeout_pitcher_name(
                row=row,
                probable_starters=probable_starters,
            )
        pitcher_name, resolved_pitcher_source, pitcher_resolution_status = pitcher_resolution_cache[pitcher_resolution_key]
        if pitcher_resolution_key not in team_context_cache:
            team_context_cache[pitcher_resolution_key] = _resolve_pitcher_team_and_opponent(
                row=row,
                pitcher_name=pitcher_name,
                probable_starters=probable_starters,
            )
        pitcher_team, opponent_team = team_context_cache[pitcher_resolution_key]
        projected_starter_match_status = _projected_starter_match_status(
            resolved_pitcher_name=pitcher_name,
            projected_home_pitcher=str(projected_starter_context.get("projected_home_pitcher") or ""),
            projected_away_pitcher=str(projected_starter_context.get("projected_away_pitcher") or ""),
        )
        pitcher_hand_key = str(pitcher_name or "").strip().lower()
        if pitcher_hand_key not in pitcher_hand_cache:
            pitcher_hand_cache[pitcher_hand_key] = _resolve_pitcher_hand(pitcher_name=pitcher_name, pitcher_statcast_df=pitcher_df)
        pitcher_hand, _ = pitcher_hand_cache[pitcher_hand_key]
        pitcher_meta_key = (id(pitcher_df), str(pitcher_name or "").strip().lower())
        if pitcher_meta_key not in baseline_meta_cache:
            baseline_meta_cache[pitcher_meta_key] = _lookup_baseline_metadata(pitcher_df, pitcher_name)
        pitcher_baseline_meta = baseline_meta_cache[pitcher_meta_key]
        lineup_key = str(opponent_team or "").strip().lower()
        if lineup_key not in lineup_cache:
            lineup_cache[lineup_key] = _extract_team_batters_from_statcast(
                team_name=opponent_team,
                batter_statcast_df=batter_statcast_df,
            )
        opponent_batters = lineup_cache[lineup_key]
        canonical_game_row = _build_game_context_from_row(row)
        canonical_game_row.update(
            {
                "projected_home_pitcher": projected_starter_context.get("projected_home_pitcher"),
                "projected_away_pitcher": projected_starter_context.get("projected_away_pitcher"),
                "projected_starter_available": projected_starter_context.get("projected_starter_available"),
                "projected_starter_source": projected_starter_context.get("projected_starter_source"),
                "projected_home_pitcher_source": projected_starter_context.get("projected_home_pitcher_source"),
                "projected_away_pitcher_source": projected_starter_context.get("projected_away_pitcher_source"),
                "starter_cache_source": projected_starter_context.get("starter_cache_source"),
                "fallback_used": projected_starter_context.get("fallback_used"),
                "projected_starter_match_status": projected_starter_match_status,
                "resolved_pitcher_name": pitcher_name,
                "resolved_pitcher_source": resolved_pitcher_source,
                "pitcher_resolution_status": pitcher_resolution_status,
                "pitcher_team": pitcher_team,
                "opponent_team": opponent_team,
            }
        )
        line_value = float(line) if line is not None and str(line).strip() not in {"", "nan", "None"} else None
        probability_cache_key = (
            str(pitcher_name or "").strip().lower(),
            tuple(str(name or "").strip().lower() for name in opponent_batters),
            str(opponent_team or "").strip().lower(),
            line_value,
            str(selection_side or "").strip().lower(),
            str(canonical_game_row.get("away_team") or "").strip().lower(),
            str(canonical_game_row.get("home_team") or "").strip().lower(),
            str(canonical_game_row.get("projected_starter_match_status") or "").strip().lower(),
        )
        if probability_cache_key not in strikeout_probability_cache:
            strikeout_probability_cache[probability_cache_key] = build_strikeout_probability_result_v2(
                pitcher_statcast_df=pitcher_df,
                pitcher_name=pitcher_name,
                batter_statcast_df=batter_statcast_df,
                opponent_batters=opponent_batters,
                opponent_team=opponent_team,
                line=line_value,
                selection_side=selection_side,
                game_row=canonical_game_row,
                runtime_cache=runtime_cache,
            )
        probability_result_v2 = strikeout_probability_cache[probability_cache_key]
        confidence_payload = _build_strikeout_confidence_payload(
            probability_result=probability_result_v2,
        )

        fair_prob = probability_result_v2.get("fair_prob")
        probability_status = _classify_strikeout_probability_status(
            fair_prob=fair_prob,
            implied=implied,
            pitcher_name=pitcher_name,
            probability_result={
                **probability_result_v2,
                "pitcher_resolution_status": pitcher_resolution_status,
                "projected_starter_match_status": projected_starter_match_status,
            },
        )
        if fair_prob is not None and implied is not None:
            edge = compute_edge(fair_prob, implied)
            bet_ev = compute_bet_ev(fair_prob, row.get("odds_american")) if row.get("odds_american") is not None else None
            source = "shared_strikeout_engine_v2"
            is_modeled = True
        else:
            edge = None
            bet_ev = None
            source = "unavailable"
            is_modeled = False

        row_dict = row.to_dict()
        row_dict.update(
            {
                "selection_scope": row.get("selection_scope") or "pitcher",
                "is_modeled": is_modeled,
                "implied_prob": implied,
                "fair_prob": fair_prob,
                "model_k_prob": fair_prob,
                "bet_ev": bet_ev,
                "edge": edge,
                "confidence_score": confidence_payload.get("confidence_score_display"),
                "confidence_bucket": confidence_payload.get("confidence_bucket_display"),
                "confidence_reasons": confidence_payload.get("confidence_reasons"),
                "confidence_score_raw": confidence_payload.get("confidence_score_raw"),
                "confidence_score_display": confidence_payload.get("confidence_score_display"),
                "confidence_source": confidence_payload.get("confidence_source"),
                "confidence_component_bonuses": confidence_payload.get("confidence_component_bonuses"),
                "confidence_component_penalties": confidence_payload.get("confidence_component_penalties"),
                "confidence_primary_driver": confidence_payload.get("confidence_primary_driver"),
                "confidence_summary_label": confidence_payload.get("confidence_summary_label"),
                "confidence_bucket_raw": confidence_payload.get("confidence_bucket_raw"),
                "confidence_bucket_display": confidence_payload.get("confidence_bucket_display"),
                "expected_strikeouts": probability_result_v2.get("expected_strikeouts"),
                "expected_strikeouts_v2": probability_result_v2.get("expected_strikeouts_v2"),
                "projected_pitch_count": probability_result_v2.get("projected_pitch_count"),
                "projected_batters_faced": probability_result_v2.get("projected_batters_faced"),
                "projected_innings": probability_result_v2.get("projected_innings"),
                "pitches_per_bf": probability_result_v2.get("pitches_per_bf"),
                "opportunity_confidence": probability_result_v2.get("opportunity_confidence"),
                "opportunity_reasons": probability_result_v2.get("opportunity_reasons"),
                "projected_k_rate": probability_result_v2.get("projected_k_rate"),
                "fair_prob_v2": probability_result_v2.get("fair_prob_v2"),
                "raw_k_prob_v2": probability_result_v2.get("raw_k_prob_v2"),
                "calibrated_k_prob_v2": probability_result_v2.get("calibrated_k_prob_v2"),
                "confidence_score_v2": probability_result_v2.get("confidence_score_v2"),
                "confidence_score_raw_v2": probability_result_v2.get("confidence_score_raw_v2"),
                "confidence_score_display_v2": probability_result_v2.get("confidence_score_display_v2"),
                "confidence_source_v2": probability_result_v2.get("confidence_source_v2"),
                "confidence_bucket_v2": probability_result_v2.get("confidence_bucket_v2"),
                "confidence_reasons_v2": probability_result_v2.get("confidence_reasons_v2"),
                "confidence_component_bonuses_v2": probability_result_v2.get("confidence_component_bonuses_v2"),
                "confidence_component_penalties_v2": probability_result_v2.get("confidence_component_penalties_v2"),
                "confidence_primary_driver_v2": probability_result_v2.get("confidence_primary_driver_v2"),
                "confidence_summary_label_v2": probability_result_v2.get("confidence_summary_label_v2"),
                "k_rate_pitch_signal": probability_result_v2.get("k_rate_pitch_signal"),
                "k_rate_anchor": probability_result_v2.get("k_rate_anchor"),
                "bb_rate_anchor": probability_result_v2.get("bb_rate_anchor"),
                "command_efficiency_signal": probability_result_v2.get("command_efficiency_signal"),
                "swing_miss_subscore": probability_result_v2.get("swing_miss_subscore"),
                "called_strike_subscore": probability_result_v2.get("called_strike_subscore"),
                "command_efficiency_subscore": probability_result_v2.get("command_efficiency_subscore"),
                "lineup_whiff_subscore": probability_result_v2.get("lineup_whiff_subscore"),
                "zone_matchup_subscore": probability_result_v2.get("zone_matchup_subscore"),
                "family_zone_matchup_subscore": probability_result_v2.get("family_zone_matchup_subscore"),
                "arsenal_fit_subscore": probability_result_v2.get("arsenal_fit_subscore"),
                "tunneling_subscore": probability_result_v2.get("tunneling_subscore"),
                "release_consistency_subscore": probability_result_v2.get("release_consistency_subscore"),
                "sequencing_subscore": probability_result_v2.get("sequencing_subscore"),
                "count_leverage_subscore": probability_result_v2.get("count_leverage_subscore"),
                "leash_risk_subscore": probability_result_v2.get("leash_risk_subscore"),
                "role_certainty_score": probability_result_v2.get("role_certainty_score"),
                "times_through_order_penalty": probability_result_v2.get("times_through_order_penalty"),
                "telemetry_path_status": probability_result_v2.get("telemetry_path_status"),
                "model_tier": probability_result_v2.get("model_tier"),
                "variance_band_low": probability_result_v2.get("variance_band_low"),
                "variance_band_high": probability_result_v2.get("variance_band_high"),
                "matchup_coverage_confidence": probability_result_v2.get("matchup_coverage_confidence"),
                "component_source_map": probability_result_v2.get("component_source_map"),
                "predicted_whiff_regions": probability_result_v2.get("predicted_whiff_regions"),
                "predicted_attack_regions": probability_result_v2.get("predicted_attack_regions"),
                "predicted_damage_regions": probability_result_v2.get("predicted_damage_regions"),
                "tunnel_pair_scores": probability_result_v2.get("tunnel_pair_scores"),
                "formula_version": probability_result_v2.get("formula_version"),
                "pitcher_swstr_rate": probability_result_v2.get("pitcher_swstr_rate"),
                "pitcher_csw_rate": probability_result_v2.get("pitcher_csw_rate"),
                "pitcher_ball_rate": probability_result_v2.get("pitcher_ball_rate"),
                "arsenal_whiff_risk": probability_result_v2.get("arsenal_fit_subscore"),
                "family_zone_whiff_risk": probability_result_v2.get("family_zone_matchup_subscore"),
                "zone_whiff_risk": probability_result_v2.get("zone_matchup_subscore"),
                "trajectory_tunnel_score": probability_result_v2.get("tunneling_subscore"),
                "trajectory_release_consistency_score": probability_result_v2.get("release_consistency_subscore"),
                "sequencing_score": probability_result_v2.get("sequencing_subscore"),
                "applied_layers": probability_result_v2.get("applied_layers"),
                "skipped_layers": probability_result_v2.get("skipped_layers"),
                "model_k_prob_source": source,
                "model_k_prob_source_detail": probability_result_v2.get("applied_layers", ""),
                "resolved_pitcher_name": pitcher_name,
                "resolved_pitcher_source": resolved_pitcher_source,
                "projected_home_pitcher": projected_starter_context.get("projected_home_pitcher"),
                "projected_away_pitcher": projected_starter_context.get("projected_away_pitcher"),
                "projected_starter_available": projected_starter_context.get("projected_starter_available"),
                "projected_starter_source": projected_starter_context.get("projected_starter_source"),
                "projected_home_pitcher_source": projected_starter_context.get("projected_home_pitcher_source"),
                "projected_away_pitcher_source": projected_starter_context.get("projected_away_pitcher_source"),
                "starter_cache_source": projected_starter_context.get("starter_cache_source"),
                "fallback_used": projected_starter_context.get("fallback_used"),
                "projected_starter_match_status": projected_starter_match_status,
                "pitcher_resolution_status": pitcher_resolution_status,
                "pitcher_team": pitcher_team,
                "opponent_team": opponent_team,
                "has_model_probability": fair_prob is not None,
                "has_modeled_edge": edge is not None,
                "model_probability_status": probability_status,
                "modeled_row_available": fair_prob is not None,
                "modeled_row_missing_reason": None if fair_prob is not None else probability_status,
                "baseline_mode": pitcher_baseline_meta.get("baseline_mode"),
                "prior_sample_size": pitcher_baseline_meta.get("prior_sample_size"),
                "season_2026_sample_size": pitcher_baseline_meta.get("season_2026_sample_size"),
                "prior_weight": pitcher_baseline_meta.get("prior_weight"),
                "season_2026_weight": pitcher_baseline_meta.get("season_2026_weight"),
                "baseline_driver": pitcher_baseline_meta.get("baseline_driver"),
                "rolling_overlay_active": pitcher_baseline_meta.get("rolling_overlay_active"),
            }
        )
        row_dict["verdict"] = _compute_verdict(
            bet_ev=bet_ev,
            edge=edge,
            confidence_score=row_dict.get("confidence_score"),
            is_modeled=is_modeled,
        )
        row_dict.update(build_strikeout_model_voice(row_dict))
        mapped_rows.append(row_dict)

    return pd.DataFrame(mapped_rows)


def map_no_home_run_props(
    props_df: pd.DataFrame,
) -> pd.DataFrame:
    if props_df.empty:
        return pd.DataFrame()
    no_hr_df = props_df[props_df["market_family"].astype(str).str.lower() == "no_hr"].copy()
    if no_hr_df.empty:
        return pd.DataFrame()

    for idx, row in no_hr_df.iterrows():
        implied = american_to_implied_prob(row.get("odds_american")) if row.get("odds_american") is not None else None
        no_hr_df.at[idx, "selection_scope"] = "game"
        no_hr_df.at[idx, "implied_prob"] = implied
        no_hr_df.at[idx, "fair_prob"] = None
        no_hr_df.at[idx, "edge"] = None
        no_hr_df.at[idx, "bet_ev"] = None
        no_hr_df.at[idx, "confidence_score"] = None
        no_hr_df.at[idx, "confidence_bucket"] = None
        no_hr_df.at[idx, "confidence_reasons"] = ["No-HR fair probability model not active yet"]
        no_hr_df.at[idx, "verdict"] = "tracked"
        no_hr_df.at[idx, "model_voice_for"] = "Market is tracked for future release"
        no_hr_df.at[idx, "model_voice_against"] = "No-HR fair probability model is not active yet"
    return no_hr_df


def map_props_to_models(
    props_df: pd.DataFrame,
    statcast_df: pd.DataFrame,
    pitcher_statcast_df: pd.DataFrame | None = None,
    probable_starters: dict | None = None,
) -> pd.DataFrame:
    frames: list[pd.DataFrame] = []
    hr_df = map_hr_props_to_model(
        props_df,
        statcast_df,
        pitcher_statcast_df=pitcher_statcast_df,
        probable_starters=probable_starters,
    )
    if not hr_df.empty:
        frames.append(hr_df)

    k_df = map_strikeout_props_to_model(
        props_df,
        batter_statcast_df=statcast_df,
        pitcher_statcast_df=pitcher_statcast_df,
        probable_starters=probable_starters,
    )
    if not k_df.empty:
        frames.append(k_df)

    no_hr_df = map_no_home_run_props(props_df)
    if not no_hr_df.empty:
        frames.append(no_hr_df)

    if not frames:
        return pd.DataFrame()
    return pd.concat(frames, ignore_index=True, sort=False)