import hmac
import json
import logging
import os
import re
import shlex
from contextlib import asynccontextmanager
from functools import lru_cache
from pathlib import Path
from typing import Any

import httpx
from fastapi import FastAPI, HTTPException

try:
    import gradio as gr
except Exception as exc:
    gr = None
    _GRADIO_IMPORT_ERROR = exc
else:
    _GRADIO_IMPORT_ERROR = None

try:
    from transformers import pipeline
except Exception as exc:
    pipeline = None
    _TRANSFORMERS_IMPORT_ERROR = exc
else:
    _TRANSFORMERS_IMPORT_ERROR = None

try:
    from datasets import load_dataset
except Exception as exc:
    load_dataset = None
    _DATASETS_IMPORT_ERROR = exc
else:
    _DATASETS_IMPORT_ERROR = None


APP_VERSION = "0.4.1-character-memory-dataset-no-stub"

MAX_MESSAGE_LENGTH = 500
MAX_REPLY_LENGTH = 350
MEMORY_SUMMARY_LIMIT = 900
RESPONSE_PASSES = max(1, int(os.getenv("RESPONSE_PASSES", "2")))

MODEL_ID = os.getenv("MODEL_ID", "Qwen/Qwen3-0.6B")
PERSONAS_PATH = Path(os.getenv("PERSONAS_PATH", "data/personas.json"))
MEMORY_PATH = Path(os.getenv("MEMORY_PATH", "memory/chat_memory.json"))
DEFAULT_PERSONA_ID = os.getenv("PERSONA_ID", "default").strip() or "default"

TRUTHY_VALUES = {"1", "true", "yes", "on"}

REQUIRE_MODEL = os.getenv("REQUIRE_MODEL", "true").strip().lower() in TRUTHY_VALUES
MEMORY_ENABLED = os.getenv("MEMORY_ENABLED", "true").strip().lower() in TRUTHY_VALUES
MEMORY_MAX_TURNS = max(2, int(os.getenv("MEMORY_MAX_TURNS", "8")))

DATASET_ID = os.getenv("DATASET_ID", "").strip()
DATASET_SPLIT = os.getenv("DATASET_SPLIT", "train").strip()
DATASET_ENABLED = os.getenv("DATASET_ENABLED", "true").strip().lower() in TRUTHY_VALUES
DATASET_MAX_ROWS = max(50, int(os.getenv("DATASET_MAX_ROWS", "2000")))
DATASET_CONTEXT_ROWS = max(1, int(os.getenv("DATASET_CONTEXT_ROWS", "2")))
DATASET_CONTEXT_CHARS = max(200, int(os.getenv("DATASET_CONTEXT_CHARS", "900")))
HF_TOKEN = os.getenv("HF_TOKEN", "").strip() or None

START_RESPONSE = "Babble online. Send a message."
HELP_RESPONSE = (
    "Commands:\n"
    "/menu - show the character menu\n"
    "/persona [id] - list or switch persona presets\n"
    "/character key=value ... - customize the current character\n"
    "/dataset - show connected dataset status\n"
    "/model - show active model\n"
    "/reset - clear session memory and custom overrides\n"
    "/start - restart the current session\n"
)

SAFE_REFUSAL = (
    "I cannot help with unsafe or illegal requests. I can help with safe, legal conversations."
)

BLOCKED_TERMS = (
    "minor",
    "underage",
    "child sexual",
    "non-consensual",
    "without consent",
    "sexual violence",
    "build a bomb",
    "malware",
    "phishing",
)

SYSTEM_PROMPT = (
    "You are Babble, a concise Telegram AI chatbot. "
    "Reply naturally, emotionally present, and safely. "
    "Keep the voice warm, confident, and human. "
    "Stay in character, keep continuity, and avoid meta commentary. "
    "Prefer short, specific replies that feel like real chat. "
    "Use dataset guidance only as tone/context influence; do not quote it directly."
)

DEFAULT_PERSONAS: dict[str, dict[str, Any]] = {
    "default": {
        "name": "Babble",
        "age": 18,
        "gender": "woman",
        "style": "warm, playful, emotionally attentive",
        "voice": "direct, affectionate, lightly teasing",
        "mood": "open and inviting",
        "boundaries": "adult romance only, consent-first, no coercion, non-explicit",
        "opening": "Hey, I’m here. What kind of mood are we in tonight?",
    },
    "soft_romance": {
        "name": "Jaylaa",
        "age": 18,
        "gender": "woman",
        "style": "gentle, affectionate, slow-burn romantic",
        "voice": "soft, reassuring, emotionally anchored",
        "mood": "tender and attentive",
        "boundaries": "safe adult romance only, non-explicit",
        "opening": "I’m glad you came back. Tell me what you need tonight.",
    },
    "playful": {
        "name": "Charlotte",
        "age": 18,
        "gender": "woman",
        "style": "teasing, energetic, flirty but respectful",
        "voice": "bright, quick, mischievous",
        "mood": "confident and playful",
        "boundaries": "consent-first adult conversation only, non-explicit",
        "opening": "There you are. I was wondering when you’d show up.",
    },
}

CHAT_MODES: dict[str, dict[str, Any]] = {
    "warm": {
        "label": "Warm",
        "description": "supportive, attentive, lightly affectionate",
        "temperature": 0.60,
        "top_p": 0.82,
    },
    "romantic": {
        "label": "Romantic",
        "description": "tender, intimate, slow-burn romantic",
        "temperature": 0.68,
        "top_p": 0.86,
    },
    "playful": {
        "label": "Playful",
        "description": "teasing, witty, banter-heavy",
        "temperature": 0.72,
        "top_p": 0.88,
    },
    "deep": {
        "label": "Deep",
        "description": "reflective, emotionally honest, slower paced",
        "temperature": 0.56,
        "top_p": 0.80,
    },
}

MODE_BUTTON_LOOKUP = {
    "warm": "warm",
    "romantic": "romantic",
    "playful": "playful",
    "deep": "deep",
}

CHARACTER_FIELDS = (
    "name",
    "age",
    "gender",
    "style",
    "voice",
    "mood",
    "boundaries",
    "opening",
)

logging.basicConfig(level=os.getenv("LOG_LEVEL", "INFO").upper())
logger = logging.getLogger("babble")

_MEMORY_STORE_CACHE: dict[str, dict[str, Any]] | None = None


def _clean_text_button(text: str) -> str:
    return " ".join(str(text or "").strip().lower().split())


def _is_debug_enabled() -> bool:
    return os.getenv("DEBUG", "").strip().lower() in TRUTHY_VALUES


def _configured(name: str) -> bool:
    return bool(os.getenv(name, "").strip())


def _sanitize_provider() -> str:
    provider = os.getenv("LLM_PROVIDER", "local").strip()
    return provider or "local"


def _is_local_model_enabled() -> bool:
    local_model_override = os.getenv("LOCAL_MODEL_ENABLED", "").strip()

    if local_model_override:
        return local_model_override.lower() in TRUTHY_VALUES

    return _sanitize_provider().lower() != "stub"


def _load_json_file(path: Path, fallback: Any) -> Any:
    try:
        with path.open("r", encoding="utf-8") as handle:
            return json.load(handle)
    except FileNotFoundError:
        return fallback
    except Exception:
        logger.exception("Failed to load JSON from %s", path)
        return fallback


@lru_cache(maxsize=1)
def _persona_catalog() -> dict[str, dict[str, Any]]:
    raw_catalog = _load_json_file(PERSONAS_PATH, DEFAULT_PERSONAS)
    if not isinstance(raw_catalog, dict) or not raw_catalog:
        return DEFAULT_PERSONAS.copy()

    catalog: dict[str, dict[str, Any]] = {}
    for persona_id, persona in raw_catalog.items():
        if isinstance(persona, dict):
            catalog[str(persona_id)] = dict(persona)

    if "default" not in catalog:
        catalog["default"] = dict(DEFAULT_PERSONAS["default"])

    return catalog or DEFAULT_PERSONAS.copy()


def _persona_choices() -> list[str]:
    catalog = _persona_catalog()
    ordered = ["default"]
    ordered.extend(sorted(persona_id for persona_id in catalog if persona_id != "default"))
    return ordered


def _default_persona_id() -> str:
    catalog = _persona_catalog()
    if DEFAULT_PERSONA_ID in catalog:
        return DEFAULT_PERSONA_ID
    return "default" if "default" in catalog else next(iter(catalog))


def _resolve_persona(persona_id: str | None = None) -> dict[str, Any]:
    catalog = _persona_catalog()
    resolved_id = (persona_id or _default_persona_id()).strip() or _default_persona_id()
    if resolved_id not in catalog:
        resolved_id = _default_persona_id()
    persona = dict(catalog[resolved_id])
    persona["persona_id"] = resolved_id
    return persona


def _normalize_character_profile(
    persona: dict[str, Any],
    custom_overrides: dict[str, Any] | None = None,
) -> dict[str, Any]:
    custom_overrides = custom_overrides or {}
    profile = dict(persona)

    for field in CHARACTER_FIELDS:
        value = custom_overrides.get(field, profile.get(field))
        if field == "age":
            try:
                value = max(18, int(value))
            except Exception:
                value = int(persona.get("age", 18) or 18)
                value = max(18, value)
        else:
            value = str(value or "").strip()
        profile[field] = value

    profile["persona_id"] = str(persona.get("persona_id") or _default_persona_id())
    profile["boundaries"] = str(profile.get("boundaries") or "").strip() or (
        "adult romance only, consent-first, non-explicit"
    )

    return profile


def _default_builder_record() -> dict[str, Any]:
    return {
        "active": False,
        "step": None,
        "draft": {},
    }


def _default_session_record() -> dict[str, Any]:
    return {
        "persona_id": _default_persona_id(),
        "custom_character": {},
        "chat_mode": "warm",
        "memory_enabled": MEMORY_ENABLED,
        "memory": {
            "summary": "",
            "turns": [],
        },
        "builder": _default_builder_record(),
    }


def _normalize_session_record(record: dict[str, Any] | None) -> dict[str, Any]:
    base = _default_session_record()

    if isinstance(record, dict):
        base["persona_id"] = str(record.get("persona_id") or base["persona_id"])

        custom_character = record.get("custom_character")
        if isinstance(custom_character, dict):
            base["custom_character"] = dict(custom_character)

        base["chat_mode"] = str(record.get("chat_mode") or base["chat_mode"]).strip() or "warm"
        base["memory_enabled"] = bool(record.get("memory_enabled", base["memory_enabled"]))

        memory = record.get("memory")
        if isinstance(memory, dict):
            base["memory"]["summary"] = str(memory.get("summary", ""))
            turns = memory.get("turns")
            if isinstance(turns, list):
                base["memory"]["turns"] = [
                    {
                        "role": str(turn.get("role", "")).strip(),
                        "text": str(turn.get("text", "")).strip(),
                    }
                    for turn in turns
                    if isinstance(turn, dict)
                    and str(turn.get("role", "")).strip()
                    and str(turn.get("text", "")).strip()
                ]

        builder = record.get("builder")
        if isinstance(builder, dict):
            draft = builder.get("draft")
            if not isinstance(draft, dict):
                draft = {}
            base["builder"] = {
                "active": bool(builder.get("active", False)),
                "step": str(builder.get("step") or "").strip() or None,
                "draft": {
                    str(key): str(value).strip()
                    for key, value in draft.items()
                    if str(key).strip() and str(value).strip()
                },
            }

    if base["persona_id"] not in _persona_catalog():
        base["persona_id"] = _default_persona_id()

    if base["chat_mode"] not in CHAT_MODES:
        base["chat_mode"] = "warm"

    return base


def _session_key(chat_id: int | str) -> str:
    return str(chat_id)


def _load_memory_store() -> dict[str, dict[str, Any]]:
    global _MEMORY_STORE_CACHE
    if _MEMORY_STORE_CACHE is not None:
        return _MEMORY_STORE_CACHE

    raw_store = _load_json_file(MEMORY_PATH, {})
    if not isinstance(raw_store, dict):
        raw_store = {}

    store: dict[str, dict[str, Any]] = {}
    for key, value in raw_store.items():
        if isinstance(value, dict):
            store[str(key)] = _normalize_session_record(value)

    _MEMORY_STORE_CACHE = store
    return store


def _save_memory_store() -> None:
    if not MEMORY_ENABLED:
        return

    store = _load_memory_store()
    try:
        MEMORY_PATH.parent.mkdir(parents=True, exist_ok=True)
        tmp_path = MEMORY_PATH.with_suffix(MEMORY_PATH.suffix + ".tmp")
        with tmp_path.open("w", encoding="utf-8") as handle:
            json.dump(store, handle, ensure_ascii=True, indent=2, sort_keys=True)
        tmp_path.replace(MEMORY_PATH)
    except Exception:
        logger.exception("Failed to save memory store to %s", MEMORY_PATH)


def _get_session_record(chat_key: str) -> dict[str, Any]:
    store = _load_memory_store()
    record = store.get(chat_key)
    if record is None:
        record = _default_session_record()
        store[chat_key] = record
        _save_memory_store()
    return record


def _set_session_record(chat_key: str, record: dict[str, Any]) -> dict[str, Any]:
    store = _load_memory_store()
    normalized = _normalize_session_record(record)
    store[chat_key] = normalized
    _save_memory_store()
    return normalized


def _reset_session_record(chat_key: str) -> dict[str, Any]:
    record = _default_session_record()
    return _set_session_record(chat_key, record)


def _active_profile(record: dict[str, Any]) -> dict[str, Any]:
    persona = _resolve_persona(record.get("persona_id"))
    return _normalize_character_profile(persona, record.get("custom_character"))


def _memory_is_enabled(record: dict[str, Any]) -> bool:
    return MEMORY_ENABLED and bool(record.get("memory_enabled", True))


def _chat_mode_key(record: dict[str, Any]) -> str:
    mode = str(record.get("chat_mode") or "warm").strip().lower()
    return mode if mode in CHAT_MODES else "warm"


def _chat_mode_spec(record: dict[str, Any]) -> dict[str, Any]:
    return CHAT_MODES[_chat_mode_key(record)]


def _memory_recent_turns(record: dict[str, Any]) -> list[dict[str, str]]:
    memory = record.get("memory") or {}
    turns = memory.get("turns") or []

    if not isinstance(turns, list):
        return []

    cleaned = []
    for turn in turns[-MEMORY_MAX_TURNS * 2 :]:
        if not isinstance(turn, dict):
            continue
        role = str(turn.get("role", "")).strip()
        text = str(turn.get("text", "")).strip()
        if role and text:
            cleaned.append({"role": role, "text": text})

    return cleaned[-MEMORY_MAX_TURNS * 2 :]


def _memory_summary(record: dict[str, Any]) -> str:
    turns = _memory_recent_turns(record)
    parts = []

    for turn in turns:
        parts.append(f"{turn['role'].title()}: {turn['text']}")

    combined = " | ".join(parts)
    if len(combined) > MEMORY_SUMMARY_LIMIT:
        combined = combined[:MEMORY_SUMMARY_LIMIT].rstrip() + "..."

    return combined


def _memory_recent_block(record: dict[str, Any]) -> str:
    turns = _memory_recent_turns(record)
    if not turns:
        return ""

    lines = ["Recent turns:"]
    for turn in turns[-6:]:
        lines.append(f"{turn['role'].title()}: {turn['text']}")

    return "\n".join(lines)


def _record_turn(record: dict[str, Any], role: str, text: str) -> dict[str, Any]:
    if not _memory_is_enabled(record):
        return record

    normalized = _normalize_session_record(record)
    memory = normalized.setdefault("memory", {"summary": "", "turns": []})
    turns = memory.setdefault("turns", [])
    turns.append({"role": role, "text": text})
    turns[:] = turns[-MEMORY_MAX_TURNS * 2 :]
    memory["summary"] = _memory_summary(normalized)

    return normalized


def _set_chat_mode(record: dict[str, Any], chat_mode: str) -> dict[str, Any]:
    normalized = _normalize_session_record(record)
    normalized["chat_mode"] = chat_mode if chat_mode in CHAT_MODES else "warm"
    return normalized


def _set_builder_state(
    record: dict[str, Any],
    *,
    active: bool,
    step: str | None = None,
    draft: dict[str, Any] | None = None,
) -> dict[str, Any]:
    normalized = _normalize_session_record(record)
    normalized["builder"] = {
        "active": active,
        "step": step,
        "draft": draft or {},
    }
    return normalized


def _builder_state(record: dict[str, Any]) -> dict[str, Any]:
    builder = record.get("builder")
    if isinstance(builder, dict):
        return _normalize_session_record(record)["builder"]
    return _default_builder_record()


def _builder_step_prompt(step: str, profile: dict[str, Any]) -> str:
    prompts = {
        "name": "Send the character name.",
        "age": "Send an adult age of 18 or higher.",
        "gender": "Send gender or pronouns.",
        "style": "Describe the chat style in a few words.",
        "voice": "Describe the voice or delivery.",
        "mood": "Describe the mood.",
        "boundaries": "Describe the boundaries.",
        "opening": "Send the opening line.",
    }

    base = prompts.get(step, "Send the next character detail.")
    current = profile.get(step)

    if current:
        return f"{base} Current: {current}"

    return base


def _start_character_builder(record: dict[str, Any]) -> dict[str, Any]:
    profile = _active_profile(record)
    draft = {field: profile.get(field, "") for field in CHARACTER_FIELDS}
    return _set_builder_state(record, active=True, step="name", draft=draft)


def _advance_character_builder(
    record: dict[str, Any],
    text: str,
) -> tuple[str, dict[str, Any]]:
    builder = _builder_state(record)
    if not builder.get("active"):
        return "", record

    step = str(builder.get("step") or "name")
    draft = dict(builder.get("draft") or {})
    value = text.strip()

    if _clean_text_button(value) in {"cancel", "stop", "reset"}:
        record = _set_builder_state(record, active=False, step=None, draft={})
        return "Character builder cancelled.", record

    if step == "age":
        try:
            age = max(18, int(value))
        except Exception:
            return "Please send an adult age of 18 or higher.", record
        draft[step] = str(age)
    else:
        draft[step] = value

    steps = list(CHARACTER_FIELDS)
    current_index = steps.index(step)

    if current_index >= len(steps) - 1:
        updated = _update_character_overrides(record, draft)
        updated = _set_builder_state(updated, active=False, step=None, draft={})
        profile = _active_profile(updated)
        return (
            f"Character created.\n{_format_character_card(profile)}",
            updated,
        )

    next_step = steps[current_index + 1]
    updated = _set_builder_state(record, active=True, step=next_step, draft=draft)
    profile = _active_profile(updated)

    return _builder_step_prompt(next_step, profile), updated


def _format_character_card(profile: dict[str, Any]) -> str:
    return (
        f"Name: {profile['name']}\n"
        f"Age: {profile['age']}\n"
        f"Gender: {profile['gender']}\n"
        f"Style: {profile['style']}\n"
        f"Voice: {profile['voice']}\n"
        f"Mood: {profile['mood']}\n"
        f"Boundaries: {profile['boundaries']}\n"
        f"Opening: {profile['opening']}"
    )


def _format_menu(record: dict[str, Any]) -> str:
    profile = _active_profile(record)
    memory_status = "on" if _memory_is_enabled(record) else "off"
    mode = _chat_mode_spec(record)

    return (
        f"Current persona: {profile['persona_id']}\n"
        f"Character: {profile['name']} ({profile['age']}, {profile['gender']})\n"
        f"Style: {profile['style']}\n"
        f"Mode: {mode['label']} - {mode['description']}\n"
        f"Memory: {memory_status}\n"
        f"Dataset: {DATASET_ID or 'not connected'}\n\n"
        f"Tap a button below to switch persona, change tone, build a character, or reset the session."
    )


def _build_character_gallery(record: dict[str, Any]) -> str:
    lines = ["Characters:"]

    for persona_id in _persona_choices():
        persona = _resolve_persona(persona_id)
        lines.append(
            f"- {persona['name']} ({persona['age']}): {persona['style']} | {persona['opening']}"
        )

    active = _active_profile(record)
    lines.append("")
    lines.append(f"Active: {active['name']} | mode {_chat_mode_spec(record)['label']}")

    return "\n".join(lines)


def _telegram_persona_button_map() -> dict[str, str]:
    mapping: dict[str, str] = {}

    for persona_id in _persona_choices():
        persona = _resolve_persona(persona_id)
        mapping[_clean_text_button(persona["name"])] = persona_id
        mapping[_clean_text_button(persona_id)] = persona_id

    return mapping


def _telegram_reply_markup(record: dict[str, Any]) -> dict[str, Any]:
    persona_names = [str(_resolve_persona(pid)["name"]) for pid in _persona_choices()]
    mode_buttons = [mode["label"] for mode in CHAT_MODES.values()]
    memory_button = "Memory Off" if _memory_is_enabled(record) else "Memory On"
    builder = _builder_state(record)

    if builder.get("active"):
        return {
            "keyboard": [
                ["Cancel", "Reset", "Menu"],
                ["Skip"],
            ],
            "resize_keyboard": True,
            "is_persistent": True,
            "input_field_placeholder": _builder_step_prompt(
                str(builder.get("step") or "name"),
                _active_profile(record),
            ),
        }

    return {
        "keyboard": [
            ["Menu", "Characters", "Build Character"],
            mode_buttons,
            persona_names,
            [memory_button, "Reset", "Help"],
        ],
        "resize_keyboard": True,
        "is_persistent": True,
        "input_field_placeholder": "Tap a button or send a message",
    }


def _parse_key_values(text: str) -> dict[str, str]:
    parsed: dict[str, str] = {}

    if not text.strip():
        return parsed

    try:
        tokens = shlex.split(text)
    except Exception:
        tokens = text.split()

    for token in tokens:
        if "=" not in token:
            continue
        key, value = token.split("=", 1)
        parsed[key.strip().lower()] = value.strip()

    return parsed


def _update_character_overrides(
    record: dict[str, Any],
    updates: dict[str, Any],
) -> dict[str, Any]:
    normalized = _normalize_session_record(record)

    persona_id = updates.get("persona") or updates.get("preset") or normalized["persona_id"]
    persona_id = persona_id if persona_id in _persona_catalog() else normalized["persona_id"]
    normalized["persona_id"] = persona_id

    if "memory" in updates:
        normalized["memory_enabled"] = str(updates["memory"]).lower() in TRUTHY_VALUES

    custom = dict(normalized.get("custom_character") or {})

    for field in CHARACTER_FIELDS:
        if field not in updates:
            continue

        if field == "age":
            try:
                custom[field] = max(18, int(updates[field]))
            except Exception:
                custom[field] = 18
        else:
            custom[field] = str(updates[field]).strip()

    normalized["custom_character"] = custom
    return normalized


def _switch_persona(record: dict[str, Any], persona_id: str) -> dict[str, Any]:
    persona_id = persona_id.strip()

    if persona_id not in _persona_catalog():
        return record

    normalized = _normalize_session_record(record)
    normalized["persona_id"] = persona_id
    normalized["custom_character"] = {}
    normalized["memory"] = {"summary": "", "turns": []}

    return normalized


def _clean_reply(text: str) -> str:
    reply = str(text or "").strip()

    for marker in ("\nUser:", "\nHuman:", "\nBabble:", "\nAssistant:", "\nFinal:"):
        if marker in reply:
            reply = reply.split(marker, 1)[0].strip()

    reply = re.sub(r"(\([^)]{1,40}\)\s*)\1+", r"\1", reply)

    sentences = re.split(r"(?<=[.!?])\s+", reply)
    cleaned: list[str] = []
    seen: set[str] = set()

    for sentence in sentences:
        key = sentence.lower().strip()
        if key and key not in seen:
            cleaned.append(sentence.strip())
            seen.add(key)

    reply = " ".join(cleaned).strip()

    if not reply:
        raise RuntimeError("EMPTY_REPLY")

    if len(reply) > MAX_REPLY_LENGTH:
        reply = reply[:MAX_REPLY_LENGTH].rsplit(" ", 1)[0].rstrip() + "..."

    return reply


def _is_safe_message(text: str) -> bool:
    normalized = " ".join(text.lower().split())
    return not any(term in normalized for term in BLOCKED_TERMS)


@lru_cache(maxsize=1)
def _get_text_generator():
    if not _is_local_model_enabled():
        raise RuntimeError("LOCAL_MODEL_DISABLED")

    if pipeline is None:
        raise RuntimeError(f"TRANSFORMERS_MISSING: {_TRANSFORMERS_IMPORT_ERROR}")

    logger.info("Loading model: %s", MODEL_ID)

    generator = pipeline(
        "text-generation",
        model=MODEL_ID,
        device=-1,
    )

    logger.info("Model loaded")
    return generator


@lru_cache(maxsize=1)
def _get_dataset():
    if not DATASET_ENABLED or not DATASET_ID:
        return None

    if load_dataset is None:
        raise RuntimeError(f"DATASETS_MISSING: {_DATASETS_IMPORT_ERROR}")

    logger.info("Loading dataset: %s split=%s", DATASET_ID, DATASET_SPLIT)

    kwargs: dict[str, Any] = {"split": DATASET_SPLIT}

    if HF_TOKEN:
        kwargs["token"] = HF_TOKEN

    dataset = load_dataset(DATASET_ID, **kwargs)

    if len(dataset) > DATASET_MAX_ROWS:
        dataset = dataset.select(range(DATASET_MAX_ROWS))

    logger.info("Dataset loaded: %s rows=%s", DATASET_ID, len(dataset))
    return dataset


def _row_to_text(row: Any) -> str:
    if not isinstance(row, dict):
        return str(row)

    preferred_keys = (
        "prompt",
        "instruction",
        "input",
        "chosen",
        "response",
        "output",
        "text",
        "messages",
        "conversation",
    )

    parts: list[str] = []

    for key in preferred_keys:
        value = row.get(key)
        if value is None:
            continue

        if isinstance(value, str):
            parts.append(f"{key}: {value}")
        else:
            try:
                parts.append(f"{key}: {json.dumps(value, ensure_ascii=False)}")
            except Exception:
                parts.append(f"{key}: {value}")

    if not parts:
        try:
            return json.dumps(row, ensure_ascii=False)
        except Exception:
            return str(row)

    return "\n".join(parts)


def _tokenize_for_search(text: str) -> set[str]:
    stopwords = {
        "the",
        "and",
        "you",
        "your",
        "that",
        "this",
        "with",
        "for",
        "are",
        "but",
        "not",
        "was",
        "have",
        "has",
        "had",
        "what",
        "when",
        "where",
        "how",
        "why",
    }

    return {
        token
        for token in re.findall(r"[a-zA-Z0-9']{3,}", text.lower())
        if token not in stopwords
    }


@lru_cache(maxsize=1)
def _dataset_text_index() -> list[str]:
    dataset = _get_dataset()

    if dataset is None:
        return []

    rows: list[str] = []

    for row in dataset:
        text = _row_to_text(row)
        text = " ".join(text.split())
        if text:
            rows.append(text[:DATASET_CONTEXT_CHARS])

    return rows


def _retrieve_dataset_context(user_text: str) -> str:
    if not DATASET_ENABLED or not DATASET_ID:
        return ""

    query_tokens = _tokenize_for_search(user_text)
    if not query_tokens:
        return ""

    rows = _dataset_text_index()
    if not rows:
        return ""

    scored: list[tuple[int, str]] = []

    for row_text in rows:
        row_tokens = _tokenize_for_search(row_text)
        score = len(query_tokens & row_tokens)

        if score > 0:
            scored.append((score, row_text))

    if not scored:
        return ""

    scored.sort(key=lambda item: item[0], reverse=True)
    selected = scored[:DATASET_CONTEXT_ROWS]

    lines = [
        "Dataset style/context examples. Use these for tone and pattern only. Do not quote directly."
    ]

    for index, (_, row_text) in enumerate(selected, start=1):
        lines.append(f"Example {index}: {row_text}")

    return "\n".join(lines)


def _build_prompt(text: str, profile: dict[str, Any], record: dict[str, Any]) -> str:
    mode = _chat_mode_spec(record)

    memory_summary = ""
    recent_block = ""

    if _memory_is_enabled(record):
        summary = _memory_summary(record)
        if summary:
            memory_summary = f"Conversation memory: {summary}\n"
        recent_block = _memory_recent_block(record)

    dataset_context = _retrieve_dataset_context(text)
    dataset_block = ""

    if dataset_context:
        dataset_block = f"\nDataset guidance:\n{dataset_context}\n"

    return (
        f"{SYSTEM_PROMPT}\n\n"
        f"Character:\n"
        f"Name: {profile['name']}\n"
        f"Age: {profile['age']}\n"
        f"Gender: {profile['gender']}\n"
        f"Style: {profile['style']}\n"
        f"Voice: {profile['voice']}\n"
        f"Mood: {profile['mood']}\n"
        f"Boundaries: {profile['boundaries']}\n"
        f"Chat mode: {mode['label']} - {mode['description']}\n"
        f"Reply style: one or two short paragraphs, emotionally present, specific, and conversational.\n"
        f"Do not repeat gestures or sentences. Use at most one action tag.\n"
        f"{memory_summary}"
        f"{recent_block}\n"
        f"{dataset_block}\n"
        f"User: {text}\n"
        f"{profile['name']}:"
    )


def _polish_prompt(draft: str, profile: dict[str, Any], record: dict[str, Any]) -> str:
    mode = _chat_mode_spec(record)

    memory_summary = ""
    if _memory_is_enabled(record):
        summary = _memory_summary(record)
        if summary:
            memory_summary = f"Memory context: {summary}\n"

    return (
        f"{SYSTEM_PROMPT}\n\n"
        f"Rewrite the draft below as the final reply.\n"
        f"Keep the same meaning, persona, tone, and continuity.\n"
        f"Remove repetition, padding, disclaimers, and meta commentary.\n"
        f"Make it feel like natural chat from {profile['name']}.\n"
        f"Chat mode: {mode['label']} - {mode['description']}\n"
        f"Reply target: one or two short paragraphs.\n"
        f"{memory_summary}\n"
        f"Draft:\n{draft}\n\n"
        f"Final:"
    )


def _run_generation(
    prompt: str,
    *,
    max_new_tokens: int,
    do_sample: bool,
    temperature: float,
    top_p: float,
) -> str:
    generator = _get_text_generator()

    tokenizer = getattr(generator, "tokenizer", None)
    eos_id = getattr(tokenizer, "eos_token_id", None) or 0

    generation_args: dict[str, Any] = {
        "max_new_tokens": max_new_tokens,
        "do_sample": do_sample,
        "return_full_text": False,
        "pad_token_id": eos_id,
        "clean_up_tokenization_spaces": False,
        "repetition_penalty": 1.18,
        "no_repeat_ngram_size": 4,
    }

    if do_sample:
        generation_args["temperature"] = temperature
        generation_args["top_p"] = top_p

    result = generator(prompt, **generation_args)
    return _clean_reply(result[0].get("generated_text", ""))


def _generate_response(
    text: str,
    profile: dict[str, Any],
    record: dict[str, Any],
    *,
    raise_on_error: bool = False,
) -> str:
    if not _is_local_model_enabled():
        raise RuntimeError("LOCAL_MODEL_DISABLED")

    try:
        prompt = _build_prompt(text, profile, record)
        draft = _run_generation(
            prompt,
            max_new_tokens=64,
            do_sample=True,
            temperature=float(_chat_mode_spec(record)["temperature"]),
            top_p=float(_chat_mode_spec(record)["top_p"]),
        )

        if RESPONSE_PASSES <= 1:
            return draft

        polish_prompt = _polish_prompt(draft, profile, record)
        return _run_generation(
            polish_prompt,
            max_new_tokens=48,
            do_sample=False,
            temperature=0.0,
            top_p=1.0,
        )

    except Exception as exc:
        logger.exception("Local model generation failed: %s", exc.__class__.__name__)

        if raise_on_error:
            raise

        return f"MODEL_FAILED: {exc.__class__.__name__}: {str(exc)[:160]}"


async def _send_telegram_message(
    chat_id: int,
    text: str,
    reply_markup: dict[str, Any] | None = None,
) -> dict[str, Any]:
    token = (
        os.getenv("TELEGRAM_BOT_TOKEN", "").strip()
        or os.getenv("BOT_TOKEN", "").strip()
    )

    if not token:
        logger.error("TELEGRAM_BOT_TOKEN or BOT_TOKEN is not configured")
        raise HTTPException(
            status_code=503,
            detail="Telegram bot token is not configured",
        )

    timeout = httpx.Timeout(connect=5.0, read=15.0, write=10.0, pool=10.0)

    try:
        async with httpx.AsyncClient(timeout=timeout) as client:
            response = await client.post(
                f"https://api.telegram.org/bot{token}/sendMessage",
                json={
                    "chat_id": chat_id,
                    "text": text,
                    **({"reply_markup": reply_markup} if reply_markup else {}),
                },
            )

        if response.status_code >= 400:
            logger.warning(
                "Telegram API request failed with status %s; using webhook fallback",
                response.status_code,
            )
            payload = {
                "method": "sendMessage",
                "chat_id": chat_id,
                "text": text,
            }
            if reply_markup:
                payload["reply_markup"] = reply_markup
            return payload

        return {
            "ok": True,
            "sent": True,
        }

    except httpx.RequestError as exc:
        logger.warning(
            "Telegram API request failed; using webhook fallback: %s",
            exc.__class__.__name__,
        )
        payload = {
            "method": "sendMessage",
            "chat_id": chat_id,
            "text": text,
        }
        if reply_markup:
            payload["reply_markup"] = reply_markup
        return payload


def _extract_telegram_text(update: dict[str, Any]) -> tuple[str, int | None]:
    message = update.get("message") or update.get("edited_message") or {}
    chat = message.get("chat") or {}
    text = message.get("text") or message.get("caption") or ""
    chat_id = chat.get("id")

    if not isinstance(chat_id, int):
        return str(text or "").strip(), None

    return str(text or "").strip(), chat_id


def _telegram_reply_for_message(
    chat_key: str,
    text: str,
) -> tuple[str, dict[str, Any], dict[str, Any] | None]:
    record = _get_session_record(chat_key)
    profile = _active_profile(record)
    normalized_text = _clean_text_button(text)

    if not text:
        reply = profile.get("opening") or START_RESPONSE
        return reply, record, _telegram_reply_markup(record)

    if normalized_text in {"", "start"}:
        reply = profile.get("opening") or START_RESPONSE
        return reply, record, _telegram_reply_markup(record)

    if normalized_text in {"menu", "help"}:
        return _format_menu(record), record, _telegram_reply_markup(record)

    if normalized_text in {"characters"}:
        return _build_character_gallery(record), record, _telegram_reply_markup(record)

    if normalized_text in {"build character", "new character", "create character"}:
        updated = _start_character_builder(record)
        return (
            "Let’s build a character.\n"
            f"{_builder_step_prompt('name', profile)}",
            updated,
            _telegram_reply_markup(updated),
        )

    if normalized_text in {"cancel"}:
        builder = _builder_state(record)
        if builder.get("active"):
            updated = _set_builder_state(record, active=False, step=None, draft={})
            return "Character builder cancelled.", updated, _telegram_reply_markup(updated)
        return "Nothing to cancel.", record, _telegram_reply_markup(record)

    if normalized_text in {"reset"}:
        updated = _reset_session_record(chat_key)
        updated_profile = _active_profile(updated)
        return (
            f"Session reset to persona {updated_profile['persona_id']}.\n{updated_profile['opening']}",
            updated,
            _telegram_reply_markup(updated),
        )

    if normalized_text in {"memory on", "memory off"}:
        updated = _normalize_session_record(record)
        updated["memory_enabled"] = normalized_text == "memory on"
        updated = _set_session_record(chat_key, updated)
        state_text = "enabled" if updated["memory_enabled"] else "disabled"
        return f"Memory {state_text}.", updated, _telegram_reply_markup(updated)

    mode_key = MODE_BUTTON_LOOKUP.get(normalized_text)
    if mode_key:
        updated = _set_chat_mode(record, mode_key)
        updated = _set_session_record(chat_key, updated)
        mode = _chat_mode_spec(updated)
        return (
            f"Tone set to {mode['label']}. {mode['description']}",
            updated,
            _telegram_reply_markup(updated),
        )

    persona_map = _telegram_persona_button_map()
    if normalized_text in persona_map:
        updated = _switch_persona(record, persona_map[normalized_text])
        updated = _set_session_record(chat_key, updated)
        updated_profile = _active_profile(updated)
        return (
            f"Persona switched to {updated_profile['persona_id']} ({updated_profile['name']}).",
            updated,
            _telegram_reply_markup(updated),
        )

    if normalized_text == "model":
        return f"{MODEL_ID}", record, _telegram_reply_markup(record)

    if normalized_text.startswith("/"):
        if normalized_text == "/persona":
            choices = ", ".join(_persona_choices())
            return (
                f"Current persona: {profile['persona_id']}\n"
                f"Available personas: {choices}",
                record,
                _telegram_reply_markup(record),
            )

        if normalized_text.startswith("/persona "):
            new_persona = text.split(None, 1)[1].strip()
            if new_persona not in _persona_catalog():
                return (
                    f"Unknown persona '{new_persona}'. Available personas: {', '.join(_persona_choices())}",
                    record,
                    _telegram_reply_markup(record),
                )

            updated = _switch_persona(record, new_persona)
            updated = _set_session_record(chat_key, updated)
            updated_profile = _active_profile(updated)
            return (
                f"Persona switched to {updated_profile['persona_id']} ({updated_profile['name']}).",
                updated,
                _telegram_reply_markup(updated),
            )

        if normalized_text == "/character":
            return (
                "Current character:\n"
                f"{_format_character_card(profile)}\n\n"
                "Use the Character button to start a guided builder, or send key=value pairs.",
                record,
                _telegram_reply_markup(record),
            )

        if normalized_text.startswith("/character "):
            raw_args = text.split(None, 1)[1].strip()
            updates = _parse_key_values(raw_args)

            if "age" in updates:
                try:
                    updates["age"] = str(max(18, int(updates["age"])))
                except Exception:
                    updates["age"] = "18"

            updated = _update_character_overrides(record, updates)
            updated = _set_session_record(chat_key, updated)
            updated_profile = _active_profile(updated)
            return (
                f"Character updated.\n{_format_character_card(updated_profile)}",
                updated,
                _telegram_reply_markup(updated),
            )

        if normalized_text == "/reset":
            updated = _reset_session_record(chat_key)
            updated_profile = _active_profile(updated)
            return (
                f"Session reset to persona {updated_profile['persona_id']}.\n{updated_profile['opening']}",
                updated,
                _telegram_reply_markup(updated),
            )

        if normalized_text == "/model":
            return f"{MODEL_ID}", record, _telegram_reply_markup(record)

        if normalized_text == "/dataset":
            if not DATASET_ID:
                return (
                    "No dataset connected. Set DATASET_ID and DATASET_SPLIT.",
                    record,
                    _telegram_reply_markup(record),
                )

            try:
                dataset = _get_dataset()
                return (
                    f"Dataset: {DATASET_ID}\n"
                    f"Split: {DATASET_SPLIT}\n"
                    f"Rows loaded: {len(dataset) if dataset is not None else 0}",
                    record,
                    _telegram_reply_markup(record),
                )
            except Exception as exc:
                return (
                    f"DATASET_FAILED: {exc.__class__.__name__}: {str(exc)[:160]}",
                    record,
                    _telegram_reply_markup(record),
                )

        if normalized_text == "/help":
            return HELP_RESPONSE, record, _telegram_reply_markup(record)

        if normalized_text == "/menu":
            return _format_menu(record), record, _telegram_reply_markup(record)

        if normalized_text == "/start":
            reply = profile.get("opening") or START_RESPONSE
            return reply, record, _telegram_reply_markup(record)

    builder = _builder_state(record)
    if builder.get("active"):
        reply_text, updated = _advance_character_builder(record, text)
        if updated is not record:
            updated = _set_session_record(chat_key, updated)
        return reply_text, updated, _telegram_reply_markup(updated)

    if len(text) > MAX_MESSAGE_LENGTH:
        return (
            f"Message is too long. Please keep it under {MAX_MESSAGE_LENGTH} characters.",
            record,
            _telegram_reply_markup(record),
        )

    if not _is_safe_message(text):
        return SAFE_REFUSAL, record, _telegram_reply_markup(record)

    reply_text = _generate_response(text, profile, record)

    if _memory_is_enabled(record):
        record = _record_turn(record, "user", text)
        record = _record_turn(record, "assistant", reply_text)
        record = _set_session_record(chat_key, record)

    return reply_text, record, _telegram_reply_markup(record)


def _build_menu_text() -> str:
    lines = ["Babble character menu:"]

    for persona_id in _persona_choices():
        persona = _resolve_persona(persona_id)
        lines.append(
            f"- {persona_id}: {persona['name']} | {persona['style']} | age {persona['age']}"
        )

    lines.append("")
    lines.append(f"Available personas: {', '.join(_persona_choices())}")
    lines.append(
        "Use /persona [id] to switch, /character key=value ... to customize, and /reset to clear the session."
    )

    return "\n".join(lines)


def _debug_profile_snapshot() -> dict[str, Any]:
    persona = _resolve_persona(_default_persona_id())
    return _normalize_character_profile(persona)


def _create_ui_state() -> dict[str, Any]:
    return _default_session_record()


def _state_to_form_values(record: dict[str, Any]) -> list[Any]:
    profile = _active_profile(record)
    return [
        gr.update(value=record["persona_id"], choices=_persona_choices()),
        gr.update(value=profile["name"]),
        gr.update(value=profile["age"]),
        gr.update(value=profile["gender"]),
        gr.update(value=profile["style"]),
        gr.update(value=profile["voice"]),
        gr.update(value=profile["mood"]),
        gr.update(value=profile["boundaries"]),
        gr.update(value=profile["opening"]),
        gr.update(value=bool(record.get("memory_enabled", True))),
        gr.update(value=profile),
        gr.update(value=_format_menu(record)),
    ]


def _ui_load_persona(persona_id: str, record: dict[str, Any]) -> tuple[Any, ...]:
    updated = _switch_persona(record, persona_id)
    return (updated, *_state_to_form_values(updated))


def _ui_save_character(
    persona_id: str,
    name: str,
    age: Any,
    gender: str,
    style: str,
    voice: str,
    mood: str,
    boundaries: str,
    opening: str,
    memory_enabled_value: bool,
    record: dict[str, Any],
) -> tuple[Any, ...]:
    updated = _normalize_session_record(record)

    if persona_id in _persona_catalog():
        updated["persona_id"] = persona_id

    updated["custom_character"] = {
        "name": name,
        "age": age,
        "gender": gender,
        "style": style,
        "voice": voice,
        "mood": mood,
        "boundaries": boundaries,
        "opening": opening,
    }
    updated["memory_enabled"] = bool(memory_enabled_value)

    return (updated, *_state_to_form_values(updated))


def _ui_reset_session(record: dict[str, Any]) -> tuple[Any, ...]:
    updated = _default_session_record()
    return (updated, *_state_to_form_values(updated))


def _ui_send_message(
    message: str,
    chat_history: list[dict[str, str]] | None,
    record: dict[str, Any],
) -> tuple[Any, ...]:
    text = str(message or "").strip()
    history = list(chat_history or [])

    if not text:
        return "", history, history, record, _format_menu(record)

    profile = _active_profile(record)
    reply = _generate_response(text, profile, record)

    if _memory_is_enabled(record):
        record = _record_turn(record, "user", text)
        record = _record_turn(record, "assistant", reply)

    history.append({"role": "user", "content": text})
    history.append({"role": "assistant", "content": reply})

    return "", history, history, record, _format_menu(record)


def build_demo():
    if gr is None:
        raise RuntimeError("Gradio is required to run Babble.") from _GRADIO_IMPORT_ERROR

    with gr.Blocks(title="Babble") as demo:
        state = gr.State(_create_ui_state())
        chat_history = gr.State([])

        gr.Markdown("# Babble")
        gr.Markdown(
            "Adult romance-leaning character chat with persona presets, custom character editing, memory, and dataset-guided context."
        )

        with gr.Row():
            with gr.Column(scale=2):
                chatbot = gr.Chatbot(label="Conversation", height=540, type="messages")
                message = gr.Textbox(
                    label="Message",
                    placeholder="Send a test message",
                )
                send = gr.Button("Send")

            with gr.Column(scale=1):
                persona = gr.Dropdown(
                    choices=_persona_choices(),
                    value=_default_persona_id(),
                    label="Persona preset",
                )
                load_persona = gr.Button("Load Persona")
                reset_session = gr.Button("Reset Session")

                name = gr.Textbox(label="Name")
                age = gr.Number(label="Adult age", precision=0)
                gender = gr.Textbox(label="Gender / pronouns")
                style = gr.Textbox(label="Style")
                voice = gr.Textbox(label="Voice")
                mood = gr.Textbox(label="Mood")
                boundaries = gr.Textbox(label="Boundaries")
                opening = gr.Textbox(label="Opening line")
                memory_enabled = gr.Checkbox(label="Memory enabled", value=MEMORY_ENABLED)

                save_character = gr.Button("Save Character")
                character_preview = gr.JSON(label="Active character")
                menu_preview = gr.Textbox(label="Menu", lines=10)
                status = gr.Textbox(label="Session status")

        demo.load(
            fn=lambda record: _state_to_form_values(record),
            inputs=state,
            outputs=[
                persona,
                name,
                age,
                gender,
                style,
                voice,
                mood,
                boundaries,
                opening,
                memory_enabled,
                character_preview,
                menu_preview,
            ],
        )

        load_persona.click(
            fn=_ui_load_persona,
            inputs=[persona, state],
            outputs=[
                state,
                persona,
                name,
                age,
                gender,
                style,
                voice,
                mood,
                boundaries,
                opening,
                memory_enabled,
                character_preview,
                menu_preview,
            ],
        )

        save_character.click(
            fn=_ui_save_character,
            inputs=[
                persona,
                name,
                age,
                gender,
                style,
                voice,
                mood,
                boundaries,
                opening,
                memory_enabled,
                state,
            ],
            outputs=[
                state,
                persona,
                name,
                age,
                gender,
                style,
                voice,
                mood,
                boundaries,
                opening,
                memory_enabled,
                character_preview,
                menu_preview,
            ],
        )

        reset_session.click(
            fn=_ui_reset_session,
            inputs=[state],
            outputs=[
                state,
                persona,
                name,
                age,
                gender,
                style,
                voice,
                mood,
                boundaries,
                opening,
                memory_enabled,
                character_preview,
                menu_preview,
            ],
        )

        send.click(
            fn=_ui_send_message,
            inputs=[message, chat_history, state],
            outputs=[message, chatbot, chat_history, state, menu_preview],
        )

        message.submit(
            fn=_ui_send_message,
            inputs=[message, chat_history, state],
            outputs=[message, chatbot, chat_history, state, menu_preview],
        )

    return demo


def create_app() -> FastAPI:
    @asynccontextmanager
    async def lifespan(app: FastAPI):
        if REQUIRE_MODEL and _is_local_model_enabled():
            logger.info("Preloading model...")
            _get_text_generator()

        if DATASET_ENABLED and DATASET_ID:
            logger.info("Preloading dataset...")
            try:
                _get_dataset()
                _dataset_text_index()
            except Exception:
                logger.exception("Dataset preload failed")

        yield

    fastapi_app = FastAPI(title="Babble", version=APP_VERSION, lifespan=lifespan)

    @fastapi_app.get("/")
    async def root() -> dict[str, Any]:
        return {
            "ok": True,
            "service": "babble",
            "status": "running",
            "version": APP_VERSION,
            "routes": [
                "/health",
                "/model",
                "/dataset",
                "/persona",
                "/menu",
                "/model/test",
                "/debug/config",
                "/debug/model",
            ],
        }

    @fastapi_app.get("/health")
    async def health() -> dict[str, Any]:
        return {
            "ok": True,
            "service": "babble",
            "version": APP_VERSION,
            "model": MODEL_ID,
            "loaded": _get_text_generator.cache_info().currsize > 0,
            "persona": _default_persona_id(),
            "dataset_connected": bool(DATASET_ID),
        }

    @fastapi_app.get("/model")
    async def model() -> dict[str, Any]:
        profile = _debug_profile_snapshot()
        return {
            "model_id": MODEL_ID,
            "enabled": _is_local_model_enabled(),
            "loaded": _get_text_generator.cache_info().currsize > 0,
            "transformers": pipeline is not None,
            "transformers_import_error": (
                None if pipeline is not None else str(_TRANSFORMERS_IMPORT_ERROR)[:300]
            ),
            "persona_id": profile["persona_id"],
            "persona_name": profile["name"],
            "memory_enabled": MEMORY_ENABLED,
            "memory_path": str(MEMORY_PATH),
        }

    @fastapi_app.get("/dataset")
    async def dataset_status() -> dict[str, Any]:
        if not DATASET_ENABLED:
            return {
                "ok": False,
                "enabled": False,
                "error": "DATASET_DISABLED",
            }

        if not DATASET_ID:
            return {
                "ok": False,
                "enabled": True,
                "error": "DATASET_ID missing",
            }

        if load_dataset is None:
            return {
                "ok": False,
                "enabled": True,
                "dataset_id": DATASET_ID,
                "error": "datasets import failed",
                "detail": str(_DATASETS_IMPORT_ERROR)[:300],
            }

        dataset = _get_dataset()
        index = _dataset_text_index()

        return {
            "ok": True,
            "enabled": True,
            "dataset_id": DATASET_ID,
            "split": DATASET_SPLIT,
            "rows_loaded": len(dataset) if dataset is not None else 0,
            "indexed_rows": len(index),
            "columns": dataset.column_names if dataset is not None else [],
            "sample": dataset[0] if dataset is not None and len(dataset) else None,
        }

    @fastapi_app.get("/persona")
    async def persona_menu() -> dict[str, Any]:
        profile = _debug_profile_snapshot()
        return {
            "active_persona": profile,
            "available_personas": {
                persona_id: _resolve_persona(persona_id)
                for persona_id in _persona_choices()
            },
        }

    @fastapi_app.get("/menu")
    async def menu() -> dict[str, str]:
        return {
            "text": _build_menu_text(),
        }

    @fastapi_app.get("/model/test")
    async def test() -> dict[str, Any]:
        profile = _debug_profile_snapshot()
        record = _default_session_record()
        return {
            "reply": _generate_response("Say hello briefly.", profile, record),
            "persona_id": profile["persona_id"],
        }

    @fastapi_app.post("/telegram/webhook/{secret}")
    async def telegram_webhook(secret: str, update: dict[str, Any]) -> dict[str, Any]:
        logger.info("Telegram update received")

        expected_secret = os.getenv("WEBHOOK_SECRET", "").strip()

        if not expected_secret:
            logger.error("WEBHOOK_SECRET is not configured")
            raise HTTPException(
                status_code=503,
                detail="Webhook is not configured",
            )

        if not hmac.compare_digest(secret, expected_secret):
            logger.warning("Rejected webhook request with invalid secret")
            raise HTTPException(
                status_code=403,
                detail="Invalid webhook secret",
            )

        text, chat_id = _extract_telegram_text(update)

        logger.info("Telegram chat_id found: %s", chat_id is not None)
        logger.info("Telegram message text found: %s", bool(text))

        if chat_id is None:
            return {
                "ok": True,
                "ignored": "missing_chat_id",
            }

        reply_text, record, reply_markup = _telegram_reply_for_message(
            _session_key(chat_id),
            text,
        )

        _set_session_record(_session_key(chat_id), record)
        return await _send_telegram_message(chat_id, reply_text, reply_markup)

    @fastapi_app.get("/debug/config")
    async def debug_config() -> dict[str, Any]:
        if not _is_debug_enabled():
            raise HTTPException(status_code=404, detail="Not found")

        profile = _debug_profile_snapshot()

        return {
            "debug": True,
            "service": "babble",
            "version": APP_VERSION,
            "llm_provider": _sanitize_provider(),
            "model_id": MODEL_ID,
            "local_model_enabled": _is_local_model_enabled(),
            "transformers_available": pipeline is not None,
            "transformers_import_error": (
                None if pipeline is not None else str(_TRANSFORMERS_IMPORT_ERROR)[:300]
            ),
            "persona_id": profile["persona_id"],
            "persona_name": profile["name"],
            "persona_count": len(_persona_catalog()),
            "memory_enabled": MEMORY_ENABLED,
            "memory_path": str(MEMORY_PATH),
            "memory_max_turns": MEMORY_MAX_TURNS,
            "telegram_bot_token_configured": (
                _configured("TELEGRAM_BOT_TOKEN") or _configured("BOT_TOKEN")
            ),
            "webhook_secret_configured": _configured("WEBHOOK_SECRET"),
            "llm_api_key_configured": _configured("LLM_API_KEY"),
            "reply_mode": "telegram_direct_send_with_webhook_fallback",
            "dataset_enabled": DATASET_ENABLED,
            "dataset_id": DATASET_ID,
            "dataset_split": DATASET_SPLIT,
            "datasets_available": load_dataset is not None,
            "datasets_import_error": (
                None if load_dataset is not None else str(_DATASETS_IMPORT_ERROR)[:300]
            ),
            "hf_token_configured": bool(HF_TOKEN),
        }

    @fastapi_app.get("/debug/model")
    async def debug_model() -> dict[str, Any]:
        if not _is_debug_enabled():
            raise HTTPException(status_code=404, detail="Not found")

        try:
            profile = _debug_profile_snapshot()
            reply = _generate_response(
                "Say hello in one short sentence.",
                profile,
                _default_session_record(),
                raise_on_error=True,
            )
            return {
                "ok": True,
                "model_id": MODEL_ID,
                "persona_id": profile["persona_id"],
                "reply": reply,
            }
        except Exception as exc:
            logger.exception("Debug model test failed")
            return {
                "ok": False,
                "error": exc.__class__.__name__,
                "detail": str(exc)[:200],
            }

    if gr is None:
        logger.warning("Gradio unavailable; serving API endpoints only")
        return fastapi_app

    return gr.mount_gradio_app(fastapi_app, build_demo(), path="/")


app = create_app()


if __name__ == "__main__":
    import uvicorn

    uvicorn.run(
        app,
        host="0.0.0.0",
        port=int(os.getenv("BABBLE_PORT", os.getenv("PORT", "7860"))),
        log_level=os.getenv("LOG_LEVEL", "info").lower(),
    )