"""
Longshot
========
A writing game played inside a language model's predictions. You build a sentence one
word at a time. At each step you see the model's real top candidate next-words with
their actual probabilities, and you pick one. Your score is the total SURPRISE you
create, measured in bits (-log2 of the probability you chose). Pick what the model
expects and you score nothing; pick its longshots and the sentence turns strange.

Track 2 toy for the "Small Models Big Adventures" hackathon.
Model: openbmb/MiniCPM5-1B (1B, on-device, well under the 32B ceiling).

Why a SMALL model is the point: the game IS the next-token distribution, so it needs
the model's real logits, and a 1B model is fast enough to predict after every single
word AND quirky enough to make fighting its expectations genuinely fun. One forward
pass per word, no GPU required.

Modes: model (real logits) / keeper (a mock distribution, so it always demos).
"""

import os
import math
import html
import inspect
import random

import gradio as gr

_BLOCKS_HAS_CSS = "css" in inspect.signature(gr.Blocks.__init__).parameters
_LAUNCH_HAS_SSR = "ssr_mode" in inspect.signature(gr.Blocks.launch).parameters
_TB_HAS_COPY = "show_copy_button" in inspect.signature(gr.Textbox.__init__).parameters
_COPY = {"show_copy_button": True} if _TB_HAS_COPY else {}

MODEL_ID = os.environ.get("LONGSHOT_MODEL", "openbmb/MiniCPM5-1B")
DEBUG = os.environ.get("LONGSHOT_DEBUG", "").strip().lower() in {"1", "true", "yes"}
MAX_STEPS = int(os.environ.get("LONGSHOT_MAX_STEPS", "24"))
K = 6                                            # candidate words shown per step

SEEDS = ["The old lighthouse keeper", "On the third day of the voyage",
         "Nobody expected the cheese to", "She opened the box and found"]

_PUNCT = set(".,;:!?\u2014\u2026\"')(-")


def _bits(p):
    return -math.log2(max(p, 1e-9))


def label(bits):
    if bits < 18:
        return "Predictable"
    if bits < 42:
        return "Curious"
    if bits < 80:
        return "Eccentric"
    if bits < 140:
        return "Unhinged"
    return "Beyond comprehension"


# ----------------------------------------------------------------- model -------
def _noop_gpu(*a, **k):
    def wrap(fn):
        return fn
    return wrap(a[0]) if a and callable(a[0]) else wrap

if os.environ.get("SPACES_ZERO_GPU", "").lower() in {"true", "1"}:
    try:
        import spaces
        GPU = spaces.GPU
    except Exception:                          # noqa: BLE001
        GPU = _noop_gpu
else:
    GPU = _noop_gpu

_tokenizer = None
_model = None
MODE = "keeper"


def load_model():
    global _tokenizer, _model, MODE
    try:
        import torch
        from transformers import AutoModelForCausalLM, AutoTokenizer
        _tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
        _model = AutoModelForCausalLM.from_pretrained(
            MODEL_ID, torch_dtype=torch.float32, trust_remote_code=True)
        _model.eval()
        MODE = "model"
        print(f"[Longshot] Loaded {MODEL_ID} -- model mode (real logits).")
    except Exception as exc:                    # noqa: BLE001
        MODE = "keeper"
        print(f"[Longshot] Could not load {MODEL_ID} ({exc}). Keeper mode active.")


load_model()


@GPU(duration=30)
def _predict_model(text, k=K):
    import torch
    if torch.cuda.is_available() and next(_model.parameters()).device.type != "cuda":
        _model.to("cuda", dtype=torch.bfloat16)
    enc = _tokenizer(text if text else _tokenizer.bos_token or " ",
                     return_tensors="pt").to(_model.device)
    with torch.no_grad():
        logits = _model(**enc).logits[0, -1].float()
    probs = torch.softmax(logits, dim=-1)
    topv, topi = probs.topk(60)
    cands, fallback = [], []
    for p, tid in zip(topv.tolist(), topi.tolist()):
        piece = _tokenizer.decode([int(tid)])
        if not piece or "\ufffd" in piece:
            continue
        st = piece.strip()
        if not st:
            continue
        fallback.append((piece, st, p))
        if piece[:1] == " " or st[0] in _PUNCT or not text:
            cands.append({"piece": piece, "word": st, "p": p})
        if len(cands) >= k:
            break
    if len(cands) < 3:                            # tokenizer gave mostly sub-words
        cands = [{"piece": pc if pc[:1] == " " else " " + s, "word": s, "p": p}
                 for pc, s, p in fallback[:k]]
    return cands


_BANK = ["the", "a", "and", "then", "slowly", "suddenly", "quietly", "because",
         "moon", "door", "whispered", "forgot", "umbrella", "sea", "clockwork",
         "nobody", "almost", "perhaps", "velvet", "thunder", "sang", "river",
         "glass", "remembered", "blue", "forever", "maybe", "stone", "feather", "drifted"]
_KP = [0.30, 0.20, 0.14, 0.10, 0.07, 0.05]


def _keeper_candidates(text, k=K):
    rng = random.Random((text[-40:] or "seed"))
    words = rng.sample(_BANK, min(k, len(_BANK)))
    return [{"piece": " " + w, "word": w, "p": _KP[i % len(_KP)]} for i, w in enumerate(words)]


def next_candidates(text):
    if MODE == "model":
        try:
            cands = _predict_model(text)
            if cands:
                return cands
        except Exception as exc:                # noqa: BLE001
            print(f"[Longshot] predict error: {exc}")
    return _keeper_candidates(text)


# --------------------------------------------------------------- rendering -----
def esc(s):
    return html.escape(str(s))


def base_state():
    return {"text": "", "score": 0.0, "steps": 0, "history": [],
            "started": False, "finished": False, "candidates": []}


def share_text(state):
    return (f'{state["score"]:.0f} bits of surprise ({label(state["score"])}) - '
            f'"{state["text"].strip()}"  · played in Longshot')


def render_stage(state):
    if not state.get("started"):
        return ('<div class="stage empty">Pick an opening below to begin, then build a '
                'sentence the model never saw coming.</div>')
    text = state.get("text", "")
    cursor = "" if state.get("finished") else '<span class="cursor">\u258c</span>'
    story = f'<div class="story">{esc(text)}{cursor}</div>'
    lab = label(state["score"])
    score = (f'<div class="score">Surprise <b>{state["score"]:.1f} bits</b>'
             f'<span class="lab lab-{lab.split()[0].lower()}">{lab}</span></div>')
    if state.get("finished"):
        body = (f'<div class="final">The oracle is <b>{lab.lower()}</b>. '
                f'{state["steps"]} words, {state["score"]:.1f} bits of surprise.</div>')
        return f'<div class="stage">{story}{score}{body}</div>'
    rows = ""
    for idx, c in enumerate(state.get("candidates") or []):
        p = c["p"]
        pct = p * 100
        w = max(3, min(100, round((p ** 0.5) * 100)))
        exp = ' <span class="exp">expected</span>' if idx == 0 else ''
        rows += (f'<div class="cand"><span class="cw">{esc(c["word"])}</span>'
                 f'<span class="bar"><span style="width:{w}%"></span></span>'
                 f'<span class="cp">{pct:.1f}%</span>{exp}</div>')
    ask = ('<div class="ask">Choose the next word below. The longer the bar, the more '
           'the model expects it. The bolder your longshot, the more surprise you score.</div>')
    return f'<div class="stage">{story}{score}{ask}<div class="cands">{rows}</div></div>'


def view(state):
    finished = state.get("finished")
    cands = state.get("candidates") or []
    btns = []
    for i in range(K):
        if not finished and state.get("started") and i < len(cands):
            btns.append(gr.update(value=(cands[i]["word"][:24] or "\u00b7"), visible=True))
        else:
            btns.append(gr.update(visible=False))
    share = (gr.update(value=share_text(state), visible=True) if finished
             else gr.update(value="", visible=False))
    return [render_stage(state)] + btns + [share, state]


# --------------------------------------------------------------- the game ------
def _commit(state, c):
    state["text"] += c["piece"]
    state["score"] += _bits(c["p"])
    state["steps"] += 1
    state["history"].append((c["word"], c["p"]))
    if state["steps"] >= MAX_STEPS:
        state["finished"] = True
        state["candidates"] = []
    else:
        state["candidates"] = next_candidates(state["text"])
    return state


def on_begin(seed):
    seed = (seed or "").strip()
    if not seed:
        return view(base_state())
    state = {"text": seed[:200], "score": 0.0, "steps": 0, "history": [],
             "started": True, "finished": False, "candidates": []}
    state["candidates"] = next_candidates(state["text"])
    return view(state)


def on_pick(i, state):
    state = state or base_state()
    if not state.get("started") or state.get("finished"):
        return view(state)
    cands = state.get("candidates") or []
    if not isinstance(i, int) or i < 0 or i >= len(cands):
        return view(state)
    return view(_commit(state, cands[i]))


def on_longshot(state):
    state = state or base_state()
    cands = state.get("candidates") or []
    if not state.get("started") or state.get("finished") or not cands:
        return view(state)
    least = min(range(len(cands)), key=lambda j: cands[j]["p"])
    return view(_commit(state, cands[least]))


def on_oracle(state):
    state = state or base_state()
    cands = state.get("candidates") or []
    if not state.get("started") or state.get("finished") or not cands:
        return view(state)
    most = max(range(len(cands)), key=lambda j: cands[j]["p"])
    return view(_commit(state, cands[most]))


def on_finish(state):
    state = state or base_state()
    if state.get("started"):
        state["finished"] = True
        state["candidates"] = []
    return view(state)


def on_new():
    return view(base_state())


CSS = """
@import url('https://fonts.googleapis.com/css2?family=Fraunces:ital,opsz,wght@0,9..144,400;0,9..144,600;1,9..144,400&family=Spectral:ital,wght@0,400;0,500;1,400&display=swap');
:root{--paper:#f4eee0;--paper-2:#ece3cf;--ink:#2b2a2e;--ink-soft:#6a6470;
  --violet:#5b4b8a;--rose:#a8456b;--line:#cdbfa6;--gold:#b4892f;}
.gradio-container,.gradio-container.dark,.dark{
  --body-background-fill:transparent;--background-fill-primary:#fffcf4;--background-fill-secondary:#f3ecda;
  --block-background-fill:#fffcf4;--block-border-color:var(--line);--border-color-primary:var(--line);
  --body-text-color:var(--ink);--body-text-color-subdued:var(--ink-soft);
  --block-label-text-color:var(--violet);--block-title-text-color:var(--ink);
  --block-label-background-fill:#ece3cf;--block-title-background-fill:transparent;
  --input-background-fill:#fffcf4;--input-border-color:var(--line);--input-placeholder-color:var(--ink-soft);
  --button-primary-background-fill:var(--violet);--button-primary-background-fill-hover:#493b70;
  --button-primary-text-color:#fbf7ec;--button-primary-border-color:#493b70;
  --button-secondary-background-fill:#ece3cf;--button-secondary-background-fill-hover:#e2d4b6;
  --button-secondary-text-color:var(--ink);--button-secondary-border-color:var(--line);
  --color-accent:var(--rose);--color-accent-soft:#f3dbe4;}
.gradio-container{background:radial-gradient(120% 80% at 80% -10%,#fbf5e6,var(--paper) 55%,var(--paper-2));
  font-family:'Spectral',Georgia,serif !important;color:var(--ink) !important;max-width:880px !important;}
.gradio-container textarea,.gradio-container input[type="text"],.gradio-container input:not([type]){
  background:#fffcf4 !important;color:var(--ink) !important;-webkit-text-fill-color:var(--ink) !important;border-color:var(--line) !important;}
.gradio-container textarea::placeholder,.gradio-container input::placeholder{color:var(--ink-soft) !important;-webkit-text-fill-color:var(--ink-soft) !important;opacity:1;}
.ls-title{font-family:'Fraunces',serif;font-weight:600;font-size:2.6rem;line-height:1;margin:.2rem 0 0;}
.ls-title em{font-style:italic;color:var(--violet);}
.ls-sub{font-style:italic;color:var(--ink-soft);margin:.35rem 0 1rem;font-size:1.05rem;}
.ls-mode{display:inline-block;font-size:.72rem;letter-spacing:.12em;text-transform:uppercase;color:var(--violet);border:1px solid var(--line);border-radius:999px;padding:.15rem .6rem;}
.stage{background:#fffcf4;border:1px solid var(--line);border-radius:16px;padding:20px 22px;box-shadow:0 16px 40px -26px rgba(43,42,46,.7);}
.stage.empty{color:var(--ink-soft);font-style:italic;text-align:center;border-style:dashed;}
.story{font-family:'Fraunces',serif;font-size:1.5rem;line-height:1.5;color:var(--ink);}
.cursor{color:var(--rose);animation:blink 1s steps(2) infinite;font-weight:600;}
@keyframes blink{50%{opacity:0;}}
.score{margin:14px 0 4px;color:var(--ink-soft);}
.score b{color:var(--ink);font-family:'Fraunces',serif;}
.lab{margin-left:10px;font-size:.75rem;letter-spacing:.1em;text-transform:uppercase;border:1px solid var(--line);border-radius:999px;padding:.12rem .55rem;color:var(--violet);}
.lab-eccentric,.lab-unhinged,.lab-beyond{color:var(--rose);border-color:var(--rose);}
.ask{color:var(--ink-soft);font-size:.92rem;margin:10px 0 12px;}
.cands{display:flex;flex-direction:column;gap:7px;}
.cand{display:flex;align-items:center;gap:10px;}
.cand .cw{font-family:'Fraunces',serif;font-weight:600;min-width:120px;color:var(--ink);}
.cand .bar{flex:1;height:12px;background:#efe6d2;border-radius:999px;overflow:hidden;}
.cand .bar span{display:block;height:100%;background:linear-gradient(90deg,var(--violet),var(--rose));}
.cand .cp{min-width:54px;text-align:right;color:var(--ink-soft);font-size:.9rem;}
.cand .exp{font-size:.68rem;letter-spacing:.08em;text-transform:uppercase;color:var(--gold);}
.final{margin-top:10px;font-family:'Fraunces',serif;font-size:1.15rem;color:var(--ink);}
.ls-foot{color:var(--ink-soft);font-size:.82rem;font-style:italic;text-align:center;margin-top:12px;}
footer{display:none !important;}
"""

_bk = {"title": "Longshot"}
if _BLOCKS_HAS_CSS:
    _bk["css"] = CSS
    _bk["theme"] = gr.themes.Soft()

with gr.Blocks(**_bk) as demo:
    state = gr.State(base_state())
    public = "MiniCPM5-1B · real logits" if MODE == "model" else "Longshot"
    mode_label = f"{public}  ·  [{MODE}]" if DEBUG else public
    gr.HTML(f"""
      <div><div class="ls-title">Long<em>shot</em></div>
      <div class="ls-sub">Build a sentence from a model's own predictions. The stranger your path, the higher your score.</div>
      <span class="ls-mode">{mode_label}</span></div>""")

    with gr.Row():
        seed = gr.Textbox(placeholder="an opening line... (The old lighthouse keeper)",
                          show_label=False, scale=8, autofocus=True)
        begin = gr.Button("Begin", variant="primary", scale=2)
    with gr.Row():
        seed_btns = [gr.Button(s, size="sm") for s in SEEDS]

    stage = gr.HTML(render_stage(base_state()))

    with gr.Row():
        pick_btns = [gr.Button("\u00b7", visible=False) for _ in range(K)]
    with gr.Row():
        longshot = gr.Button("🎲 Take the longshot", size="sm")
        oracle = gr.Button("✨ Oracle's pick", size="sm")
        finish = gr.Button("Finish the sentence", size="sm")
        newgame = gr.Button("New game", size="sm")

    share = gr.Textbox(label="Share your sentence", visible=False, interactive=True, **_COPY)
    gr.HTML('<div class="ls-foot">Surprise is measured in bits: choosing a word the model gave a 1-in-4 chance scores 2 bits; a 1-in-100 longshot scores about 6.6.</div>')

    OUT = [stage] + pick_btns + [share, state]
    begin.click(on_begin, seed, OUT)
    seed.submit(on_begin, seed, OUT)
    for sb, s in zip(seed_btns, SEEDS):
        sb.click(on_begin, gr.State(s), OUT)
    for idx, pb in enumerate(pick_btns):
        pb.click(on_pick, [gr.State(idx), state], OUT)
    longshot.click(on_longshot, state, OUT)
    oracle.click(on_oracle, state, OUT)
    finish.click(on_finish, state, OUT)
    newgame.click(on_new, None, OUT)

if __name__ == "__main__":
    _lk = {}
    if not _BLOCKS_HAS_CSS:
        _lk["css"] = CSS
        _lk["theme"] = gr.themes.Soft()
    if _LAUNCH_HAS_SSR:
        _lk["ssr_mode"] = False
    demo.queue(max_size=24).launch(**_lk)