"""
The Void -- Buleyean RL
PyTorch vs Aether. Same model. Different engines. Let the speed speak.
"""

import gradio as gr
import torch
import json
import time
import subprocess
import urllib.request
import urllib.error
from concurrent.futures import ThreadPoolExecutor, as_completed
from transformers import AutoModelForCausalLM, AutoTokenizer

# ─── Start Aether sidecar ────────────────────────────────────────────────────
print("[Void] Starting Aether inference server...", flush=True)
aether_proc = subprocess.Popen(
    ["node", "aether-server.mjs"],
    env={**__import__('os').environ, "AETHER_PORT": "7861"},
    stdout=subprocess.PIPE,
    stderr=subprocess.STDOUT,
)

# ─── Load PyTorch model ──────────────────────────────────────────────────────
print("[Void] Loading PyTorch base model...", flush=True)
base_tokenizer = AutoTokenizer.from_pretrained("HuggingFaceTB/SmolLM2-360M-Instruct")
base_model = AutoModelForCausalLM.from_pretrained(
    "HuggingFaceTB/SmolLM2-360M-Instruct",
    torch_dtype=torch.float32,
    device_map="cpu",
)
print("[Void] PyTorch model ready.", flush=True)

# Wait for Aether
print("[Void] Waiting for Aether...", flush=True)
import select
for attempt in range(180):
    try:
        req = urllib.request.Request("http://127.0.0.1:7861/health")
        resp = urllib.request.urlopen(req, timeout=2)
        health = json.loads(resp.read())
        if health.get("status") == "ok" and health.get("model") == "loaded":
            print(f"[Void] Aether ready (loaded in {health.get('loadTime')}ms, SIMD: {health.get('simd')})", flush=True)
            break
    except Exception:
        pass
    if aether_proc.stdout and select.select([aether_proc.stdout], [], [], 0)[0]:
        line = aether_proc.stdout.readline()
        if line:
            print(f"  {line.decode().strip()}", flush=True)
    time.sleep(1)
else:
    print("[Void] WARNING: Aether not ready after 180s", flush=True)


def gen_pytorch(prompt):
    messages = [{"role": "user", "content": prompt}]
    text = base_tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
    inputs = base_tokenizer(text, return_tensors="pt")
    t0 = time.perf_counter()
    with torch.no_grad():
        outputs = base_model.generate(
            **inputs, max_new_tokens=256, temperature=0.7, top_p=0.9,
            do_sample=True, pad_token_id=base_tokenizer.eos_token_id,
        )
    elapsed = time.perf_counter() - t0
    n = outputs.shape[1] - inputs["input_ids"].shape[1]
    text = base_tokenizer.decode(outputs[0][inputs["input_ids"].shape[1]:], skip_special_tokens=True).strip()
    return text, elapsed, n, (elapsed * 1000 / n) if n > 0 else 0


def gen_aether(prompt):
    try:
        data = json.dumps({"prompt": prompt, "max_tokens": 256}).encode()
        req = urllib.request.Request("http://127.0.0.1:7861/generate", data=data,
                                     headers={"Content-Type": "application/json"})
        resp = urllib.request.urlopen(req, timeout=300)
        r = json.loads(resp.read())
        return r["text"], r["totalTimeMs"] / 1000, r["tokens"], r["avgTokenMs"]
    except urllib.error.HTTPError as e:
        body = e.read().decode() if e.fp else str(e)
        try: detail = json.loads(body).get("error", body[:300])
        except Exception: detail = body[:300]
        return f"[Aether error: {detail}]", 0, 0, 0
    except Exception as e:
        return f"[Aether error: {e}]", 0, 0, 0


def compare(prompt):
    if not prompt or not prompt.strip():
        yield "", "", "", ""
        return

    base_result = [None]
    aether_result = [None]

    def run_base():
        base_result[0] = gen_pytorch(prompt)
    def run_aether():
        aether_result[0] = gen_aether(prompt)

    with ThreadPoolExecutor(max_workers=2) as pool:
        futures = {pool.submit(run_base): "base", pool.submit(run_aether): "aether"}
        for future in as_completed(futures):
            name = futures[future]
            future.result()
            if name == "base" and base_result[0]:
                t, tm, tk, ms = base_result[0]
                st = f"{tk} tokens in {tm:.1f}s ({ms:.0f}ms/tok)"
                at = aether_result[0][0] if aether_result[0] else "generating..."
                ast = f"{aether_result[0][2]} tokens in {aether_result[0][1]:.1f}s ({aether_result[0][3]:.0f}ms/tok)" if aether_result[0] else "running..."
                yield t, at, st, ast
            elif name == "aether" and aether_result[0]:
                t, tm, tk, ms = aether_result[0]
                st = f"{tk} tokens in {tm:.1f}s ({ms:.0f}ms/tok)"
                bt = base_result[0][0] if base_result[0] else "generating..."
                bst = f"{base_result[0][2]} tokens in {base_result[0][1]:.1f}s ({base_result[0][3]:.0f}ms/tok)" if base_result[0] else "running..."
                yield bt, t, bst, st

    if base_result[0] and aether_result[0]:
        bt, b_t, b_tk, b_ms = base_result[0]
        at, a_t, a_tk, a_ms = aether_result[0]
        yield bt, at, f"{b_tk} tokens in {b_t:.1f}s ({b_ms:.0f}ms/tok)", f"{a_tk} tokens in {a_t:.1f}s ({a_ms:.0f}ms/tok)"


CSS = """
.gradio-container { max-width: 1060px !important; margin: 0 auto !important; }
.gradio-container, .dark { background: #09090b !important; }
#hero { text-align: center; padding: 2rem 0 1rem; }
#hero h1 { font-size: 2.5rem; font-weight: 300; letter-spacing: -0.02em; color: #fafafa; margin: 0; }
#hero .subtitle { color: #71717a; font-size: 0.95rem; margin-top: 0.5rem; }
#hero .accent { color: #3b82f6; }
.response-card { background: #0c0c0f !important; border: 1px solid #1f1f23 !important; border-radius: 8px !important; }
.response-card textarea { background: #0c0c0f !important; border: none !important; color: #e4e4e7 !important; font-size: 0.95rem !important; line-height: 1.6 !important; }
.base-label { color: #71717a !important; font-size: 0.8rem !important; text-transform: uppercase !important; letter-spacing: 0.05em !important; font-weight: 500 !important; }
.void-label { color: #3b82f6 !important; font-size: 0.8rem !important; text-transform: uppercase !important; letter-spacing: 0.05em !important; font-weight: 500 !important; }
.stats-text { font-family: 'SF Mono', 'Fira Code', monospace !important; font-size: 0.8rem !important; color: #52525b !important; }
#prompt-input > label > span { display: none !important; }
#prompt-input textarea { background: #111114 !important; border: 1px solid #1f1f23 !important; border-radius: 8px !important; color: #fafafa !important; font-size: 1rem !important; padding: 1rem !important; }
#prompt-input textarea:focus { border-color: #3b82f6 !important; box-shadow: 0 0 0 2px rgba(59,130,246,0.1) !important; }
#gen-btn { background: #3b82f6 !important; border: none !important; border-radius: 8px !important; font-weight: 500 !important; font-size: 0.9rem !important; padding: 0.75rem 2rem !important; }
#gen-btn:hover { background: #2563eb !important; }
.prompt-chip { background: #111114 !important; border: 1px solid #1f1f23 !important; border-radius: 6px !important; color: #a1a1aa !important; font-size: 0.85rem !important; }
.prompt-chip:hover { border-color: #3b82f6 !important; color: #fafafa !important; }
#footer { text-align: center; padding: 2rem 0; border-top: 1px solid #1f1f23; margin-top: 2rem; }
#footer p { color: #52525b; font-size: 0.8rem; }
#footer a { color: #3b82f6; text-decoration: none; }
footer.svelte-1ax1toq { display: none !important; }
.built-with { display: none !important; }
"""

with gr.Blocks(css=CSS, theme=gr.themes.Base(primary_hue="blue", neutral_hue="zinc"), title="The Void") as demo:

    gr.HTML("""
    <div id="hero">
        <h1>The <span class="accent">Void</span></h1>
        <p class="subtitle">PyTorch vs Aether. Same prompt. Different engines. Live inference.<br/>
        Left: standard PyTorch CPU. Right: Aether -- pure JS + 14KB WASM SIMD, zero ML dependencies.</p>
    </div>
    """)

    prompt = gr.Textbox(elem_id="prompt-input", placeholder="What would you like to ask?", lines=2, label="Prompt", show_label=False, interactive=True)
    btn = gr.Button("Generate", elem_id="gen-btn", variant="primary")

    with gr.Row(equal_height=True):
        with gr.Column():
            gr.HTML('<p class="base-label">PyTorch (standard)</p>')
            base_out = gr.Textbox(lines=10, show_label=False, interactive=False, elem_classes=["response-card"])
            base_stats = gr.HTML('<p class="stats-text">--</p>')
        with gr.Column(min_width=30):
            gr.HTML('<p style="color:#27272a; text-align:center; padding-top:4rem; font-size:0.75rem; letter-spacing:0.1em;">VS</p>')
        with gr.Column():
            gr.HTML('<p class="void-label">Aether (our engine)</p>')
            aether_out = gr.Textbox(lines=10, show_label=False, interactive=False, elem_classes=["response-card"])
            aether_stats = gr.HTML('<p class="stats-text">--</p>')

    def run_compare(prompt_text):
        for bt, at, bs, ast in compare(prompt_text):
            yield bt, at, f'<p class="stats-text">{bs}</p>', f'<p class="stats-text">{ast}</p>'

    btn.click(run_compare, [prompt], [base_out, aether_out, base_stats, aether_stats])
    prompt.submit(run_compare, [prompt], [base_out, aether_out, base_stats, aether_stats])

    gr.HTML('<p style="color:#52525b; font-size:0.8rem; margin-top:1.5rem; margin-bottom:0.5rem;">Try these:</p>')
    with gr.Row():
        for p in ["hello", "How are you feeling?", "I've been anxious lately.", "Write a haiku about failure.", "What is the meaning of life?"]:
            gr.Button(p, size="sm", elem_classes=["prompt-chip"]).click(
                fn=lambda x=p: x, outputs=[prompt]
            ).then(fn=run_compare, inputs=[prompt], outputs=[base_out, aether_out, base_stats, aether_stats])

    gr.HTML("""
    <div id="footer">
        <p style="color:#a1a1aa; font-size:0.85rem; margin-bottom:0.5rem;">
            SmolLM2-360M &middot; Buleyean RL &middot;
            Left: PyTorch CPU (base model) &middot; Right: Aether WASM-SIMD (Buleyean, zero ML deps)
        </p>
        <p>
            <a href="https://forkracefold.com/">Whitepaper</a> &middot;
            <a href="https://huggingface.co/spaces/forkjoin-ai/aether">Aether</a> &middot;
            <a href="https://huggingface.co/spaces/forkjoin-ai/aether-browser">Edge Mesh</a> &middot;
            <a href="https://huggingface.co/spaces/forkjoin-ai/the-void">The Void</a> &middot;
            <a href="https://huggingface.co/spaces/forkjoin-ai/buleyean-rl">Buleyean RL</a> &middot;
            <a href="https://huggingface.co/spaces/forkjoin-ai/glossolalia">Glossolalia</a> &middot;
            <a href="https://huggingface.co/spaces/forkjoin-ai/metacog">Metacog</a> &middot;
            <a href="https://huggingface.co/spaces/forkjoin-ai/five-bules">Five Bules</a> &middot;
            <a href="https://huggingface.co/spaces/forkjoin-ai/void-attention">Void Attention</a> &middot;
            <a href="https://huggingface.co/spaces/forkjoin-ai/quark-personality">Quark Personality</a>
        </p>
        <p style="margin-top:1rem;">500+ Lean 4 theorems &middot; Zero sorry &middot; <a href="https://forkracefold.com/">&phi;&sup2; = &phi; + 1</a></p>
        <p style="margin-top:1rem;">Copyright 2026 forkjoin.ai</p>
    </div>
    """)

if __name__ == "__main__":
    demo.launch(server_name="0.0.0.0", server_port=7860)