Spaces:

angkit007
/

hackathon

Sleeping

App Files Files Community

hackathon / app_single.py

angkit007

renamed

f0a208d 12 days ago

Raw

History Blame Contribute Delete

48.9 kB

	"""
	app_single.py — MiniCPM-V 4.6 · An Adventure in Thousand Token Wood
	=====================================================================
	A storybook playground: MiniCPM-V reads an uploaded image like a page
	from an adventure, then a woodland cat performs its mood in a forest
	clearing — complete with a tiny generative tune.

	Pipeline:
	1. Upload image → MiniCPM-V streams a description
	2. Model returns a JSON dance spec (mood + 6 numeric animation params)
	3. The cat performs in the clearing using those exact params — every
	move is model-determined, not hardcoded.
	4. A free, generative melody (Web Audio API, no audio files) plays
	along — tempo and register also derived from the model's params.

	Dance params returned by model:
	mood : one of 10 mood words
	speed : animation cycle seconds (0.3 fast … 3.0 slow)
	jump : vertical bounce px (0 … 60)
	sway : body rotation degrees (0 … 20)
	tail_speed : tail cycle seconds (0.2 … 3.0)
	tail_range : tail swing degrees (5 … 120)
	ear_tilt : ear rotation degrees (0 … 25)

	Two backends — switchable in the UI:
	• API (default) — calls the hosted MiniCPM-V 4.6 API. Needs internet.
	• Local (offline) — downloads openbmb/MiniCPM-V-4 (4.1B, Apache-2.0) once,
	caches it to ./model_cache/, then runs fully offline.
	Requires: pip install torch transformers accelerate

	Run locally:
	pip install -r requirements.txt
	python app_single.py
	→ open http://localhost:7860

	Optional: set your own API key so you're not on the shared public quota
	Windows (PowerShell): $env:MINICPM_API_KEY="sk-..."
	macOS / Linux: export MINICPM_API_KEY="sk-..."
	"""

	import base64, io, os, json, re
	import gradio as gr
	from openai import OpenAI, APIStatusError, APIConnectionError
	from PIL import Image

	# ── Config ────────────────────────────────────────────────────────────────────
	API_BASE_URL = "https://api.modelbest.cn/v1"
	PUBLIC_API_KEY = "sk-pQ8L2zF3XmR5kY9wV4jB7hN1tC6vM0xG3aD5sH2bJ9lK4cZ8"

	MODELS = {
	"⚡ Instruct (fast, direct)": "MiniCPM-V-4.6-Instruct",
	"🧠 Thinking (reasons first)": "MiniCPM-V-4.6-Thinking",
	}

	DEFAULT_PROMPT = "Describe this image in detail."
	DEFAULT_MAX_TOKENS = 512
	DEFAULT_TEMPERATURE = 0.7
	IMAGE_QUALITY = 90

	MOOD_LABELS = ["happy","sad","calm","energetic","mysterious","depressed",
	"romantic","tense","nostalgic","angry","neutral"]

	PROMPT_EXAMPLES = [
	["Describe this image in detail."],
	["List every object you can see."],
	["What is the mood or atmosphere of this image?"],
	["What text, if any, appears in this image?"],
	["Explain this image to someone who cannot see it."],
	]

	# ── Mood palettes — each mood is a "firefly color" in the wood ────────────────
	# scale: semitone offsets from root (a small mode/scale per mood)
	# root : MIDI-ish base note number (we map to Hz with 440 * 2^((n-69)/12))
	MOOD_PALETTE = {
	"happy": {"bg":"#1a1605","body":"#FFD166","detail":"#E8A23A","eye":"#2D1B00","nose":"#FF8A3D","pcol":"#FFE08A","particle":"✦","label":"Happy","caption":"Bouncing with joy", "scale":[0,2,4,7,9,12], "root":72},
	"sad": {"bg":"#0c1116","body":"#8AA0B2","detail":"#5D7A8E","eye":"#1A2530","nose":"#B7C7D2","pcol":"#A9C8E0","particle":"·","label":"Sad","caption":"Slow, heavy steps", "scale":[0,3,5,7,10,12], "root":60},
	"calm": {"bg":"#0a1614","body":"#6FBFB3","detail":"#4A9C8F","eye":"#0A2018","nose":"#A8E0D6","pcol":"#BFEDE4","particle":"○","label":"Calm","caption":"Drifting at ease", "scale":[0,2,5,7,9,12], "root":64},
	"energetic": {"bg":"#1a0e05","body":"#FF8A5B","detail":"#E8623A","eye":"#1a0500","nose":"#FFD1BC","pcol":"#FFCB6B","particle":"★","label":"Energetic","caption":"Can't sit still", "scale":[0,2,4,5,7,9,11,12],"root":71},
	"mysterious": {"bg":"#120c1a","body":"#A98BD6","detail":"#6D4FA8","eye":"#F0B8FF","nose":"#D9C2EE","pcol":"#C7B3F0","particle":"✧","label":"Mysterious","caption":"Slipping through shadow", "scale":[0,1,4,5,7,8,11,12],"root":62},
	"romantic": {"bg":"#1a0c12","body":"#F2A0BD","detail":"#D9648D","eye":"#1a0010","nose":"#FBE0EA","pcol":"#F7B8CE","particle":"♥","label":"Romantic","caption":"A slow, dreamy waltz", "scale":[0,2,4,7,9,12], "root":67},
	"tense": {"bg":"#100808","body":"#F0726E","detail":"#C03C38","eye":"#FFB3AE","nose":"#F7C7C4","pcol":"#F2A6A2","particle":"\|","label":"Tense","caption":"Coiled and alert", "scale":[0,1,3,6,7,10,12], "root":61},
	"nostalgic": {"bg":"#160f06","body":"#F2C083","detail":"#D98A3D","eye":"#160f06","nose":"#FBE3C7","pcol":"#F7DDB5","particle":"◦","label":"Nostalgic","caption":"Rocking to old memories", "scale":[0,2,3,7,9,12], "root":65},
	"angry": {"bg":"#160505","body":"#F0635E","detail":"#A8201C","eye":"#FF6961","nose":"#F7B0AC","pcol":"#F58F8A","particle":"✸","label":"Angry","caption":"Stomping, full of fire", "scale":[0,1,3,5,6,8,10,12],"root":59},
	"neutral": {"bg":"#0e0f13","body":"#A6ADB8","detail":"#727A86","eye":"#0d0d18","nose":"#D8DDE3","pcol":"#C7CDD6","particle":"·","label":"Neutral","caption":"Steady and unhurried", "scale":[0,2,4,7,9,12], "root":64},
	}

	# ── Default dance specs (fallback if model call fails) ────────────────────────
	DEFAULT_DANCE = {
	"happy": {"speed":0.7, "jump":50, "sway":6, "tail_speed":0.4, "tail_range":200,"ear_tilt":8},
	"sad": {"speed":2.4, "jump":2, "sway":8, "tail_speed":2.5, "tail_range":30, "ear_tilt":15},
	"calm": {"speed":2.8, "jump":10, "sway":2, "tail_speed":3.2, "tail_range":35, "ear_tilt":3},
	"energetic": {"speed":0.3, "jump":30, "sway":15, "tail_speed":0.28,"tail_range":180,"ear_tilt":15},
	"mysterious": {"speed":2.0, "jump":15, "sway":5, "tail_speed":1.8, "tail_range":100,"ear_tilt":5},
	"romantic": {"speed":1.6, "jump":12, "sway":5, "tail_speed":1.6, "tail_range":65, "ear_tilt":3},
	"tense": {"speed":0.4, "jump":3, "sway":3, "tail_speed":0.4, "tail_range":10, "ear_tilt":12},
	"nostalgic": {"speed":2.2, "jump":6, "sway":6, "tail_speed":2.0, "tail_range":65, "ear_tilt":5},
	"angry": {"speed":0.38,"jump":18, "sway":5, "tail_speed":0.32,"tail_range":160,"ear_tilt":20},
	"neutral": {"speed":2.0, "jump":8, "sway":1, "tail_speed":2.2, "tail_range":30, "ear_tilt":2},
	}

	# ── Helpers ───────────────────────────────────────────────────────────────────
	def pil_to_data_url(image):
	image = image.convert("RGB")
	buf = io.BytesIO()
	image.save(buf, format="JPEG", quality=IMAGE_QUALITY)
	return "data:image/jpeg;base64," + base64.b64encode(buf.getvalue()).decode()

	def _resolve_key(ui_key):
	return (os.environ.get("MINICPM_API_KEY","").strip()
	or (ui_key or "").strip() or PUBLIC_API_KEY)

	def _client(ui_key):
	return OpenAI(api_key=_resolve_key(ui_key), base_url=API_BASE_URL)

	# ── Description (streaming) ───────────────────────────────────────────────────
	def stream_description(image, prompt, model_label, max_tokens, temperature, api_key):
	if image is None:
	yield "⚠️ Please upload an image first."
	return
	try:
	stream = _client(api_key).chat.completions.create(
	model=MODELS[model_label],
	messages=[{"role":"user","content":[
	{"type":"image_url","image_url":{"url": pil_to_data_url(image)}},
	{"type":"text","text": prompt},
	]}],
	max_tokens=max_tokens, temperature=temperature, stream=True,
	)
	result = ""
	for chunk in stream:
	delta = chunk.choices[0].delta.content or ""
	if delta:
	result += delta
	yield result
	except APIStatusError as e:
	yield f"❌ API error {e.status_code}: {e.message}"
	except APIConnectionError:
	yield "❌ Cannot reach api.modelbest.cn"
	except Exception as e:
	yield f"❌ {e}"

	# ── Model-driven dance spec ───────────────────────────────────────────────────
	DANCE_SYSTEM_PROMPT = f"""You are a cat dance choreographer AI.
	Given a scene description, return ONLY a valid JSON object — no prose, no markdown, no code fences.

	JSON schema (all fields required):
	{{
	"mood": one of {MOOD_LABELS},
	"speed": float 0.3–3.0 (animation cycle seconds; lower = faster),
	"jump": int 0–60 (vertical bounce in pixels),
	"sway": int 0–20 (body rotation degrees),
	"tail_speed": float 0.2–3.0 (tail cycle seconds),
	"tail_range": int 5–200 (tail swing degrees),
	"ear_tilt": int 0–25 (ear tilt degrees)
	}}

	Choose values that physically match the scene mood. An energetic scene should have
	low speed (fast), high jump, high sway. A calm scene should have high speed (slow),
	low jump, low sway. Be creative — the cat's whole body expresses the image's emotion."""

	def _keyword_mood(description: str) -> str:
	"""Simple keyword-based mood fallback when JSON parsing fails."""
	t = description.lower()
	for m, kws in [
	("happy",["happy","joy","celebrate","laugh","smile","bright","sunny"]),
	("sad",["sad","lonely","rain","sorrow","grief","cry","gloom"]),
	("energetic",["energetic","vibrant","excited","dynamic","rush","active"]),
	("calm",["calm","peaceful","quiet","gentle","serene","still"]),
	("mysterious",["mysterious","dark","eerie","shadow","mystic","fog"]),
	("romantic",["romantic","love","tender","intimate","warm","soft"]),
	("tense",["tense","anxious","fear","alarm","nervous","danger"]),
	("nostalgic",["nostalgic","memory","vintage","old","past","retro"]),
	("angry",["angry","furious","rage","fierce","storm"]),
	]:
	if any(w in t for w in kws):
	return m
	return "neutral"

	def get_dance_spec(description: str, api_key: str) -> tuple[str, dict]:
	"""
	Returns (mood, dance_params_dict).
	The model outputs the full dance spec as JSON.
	Falls back to defaults if parsing fails.
	"""
	if not description or description.startswith(("⚠️","❌")):
	return "neutral", DEFAULT_DANCE["neutral"]
	try:
	resp = _client(api_key).chat.completions.create(
	model="MiniCPM-V-4.6-Instruct",
	messages=[
	{"role":"system","content": DANCE_SYSTEM_PROMPT},
	{"role":"user", "content": f"Scene description:\n{description[:800]}"},
	],
	max_tokens=120, temperature=0.3,
	)
	raw = resp.choices[0].message.content.strip()
	# Strip markdown fences if present
	raw = re.sub(r"```[a-z]*", "", raw).strip().strip("`").strip()
	spec = json.loads(raw)

	mood = spec.get("mood","neutral")
	if mood not in MOOD_LABELS:
	mood = "neutral"

	dance = {
	"speed": float(max(0.3, min(3.0, spec.get("speed", 1.5)))),
	"jump": int(max(0, min(60, spec.get("jump", 10)))),
	"sway": int(max(0, min(20, spec.get("sway", 5)))),
	"tail_speed": float(max(0.2, min(3.0, spec.get("tail_speed", 1.5)))),
	"tail_range": int(max(5, min(200, spec.get("tail_range", 40)))),
	"ear_tilt": int(max(0, min(25, spec.get("ear_tilt", 5)))),
	}
	return mood, dance

	except Exception:
	mood = _keyword_mood(description)
	return mood, DEFAULT_DANCE[mood]


	# ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
	# OFFLINE / LOCAL BACKEND
	# ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
	# Runs entirely on this machine, no internet required after first download.
	# Model : openbmb/MiniCPM-V-4 (4.1B params, Apache-2.0, fully public)
	# Cache : ./model_cache/ (weights) + .download_complete (sentinel)
	#
	# Heavy deps (torch, transformers) are imported lazily — only when the
	# user actually selects the Local backend — so API-only users don't need
	# them installed.

	from pathlib import Path

	LOCAL_MODEL_ID = "openbmb/MiniCPM-V-4"
	LOCAL_CACHE_DIR = Path(__file__).parent / "model_cache"
	LOCAL_SENTINEL = LOCAL_CACHE_DIR / ".download_complete"

	_local_model = None
	_local_tokenizer = None

	def local_is_cached() -> bool:
	return LOCAL_SENTINEL.exists()

	def local_cache_size_gb() -> float:
	if not LOCAL_CACHE_DIR.exists():
	return 0.0
	return sum(f.stat().st_size for f in LOCAL_CACHE_DIR.rglob("*") if f.is_file()) / 1e9

	def local_status_md() -> str:
	if local_is_cached():
	return (f"✅ Model cached — `{LOCAL_MODEL_ID}` "
	f"({local_cache_size_gb():.1f} GB) ready to run offline.")
	return (f"⬇️ Not downloaded yet — `{LOCAL_MODEL_ID}` (~8 GB) will be "
	f"fetched on first use and cached in `model_cache/`. "
	f"Requires internet for this one-time download.")

	def _load_local_model():
	"""
	Lazily import torch/transformers and load MiniCPM-V-4 from local cache,
	downloading once if needed. Returns (model, tokenizer).
	"""
	global _local_model, _local_tokenizer
	if _local_model is not None:
	return _local_model, _local_tokenizer

	try:
	import torch
	import transformers
	from transformers import AutoModel, AutoTokenizer
	except ImportError as e:
	raise RuntimeError(
	"Local backend requires extra packages.\n"
	"Install with:\n"
	" pip install torch transformers accelerate\n"
	f"(original error: {e})"
	)

	# transformers v5 broke MiniCPM-V-4's custom code (all_tied_weights_keys)
	_tv = tuple(int(x) for x in transformers.__version__.split(".")[:2])
	if _tv >= (5, 0):
	from transformers import modeling_utils as _mu
	_orig_getattr = getattr(_mu.PreTrainedModel, "__getattr__", None)
	def _safe_getattr(self, name):
	if name == "all_tied_weights_keys":
	return {}
	if _orig_getattr is not None:
	return _orig_getattr(self, name)
	raise AttributeError(name)
	_mu.PreTrainedModel.__getattr__ = _safe_getattr

	LOCAL_CACHE_DIR.mkdir(parents=True, exist_ok=True)
	local_only = local_is_cached()

	common = dict(
	trust_remote_code=True,
	cache_dir=str(LOCAL_CACHE_DIR),
	local_files_only=local_only,
	)

	_local_tokenizer = AutoTokenizer.from_pretrained(LOCAL_MODEL_ID, **common)

	device = "cuda" if torch.cuda.is_available() else "cpu"
	dtype = torch.float16 if device == "cuda" else torch.float32

	_local_model = AutoModel.from_pretrained(
	LOCAL_MODEL_ID,
	torch_dtype=dtype,
	attn_implementation="sdpa",
	device_map="auto" if device == "cuda" else None,
	low_cpu_mem_usage=True,
	**common,
	)
	if device == "cpu":
	_local_model = _local_model.to(device)
	_local_model.eval()

	if not local_only:
	LOCAL_SENTINEL.write_text(f"{LOCAL_MODEL_ID} downloaded.\nDelete to re-download.\n")

	return _local_model, _local_tokenizer

	def stream_description_local(image, prompt, max_tokens, temperature):
	"""Local (offline) equivalent of stream_description — non-streaming, single yield."""
	if image is None:
	yield "⚠️ Please upload an image first."
	return
	try:
	model, tokenizer = _load_local_model()
	msgs = [{"role": "user", "content": [image.convert("RGB"), prompt]}]
	result = model.chat(
	image=image.convert("RGB"),
	msgs=msgs,
	tokenizer=tokenizer,
	sampling=(temperature > 0),
	temperature=max(temperature, 0.01),
	max_new_tokens=max_tokens,
	)
	yield result
	except RuntimeError as e:
	yield f"❌ {e}"
	except Exception as e:
	yield f"❌ Local inference error: {e}"

	def get_dance_spec_local(description: str) -> tuple[str, dict]:
	"""Local equivalent of get_dance_spec — one extra text-only local call."""
	if not description or description.startswith(("⚠️","❌")):
	return "neutral", DEFAULT_DANCE["neutral"]
	try:
	model, tokenizer = _load_local_model()
	msgs = [{"role": "user", "content": [
	DANCE_SYSTEM_PROMPT + f"\n\nScene description:\n{description[:800]}"
	]}]
	raw = model.chat(
	image=None, msgs=msgs, tokenizer=tokenizer,
	sampling=False, max_new_tokens=150,
	)
	raw = re.sub(r"```[a-z]*", "", raw).strip().strip("`").strip()
	spec = json.loads(raw)

	mood = spec.get("mood","neutral")
	if mood not in MOOD_LABELS:
	mood = "neutral"

	dance = {
	"speed": float(max(0.3, min(3.0, spec.get("speed", 1.5)))),
	"jump": int(max(0, min(60, spec.get("jump", 10)))),
	"sway": int(max(0, min(20, spec.get("sway", 5)))),
	"tail_speed": float(max(0.2, min(3.0, spec.get("tail_speed", 1.5)))),
	"tail_range": int(max(5, min(200, spec.get("tail_range", 40)))),
	"ear_tilt": int(max(0, min(25, spec.get("ear_tilt", 5)))),
	}
	return mood, dance
	except Exception:
	return _keyword_mood(description), DEFAULT_DANCE[_keyword_mood(description)]


	# ── Keyword dance for text-only tab (no API needed) ───────────────────────────
	def generate_animation(text: str) -> str:
	t = text.lower()
	mood = "neutral"
	for m, kws in [
	("happy",["happy","celebrate","party","joy","cheerful"]),
	("sad",["sad","lonely","rain","grief","sorrow"]),
	("energetic",["energy","dance","excited","lively"]),
	("calm",["calm","peace","serene","gentle","quiet"]),
	("mysterious",["mysterious","eerie","dark","shadow"]),
	("romantic",["romantic","love","tender","warm"]),
	("tense",["tense","nervous","anxiety","fear"]),
	("nostalgic",["nostalgic","memory","vintage","old"]),
	("angry",["angry","furious","rage","fierce"]),
	]:
	if any(w in t for w in kws):
	mood = m
	break
	return cat_html(mood, DEFAULT_DANCE[mood])

	# ── Stage chrome — shared studio frame ────────────────────────────────────────
	STAGE_FONT = "'Space Grotesk', 'Inter', system-ui, sans-serif"
	LABEL_FONT = "'Inter', system-ui, sans-serif"
	MONO_FONT = "'JetBrains Mono', 'SFMono-Regular', Consolas, monospace"

	def _stage_open(spotlight_color: str, breathe_speed: float = 4.0) -> str:
	"""Opening <div> + shared <style> for the emotion card, HF light style."""
	return f"""<div class="stage" style="--spot:{spotlight_color};">
	<style>
	@import url('https://fonts.googleapis.com/css2?family=Space+Grotesk:wght@500;700&family=Inter:wght@400;500;600&family=JetBrains+Mono:wght@400;500&display=swap');

	.stage {{
	position:relative; height:440px; border-radius:12px;
	overflow:hidden; isolation:isolate;
	background:
	radial-gradient(ellipse 70% 50% at 50% 22%, color-mix(in srgb, var(--spot) 14%, transparent), transparent 70%),
	#F8F9FA;
	border:1px solid #E5E7EB;
	display:flex; flex-direction:column; align-items:center; justify-content:center;
	font-family:{STAGE_FONT};
	}}
	@keyframes spot_breathe {{
	0%,100% {{ opacity:.7; }}
	50% {{ opacity:1; }}
	}}
	.stage::before {{
	content:''; position:absolute; inset:0; pointer-events:none;
	background: radial-gradient(ellipse 45% 36% at 50% 18%, color-mix(in srgb, var(--spot) 18%, transparent), transparent 72%);
	animation: spot_breathe {breathe_speed}s ease-in-out infinite;
	}}
	/* faint dot-grid texture, HF-card style */
	.stage::after {{
	content:''; position:absolute; inset:0; pointer-events:none; opacity:.5;
	background-image: radial-gradient(circle, #E5E7EB 1px, transparent 1px);
	background-size: 22px 22px;
	}}

	.stage-cue {{
	position:absolute; top:16px; left:0; right:0;
	display:flex; align-items:center; justify-content:center; gap:8px;
	font-family:{MONO_FONT};
	font-size:.68rem; letter-spacing:.16em; text-transform:uppercase;
	color:#6B7280; font-weight:500; z-index:3;
	}}
	.stage-cue .dot {{
	width:8px; height:8px; border-radius:50%;
	background:var(--spot); box-shadow:0 0 0 3px color-mix(in srgb, var(--spot) 25%, transparent);
	}}
	.stage-cue .mood-name {{
	color:#111827; font-weight:700; letter-spacing:.1em;
	font-family:{MONO_FONT};
	background:#FFFFFF; border:1px solid #E5E7EB;
	border-radius:999px; padding:2px 10px;
	}}

	.stage-caption {{
	position:absolute; bottom:62px; left:0; right:0; text-align:center; z-index:3;
	color:#4B5563; font-size:.92rem; letter-spacing:.01em; font-style:italic;
	font-family:{STAGE_FONT}; font-weight:500;
	}}

	.cue-sheet {{
	position:absolute; bottom:14px; left:0; right:0; z-index:3;
	display:flex; justify-content:center; gap:8px; flex-wrap:wrap;
	padding:0 20px;
	}}
	.cue-chip {{
	font-family:{MONO_FONT}; font-size:.64rem; letter-spacing:.03em;
	color:#374151; background:#FFFFFF; border:1px solid #E5E7EB;
	border-radius:999px; padding:3px 10px; white-space:nowrap;
	box-shadow: 0 1px 2px rgba(0,0,0,.03);
	}}
	.cue-chip b {{ color:#92660C; font-weight:600; }}

	/* ── music toggle button ── */
	.music-toggle {{
	position:absolute; top:14px; right:14px; z-index:4;
	width:36px; height:36px; border-radius:50%;
	background:#FFFFFF; border:1px solid #E5E7EB;
	display:flex; align-items:center; justify-content:center;
	cursor:pointer; font-size:1rem; color:#374151;
	box-shadow: 0 1px 2px rgba(0,0,0,.04);
	transition: transform .15s ease, background .15s ease, box-shadow .15s ease;
	}}
	.music-toggle:hover {{
	transform: scale(1.06);
	box-shadow: 0 2px 8px rgba(0,0,0,.08);
	}}
	.music-toggle.playing {{
	background: #FFD21E;
	border-color: #FFD21E;
	color:#111827;
	}}
	.music-toggle .icon-play {{ display:inline; }}
	.music-toggle .icon-pause {{ display:none; }}
	.music-toggle.playing .icon-play {{ display:none; }}
	.music-toggle.playing .icon-pause {{ display:inline; }}
	</style>
	"""

	def _stage_close() -> str:
	return "</div>"

	# ── Cat stage — all parts stay inside the stage, nothing can overflow ─────────
	def cat_html(mood: str, dance: dict) -> str:
	p = MOOD_PALETTE.get(mood, MOOD_PALETTE["neutral"])
	B = p["body"]; D = p["detail"]; E = p["eye"]; N = p["nose"]
	sp = dance["speed"]; jp = dance["jump"]
	sw = dance["sway"]; tsp = dance["tail_speed"]
	tr = dance["tail_range"]; et = dance["ear_tilt"]

	t0 = -tr // 2; t1 = tr // 2
	breathe = max(2.0, min(6.0, sp * 2))
	stage_id = f"stage_{mood}"

	# ── music params derived from dance spec ──
	scale = p["scale"]
	root = p["root"]
	# tempo: faster dance (low sp) -> faster notes. Map sp [0.3,3.0] -> note interval [140,520]ms
	note_ms = int(140 + (sp - 0.3) / (3.0 - 0.3) * (520 - 140))
	# register: higher jump -> notes climb higher (octave shift 0,1,2)
	octave_shift = 12 * min(2, jp // 25)
	note_root = root + octave_shift

	cue_chips = (
	f'<span class="cue-chip">speed <b>{sp}s</b></span>'
	f'<span class="cue-chip">jump <b>{jp}px</b></span>'
	f'<span class="cue-chip">sway <b>{sw}°</b></span>'
	f'<span class="cue-chip">tail <b>{tsp}s / {tr}°</b></span>'
	f'<span class="cue-chip">ears <b>{et}°</b></span>'
	)

	return _stage_open(B, breathe) + f"""
	<style>
	@keyframes K_body {{
	0%,100% {{ transform: translateY(0px) rotate(-{sw}deg); }}
	50% {{ transform: translateY(-{jp}px) rotate({sw}deg); }}
	}}
	@keyframes K_tail {{
	0%,100% {{ transform: rotate({t0}deg); }}
	50% {{ transform: rotate({t1}deg); }}
	}}
	@keyframes K_ear {{
	0%,100% {{ transform: rotate(-{et}deg); }}
	50% {{ transform: rotate({et}deg); }}
	}}
	@keyframes K_blink {{
	0%,88%,100% {{ transform: scaleY(1); }}
	93% {{ transform: scaleY(0.08); }}
	}}
	@keyframes K_shadow {{
	0%,100% {{ transform: translateX(-50%) scaleX(1); opacity:.45; }}
	50% {{ transform: translateX(-50%) scaleX({max(0.4, 1 - jp/80):.2f}); opacity:.15; }}
	}}
	@keyframes K_part {{
	0% {{ opacity:0; transform:translate(0,0) scale(.5); }}
	20% {{ opacity:.9; }}
	80% {{ opacity:.4; }}
	100% {{ opacity:0; transform:translate(var(--px),var(--py)) scale(1.5); }}
	}}

	.cat-wrap {{ position:relative; width:160px; height:200px; z-index:2; }}

	.cat-shadow {{
	position:absolute; bottom:-4px; left:50%;
	width:72px; height:11px; border-radius:50%;
	background:rgba(0,0,0,.55);
	animation: K_shadow {sp}s ease-in-out infinite;
	}}

	.cat-unit {{
	position:absolute; bottom:0; left:50%;
	transform-origin: center bottom;
	animation: K_body {sp}s ease-in-out infinite;
	}}

	.c-body {{
	position:absolute; bottom:0; left:-36px;
	width:72px; height:62px;
	border-radius:52% 52% 46% 46%;
	background:{B};
	box-shadow:inset -6px -5px 0 {D};
	}}
	.c-belly {{
	position:absolute; bottom:5px; left:50%; transform:translateX(-50%);
	width:40px; height:30px; border-radius:50%;
	background:{D}28;
	}}

	.c-tail {{
	position:absolute; bottom:4px; left:22px;
	width:16px; height:52px;
	border-radius:38% 62% 55% 45% / 28% 28% 72% 72%;
	background:{B};
	box-shadow:inset 3px 0 0 {D};
	transform-origin:bottom center;
	animation:K_tail {tsp}s ease-in-out infinite;
	}}
	.c-tail::after {{
	content:'';
	position:absolute; top:-9px; left:-5px;
	width:26px; height:18px; border-radius:50%;
	background:{B};
	box-shadow:inset 2px -2px 0 {D};
	}}

	.c-paw-l,.c-paw-r {{
	position:absolute; bottom:0;
	width:22px; height:13px;
	border-radius:50% 50% 42% 42%;
	background:{B};
	box-shadow:inset -2px -2px 0 {D};
	}}
	.c-paw-l {{ left:-34px; }}
	.c-paw-r {{ left:12px; }}

	.c-head {{
	position:absolute; bottom:56px; left:-32px;
	width:64px; height:58px; border-radius:50%;
	background:{B};
	box-shadow:inset -4px -3px 0 {D};
	overflow:visible;
	}}

	.c-ear-l,.c-ear-r {{
	position:absolute;
	width:0; height:0;
	border-left:11px solid transparent;
	border-right:11px solid transparent;
	border-bottom:21px solid {B};
	animation:K_ear {sp}s ease-in-out infinite;
	}}
	.c-ear-l {{ top:-16px; left:2px; transform-origin:bottom left; }}
	.c-ear-r {{ top:-16px; left:40px; transform-origin:bottom right; }}
	.c-ear-l::after,.c-ear-r::after {{
	content:'';position:absolute;top:5px;left:-6px;
	width:0;height:0;
	border-left:6px solid transparent;
	border-right:6px solid transparent;
	border-bottom:13px solid {D};
	}}

	.c-eye-l,.c-eye-r {{
	position:absolute;
	width:12px; height:12px; border-radius:50%;
	background:{E};
	animation:K_blink 3.5s ease-in-out infinite;
	}}
	.c-eye-l {{ top:18px; left:8px; }}
	.c-eye-r {{ top:18px; left:44px; animation-delay:.2s; }}
	.c-eye-l::after,.c-eye-r::after {{
	content:'';position:absolute;top:2px;left:2px;
	width:5px;height:5px;border-radius:50%;
	background:rgba(255,255,255,.32);
	}}

	.c-nose {{
	position:absolute; top:32px; left:27px;
	width:10px; height:7px;
	border-radius:50% 50% 40% 40%;
	background:{N};
	transform:translateX(-50%);
	}}

	.c-mouth-l,.c-mouth-r {{
	position:absolute;
	width:8px; height:5px;
	border:0 solid {N};
	border-bottom-width:1.5px;
	border-radius:0 0 50% 50%;
	top:38px;
	}}
	.c-mouth-l {{ left:21px; border-left-width:1.5px; transform:rotate(10deg); }}
	.c-mouth-r {{ left:30px; border-right-width:1.5px; transform:rotate(-10deg); }}

	.c-wl1,.c-wl2,.c-wr1,.c-wr2 {{
	position:absolute; height:1.5px;
	background:rgba(255,255,255,.5); border-radius:1px;
	width:28px;
	}}
	.c-wl1 {{ top:29px; right:37px; transform:rotate(-10deg); transform-origin:right; }}
	.c-wl2 {{ top:35px; right:37px; transform:rotate( 10deg); transform-origin:right; }}
	.c-wr1 {{ top:29px; left:37px; transform:rotate( 10deg); transform-origin:left; }}
	.c-wr2 {{ top:35px; left:37px; transform:rotate(-10deg); transform-origin:left; }}

	.c-particle {{
	position:absolute; pointer-events:none;
	color:{D}; font-size:.9rem;
	opacity:0;
	animation:K_part var(--pd) var(--pde) ease-out infinite;
	}}
	</style>

	<div class="stage-cue">
	<span class="dot"></span>
	<span class="mood-name">{p['label']}</span>
	<span> · live emotion</span>
	</div>

	<button class="music-toggle" id="music_{stage_id}" title="Play the generated tune" aria-label="Toggle music">
	<span class="icon-play">♪</span><span class="icon-pause">⏸</span>
	</button>

	<div class="cat-wrap" id="cw">
	<div class="cat-shadow"></div>
	<div class="cat-unit">
	<div class="c-tail"></div>
	<div class="c-body"><div class="c-belly"></div></div>
	<div class="c-paw-l"></div>
	<div class="c-paw-r"></div>
	<div class="c-head">
	<div class="c-ear-l"></div>
	<div class="c-ear-r"></div>
	<div class="c-eye-l"></div>
	<div class="c-eye-r"></div>
	<div class="c-nose"></div>
	<div class="c-mouth-l"></div>
	<div class="c-mouth-r"></div>
	<div class="c-wl1"></div>
	<div class="c-wl2"></div>
	<div class="c-wr1"></div>
	<div class="c-wr2"></div>
	</div>
	</div>
	</div>

	<div class="stage-caption">{p['caption']}</div>
	<div class="cue-sheet">{cue_chips}</div>

	<script>
	(function(){{
	const wrap = document.getElementById('cw');
	const chars = '{p['particle']}'.split('');
	for(let i=0;i<22;i++){{
	const el = document.createElement('div');
	el.className = 'c-particle';
	el.textContent = chars[i % chars.length];
	const a = Math.random()Math.PI2, d = 50+Math.random()*75;
	el.style.setProperty('--px', (Math.cos(a)*d)+'px');
	el.style.setProperty('--py', (Math.sin(a)*d-20)+'px');
	el.style.setProperty('--pd', (.9+Math.random()*2).toFixed(2)+'s');
	el.style.setProperty('--pde',(Math.random()*2.5).toFixed(2)+'s');
	el.style.left = (55+Math.random()*50)+'px';
	el.style.top = (40+Math.random()*80)+'px';
	el.style.fontSize = (.55+Math.random()*.65).toFixed(2)+'rem';
	wrap.appendChild(el);
	}}

	// ── Generative tune — Web Audio, no files ──
	const scale = {scale};
	const noteRoot= {note_root};
	const noteMs = {note_ms};
	const mood = "{mood}";

	let ctx = null, timer = null, step = 0, master = null;

	function midiToFreq(n) {{ return 440 * Math.pow(2, (n - 69) / 12); }}

	function pattern(stepIdx) {{
	// simple per-mood arpeggio shapes over the scale degrees
	const len = scale.length;
	let degree;
	if (mood === 'energetic' \|\| mood === 'angry') {{
	degree = scale[stepIdx % len]; // straight run, bright
	}} else if (mood === 'sad' \|\| mood === 'nostalgic') {{
	degree = scale[[0,2,1,3][stepIdx % 4] % len]; // gentle up-down
	}} else if (mood === 'mysterious' \|\| mood === 'tense') {{
	degree = scale[[0,3,1,5][stepIdx % 4] % len]; // wider, uneasy leaps
	}} else {{
	degree = scale[[0,1,2,1][stepIdx % 4] % len]; // calm/happy/romantic/calm lilt
	}}
	return noteRoot + degree;
	}}

	function playNote() {{
	if (!ctx) return;
	const midi = pattern(step);
	const freq = midiToFreq(midi);
	const t0 = ctx.currentTime;

	const osc = ctx.createOscillator();
	const gain = ctx.createGain();
	osc.type = (mood === 'angry' \|\| mood === 'energetic') ? 'sawtooth'
	: (mood === 'mysterious' \|\| mood === 'tense') ? 'triangle'
	: 'sine';
	osc.frequency.setValueAtTime(freq, t0);

	const dur = noteMs / 1000 * 0.9;
	gain.gain.setValueAtTime(0.0001, t0);
	gain.gain.exponentialRampToValueAtTime(0.18, t0 + 0.02);
	gain.gain.exponentialRampToValueAtTime(0.0001, t0 + dur);

	osc.connect(gain).connect(master);
	osc.start(t0);
	osc.stop(t0 + dur + 0.02);

	step = (step + 1) % 16;
	}}

	const btn = document.getElementById('music_{stage_id}');
	btn.addEventListener('click', function(){{
	if (!ctx) {{
	ctx = new (window.AudioContext \|\| window.webkitAudioContext)();
	master = ctx.createGain();
	master.gain.value = 0.5;
	master.connect(ctx.destination);
	}}
	if (timer) {{
	clearInterval(timer); timer = null;
	ctx.suspend();
	btn.classList.remove('playing');
	}} else {{
	ctx.resume();
	playNote();
	timer = setInterval(playNote, {note_ms});
	btn.classList.add('playing');
	}}
	}});
	}})();
	</script>""" + _stage_close()

	def placeholder_html():
	return _stage_open("#FFD21E", 6.0) + f"""
	<div style="text-align:center; z-index:2; color:#6B7280; font-family:{STAGE_FONT};">
	<div style="font-size:2.4rem; margin-bottom:14px; opacity:.6;">🐱</div>
	<div style="font-size:1.05rem; font-weight:700; letter-spacing:.01em; color:#111827; margin-bottom:8px;">
	No emotion yet
	</div>
	<div style="font-size:.82rem; color:#6B7280; max-width:280px; margin:0 auto; line-height:1.7; font-family:{LABEL_FONT};">
	Upload an image — the model reads its mood and the cat performs it,
	tune and all.
	</div>
	</div>""" + _stage_close()

	def loading_html(local: bool = False) -> str:
	title = "Running locally…" if local else "Analyzing image…"
	caption = ("on-device inference — first run may take a while"
	if local else "choreographing the emotion")
	return _stage_open("#FFD21E", 2.0) + f"""
	<div style="text-align:center; z-index:2; color:#6B7280; font-family:{STAGE_FONT};">
	<div class="loading-spinner" style="
	width:32px; height:32px; margin:0 auto 16px;
	border:3px solid #E5E7EB; border-top-color:#FFD21E;
	border-radius:50%; animation: spin 0.9s linear infinite;"></div>
	<div style="font-size:.92rem; letter-spacing:.01em; color:#111827; font-weight:700;">
	{title}
	</div>
	<div style="font-size:.78rem; color:#6B7280; margin-top:4px; font-family:{LABEL_FONT};">
	{caption}
	</div>
	</div>
	<style>@keyframes spin {{ to {{ transform: rotate(360deg); }} }}</style>""" + _stage_close()

	# ── Main pipeline ─────────────────────────────────────────────────────────────
	def run_image_pipeline(image, prompt, model_label, max_tokens, temperature, api_key, backend):
	if backend == "Local (offline)":
	yield "", loading_html(local=True)
	final_desc = ""
	for partial in stream_description_local(image, prompt, max_tokens, temperature):
	final_desc = partial
	yield final_desc, loading_html(local=True)
	mood, dance = get_dance_spec_local(final_desc)
	yield final_desc, cat_html(mood, dance)
	return

	final_desc = ""
	for partial in stream_description(image, prompt, model_label, max_tokens, temperature, api_key):
	final_desc = partial
	yield partial, loading_html()

	# Model determines the full dance spec
	mood, dance = get_dance_spec(final_desc, api_key)
	yield final_desc, cat_html(mood, dance)

	# ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
	# UI — Cat Dance Studio
	# ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━

	CSS = """
	@import url('https://fonts.googleapis.com/css2?family=Space+Grotesk:wght@500;600;700&family=Inter:wght@400;500;600;700&family=JetBrains+Mono:wght@400;500&display=swap');

	:root {
	--bg: #FFFFFF;
	--surface: #F8F9FA;
	--raised: #E5E7EB;
	--text: #111827;
	--text-dim: #4B5563;
	--text-faint:#6B7280;
	--accent: #FFD21E;
	--accent-ink:#111827;
	}

	.gradio-container {
	background: var(--bg) !important;
	font-family: 'Inter', system-ui, sans-serif !important;
	}

	/* ── Header ────────────────────────────────────────────────────────────── */
	#studio-header {
	text-align:center; padding: 18px 20px 22px;
	border:1px solid var(--raised); border-radius:12px;
	background: var(--surface);
	margin-bottom:8px;
	}
	#studio-header h1 {
	font-family:'Space Grotesk', sans-serif !important;
	font-weight:700 !important; letter-spacing:.01em;
	font-size:1.9rem !important; color:var(--text) !important;
	margin-bottom:6px !important;
	}
	#studio-header p {
	color:var(--text-dim) !important; font-size:.92rem !important;
	margin:0 !important;
	}
	#studio-header .eyebrow {
	display:inline-flex; align-items:center; gap:8px;
	font-family:'JetBrains Mono', monospace; font-size:.7rem;
	letter-spacing:.18em; text-transform:uppercase;
	color:var(--text-faint); margin-bottom:10px;
	}
	#studio-header .eyebrow .badge {
	display:inline-flex; align-items:center; gap:5px;
	background: var(--accent); color: var(--accent-ink);
	border-radius:999px; padding:2px 10px;
	font-weight:700; letter-spacing:.1em;
	}
	#studio-header .eyebrow .badge .dot {
	width:6px; height:6px; border-radius:50%;
	background: var(--accent-ink); opacity:.7;
	}

	/* ── Panels ────────────────────────────────────────────────────────────── */
	.gr-form, .gr-box, .gr-panel, .gr-block.gr-box {
	background: var(--bg) !important;
	border: 1px solid var(--raised) !important;
	border-radius: 10px !important;
	}

	/* Section labels */
	.gradio-container label span {
	font-family:'Inter', sans-serif !important;
	font-size:.78rem !important; font-weight:600 !important;
	letter-spacing:.02em !important; color:var(--text-dim) !important;
	}

	/* ── Buttons ───────────────────────────────────────────────────────────── */
	#submit-img, #submit-txt {
	background: var(--accent) !important;
	color: var(--accent-ink) !important;
	border: 1px solid #E8BD00 !important;
	font-weight:700 !important;
	letter-spacing:.02em !important;
	font-family:'Space Grotesk', sans-serif !important;
	box-shadow: 0 1px 2px rgba(0,0,0,.04) !important;
	transition: transform .12s ease, box-shadow .12s ease !important;
	}
	#submit-img:hover, #submit-txt:hover {
	transform: translateY(-1px);
	box-shadow: 0 4px 12px rgba(255,210,30,.35) !important;
	}
	#submit-img:active, #submit-txt:active { transform: translateY(0); }

	/* ── Description output ───────────────────────────────────────────────── */
	#desc-output textarea {
	font-family:'Inter', sans-serif !important;
	font-size:.88rem !important; line-height:1.6 !important;
	color:var(--text) !important;
	background:var(--surface) !important;
	}

	/* ── Run-locally panel ─────────────────────────────────────────────────── */
	#run-locally {
	border:1px solid var(--raised) !important;
	background: var(--surface) !important;
	}
	#run-locally code {
	font-family:'JetBrains Mono', monospace !important;
	font-size:.78rem !important;
	background:var(--bg) !important;
	border:1px solid var(--raised) !important;
	border-radius:6px !important;
	color:#92660C !important;
	}
	#run-locally pre {
	background:var(--bg) !important;
	border:1px solid var(--raised) !important;
	border-radius:8px !important;
	padding:10px 14px !important;
	}

	/* ── Tabs ──────────────────────────────────────────────────────────────── */
	.tab-nav button {
	font-family:'Space Grotesk', sans-serif !important;
	font-weight:600 !important; letter-spacing:.01em !important;
	color: var(--text-dim) !important;
	}
	.tab-nav button.selected {
	color: var(--text) !important;
	border-bottom-color: var(--accent) !important;
	}

	/* ── Misc ──────────────────────────────────────────────────────────────── */
	footer { display:none !important; }
	.gr-accordion { border-color: var(--raised) !important; }
	"""

	LOCAL_RUN_MD = """
	Run this studio on your own machine — no install beyond Python.

	```bash
	pip install gradio openai pillow
	python app_single.py
	```

	Then open http://localhost:7860

	By default the app uses a shared public API key (rate-limited). To use your
	own [modelbest.cn](https://modelbest.cn) key without typing it every time,
	set an environment variable before launching:

	```bash
	# macOS / Linux
	export MINICPM_API_KEY="sk-your-key-here"

	# Windows (PowerShell)
	$env:MINICPM_API_KEY="sk-your-key-here"
	```

	The app checks `MINICPM_API_KEY` first, then the API Key field below,
	then falls back to the shared public key.

	---

	### 🔌 Fully offline mode

	Select Local (offline) as the Backend on the Image tab to run everything
	on-device — no internet needed after the first download.

	```bash
	pip install torch transformers accelerate
	python app_single.py
	```

	The first time you use the Local backend, it downloads `openbmb/MiniCPM-V-4`
	(4.1B params, Apache-2.0, ~8 GB) into `model_cache/` next to this file. Every
	run after that loads from disk only — no network calls.

	To force a fresh download, delete the `model_cache/` folder.

	A GPU is recommended but not required; the app automatically uses CUDA if
	available and falls back to CPU otherwise.
	"""

	with gr.Blocks(title="An Adventure in Thousand Token Wood · MiniCPM-V 4.6", theme=gr.themes.Soft(), css=CSS) as demo:

	gr.HTML(
	"""<div id="studio-header">
	<div class="eyebrow">
	<span class="badge"><span class="dot"></span>MiniCPM-V 4.6</span>
	<span>An Adventure in Thousand Token Wood</span>
	</div>
	<h1>Emberglade - An emotion identifier that makes you HAPPY !!!</h1>
	<p>Upload an image. The model reads its mood — then a cat performs it, live, with its own tune.</p>
	</div>"""
	)

	with gr.Tabs():
	# ── Tab 1: Image pipeline ─────────────────────────────────────────────
	with gr.TabItem("📷 Image → emotion"):
	with gr.Row():
	with gr.Column(scale=1):
	image_input = gr.Image(type="pil", label="Upload image", height=240)
	prompt_input = gr.Textbox(value=DEFAULT_PROMPT, label="Prompt", lines=2)

	backend_sel = gr.Radio(
	choices=["API (online)", "Local (offline)"],
	value="API (online)",
	label="Backend",
	)

	model_sel = gr.Radio(choices=list(MODELS.keys()),
	value=list(MODELS.keys())[0], label="Model",
	info="Used only for the API backend")

	with gr.Accordion("Generation settings", open=False):
	max_tok = gr.Slider(64, 2048, value=DEFAULT_MAX_TOKENS, step=64, label="Max tokens")
	temp = gr.Slider(0.0, 1.5, value=DEFAULT_TEMPERATURE, step=0.05, label="Temperature")

	with gr.Accordion("API key", open=False):
	api_key = gr.Textbox(label="Your key (optional)", type="password",
	placeholder="sk-… leave blank to use the shared key")
	gr.Markdown("Get your own at [modelbest.cn](https://modelbest.cn) — see Run locally below for setup.")

	with gr.Accordion("Local model (offline)", open=False, elem_id="local-model"):
	local_status = gr.Markdown(local_status_md())
	gr.Markdown(
	f"Model: `{LOCAL_MODEL_ID}` · 4.1B params · Apache-2.0\n\n"
	"Selecting Local (offline) above will download this model "
	"the first time it's used (~8 GB, one-time, needs internet), "
	"then cache it in `model_cache/` for fully offline use afterward.\n\n"
	"Requires: `pip install torch transformers accelerate`"
	)
	refresh_local_btn = gr.Button("Refresh status", size="sm")

	img_btn = gr.Button("Start emotion", variant="primary", elem_id="submit-img")
	gr.Examples(examples=PROMPT_EXAMPLES, inputs=[prompt_input], label="Prompt ideas")

	with gr.Column(scale=1):
	cat_out = gr.HTML(value=placeholder_html(), label="Stage")
	desc_out = gr.Textbox(label="Description (model output, streaming)", lines=7,
	placeholder="The model's description will stream in here…",
	elem_id="desc-output")

	pipeline_inputs = [image_input, prompt_input, model_sel, max_tok, temp, api_key, backend_sel]

	img_btn.click(
	fn=run_image_pipeline,
	inputs=pipeline_inputs,
	outputs=[desc_out, cat_out],
	)
	prompt_input.submit(
	fn=run_image_pipeline,
	inputs=pipeline_inputs,
	outputs=[desc_out, cat_out],
	)
	refresh_local_btn.click(fn=local_status_md, outputs=[local_status])

	# ── Tab 2: Text-only (keyword dance, no API) ──────────────────────────
	with gr.TabItem("✍️ Text → emotion"):
	gr.Markdown("Type mood words for an instant emotion — no API key needed.")
	with gr.Row():
	with gr.Column(scale=1):
	txt_input = gr.Textbox(
	label="Describe a mood",
	placeholder='"happy party" · "sad rain" · "energetic dance"',
	lines=3,
	)
	txt_btn = gr.Button("Start emotion", variant="primary", elem_id="submit-txt")
	gr.Examples(
	examples=[["happy celebrate joy"],["sad lonely rain"],
	["energetic dance excited"],["calm peaceful"],
	["mysterious dark shadow"],["romantic love"],
	["tense nervous fear"],["nostalgic memory"],["angry rage"]],
	inputs=[txt_input], label="Quick examples",
	)
	with gr.Column(scale=1):
	txt_cat = gr.HTML(value=placeholder_html(), label="Stage")

	txt_btn.click(fn=generate_animation, inputs=[txt_input], outputs=[txt_cat])
	txt_input.submit(fn=generate_animation, inputs=[txt_input], outputs=[txt_cat])

	# ── Run locally ──────────────────────────────────────────────────────────
	with gr.Accordion("⚙ Run locally", open=False, elem_id="run-locally"):
	gr.Markdown(LOCAL_RUN_MD)

	if __name__ == "__main__":
	demo.launch(server_name="0.0.0.0", server_port=7860, show_error=True)