Spaces:

build-small-hackathon
/

lightloom

Running on Zero

App Files Files Community

lightloom / frontend /js /api.js

Efradeca's picture

chore: deploy private lightloom build

318f094 verified 18 days ago

History Blame Contribute Delete

13.6 kB

	// frontend/js/api.js — Lightloom "La Sala" · backend transport (LL.api)
	//
	// The ONLY sanctioned way to reach the GPU pipeline is @gradio/client. Raw
	// fetch() against /api/recital BREAKS ZeroGPU quota attribution (the client
	// injects the session/quota auth headers fetch cannot), so we never do that
	// here. We connect once, submit "/recital", and fan each streamed message out
	// to onEvent. See app.py @app.api(name="recital", ...) for the validated shape.
	//
	// Public surface (per the shared contract):
	// LL.api.connect() -> Promise<Client> (memoized)
	// LL.api.streamRecital(text, lang, onEvent) -> Promise<{session,done}>
	// LL.api.cancel() -> void (aborts the live job)
	//
	// No frameworks, no build step — vanilla ES module.

	// PINNED to the exact version currently resolving (2.2.2) and the real dist/index.js entry. The old
	// unpinned @latest import meant a future @gradio/client publish could 404/restructure and fail to
	// parse at load time -> window.LL.api never assigned -> the world is dead-on-stage with NO error.
	// Re-pin deliberately when the Space's gradio SDK is bumped (keep client major in step with gradio).
	import { Client } from "https://cdn.jsdelivr.net/npm/@gradio/client@2.2.2/dist/index.js";

	const LL = (window.LL = window.LL \|\| {});

	// msg.data may arrive as the event object itself OR a 1-element array [event]
	// (Gradio wraps single outputs either way depending on version). Normalize so
	// the controller always receives a plain event object.
	const asEvent = (d) => (Array.isArray(d) ? d[0] : d);

	const api = {
	_clientPromise: null, // memoized Client.connect() so we connect at most once
	_job: null, // the live submit() job handle (has .cancel())
	_cancelled: false, // guards against late events after an explicit cancel()

	/**
	* Connect (once) to the gr.Server that serves this page. Memoized: repeated
	* calls return the same in-flight/resolved promise. A failed connect clears
	* the memo so a later call can retry.
	* @returns {Promise<import("@gradio/client").Client>}
	*/
	async connect() {
	if (!this._clientPromise) {
	// window.location.origin => same Space that served index.html. This is
	// what carries the ZeroGPU quota identity; do not hardcode a URL.
	this._clientPromise = Client.connect(window.location.origin).catch((err) => {
	this._clientPromise = null; // allow a retry on the next call
	throw err;
	});
	}
	return this._clientPromise;
	},

	// Removed obsolete one-shot endpoints (streamRecital / streamPanorama / streamWorld / streamScroll) —
	// all superseded by streamScrollLive (the continuous-panorama path). The typed path now feeds
	// /scroll_live per sentence, identical Director/painter/continuity to voice.

	/**
	* LIVE narration — the world builds AS YOU SPEAK. Submit ONE spoken phrase segment
	* (base64 WAV); the server transcribes it AND paints a few strips that CONTINUE this
	* `session`'s panorama, streaming transcript/section/depth events. Call it once per
	* VAD-cut phrase; continuity is keyed server-side by `session`. Short-lived per call
	* (it does NOT touch the long-stream _job handle), so phrases can pipeline in order.
	* Pass an empty `audioB64` once on mic-tap to WARM the models ahead of the first word.
	* @returns {Promise<{session:string, done:boolean}>}
	*/
	async streamScrollLive(session, audioB64 = "", lang = "en", onEvent, text = "") {
	const emit = typeof onEvent === "function" ? onEvent : () => {};
	let client;
	try {
	client = await this.connect();
	} catch (err) {
	emit({ stage: "error", error: `connect_failed: ${shortErr(err)}` });
	return { session, done: false };
	}
	let timedOut = false;
	try {
	const job = client.submit("/scroll_live", {
	session: session \|\| "",
	text: text \|\| "",
	audio_b64: audioB64 \|\| "",
	lang: lang \|\| "en",
	});
	// IDLE WATCHDOG: a `for await` over the job NEVER resolves if the server closes the socket cleanly
	// mid-job without the iterator signalling done -> the live drain wedges forever on one scene. If no
	// message arrives for 25 s, cancel the job so the loop ends and the drain can continue.
	let watchdog = null;
	const arm = () => { if (watchdog) clearTimeout(watchdog); watchdog = setTimeout(() => { timedOut = true; try { job.cancel(); } catch (_) {} }, 25000); };
	arm();
	try {
	for await (const msg of job) {
	arm();
	if (!msg \|\| msg.type !== "data") continue;
	const ev = asEvent(msg.data);
	if (!ev \|\| typeof ev !== "object") continue;
	if (ev.session) session = ev.session;
	try { emit(ev); } catch (e) { console.error("[LL.api] live onEvent threw", e); }
	}
	} finally {
	if (watchdog) clearTimeout(watchdog);
	}
	} catch (err) {
	if (!timedOut) emit({ stage: "error", error: `stream_failed: ${shortErr(err)}` });
	}
	if (timedOut) emit({ stage: "section_error", error: "phrase_timeout" }); // surfaced as a transient status, not a silent stall
	return { session, done: true };
	},

	/**
	* DIRECTOR'S CUT keepsake. Over the FINISHED session panorama (already on disk under `session`), run the
	* post-process: the MiniCPM-V-4.6 Art Director names it from the pixels, then a depth-parallax fly-through
	* is rendered to world.mp4. Streams {stitched,titled,rendering,encoding,ready} (ready carries .video + the
	* .title). Short-lived per call; does NOT touch the live _job handle. Independent of the live painter.
	* @returns {Promise<{session:string, done:boolean}>}
	*/
	async streamPostprocess(session, lang = "en", onEvent) {
	const emit = typeof onEvent === "function" ? onEvent : () => {};
	let client;
	try {
	client = await this.connect();
	} catch (err) {
	emit({ stage: "postprocess_error", error: `connect_failed: ${shortErr(err)}` });
	return { session, done: false };
	}
	let timedOut = false;
	let sawTerminal = false;
	const isTerminal = (s) => s === "ready" \|\| s === "postprocess_error" \|\| s === "quota_exceeded" \|\| s === "render_timeout" \|\| s === "error";
	try {
	const job = client.submit("/postprocess", { session: session \|\| "", lang: lang \|\| "en" });
	// IDLE WATCHDOG (mirrors streamScrollLive): a clean mid-stream socket close would otherwise leave the
	// keepsake stuck forever on the sticky "Crafting…" status. 45s — renders have longer legitimate gaps
	// (cold model load, a long encode) than a live phrase, so the live 25s budget would false-cancel.
	let watchdog = null;
	const arm = () => { if (watchdog) clearTimeout(watchdog); watchdog = setTimeout(() => { timedOut = true; try { job.cancel(); } catch (_) {} }, 45000); };
	arm();
	try {
	for await (const msg of job) {
	arm();
	if (!msg \|\| msg.type !== "data") continue;
	const ev = asEvent(msg.data);
	if (!ev \|\| typeof ev !== "object") continue;
	if (ev.session) session = ev.session;
	if (isTerminal(ev.stage)) sawTerminal = true;
	try { emit(ev); } catch (e) { console.error("[LL.api] postprocess onEvent threw", e); }
	}
	} finally {
	if (watchdog) clearTimeout(watchdog);
	}
	} catch (err) {
	if (!timedOut) { emit({ stage: "postprocess_error", error: `stream_failed: ${shortErr(err)}` }); sawTerminal = true; }
	}
	// Never strand the UI on the sticky "Crafting…" status: if the stream ended (clean close or a watchdog
	// cancel) without a terminal event, synthesize one so the controller clears the status and toasts.
	if (!sawTerminal) emit({ stage: "postprocess_error", error: timedOut ? "postprocess_timeout" : "stream_ended" });
	return { session, done: true };
	},

	/**
	* "Ask Your World" — MiniCPM-V-4.6 answers a free-form question about the FINISHED world from its pixels.
	* Short (one VLM call); resolves with { answer, error? }. Independent of live image creation.
	*/
	async ask(session, question, lang = "en") {
	let client;
	try { client = await this.connect(); } catch (err) { return { answer: "", error: `connect_failed: ${shortErr(err)}` }; }
	try {
	const job = client.submit("/ask", { session: session \|\| "", question: question \|\| "", lang: lang \|\| "en" });
	let res = { answer: "" };
	for await (const msg of job) {
	if (!msg \|\| msg.type !== "data") continue;
	const ev = asEvent(msg.data);
	if (ev && typeof ev === "object") res = ev;
	}
	return res;
	} catch (err) { return { answer: "", error: `stream_failed: ${shortErr(err)}` }; }
	},

	/**
	* Transcribe a base64 WAV (the narrator's mic audio) via Cohere Transcribe.
	* Resolves with {text, error}. Used by LL.recorder; the transcript then drives
	* streamPanorama just like a typed recital.
	*
	* @param {string} audioB64 data:audio/wav;base64,... (or bare base64)
	* @param {string} lang ISO code ("en"/"es"/...); default "en"
	* @param {(event:object)=>void} [onEvent] optional per-stage callback
	* @returns {Promise<{text:string, error:?string}>}
	*/
	async transcribe(audioB64, lang = "en", onEvent) {
	const emit = typeof onEvent === "function" ? onEvent : () => {};
	let client;
	try {
	client = await this.connect();
	} catch (err) {
	return { text: "", error: `connect_failed: ${shortErr(err)}` };
	}
	let text = "";
	let error = null;
	try {
	const job = client.submit("/transcribe", { audio_b64: audioB64, lang: lang \|\| "en" });
	for await (const msg of job) {
	if (!msg \|\| msg.type !== "data") continue;
	const ev = asEvent(msg.data);
	if (!ev \|\| typeof ev !== "object") continue;
	emit(ev);
	if (ev.stage === "transcript") text = ev.text \|\| "";
	if (ev.stage === "error" \|\| ev.stage === "quota_exceeded") error = ev.error \|\| ev.stage;
	}
	} catch (err) {
	error = `stream_failed: ${shortErr(err)}`;
	}
	return { text, error };
	},

	/** Shared streaming core for the @app.api endpoints (recital + panorama). */
	async _streamEndpoint(endpoint, text, lang = "en", onEvent) {
	const emit = typeof onEvent === "function" ? onEvent : () => {};

	// Guard empty input before spending a GPU connect: surface a soft error
	// event the controller can render as a toast, then resolve cleanly.
	const poem = (text \|\| "").trim();
	if (!poem) {
	emit({ stage: "error", error: "empty_text" });
	return { session: null, done: false, cancelled: false };
	}

	// A fresh stream supersedes any previous one.
	this.cancel();
	this._cancelled = false;

	let client;
	try {
	client = await this.connect();
	} catch (err) {
	// Connection failure is terminal for this attempt — report and stop.
	emit({ stage: "error", error: `connect_failed: ${shortErr(err)}` });
	return { session: null, done: false, cancelled: false };
	}

	let session = null;
	let done = false;
	let job = null;

	try {
	// Payload keys MUST be text+lang (the @app.api signatures take text, lang).
	job = client.submit(endpoint, { text: poem, lang: lang \|\| "en" });
	this._job = job;

	// The job is an async iterable of status/data messages. We only act on
	// "data" messages; "status" carries queue/progress info we ignore here.
	for await (const msg of job) {
	if (this._cancelled) break;
	if (!msg \|\| msg.type !== "data") continue;

	const event = asEvent(msg.data);
	if (!event \|\| typeof event !== "object") continue;

	if (event.session) session = event.session;
	if (event.stage === "done") done = true;

	try {
	emit(event);
	} catch (handlerErr) {
	// A throwing handler must not tear down the whole stream — one bad
	// beat render shouldn't end the film. Log and keep streaming.
	console.error("[LL.api] onEvent handler threw", handlerErr);
	}
	}
	} catch (err) {
	if (!this._cancelled) {
	emit({ stage: "error", error: `stream_failed: ${shortErr(err)}` });
	}
	} finally {
	// Only clear the handle if a newer submit() hasn't already replaced it.
	if (this._job === job) this._job = null;
	}

	return { session, done, cancelled: this._cancelled };
	},

	/**
	* Abort the in-flight recital job (if any). Idempotent and safe to call when
	* nothing is running. Marks the stream cancelled so any already-queued events
	* are dropped by the loop guard above.
	*/
	cancel() {
	this._cancelled = true;
	const job = this._job;
	this._job = null;
	if (job && typeof job.cancel === "function") {
	try {
	job.cancel();
	} catch (err) {
	console.warn("[LL.api] job.cancel() failed", err);
	}
	}
	},
	};

	// Tiny helper kept local (no extra globals).
	function shortErr(err) {
	const m = err && (err.message \|\| err.toString());
	return String(m \|\| "unknown").slice(0, 160);
	}

	LL.api = api;

	export default api;