Spaces:

build-small-hackathon
/

small-cuts

Running

App Files Files Community

small-cuts / src /small_cuts /engine /library.py

macayaven

Upload folder using huggingface_hub

24e5b39 verified 17 days ago

Raw

History Blame Contribute Delete

15 kB

	"""Engine-side scene library: filesystem media + sqlite index (D6).

	The real `SceneSink`. Every successful narration is persisted — frame JPEG,
	title card, voice WAV, one sqlite row — and fanned out to live SSE
	subscribers (D7). Blocking writes run in a worker thread via
	`asyncio.to_thread`; the publish happens back on the event loop. Stored
	entries and live events share the same NarratedScene shape, per
	docs/contracts/narrated-scene.schema.json.
	"""

	from __future__ import annotations

	import asyncio
	import contextlib
	import json
	import os
	import sqlite3
	import sys
	import threading
	from datetime import datetime, timezone
	from pathlib import Path
	from typing import Any

	from PIL import Image

	from small_cuts import narrator, tts
	from small_cuts.frames import pick_key_frame
	from small_cuts.title_card import TITLE_MAX_LEN, derive_title, render_title_card

	from .session import CONTRACT_VERSION, _wav_bytes

	DEFAULT_ROOT = "~/.small-cuts/library"
	OWNER = "carlos" # v1 engines are single-user; the field is reserved for multi-user
	VISIBILITIES = ("private", "shared", "public")
	MEDIA_FILES = ("frame.jpg", "card.webp", "voice.wav", "clip.mp4")
	STORAGE_TIMEOUT_S = 30.0
	SUBSCRIBER_QUEUE_MAX = 256
	CLIP_MP4_FPS = 12
	CLIP_BLEND_STEPS = 1
	H264_MIN_DIMENSION = 2
	POSTER_JPEG_QUALITY = 90
	RGB_MODE = "RGB"
	VIDEO_PIXEL_FORMAT = "yuv420p"
	PRIMARY_VIDEO_CODEC = "libx264"
	FALLBACK_VIDEO_CODEC = "h264"

	_SCHEMA = """\
	CREATE TABLE IF NOT EXISTS scenes (
	scene_id TEXT PRIMARY KEY,
	seq INTEGER NOT NULL UNIQUE,
	moment_id TEXT NOT NULL,
	session_id TEXT NOT NULL,
	captured_at TEXT NOT NULL,
	created_at TEXT NOT NULL,
	style_key TEXT NOT NULL,
	title TEXT NOT NULL,
	narration TEXT NOT NULL,
	visibility TEXT NOT NULL DEFAULT 'private',
	owner TEXT NOT NULL,
	engine TEXT NOT NULL
	)"""

	_INSERT = """\
	INSERT INTO scenes (scene_id, seq, moment_id, session_id, captured_at, created_at,
	style_key, title, narration, visibility, owner, engine)
	VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)"""


	class SceneLibrary:
	"""Scene store + in-process pub/sub. The instance itself is the async SceneSink.

	Layout: `<root>/library.sqlite3` + `<root>/media/<scene_id>/{frame.jpg,
	card.webp, voice.wav}`. One sqlite connection, guarded by a lock: the
	sink writes from worker threads, queries come from request handlers.
	"""

	def __init__(self, root: str \| Path \| None = None) -> None:
	base = root or os.environ.get("SMALL_CUTS_LIBRARY_DIR") or DEFAULT_ROOT
	self.root = Path(base).expanduser().resolve()
	self.media_dir = self.root / "media"
	self.media_dir.mkdir(parents=True, exist_ok=True)
	self._lock = threading.Lock() # guards the connection and seq allocation
	self._db = sqlite3.connect(self.root / "library.sqlite3", check_same_thread=False)
	self._db.row_factory = sqlite3.Row
	with self._lock, self._db:
	# WAL + busy_timeout: viewer reads don't block sink writes, and a
	# briefly locked database waits instead of raising immediately.
	self._db.execute("PRAGMA journal_mode=WAL")
	self._db.execute("PRAGMA busy_timeout=5000")
	self._db.execute(_SCHEMA)
	self._subscribers: list[asyncio.Queue[dict[str, Any]]] = []

	# -- the sink -----------------------------------------------------------------

	async def __call__(self, scene: dict[str, Any]) -> None:
	"""SceneSink entry point: persist off the event loop, then publish.

	A failed store (disk full, sqlite error) must not be silent data loss:
	the mobile client already received its SceneAudio, so log to stderr and
	fan an error ControlFrame to the viewer stream — the timeline stays
	honest. `_hand_to_sink`'s suppression remains the last-resort backstop.
	"""
	try:
	narrated = await asyncio.wait_for(
	asyncio.to_thread(self.store, scene), timeout=STORAGE_TIMEOUT_S
	)
	except (Exception, asyncio.TimeoutError) as exc:
	print(
	f"small_cuts.engine: library write failed for scene {scene['scene_id']}: {exc!r}",
	file=sys.stderr,
	)
	self.publish_event(
	{
	"contract_version": CONTRACT_VERSION,
	"kind": "error",
	"moment_id": scene["moment_id"],
	"error": {
	"stage": "storage",
	"code": "library_write_failed",
	"message": str(exc)[:300],
	"retryable": False,
	},
	}
	)
	return
	self.publish_event(narrated)

	def publish_event(self, payload: dict[str, Any]) -> None:
	"""Fan any event (stored scene or ControlFrame error) to live subscribers.

	Events without a seq (errors) are EPHEMERAL: not persisted, not in Last-Event-ID replay.
	"""
	for queue in list(self._subscribers):
	try:
	queue.put_nowait(payload)
	except asyncio.QueueFull:
	self.unsubscribe(queue)

	def store(self, scene: dict[str, Any]) -> dict[str, Any]:
	"""Persist media + index row (blocking); returns the stored NarratedScene."""
	scene_id: str = scene["scene_id"]
	narration: str = scene["narration"]
	style_key: str = scene["style_key"]
	title = _stored_title(scene.get("title"), narration)

	scene_dir = self.media_dir / scene_id
	scene_dir.mkdir(parents=True, exist_ok=True)
	clip_frames = scene.get("clip_frames") or []
	poster = pick_key_frame(clip_frames) if clip_frames else scene["image"]
	poster.convert(RGB_MODE).save(scene_dir / "frame.jpg", "JPEG", quality=POSTER_JPEG_QUALITY)
	if len(clip_frames) >= 2:
	try:
	_write_clip_mp4(scene_dir / "clip.mp4", clip_frames)
	except Exception as exc:
	print(
	f"small_cuts.engine: clip write failed for scene {scene_id}: {exc!r}",
	file=sys.stderr,
	)
	render_title_card(title, style_key).save(scene_dir / "card.webp", "WEBP")
	(scene_dir / "voice.wav").write_bytes(_wav_bytes(scene["audio"], scene["sample_rate"]))

	narrator_backend = narrator.get_backend()
	tts_backend = tts.get_tts_backend()
	engine = {
	"narrator_model": narrator_backend.model_id,
	"narrator_backend": narrator_backend.name,
	"tts_model": tts_backend.model_id,
	"latency_ms": scene["latency_ms"],
	}
	with self._lock, self._db:
	# max+1 under the lock: monotonic across the process AND across restarts.
	seq = self._db.execute("SELECT COALESCE(MAX(seq), -1) + 1 FROM scenes").fetchone()[0]
	self._db.execute(
	_INSERT,
	(
	scene_id,
	seq,
	scene["moment_id"],
	scene["session_id"],
	_normalize_datetime(scene["captured_at"]),
	_normalize_datetime(scene["created_at"]),
	style_key,
	title,
	narration,
	"private",
	_owner(),
	json.dumps(engine),
	),
	)
	stored = self.get(scene_id)
	if stored is None:
	raise RuntimeError(f"scene {scene_id} missing immediately after insert")
	return stored

	# -- queries ---------------------------------------------------------------------

	def to_narrated_scene(self, row: sqlite3.Row) -> dict[str, Any]:
	"""Contract-valid NarratedScene (1.1.0) for one stored row."""
	scene_id = row["scene_id"]
	media = {
	"frame_url": f"/media/{scene_id}/frame.jpg",
	"card_url": f"/media/{scene_id}/card.webp",
	"audio_url": f"/media/{scene_id}/voice.wav",
	}
	if (self.media_dir / scene_id / "clip.mp4").is_file():
	media["clip_url"] = f"/media/{scene_id}/clip.mp4"
	return {
	"contract_version": CONTRACT_VERSION,
	"scene_id": scene_id,
	"moment_id": row["moment_id"],
	"session_id": row["session_id"],
	"captured_at": row["captured_at"],
	"created_at": row["created_at"],
	"style_key": row["style_key"],
	"title": row["title"],
	"narration": row["narration"],
	"visibility": row["visibility"],
	"seq": row["seq"],
	"owner": row["owner"],
	"media": media,
	"engine": json.loads(row["engine"]),
	}

	def list_scenes(
	self,
	session_id: str \| None = None,
	visibility: str \| None = None,
	limit: int = 100,
	) -> list[dict[str, Any]]:
	"""Newest bounded window, returned in scene chronology for the viewer."""
	clauses, params = [], []
	if session_id is not None:
	clauses.append("session_id = ?")
	params.append(session_id)
	if visibility is not None:
	clauses.append("visibility = ?")
	params.append(visibility)
	where = f" WHERE {' AND '.join(clauses)}" if clauses else ""
	query = (
	"SELECT * FROM ("
	f"SELECT * FROM scenes{where} ORDER BY seq DESC LIMIT ?"
	") ORDER BY captured_at, seq"
	)
	with self._lock:
	rows = self._db.execute(query, (*params, limit)).fetchall()
	return [self.to_narrated_scene(row) for row in rows]

	def get(self, scene_id: str) -> dict[str, Any] \| None:
	with self._lock:
	row = self._db.execute(
	"SELECT * FROM scenes WHERE scene_id = ?", (scene_id,)
	).fetchone()
	return self.to_narrated_scene(row) if row is not None else None

	def set_visibility(self, scene_id: str, visibility: str) -> dict[str, Any] \| None:
	"""The viewer's only write (D7). Returns the updated scene, or None if unknown."""
	if visibility not in VISIBILITIES:
	raise ValueError(f"Unknown visibility {visibility!r}; expected one of {VISIBILITIES}")
	with self._lock, self._db:
	updated = self._db.execute(
	"UPDATE scenes SET visibility = ? WHERE scene_id = ?", (visibility, scene_id)
	).rowcount
	return self.get(scene_id) if updated else None

	def scenes_since(self, seq: int) -> list[dict[str, Any]]:
	"""Scenes with seq > `seq`, ordered by seq — the SSE Last-Event-ID replay."""
	with self._lock:
	rows = self._db.execute(
	"SELECT * FROM scenes WHERE seq > ? ORDER BY seq", (seq,)
	).fetchall()
	return [self.to_narrated_scene(row) for row in rows]

	def media_path(self, scene_id: str, filename: str) -> Path \| None:
	"""Resolve a media file, or None: unknown name, traversal, or missing file."""
	if filename not in MEDIA_FILES:
	return None
	path = (self.media_dir / scene_id / filename).resolve()
	if not path.is_relative_to(self.media_dir): # traversal via scene_id
	return None
	return path if path.is_file() else None

	# -- pub/sub ----------------------------------------------------------------------

	def subscribe(self) -> asyncio.Queue[dict[str, Any]]:
	"""New-scene feed for one SSE connection; pair with `unsubscribe`."""
	queue: asyncio.Queue[dict[str, Any]] = asyncio.Queue(maxsize=SUBSCRIBER_QUEUE_MAX)
	self._subscribers.append(queue)
	return queue

	def unsubscribe(self, queue: asyncio.Queue[dict[str, Any]]) -> None:
	with contextlib.suppress(ValueError):
	self._subscribers.remove(queue)

	def close(self) -> None:
	with self._lock:
	self._db.close()


	def _write_clip_mp4(
	path: Path,
	frames: list[Image.Image],
	fps: int = CLIP_MP4_FPS,
	blend_steps: int = CLIP_BLEND_STEPS,
	) -> None:
	"""Render a small browser-playable MP4 from sampled POV frames."""
	import av

	rgb_frames = [frame.convert(RGB_MODE) for frame in frames]
	width, height = rgb_frames[0].size
	# H.264/yuv420p expects even dimensions. Preserve portrait aspect and only
	# shave one pixel if needed; capture frames are already downscaled upstream.
	width = max(H264_MIN_DIMENSION, width - (width % 2))
	height = max(H264_MIN_DIMENSION, height - (height % 2))
	encode_frames = _smooth_clip_frames(rgb_frames, blend_steps=blend_steps, size=(width, height))

	container = av.open(str(path), "w")
	try:
	try:
	stream = container.add_stream(PRIMARY_VIDEO_CODEC, rate=fps)
	except Exception:
	stream = container.add_stream(FALLBACK_VIDEO_CODEC, rate=fps)
	stream.width = width
	stream.height = height
	stream.pix_fmt = VIDEO_PIXEL_FORMAT

	for image in encode_frames:
	frame = av.VideoFrame.from_image(image)
	for packet in stream.encode(frame):
	container.mux(packet)
	for packet in stream.encode():
	container.mux(packet)
	finally:
	container.close()


	def _smooth_clip_frames(
	frames: list[Image.Image],
	blend_steps: int = CLIP_BLEND_STEPS,
	size: tuple[int, int] \| None = None,
	) -> list[Image.Image]:
	"""Insert tiny cross-dissolve frames so sampled POV clips do not hard-cut."""
	if not frames:
	return []
	prepared = []
	for image in frames:
	image = image.convert(RGB_MODE)
	if size is not None and image.size != size:
	image = image.resize(size, Image.Resampling.LANCZOS)
	prepared.append(image)
	if blend_steps <= 0 or len(prepared) < 2:
	return prepared

	smoothed = [prepared[0]]
	for previous, current in zip(prepared, prepared[1:], strict=False):
	for step in range(1, blend_steps + 1):
	alpha = step / (blend_steps + 1)
	smoothed.append(Image.blend(previous, current, alpha))
	smoothed.append(current)
	return smoothed


	def _stored_title(raw_title: object, narration: str) -> str:
	if isinstance(raw_title, str) and raw_title.strip():
	return derive_title(raw_title, max_len=TITLE_MAX_LEN)
	return derive_title(narration, max_len=TITLE_MAX_LEN)


	def _owner() -> str:
	return os.environ.get("SMALL_CUTS_ENGINE_OWNER", OWNER)


	def _normalize_datetime(value: str) -> str:
	raw = value.replace("Z", "+00:00")
	parsed = datetime.fromisoformat(raw)
	if parsed.tzinfo is None:
	raise ValueError(f"timestamp must include timezone: {value}")
	return parsed.astimezone(timezone.utc).isoformat()