Spaces:

azan888
/

3d_model

Sleeping

3d_model / ylff /utils /capture_bundle.py

Azan

Clean deployment build (Squashed)

7a87926 7 days ago

22.6 kB

	"""
	Capture bundle reader/validator (SPECIFICATIONS.md Appendix C).

	This module provides a single entry point (`CaptureBundle`) that:
	- loads a bundle manifest,
	- validates referenced files exist,
	- offers typed accessors to common assets.
	"""

	from __future__ import annotations

	import json
	from dataclasses import dataclass
	from pathlib import Path
	from typing import Any, Dict, List, Optional, Tuple, Union
	import numpy as np

	from ..models.capture_models import CaptureManifest, DetailedAnnotation
	from .dataset_layout import CaptureBundleLayout, validate_paths_exist


	class CaptureBundleError(ValueError):
	pass


	@dataclass(frozen=True)
	class _CalibrationCompat:
	rig_extrinsics_path: Optional[str] = None
	sync_offsets_path: Optional[str] = None


	@dataclass(frozen=True)
	class _AnnotationsCompat:
	quick_annotation_path: Optional[str] = None
	detailed_annotation_path: Optional[str] = None


	@dataclass(frozen=True)
	class _DeviceCompat:
	device_id: str
	video_path: Optional[str] = None
	intrinsics_path: Optional[str] = None
	timestamps_path: Optional[str] = None
	arkit_poses_path: Optional[str] = None
	lidar_depth_dir: Optional[str] = None
	# Optional forward-compat passthrough (mirrors pydantic extra)
	model_extra: Dict[str, Any] = None # type: ignore[assignment]


	@dataclass(frozen=True)
	class _ManifestCompat:
	schema_version: str
	capture_id: str
	devices: List[_DeviceCompat]
	calibration: Optional[_CalibrationCompat] = None
	annotations: Optional[_AnnotationsCompat] = None
	teacher_outputs: Optional[Any] = None
	metadata: Dict[str, Any] = None # type: ignore[assignment]


	@dataclass(frozen=True)
	class CaptureBundle:
	root: Path
	# Backward-compatible view of the manifest. For v1 this is derived from
	# the pydantic model; for v2 this is synthesized from the stream registry.
	manifest: Union[CaptureManifest, _ManifestCompat]
	manifest_obj: Dict[str, Any]
	schema_version: str
	_v2_stream_index: Dict[Tuple[str, str], str]

	@classmethod
	def load(cls, root: Path) -> CaptureBundle:
	root = Path(root)
	layout = CaptureBundleLayout(root=root)
	if not root.exists():
	raise CaptureBundleError(f"Capture bundle root does not exist: {root}")
	if not layout.manifest_path.exists():
	raise CaptureBundleError(f"Missing manifest.json at: {layout.manifest_path}")

	try:
	manifest_obj = json.loads(layout.manifest_path.read_text())
	except Exception as e:
	raise CaptureBundleError(f"Failed to parse manifest.json: {e}") from e

	schema_version = str(manifest_obj.get("schema_version", "1.0") or "1.0")

	# v1: strict pydantic schema
	if schema_version.startswith("1"):
	try:
	manifest = CaptureManifest.model_validate(manifest_obj)
	except Exception as e:
	raise CaptureBundleError(f"Invalid manifest schema: {e}") from e
	bundle = cls(
	root=root,
	manifest=manifest,
	manifest_obj=manifest_obj,
	schema_version=schema_version,
	_v2_stream_index={},
	)
	bundle.validate(repairable_ok=False)
	return bundle

	# v2: stream-centric schema. Synthesize a backward-compatible manifest view.
	if not schema_version.startswith("2"):
	raise CaptureBundleError(f"Unsupported manifest schema_version: {schema_version}")

	devices = manifest_obj.get("devices", []) or []
	if not isinstance(devices, list) or not devices:
	raise CaptureBundleError("v2 manifest has no devices[] pointers")

	# Build stream index: (device_id, kind) -> stream.json path
	v2_stream_index: Dict[Tuple[str, str], str] = {}
	for s in manifest_obj.get("streams", []) or []:
	if not isinstance(s, dict):
	continue
	did = s.get("device_id")
	kind = s.get("kind")
	path = s.get("path")
	if (
	isinstance(did, str)
	and isinstance(kind, str)
	and isinstance(path, str)
	and did
	and kind
	and path
	):
	v2_stream_index[(did, kind)] = path

	def _resolve_stream_data_rel(did: str, kind: str) -> Optional[str]:
	sp = v2_stream_index.get((did, kind))
	if not sp:
	return None
	sj_path = (root / sp).resolve()
	if not sj_path.exists():
	return None
	try:
	sj = json.loads(sj_path.read_text())
	except Exception:
	return None
	data = sj.get("data") if isinstance(sj, dict) else None
	if isinstance(data, dict) and isinstance(data.get("path"), str) and data["path"]:
	# Convert to bundle-root-relative path
	rel = (sj_path.parent / data["path"]).resolve()
	try:
	return str(rel.relative_to(root))
	except Exception:
	return str(rel)
	return None

	compat_devices: List[_DeviceCompat] = []
	for dref in devices:
	if not isinstance(dref, dict):
	continue
	did = dref.get("device_id")
	p = dref.get("path")
	if not (isinstance(did, str) and did and isinstance(p, str) and p):
	continue

	# Prefer stream registry for primary assets.
	video_rel = _resolve_stream_data_rel(did, "video.rgb")
	# Intrinsics: v2 prefers per-device calibration/intrinsics.json;
	# fall back to v1 intrinsics.json.
	intr_v2 = root / "devices" / did / "calibration" / "intrinsics.json"
	intr_v1 = root / "devices" / did / "intrinsics.json"
	intr_rel = None
	if intr_v2.exists():
	intr_rel = str(intr_v2.relative_to(root))
	elif intr_v1.exists():
	intr_rel = str(intr_v1.relative_to(root))

	ts_v1 = root / "devices" / did / "timestamps.json"
	ts_rel = str(ts_v1.relative_to(root)) if ts_v1.exists() else None

	poses_v1 = root / "devices" / did / "arkit_poses.json"
	poses_rel = str(poses_v1.relative_to(root)) if poses_v1.exists() else None

	depth_dir_v1 = root / "devices" / did / "depth"
	depth_dir_rel = str(depth_dir_v1.relative_to(root)) if depth_dir_v1.exists() else None

	extra_streams: Dict[str, Any] = {}
	if depth_dir_rel:
	extra_streams["depth"] = {"directory": depth_dir_rel}

	compat_devices.append(
	_DeviceCompat(
	device_id=did,
	video_path=video_rel,
	intrinsics_path=intr_rel,
	timestamps_path=ts_rel,
	arkit_poses_path=poses_rel,
	lidar_depth_dir=None,
	model_extra={"streams": extra_streams} if extra_streams else {},
	)
	)

	if not compat_devices:
	raise CaptureBundleError("v2 manifest has no usable device entries")

	# Calibration + annotations compat: map well-known files when present.
	calib_files = []
	calib = (
	manifest_obj.get("calibration")
	if isinstance(manifest_obj.get("calibration"), dict)
	else {}
	)
	if isinstance(calib, dict) and isinstance(calib.get("files"), list):
	calib_files = [str(x) for x in calib.get("files") if isinstance(x, str)]
	cal = _CalibrationCompat(
	rig_extrinsics_path=(
	"calibration/rig_extrinsics.json"
	if "calibration/rig_extrinsics.json" in calib_files
	else None
	),
	sync_offsets_path=(
	"calibration/sync_offsets.json"
	if "calibration/sync_offsets.json" in calib_files
	else None
	),
	)

	ann_files = []
	anns = (
	manifest_obj.get("annotations")
	if isinstance(manifest_obj.get("annotations"), dict)
	else {}
	)
	if isinstance(anns, dict) and isinstance(anns.get("files"), list):
	ann_files = [str(x) for x in anns.get("files") if isinstance(x, str)]
	ann = _AnnotationsCompat(
	quick_annotation_path=(
	"annotations/quick_annotation.json"
	if "annotations/quick_annotation.json" in ann_files
	else None
	),
	detailed_annotation_path=(
	"annotations/detailed_annotation.json"
	if "annotations/detailed_annotation.json" in ann_files
	else None
	),
	)

	compat_manifest = _ManifestCompat(
	schema_version=schema_version,
	capture_id=str(manifest_obj.get("capture_id") or ""),
	devices=compat_devices,
	calibration=cal,
	annotations=ann,
	metadata={},
	)

	bundle = cls(
	root=root,
	manifest=compat_manifest,
	manifest_obj=manifest_obj,
	schema_version=schema_version,
	_v2_stream_index=v2_stream_index,
	)
	bundle.validate(repairable_ok=False)
	return bundle

	@property
	def layout(self) -> CaptureBundleLayout:
	return CaptureBundleLayout(root=self.root)

	def validate(self, repairable_ok: bool = True) -> None:
	"""
	Validate that referenced paths exist.

	If `repairable_ok` is True, missing optional assets do not fail validation.
	"""
	rels: List[Optional[str]] = []
	devices = getattr(self.manifest, "devices", []) or []
	for d in devices:
	rels.extend(
	[
	getattr(d, "video_path", None),
	getattr(d, "intrinsics_path", None),
	getattr(d, "timestamps_path", None),
	getattr(d, "arkit_poses_path", None),
	]
	)
	rels.append(getattr(d, "lidar_depth_dir", None))
	# WaveformMobile forward-compat: some manifests store depth under
	# device.extra.streams.depth.
	# Prefer lidar_depth_dir, but validate stream directory when present.
	extra = getattr(d, "model_extra", None) or {}
	streams = extra.get("streams") if isinstance(extra, dict) else None
	if isinstance(streams, dict):
	depth = streams.get("depth")
	if isinstance(depth, dict):
	rel = depth.get("directory")
	if isinstance(rel, str) and rel:
	rels.append(rel)

	if getattr(self.manifest, "calibration", None):
	cal = self.manifest.calibration # type: ignore[union-attr]
	rels.extend(
	[
	getattr(cal, "rig_extrinsics_path", None),
	getattr(cal, "sync_offsets_path", None),
	]
	)
	if getattr(self.manifest, "annotations", None):
	ann = self.manifest.annotations # type: ignore[union-attr]
	rels.extend(
	[
	getattr(ann, "quick_annotation_path", None),
	getattr(ann, "detailed_annotation_path", None),
	]
	)
	if getattr(self.manifest, "teacher_outputs", None):
	tout = self.manifest.teacher_outputs # type: ignore[union-attr]
	rels.extend(
	[
	getattr(tout, "depth_dir", None),
	getattr(tout, "uncertainty_dir", None),
	getattr(tout, "reconstruction_path", None),
	]
	)

	errors = validate_paths_exist(self.root, rels)
	if errors and not repairable_ok:
	raise CaptureBundleError("Capture bundle validation failed:\n- " + "\n- ".join(errors))

	# ---- Convenience accessors -------------------------------------------------

	def list_devices(self) -> List[str]:
	devices = getattr(self.manifest, "devices", []) or []
	return [str(getattr(d, "device_id")) for d in devices]

	def get_device(self, device_id: str):
	devices = getattr(self.manifest, "devices", []) or []
	for d in devices:
	if str(getattr(d, "device_id")) == device_id:
	return d
	raise CaptureBundleError(f"Unknown device_id: {device_id}")

	def device_video_path(self, device_id: str) -> Path:
	d = self.get_device(device_id)
	if not getattr(d, "video_path", None):
	raise CaptureBundleError(
	f"No video_path for device_id={device_id} (schema_version={self.schema_version})"
	)
	return (self.root / str(getattr(d, "video_path"))).resolve()

	def device_intrinsics_path(self, device_id: str) -> Path:
	d = self.get_device(device_id)
	if not getattr(d, "intrinsics_path", None):
	raise CaptureBundleError(
	f"No intrinsics_path for device_id={device_id} "
	f"(schema_version={self.schema_version})"
	)
	return (self.root / str(getattr(d, "intrinsics_path"))).resolve()

	def device_timestamps_path(self, device_id: str) -> Path:
	d = self.get_device(device_id)
	if not getattr(d, "timestamps_path", None):
	raise CaptureBundleError(
	f"No timestamps_path for device_id={device_id} "
	f"(schema_version={self.schema_version}). "
	"Use the timeline.frames stream (v2) instead."
	)
	return (self.root / str(getattr(d, "timestamps_path"))).resolve()

	def device_arkit_poses_path(self, device_id: str) -> Optional[Path]:
	d = self.get_device(device_id)
	if not getattr(d, "arkit_poses_path", None):
	return None
	return (self.root / str(getattr(d, "arkit_poses_path"))).resolve()

	def device_lidar_depth_dir(self, device_id: str) -> Optional[Path]:
	d = self.get_device(device_id)
	if not getattr(d, "lidar_depth_dir", None):
	return None
	return (self.root / str(getattr(d, "lidar_depth_dir"))).resolve()

	def device_depth_dir_best_effort(self, device_id: str) -> Optional[Path]:
	"""
	Prefer canonical `lidar_depth_dir`, but fall back to WaveformMobile packed stream directory
	stored under `device.streams.depth.directory` if present.
	"""
	d = self.get_device(device_id)
	if getattr(d, "lidar_depth_dir", None):
	p = (self.root / str(getattr(d, "lidar_depth_dir"))).resolve()
	return p
	extra = getattr(d, "model_extra", None) or {}
	if not isinstance(extra, dict):
	return None
	streams = extra.get("streams")
	if not isinstance(streams, dict):
	return None
	depth = streams.get("depth")
	if not isinstance(depth, dict):
	return None
	rel = depth.get("directory")
	if not isinstance(rel, str) or not rel:
	return None
	return (self.root / rel).resolve()

	# ---- v2 stream-centric helpers --------------------------------------------

	def v2_has_streams(self) -> bool:
	return bool(self.schema_version.startswith("2") and self._v2_stream_index)

	def v2_stream_ref(self, *, device_id: str, kind: str) -> Optional[Path]:
	"""
	Return the path to `stream.json` for (device_id, kind) when present in v2.
	"""
	if not self.schema_version.startswith("2"):
	return None
	rel = self._v2_stream_index.get((device_id, kind))
	return (self.root / rel).resolve() if rel else None

	def v2_stream_json(self, *, device_id: str, kind: str) -> Optional[Dict[str, Any]]:
	p = self.v2_stream_ref(device_id=device_id, kind=kind)
	if not p or not p.exists():
	return None
	try:
	obj = json.loads(p.read_text())
	return obj if isinstance(obj, dict) else None
	except Exception:
	return None

	def v2_stream_data_path(self, *, device_id: str, kind: str) -> Optional[Path]:
	sj = self.v2_stream_json(device_id=device_id, kind=kind)
	if not sj:
	return None
	sp = self.v2_stream_ref(device_id=device_id, kind=kind)
	if not sp:
	return None
	data = sj.get("data") if isinstance(sj.get("data"), dict) else None
	if not isinstance(data, dict):
	return None
	rel = data.get("path")
	if not isinstance(rel, str) or not rel:
	return None
	return (sp.parent / rel).resolve()

	# ---- WaveformMobile optional sensor streams -----------------------------------------

	def _device_streams_extra(self, device_id: str) -> Dict[str, Any]:
	d = self.get_device(device_id)
	extra = getattr(d, "model_extra", None) or {}
	if not isinstance(extra, dict):
	return {}
	streams = extra.get("streams")
	return streams if isinstance(streams, dict) else {}

	def device_imu_paths(
	self, device_id: str
	) -> tuple[Optional[Path], Optional[Path], Optional[Path]]:
	"""
	Return (imu_stream.bin, imu_frames.bin, imu_index.json) paths when present
	in device.streams.imu.
	"""
	streams = self._device_streams_extra(device_id)
	imu = streams.get("imu")
	if not isinstance(imu, dict):
	return (None, None, None)
	stream = imu.get("stream")
	frames = imu.get("frames")
	index = imu.get("index")
	sp = (self.root / str(stream)).resolve() if isinstance(stream, str) and stream else None
	fp = (self.root / str(frames)).resolve() if isinstance(frames, str) and frames else None
	ip = (self.root / str(index)).resolve() if isinstance(index, str) and index else None
	return (sp, fp, ip)

	def device_barometer_paths(self, device_id: str) -> tuple[Optional[Path], Optional[Path]]:
	"""
	Return (barometer_stream.bin, barometer/index.json) paths when present in
	device.streams.barometer.
	"""
	streams = self._device_streams_extra(device_id)
	bar = streams.get("barometer")
	if not isinstance(bar, dict):
	return (None, None)
	stream = bar.get("stream")
	index = bar.get("index")
	sp = (self.root / str(stream)).resolve() if isinstance(stream, str) and stream else None
	ip = (self.root / str(index)).resolve() if isinstance(index, str) and index else None
	return (sp, ip)

	def load_detailed_annotation(self) -> Optional[DetailedAnnotation]:
	if not self.manifest.annotations or not self.manifest.annotations.detailed_annotation_path:
	return None
	p = (self.root / self.manifest.annotations.detailed_annotation_path).resolve()
	if not p.exists():
	return None
	try:
	obj = json.loads(p.read_text())
	return DetailedAnnotation.model_validate(obj)
	except Exception as e:
	raise CaptureBundleError(f"Failed to parse detailed annotation: {p}: {e}") from e

	def load_intrinsics_matrix(self, device_id: str) -> np.ndarray:
	"""
	Load intrinsics from JSON as a (3, 3) float32 matrix.

	The exact intrinsics JSON schema is intentionally flexible; we accept:
	- {"K": [[...],[...],[...]]} or
	- {"intrinsics": [[...],[...],[...]]} or
	- {"fx":..., "fy":..., "cx":..., "cy":...}
	"""
	p = self.device_intrinsics_path(device_id)
	obj = json.loads(p.read_text())
	if "K" in obj:
	K = np.asarray(obj["K"], dtype=np.float32)
	elif "intrinsics" in obj:
	K = np.asarray(obj["intrinsics"], dtype=np.float32)
	elif all(k in obj for k in ("fx", "fy", "cx", "cy")):
	fx, fy, cx, cy = float(obj["fx"]), float(obj["fy"]), float(obj["cx"]), float(obj["cy"])
	K = np.array([[fx, 0.0, cx], [0.0, fy, cy], [0.0, 0.0, 1.0]], dtype=np.float32)
	else:
	raise CaptureBundleError(f"Unsupported intrinsics JSON schema: {p}")
	if K.shape != (3, 3):
	raise CaptureBundleError(f"Intrinsics must be 3x3, got {K.shape} in {p}")
	return K

	def load_intrinsics_and_distortion(
	self, device_id: str
	) -> tuple[np.ndarray, Optional[np.ndarray]]:
	"""
	Load intrinsics matrix K and (optional) distortion coefficients.

	Distortion support is best-effort and forward-compatible. Accepted keys:
	- {"distortion": [...]} (OpenCV-style coeffs)
	- {"dist": [...]} or {"dist_coeffs": [...]}
	- {"k": [...]} (legacy)
	"""
	p = self.device_intrinsics_path(device_id)
	obj = json.loads(p.read_text())
	K = self.load_intrinsics_matrix(device_id)
	dist = None
	for key in ("distortion", "dist", "dist_coeffs", "k"):
	if key in obj and isinstance(obj[key], list):
	try:
	dist = np.asarray(obj[key], dtype=np.float64).reshape(-1)
	except Exception:
	dist = None
	break
	return K.astype(np.float32, copy=False), dist

	def load_sync_offsets(self) -> Optional[Dict[str, float]]:
	"""
	Load per-device sync offsets (seconds) if available.
	"""
	if not self.manifest.calibration or not self.manifest.calibration.sync_offsets_path:
	return None
	p = (self.root / self.manifest.calibration.sync_offsets_path).resolve()
	if not p.exists():
	return None
	obj = json.loads(p.read_text())
	# Expected {device_id: offset_seconds}
	return {str(k): float(v) for k, v in obj.items()}

	def load_rig_extrinsics(self) -> Optional[Dict[str, Any]]:
	"""
	Load rig extrinsics if available.

	The exact schema is not locked yet; we return raw JSON for now.
	"""
	if not self.manifest.calibration or not self.manifest.calibration.rig_extrinsics_path:
	return None
	p = (self.root / self.manifest.calibration.rig_extrinsics_path).resolve()
	if not p.exists():
	return None
	return json.loads(p.read_text())