Spaces:

bing-yan
/

trace

Sleeping

trace / inference.py

bingyan user

Rebrand TRACE -> SPARK

8619a66 about 1 month ago

68.8 kB

	"""
	SPARK inference engine.

	Loads trained EC and TPD models and runs end-to-end inference
	from preprocessed arrays (dimensionless for CV, physical for TPD).
	"""

	import json
	import sys
	import os
	from pathlib import Path

	import numpy as np
	import torch



	import flow_model as _fm_module
	import multi_mechanism_model as _mm_module
	import tpd_model as _tpd_mod
	import generate_tpd_data as _tpd_gen
	from multi_mechanism_model import MultiMechanismFlow
	from tpd_model import MultiMechanismFlowTPD
	from flow_model import MECHANISM_PARAMS, ActNorm
	from generate_tpd_data import TPD_MECHANISM_PARAMS


	def _fix_actnorm_initialized(model):
	"""Mark all ActNorm layers as initialized after loading a checkpoint.

	Old checkpoints lack the ``_initialized`` buffer, so ``load_state_dict``
	leaves it at ``False``. The first forward pass would then overwrite the
	trained ``log_scale``/``bias`` with data-dependent statistics.
	"""
	for module in model.modules():
	if isinstance(module, ActNorm) and not module.initialized:
	module.initialized = True


	class SPARKPredictor:
	"""Unified predictor for both EC (cyclic voltammetry) and TPD domains."""

	def __init__(self, ec_checkpoint=None, tpd_checkpoint=None, device=None,
	ec_image_checkpoint=None, tpd_image_checkpoint=None,
	ec_joint_checkpoint=None, tpd_joint_checkpoint=None):
	if device is None:
	device = "cuda" if torch.cuda.is_available() else "cpu"
	self.device = device

	self.ec_model = None
	self.ec_norm_stats = None
	self.tpd_model = None
	self.tpd_norm_stats = None

	# Optional image-input variants; loaded only if checkpoint paths
	# are supplied. Each is a separate model with its own encoder.
	self.ec_image_model = None
	self.ec_image_mech_list = None
	self.tpd_image_model = None
	self.tpd_image_mech_list = None

	# Optional Phase-2 joint (image + waveform) variants.
	self.ec_joint_model = None
	self.ec_joint_mech_list = None
	self.tpd_joint_model = None
	self.tpd_joint_mech_list = None

	if ec_checkpoint is not None:
	self._load_ec(ec_checkpoint)
	if tpd_checkpoint is not None:
	self._load_tpd(tpd_checkpoint)
	if ec_image_checkpoint is not None:
	self._load_ec_image(ec_image_checkpoint)
	if tpd_image_checkpoint is not None:
	self._load_tpd_image(tpd_image_checkpoint)
	if ec_joint_checkpoint is not None:
	self._load_ec_joint(ec_joint_checkpoint)
	if tpd_joint_checkpoint is not None:
	self._load_tpd_joint(tpd_joint_checkpoint)

	@property
	def has_ec_image_model(self) -> bool:
	return self.ec_image_model is not None

	@property
	def has_tpd_image_model(self) -> bool:
	return self.tpd_image_model is not None

	@property
	def has_ec_joint_model(self) -> bool:
	return self.ec_joint_model is not None

	@property
	def has_tpd_joint_model(self) -> bool:
	return self.tpd_joint_model is not None

	def _load_ec(self, ckpt_path):
	ckpt_path = Path(ckpt_path)
	checkpoint = torch.load(ckpt_path, map_location="cpu", weights_only=False)
	args = checkpoint["args"]

	# If the checkpoint was trained on a custom mechanism subset (e.g.
	# v14_9mech), patch the global MECHANISM_LIST in flow_model and
	# multi_mechanism_model BEFORE constructing MultiMechanismFlow so
	# the classifier and flow_heads sizes match the checkpoint exactly.
	# Otherwise strict=False below would silently drop classifier
	# weights and we'd end up with random-weights predictions.
	if args.get("mechanism_list") is not None:
	new_list = list(args["mechanism_list"])
	_fm_module.MECHANISM_LIST = new_list
	_mm_module.MECHANISM_LIST = new_list
	self.ec_mechanism_list = list(_fm_module.MECHANISM_LIST)

	self.ec_model = MultiMechanismFlow(
	d_context=args.get("d_context", 128),
	d_model=args.get("d_model", 128),
	n_coupling_layers=args.get("n_coupling_layers", 6),
	hidden_dim=args.get("hidden_dim", 96),
	coupling_type=args.get("coupling_type", "spline"),
	n_bins=args.get("n_bins", 8),
	tail_bound=args.get("tail_bound", 5.0),
	aggregation=args.get("aggregation", "set_transformer"),
	use_summary_features=args.get("use_summary_features", False),
	)

	# If checkpoint includes a trained OOD head, initialize the matching
	# nn.Sequential before loading so its weights are restored too.
	state = checkpoint["model_state_dict"]
	if any(k.startswith("ood_head.") for k in state):
	meta = checkpoint.get("ood_head_meta", {})
	self.ec_model.init_ood_head(
	hidden_dim=meta.get("hidden_dim", 64),
	extra_input_dim=meta.get("extra_input_dim", 0),
	use_nll=meta.get("use_nll", False),
	use_posterior_width=meta.get("use_posterior_width", False),
	)

	missing, unexpected = self.ec_model.load_state_dict(
	state, strict=False)
	# We only tolerate buffers like ActNorm._initialized being missing/extra.
	suspicious_missing = [
	k for k in missing if not k.endswith("_initialized")
	]
	suspicious_unexpected = [
	k for k in unexpected if not k.endswith("_initialized")
	]
	if suspicious_missing or suspicious_unexpected:
	print(f"[SPARKPredictor] WARNING: state_dict mismatch on EC ckpt.")
	if suspicious_missing:
	print(f" missing ({len(suspicious_missing)}): "
	f"{suspicious_missing[:6]}{' ...' if len(suspicious_missing) > 6 else ''}")
	if suspicious_unexpected:
	print(f" unexpected({len(suspicious_unexpected)}): "
	f"{suspicious_unexpected[:6]}{' ...' if len(suspicious_unexpected) > 6 else ''}")
	_fix_actnorm_initialized(self.ec_model)
	self.ec_model.to(self.device).eval()

	# Search for norm_stats in multiple locations
	ckpt_dir = ckpt_path.parent
	stem = ckpt_path.stem.replace("best", "").rstrip("_")
	prefix = stem + "_" if stem else ""
	for search_dir in [ckpt_dir, ckpt_dir.parent]:
	for name_pattern in [f"{prefix}norm_stats.json", "ec_norm_stats.json", "norm_stats.json"]:
	p = search_dir / name_pattern
	if p.exists():
	with open(p) as f:
	self.ec_norm_stats = json.load(f)
	break
	if self.ec_norm_stats is not None:
	break
	for search_dir in [ckpt_dir, ckpt_dir.parent]:
	for name_pattern in [f"{prefix}theta_stats.json", "ec_theta_stats.json", "theta_stats.json"]:
	p = search_dir / name_pattern
	if p.exists():
	with open(p) as f:
	self.ec_theta_stats = json.load(f)
	break
	if hasattr(self, "ec_theta_stats") and self.ec_theta_stats is not None:
	break

	def _load_tpd(self, ckpt_path):
	ckpt_path = Path(ckpt_path)
	checkpoint = torch.load(ckpt_path, map_location="cpu", weights_only=False)
	args = checkpoint["args"]

	self.tpd_use_summary = args.get("use_summary_features", False)

	# As with EC: align module-globals AND pass mechanism_list explicitly
	# so the classifier/flow_heads match the checkpoint shape (e.g.
	# tpd_11mech_v1 has 11 mechs, not the default 13).
	ckpt_mech_list = args.get("mechanism_list")
	if ckpt_mech_list is not None:
	new_list = list(ckpt_mech_list)
	_tpd_gen.TPD_MECHANISM_LIST = new_list
	_tpd_gen.TPD_MECHANISM_TO_ID = {m: i for i, m in enumerate(new_list)}
	_tpd_mod.TPD_MECHANISM_LIST = new_list
	try:
	import dataset_tpd as _ds_tpd
	_ds_tpd.TPD_MECHANISM_LIST = new_list
	except ImportError:
	pass
	self.tpd_mechanism_list = list(_tpd_gen.TPD_MECHANISM_LIST)

	self.tpd_model = MultiMechanismFlowTPD(
	d_context=args.get("d_context", 128),
	d_model=args.get("d_model", 128),
	n_coupling_layers=args.get("n_coupling_layers", 6),
	hidden_dim=args.get("hidden_dim", 96),
	coupling_type=args.get("coupling_type", "spline"),
	n_bins=args.get("n_bins", 8),
	tail_bound=args.get("tail_bound", 5.0),
	use_summary_features=self.tpd_use_summary,
	use_bounded_flow=args.get("use_bounded_flow", False),
	mechanism_list=self.tpd_mechanism_list,
	)

	state = checkpoint["model_state_dict"]
	if any(k.startswith("ood_head.") for k in state):
	meta = checkpoint.get("ood_head_meta", {})
	self.tpd_model.init_ood_head(
	hidden_dim=meta.get("hidden_dim", 64),
	extra_input_dim=meta.get("extra_input_dim", 0),
	)

	missing, unexpected = self.tpd_model.load_state_dict(
	state, strict=False)
	suspicious_missing = [
	k for k in missing if not k.endswith("_initialized")
	]
	suspicious_unexpected = [
	k for k in unexpected if not k.endswith("_initialized")
	]
	if suspicious_missing or suspicious_unexpected:
	print(f"[SPARKPredictor] WARNING: state_dict mismatch on TPD ckpt.")
	if suspicious_missing:
	print(f" missing ({len(suspicious_missing)}): "
	f"{suspicious_missing[:6]}{' ...' if len(suspicious_missing) > 6 else ''}")
	if suspicious_unexpected:
	print(f" unexpected({len(suspicious_unexpected)}): "
	f"{suspicious_unexpected[:6]}{' ...' if len(suspicious_unexpected) > 6 else ''}")
	_fix_actnorm_initialized(self.tpd_model)
	self.tpd_model.to(self.device).eval()

	# Search for norm_stats in multiple locations
	ckpt_dir = ckpt_path.parent
	stem = ckpt_path.stem.replace("best", "").rstrip("_")
	prefix = stem + "_" if stem else ""
	for search_dir in [ckpt_dir, ckpt_dir.parent]:
	for name_pattern in [f"{prefix}norm_stats.json", "tpd_norm_stats.json", "norm_stats.json"]:
	p = search_dir / name_pattern
	if p.exists():
	with open(p) as f:
	self.tpd_norm_stats = json.load(f)
	break
	if self.tpd_norm_stats is not None:
	break
	for search_dir in [ckpt_dir, ckpt_dir.parent]:
	for name_pattern in [f"{prefix}theta_stats.json", "tpd_theta_stats.json", "theta_stats.json"]:
	p = search_dir / name_pattern
	if p.exists():
	with open(p) as f:
	self.tpd_theta_stats = json.load(f)
	break
	if hasattr(self, "tpd_theta_stats") and self.tpd_theta_stats is not None:
	break

	# =====================================================================
	# Image-input variants (parallel to the waveform models above)
	# =====================================================================

	@staticmethod
	def _detect_input_mode(state_dict) -> str:
	"""Detect input_mode from a checkpoint's state_dict keys.

	Phase-1 image -> encoder.per_cv_encoder.stem.*
	Phase-1 wave -> encoder.per_cv_encoder.conv.*
	Phase-2 joint -> encoder.image_encoder.* + encoder.waveform_encoder.*
	"""
	if any(k.startswith("encoder.image_encoder.") for k in state_dict) and \
	any(k.startswith("encoder.waveform_encoder.") for k in state_dict):
	return "image+waveform"
	if any(k.startswith("encoder.per_cv_encoder.stem.") for k in state_dict):
	return "image"
	return "waveform"

	def _build_image_model_state(self, ckpt_path, builder_cls,
	is_tpd=False, expected_input_mode="image"):
	ckpt_path = Path(ckpt_path)
	ckpt = torch.load(ckpt_path, map_location="cpu", weights_only=False)
	args = ckpt["args"] if isinstance(ckpt, dict) and "args" in ckpt else {}
	# Older image-mode trainers didn't store input_mode in args; sniff
	# the state_dict to disambiguate.
	actual = (args.get("input_mode")
	or self._detect_input_mode(ckpt["model_state_dict"]))
	if actual != expected_input_mode:
	raise ValueError(
	f"{expected_input_mode!r} checkpoint expected; got input_mode="
	f"{actual!r} for {ckpt_path}"
	)
	return ckpt_path, ckpt, args

	def _load_ec_image(self, ckpt_path):
	ckpt_path, ckpt, args = self._build_image_model_state(
	ckpt_path, MultiMechanismFlow,
	)
	if args.get("mechanism_list") is not None:
	new_list = list(args["mechanism_list"])
	_fm_module.MECHANISM_LIST = new_list
	_mm_module.MECHANISM_LIST = new_list
	self.ec_image_mech_list = list(_fm_module.MECHANISM_LIST)

	self.ec_image_model = MultiMechanismFlow(
	d_context=args.get("d_context", 128),
	d_model=args.get("d_model", 128),
	n_coupling_layers=args.get("n_coupling_layers", 6),
	hidden_dim=args.get("hidden_dim", 96),
	coupling_type=args.get("coupling_type", "spline"),
	n_bins=args.get("n_bins", 8),
	tail_bound=args.get("tail_bound", 5.0),
	aggregation=args.get("aggregation", "set_transformer"),
	use_summary_features=False,
	input_mode="image",
	image_in_channels=args.get("image_in_channels", 1),
	)

	state = ckpt["model_state_dict"]
	if any(k.startswith("ood_head.") for k in state):
	meta = ckpt.get("ood_head_meta", {})
	self.ec_image_model.init_ood_head(
	hidden_dim=meta.get("hidden_dim", 64),
	extra_input_dim=meta.get("extra_input_dim", 0),
	use_nll=meta.get("use_nll", False),
	use_posterior_width=meta.get("use_posterior_width", False),
	)

	missing, unexpected = self.ec_image_model.load_state_dict(
	state, strict=False)
	suspicious_missing = [k for k in missing if not k.endswith("_initialized")]
	suspicious_unexpected = [k for k in unexpected if not k.endswith("_initialized")]
	if suspicious_missing or suspicious_unexpected:
	print("[SPARKPredictor] WARNING: state_dict mismatch on EC image ckpt.")
	if suspicious_missing:
	print(f" missing ({len(suspicious_missing)}): "
	f"{suspicious_missing[:6]}{' ...' if len(suspicious_missing) > 6 else ''}")
	if suspicious_unexpected:
	print(f" unexpected({len(suspicious_unexpected)}): "
	f"{suspicious_unexpected[:6]}{' ...' if len(suspicious_unexpected) > 6 else ''}")
	_fix_actnorm_initialized(self.ec_image_model)
	self.ec_image_model.to(self.device).eval()

	def _load_tpd_image(self, ckpt_path):
	ckpt_path, ckpt, args = self._build_image_model_state(
	ckpt_path, MultiMechanismFlowTPD, is_tpd=True,
	)
	ckpt_mech_list = args.get("mechanism_list")
	if ckpt_mech_list is not None:
	new_list = list(ckpt_mech_list)
	_tpd_gen.TPD_MECHANISM_LIST = new_list
	_tpd_gen.TPD_MECHANISM_TO_ID = {m: i for i, m in enumerate(new_list)}
	_tpd_mod.TPD_MECHANISM_LIST = new_list
	try:
	import dataset_tpd as _ds_tpd
	_ds_tpd.TPD_MECHANISM_LIST = new_list
	except ImportError:
	pass
	self.tpd_image_mech_list = list(_tpd_gen.TPD_MECHANISM_LIST)

	self.tpd_image_model = MultiMechanismFlowTPD(
	d_context=args.get("d_context", 128),
	d_model=args.get("d_model", 128),
	n_coupling_layers=args.get("n_coupling_layers", 6),
	hidden_dim=args.get("hidden_dim", 96),
	coupling_type=args.get("coupling_type", "spline"),
	n_bins=args.get("n_bins", 8),
	tail_bound=args.get("tail_bound", 5.0),
	use_summary_features=False,
	use_bounded_flow=args.get("use_bounded_flow", False),
	mechanism_list=self.tpd_image_mech_list,
	input_mode="image",
	image_in_channels=args.get("image_in_channels", 1),
	)

	state = ckpt["model_state_dict"]
	if any(k.startswith("ood_head.") for k in state):
	meta = ckpt.get("ood_head_meta", {})
	self.tpd_image_model.init_ood_head(
	hidden_dim=meta.get("hidden_dim", 64),
	extra_input_dim=meta.get("extra_input_dim", 0),
	)

	missing, unexpected = self.tpd_image_model.load_state_dict(
	state, strict=False)
	suspicious_missing = [k for k in missing if not k.endswith("_initialized")]
	suspicious_unexpected = [k for k in unexpected if not k.endswith("_initialized")]
	if suspicious_missing or suspicious_unexpected:
	print("[SPARKPredictor] WARNING: state_dict mismatch on TPD image ckpt.")
	if suspicious_missing:
	print(f" missing ({len(suspicious_missing)}): "
	f"{suspicious_missing[:6]}{' ...' if len(suspicious_missing) > 6 else ''}")
	if suspicious_unexpected:
	print(f" unexpected({len(suspicious_unexpected)}): "
	f"{suspicious_unexpected[:6]}{' ...' if len(suspicious_unexpected) > 6 else ''}")
	_fix_actnorm_initialized(self.tpd_image_model)
	self.tpd_image_model.to(self.device).eval()

	# =====================================================================
	# Phase-2 joint (image + waveform) loaders
	# =====================================================================

	def _load_ec_joint(self, ckpt_path):
	ckpt_path, ckpt, args = self._build_image_model_state(
	ckpt_path, MultiMechanismFlow,
	expected_input_mode="image+waveform",
	)
	if args.get("mechanism_list") is not None:
	new_list = list(args["mechanism_list"])
	_fm_module.MECHANISM_LIST = new_list
	_mm_module.MECHANISM_LIST = new_list
	self.ec_joint_mech_list = list(_fm_module.MECHANISM_LIST)

	self.ec_joint_model = MultiMechanismFlow(
	d_context=args.get("d_context", 128),
	d_model=args.get("d_model", 128),
	n_coupling_layers=args.get("n_coupling_layers", 6),
	hidden_dim=args.get("hidden_dim", 96),
	coupling_type=args.get("coupling_type", "spline"),
	n_bins=args.get("n_bins", 8),
	tail_bound=args.get("tail_bound", 5.0),
	aggregation=args.get("aggregation", "set_transformer"),
	use_summary_features=False,
	input_mode="image+waveform",
	image_in_channels=args.get("image_in_channels", 1),
	)

	state = ckpt["model_state_dict"]
	if any(k.startswith("ood_head.") for k in state):
	meta = ckpt.get("ood_head_meta", {})
	self.ec_joint_model.init_ood_head(
	hidden_dim=meta.get("hidden_dim", 64),
	extra_input_dim=meta.get("extra_input_dim", 0),
	use_nll=meta.get("use_nll", False),
	use_posterior_width=meta.get("use_posterior_width", False),
	)

	missing, unexpected = self.ec_joint_model.load_state_dict(
	state, strict=False)
	suspicious_missing = [k for k in missing if not k.endswith("_initialized")]
	suspicious_unexpected = [k for k in unexpected if not k.endswith("_initialized")]
	if suspicious_missing or suspicious_unexpected:
	print("[SPARKPredictor] WARNING: state_dict mismatch on EC joint ckpt.")
	if suspicious_missing:
	print(f" missing ({len(suspicious_missing)}): "
	f"{suspicious_missing[:6]}{' ...' if len(suspicious_missing) > 6 else ''}")
	if suspicious_unexpected:
	print(f" unexpected({len(suspicious_unexpected)}): "
	f"{suspicious_unexpected[:6]}{' ...' if len(suspicious_unexpected) > 6 else ''}")
	_fix_actnorm_initialized(self.ec_joint_model)
	self.ec_joint_model.to(self.device).eval()

	def _load_tpd_joint(self, ckpt_path):
	ckpt_path, ckpt, args = self._build_image_model_state(
	ckpt_path, MultiMechanismFlowTPD, is_tpd=True,
	expected_input_mode="image+waveform",
	)
	ckpt_mech_list = args.get("mechanism_list")
	if ckpt_mech_list is not None:
	new_list = list(ckpt_mech_list)
	_tpd_gen.TPD_MECHANISM_LIST = new_list
	_tpd_gen.TPD_MECHANISM_TO_ID = {m: i for i, m in enumerate(new_list)}
	_tpd_mod.TPD_MECHANISM_LIST = new_list
	try:
	import dataset_tpd as _ds_tpd
	_ds_tpd.TPD_MECHANISM_LIST = new_list
	except ImportError:
	pass
	self.tpd_joint_mech_list = list(_tpd_gen.TPD_MECHANISM_LIST)

	self.tpd_joint_model = MultiMechanismFlowTPD(
	d_context=args.get("d_context", 128),
	d_model=args.get("d_model", 128),
	n_coupling_layers=args.get("n_coupling_layers", 6),
	hidden_dim=args.get("hidden_dim", 96),
	coupling_type=args.get("coupling_type", "spline"),
	n_bins=args.get("n_bins", 8),
	tail_bound=args.get("tail_bound", 5.0),
	use_summary_features=False,
	use_bounded_flow=args.get("use_bounded_flow", False),
	mechanism_list=self.tpd_joint_mech_list,
	input_mode="image+waveform",
	image_in_channels=args.get("image_in_channels", 1),
	)

	state = ckpt["model_state_dict"]
	if any(k.startswith("ood_head.") for k in state):
	meta = ckpt.get("ood_head_meta", {})
	self.tpd_joint_model.init_ood_head(
	hidden_dim=meta.get("hidden_dim", 64),
	extra_input_dim=meta.get("extra_input_dim", 0),
	)

	missing, unexpected = self.tpd_joint_model.load_state_dict(
	state, strict=False)
	suspicious_missing = [k for k in missing if not k.endswith("_initialized")]
	suspicious_unexpected = [k for k in unexpected if not k.endswith("_initialized")]
	if suspicious_missing or suspicious_unexpected:
	print("[SPARKPredictor] WARNING: state_dict mismatch on TPD joint ckpt.")
	if suspicious_missing:
	print(f" missing ({len(suspicious_missing)}): "
	f"{suspicious_missing[:6]}{' ...' if len(suspicious_missing) > 6 else ''}")
	if suspicious_unexpected:
	print(f" unexpected({len(suspicious_unexpected)}): "
	f"{suspicious_unexpected[:6]}{' ...' if len(suspicious_unexpected) > 6 else ''}")
	_fix_actnorm_initialized(self.tpd_joint_model)
	self.tpd_joint_model.to(self.device).eval()

	@staticmethod
	def _pil_to_grayscale_tensor(pil_image, target_size=224):
	"""Convert a PIL image to a [1, target_size, target_size] float
	tensor in [0, 1]."""
	from PIL import Image as PILImage
	img = pil_image.convert("L")
	if img.size != (target_size, target_size):
	img = img.resize((target_size, target_size), PILImage.BILINEAR)
	arr = np.asarray(img, dtype=np.float32) / 255.0
	return torch.from_numpy(arr).unsqueeze(0) # [1, H, W]

	def _build_image_input(self, pil_images, sigmas, flux_scales,
	target_size=224):
	"""Build image-mode model input from a list of PIL images.

	Args:
	pil_images: list of PIL.Image objects (one per scan rate / heating rate).
	sigmas: 1-D array of raw scan rates (V/s) or heating rates (K/s).
	flux_scales: 1-D array of log10(peak \|signal\|) per scan/curve.
	If None, set to zero (model still works since flux_scales is
	additive conditioning that the network learned to handle).
	target_size: image edge length expected by the encoder.
	"""
	n = len(pil_images)
	imgs = torch.stack(
	[self._pil_to_grayscale_tensor(p, target_size) for p in pil_images]
	) # [N, 1, H, W]
	x = imgs.unsqueeze(0).to(self.device) # [1, N, 1, H, W]
	scan_mask = torch.ones(1, n, dtype=torch.bool, device=self.device)
	sigmas_log = np.log10(np.clip(np.asarray(sigmas, dtype=np.float32),
	1e-10, None))
	sigmas_t = torch.from_numpy(sigmas_log).unsqueeze(0).to(self.device)
	if flux_scales is None:
	fs_t = torch.zeros(1, n, dtype=torch.float32, device=self.device)
	else:
	fs_t = torch.from_numpy(
	np.asarray(flux_scales, dtype=np.float32)
	).unsqueeze(0).to(self.device)
	return {
	"input": x, "scan_mask": scan_mask,
	"sigmas": sigmas_t, "flux_scales": fs_t,
	}

	@torch.no_grad()
	def predict_ec_image(self, pil_images, sigmas, flux_scales=None,
	n_samples=500, temperature=1.0):
	"""Run image-mode CV inference. `pil_images` length should match `sigmas`.

	Returns the same dict shape as `predict_ec`.
	"""
	if self.ec_image_model is None:
	raise RuntimeError("EC image model not loaded")
	if len(pil_images) != len(sigmas):
	raise ValueError(
	f"#images ({len(pil_images)}) must match #sigmas ({len(sigmas)})"
	)
	tensors = self._build_image_input(pil_images, sigmas, flux_scales)
	pred = self.ec_image_model.predict(
	tensors["input"],
	scan_mask=tensors["scan_mask"],
	sigmas=tensors["sigmas"],
	flux_scales=tensors["flux_scales"],
	n_samples=n_samples,
	temperature=temperature,
	)
	return self._format_ec_pred(pred, self.ec_image_mech_list)

	def _build_joint_input_ec(self, pil_images, sigmas,
	potentials, fluxes, times):
	"""Build the joint encoder's input dict for CV.

	Combines `_build_image_input` (image branch) with the same
	normalization/resampling pipeline `_prepare_ec_tensor` uses for the
	waveform branch, then fuses them into the dict shape the joint
	encoder expects.
	"""
	n_scans = len(pil_images)
	if len(sigmas) != n_scans or len(potentials) != n_scans \
	or len(fluxes) != n_scans:
	raise ValueError(
	"predict_ec_joint: pil_images, sigmas, potentials, fluxes "
	"must all have the same length"
	)

	# Image branch: [1, N, 1, H, W]
	imgs = torch.stack(
	[self._pil_to_grayscale_tensor(p, target_size=224)
	for p in pil_images]
	).unsqueeze(0).to(self.device)
	scan_mask_image = torch.ones(1, n_scans, dtype=torch.bool,
	device=self.device)

	# Waveform branch: re-use the existing tensor builder.
	wf_tensors = self._prepare_ec_tensor(potentials, fluxes, times, sigmas)
	x = {
	"image": imgs,
	"waveform": wf_tensors["input"],
	"scan_mask_image": scan_mask_image,
	"scan_mask_waveform": wf_tensors["scan_mask"],
	}
	return x, wf_tensors["sigmas"], wf_tensors["flux_scales"]

	def _build_joint_input_tpd(self, pil_images, betas, temperatures, rates):
	n_rates = len(pil_images)
	if len(betas) != n_rates or len(temperatures) != n_rates \
	or len(rates) != n_rates:
	raise ValueError(
	"predict_tpd_joint: pil_images, betas, temperatures, rates "
	"must all have the same length"
	)
	imgs = torch.stack(
	[self._pil_to_grayscale_tensor(p, target_size=224)
	for p in pil_images]
	).unsqueeze(0).to(self.device)
	scan_mask_image = torch.ones(1, n_rates, dtype=torch.bool,
	device=self.device)
	wf_tensors = self._prepare_tpd_tensor(temperatures, rates, betas)
	x = {
	"image": imgs,
	"waveform": wf_tensors["input"],
	"scan_mask_image": scan_mask_image,
	"scan_mask_waveform": wf_tensors["scan_mask"],
	}
	return x, wf_tensors["sigmas"], wf_tensors["flux_scales"]

	@torch.no_grad()
	def predict_ec_joint(self, pil_images, sigmas, potentials, fluxes,
	times=None, n_samples=500, temperature=1.0):
	"""Run Phase-2 joint CV inference: image + waveform together."""
	if self.ec_joint_model is None:
	raise RuntimeError("EC joint model not loaded")
	x, sigmas_t, flux_scales_t = self._build_joint_input_ec(
	pil_images, sigmas, potentials, fluxes, times,
	)
	pred = self.ec_joint_model.predict(
	x, scan_mask=None, sigmas=sigmas_t, flux_scales=flux_scales_t,
	n_samples=n_samples, temperature=temperature,
	)
	return self._format_ec_pred(pred, self.ec_joint_mech_list)

	@torch.no_grad()
	def predict_tpd_joint(self, pil_images, betas, temperatures, rates,
	n_samples=500, temperature=1.0):
	"""Run Phase-2 joint TPD inference: image + waveform together."""
	if self.tpd_joint_model is None:
	raise RuntimeError("TPD joint model not loaded")
	x, sigmas_t, flux_scales_t = self._build_joint_input_tpd(
	pil_images, betas, temperatures, rates,
	)
	pred = self.tpd_joint_model.predict(
	x, scan_mask=None, sigmas=sigmas_t, flux_scales=flux_scales_t,
	n_samples=n_samples, temperature=temperature,
	)
	return self._format_tpd_pred(pred, self.tpd_joint_mech_list)

	@torch.no_grad()
	def predict_tpd_image(self, pil_images, betas, flux_scales=None,
	n_samples=500, temperature=1.0):
	"""Run image-mode TPD inference. Returns the same shape as predict_tpd."""
	if self.tpd_image_model is None:
	raise RuntimeError("TPD image model not loaded")
	if len(pil_images) != len(betas):
	raise ValueError(
	f"#images ({len(pil_images)}) must match #betas ({len(betas)})"
	)
	tensors = self._build_image_input(pil_images, betas, flux_scales)
	pred = self.tpd_image_model.predict(
	tensors["input"],
	scan_mask=tensors["scan_mask"],
	sigmas=tensors["sigmas"],
	flux_scales=tensors["flux_scales"],
	n_samples=n_samples,
	temperature=temperature,
	)
	return self._format_tpd_pred(pred, self.tpd_image_mech_list)

	def _format_ec_pred(self, pred, mech_list):
	probs = pred["mechanism_probs"][0].cpu().numpy()
	pred_idx = int(pred["mechanism_pred"][0].cpu().item())
	pred_mech = mech_list[pred_idx]
	param_stats = {}
	samples_dict = {}
	for mech in mech_list:
	if pred["samples"][mech] is not None:
	s = pred["samples"][mech][0].cpu().numpy()
	samples_dict[mech] = s
	param_stats[mech] = {
	"names": MECHANISM_PARAMS[mech]["names"],
	"mean": s.mean(axis=0).tolist(),
	"std": s.std(axis=0).tolist(),
	"median": np.median(s, axis=0).tolist(),
	"q05": np.quantile(s, 0.05, axis=0).tolist(),
	"q95": np.quantile(s, 0.95, axis=0).tolist(),
	}
	ood_score = pred.get("ood_score")
	ood_score_val = (float(ood_score[0].cpu().item())
	if ood_score is not None else None)
	return {
	"domain": "ec",
	"mechanism_probs": {m: float(probs[i]) for i, m in enumerate(mech_list)},
	"mechanism_names": mech_list,
	"predicted_mechanism": pred_mech,
	"predicted_mechanism_idx": pred_idx,
	"parameter_stats": param_stats,
	"posterior_samples": samples_dict,
	"ood_score": ood_score_val,
	}

	def _format_tpd_pred(self, pred, mech_list):
	probs = pred["mechanism_probs"][0].cpu().numpy()
	pred_idx = int(pred["mechanism_pred"][0].cpu().item())
	pred_mech = mech_list[pred_idx]
	param_stats = {}
	samples_dict = {}
	for mech in mech_list:
	if pred["samples"][mech] is not None:
	s = pred["samples"][mech][0].cpu().numpy()
	samples_dict[mech] = s
	param_stats[mech] = {
	"names": TPD_MECHANISM_PARAMS[mech]["names"],
	"mean": s.mean(axis=0).tolist(),
	"std": s.std(axis=0).tolist(),
	"median": np.median(s, axis=0).tolist(),
	"q05": np.quantile(s, 0.05, axis=0).tolist(),
	"q95": np.quantile(s, 0.95, axis=0).tolist(),
	}
	ood_score = pred.get("ood_score")
	ood_score_val = (float(ood_score[0].cpu().item())
	if ood_score is not None else None)
	return {
	"domain": "tpd",
	"mechanism_probs": {m: float(probs[i]) for i, m in enumerate(mech_list)},
	"mechanism_names": mech_list,
	"predicted_mechanism": pred_mech,
	"predicted_mechanism_idx": pred_idx,
	"parameter_stats": param_stats,
	"posterior_samples": samples_dict,
	"ood_score": ood_score_val,
	}

	# =====================================================================
	# Hybrid predictors: run image-mode + waveform-mode in parallel and
	# combine, with selectable strategies.
	# =====================================================================

	@staticmethod
	def _ensemble_results(image_result, waveform_result, param_names_lookup):
	"""Combine image-mode + waveform-mode predictions.

	- mechanism_probs: arithmetic mean of the two per-mech dicts.
	- predicted_mechanism: argmax of the ensembled probs.
	- posterior_samples: per-mech, concatenate the samples from each
	model (when both produced samples), then recompute parameter_stats.
	- ood_score: max of the two scores (more conservative; image-mode's
	OOD means P(ID), so 'higher' is safer; we take min instead — see
	below). We surface the IMAGE-mode OOD score as the headline OOD,
	but if the waveform model also has one we take the lower of the
	two so the banner is shown when either is concerned.

	`param_names_lookup` is a dict mech -> list of parameter names; it
	provides 'names' for the recomputed parameter_stats.
	"""
	if image_result is None:
	return waveform_result
	if waveform_result is None:
	return image_result

	mech_list = image_result["mechanism_names"]
	probs_a = image_result["mechanism_probs"]
	probs_b = waveform_result["mechanism_probs"]

	ensemble_probs = {
	m: 0.5 * (probs_a.get(m, 0.0) + probs_b.get(m, 0.0))
	for m in mech_list
	}
	s = sum(ensemble_probs.values())
	if s > 0:
	ensemble_probs = {m: v / s for m, v in ensemble_probs.items()}
	sorted_probs = sorted(ensemble_probs.items(), key=lambda kv: -kv[1])
	top_mech, _ = sorted_probs[0]
	top_idx = mech_list.index(top_mech)

	samples_dict = {}
	param_stats = {}
	for mech in mech_list:
	sa = image_result["posterior_samples"].get(mech)
	sb = waveform_result["posterior_samples"].get(mech)
	if sa is not None and sb is not None:
	combined = np.concatenate([sa, sb], axis=0)
	elif sa is not None:
	combined = sa
	elif sb is not None:
	combined = sb
	else:
	combined = None
	if combined is None:
	continue
	samples_dict[mech] = combined
	names = param_names_lookup.get(mech, [f"p{i}" for i in range(combined.shape[-1])])
	param_stats[mech] = {
	"names": names,
	"mean": combined.mean(axis=0).tolist(),
	"std": combined.std(axis=0).tolist(),
	"median": np.median(combined, axis=0).tolist(),
	"q05": np.quantile(combined, 0.05, axis=0).tolist(),
	"q95": np.quantile(combined, 0.95, axis=0).tolist(),
	}

	ood_a = image_result.get("ood_score")
	ood_b = waveform_result.get("ood_score")
	ood_vals = [v for v in (ood_a, ood_b) if v is not None]
	ood_ensemble = min(ood_vals) if ood_vals else None # P(ID); lower=more concerning

	return {
	"domain": image_result["domain"],
	"mechanism_probs": ensemble_probs,
	"mechanism_names": mech_list,
	"predicted_mechanism": top_mech,
	"predicted_mechanism_idx": top_idx,
	"parameter_stats": param_stats,
	"posterior_samples": samples_dict,
	"ood_score": ood_ensemble,
	"_ensemble": True,
	}

	@staticmethod
	def _agreement_stats(image_result, waveform_result):
	if image_result is None or waveform_result is None:
	return {
	"available": False,
	"top_mech_match": None,
	"top_prob_image": None,
	"top_prob_waveform": None,
	}
	return {
	"available": True,
	"top_mech_match": (
	image_result["predicted_mechanism"]
	== waveform_result["predicted_mechanism"]
	),
	"top_prob_image": float(max(image_result["mechanism_probs"].values())),
	"top_prob_waveform": float(max(waveform_result["mechanism_probs"].values())),
	"image_mech": image_result["predicted_mechanism"],
	"waveform_mech": waveform_result["predicted_mechanism"],
	}

	def _predict_ec_two_paths(
	self, pil_images, sigmas, potentials, fluxes, times=None,
	n_samples=500, temperature=1.0, do_preprocess=True,
	):
	"""Run image-mode + waveform-mode + joint CV inference (whichever are
	available). Returns (image_result, waveform_result, joint_result,
	preprocessing_meta). Any result may be None if the corresponding
	model is missing or the input arrays were not provided.
	"""
	image_result = None
	waveform_result = None
	joint_result = None
	preproc_meta = []

	# Preprocess images once; both image-only and joint paths reuse them.
	preprocessed = None
	if pil_images and (self.has_ec_image_model or self.has_ec_joint_model):
	if do_preprocess:
	from image_preprocessing import prepare_for_image_mode
	preprocessed = []
	for p in pil_images:
	out, meta = prepare_for_image_mode(p)
	preprocessed.append(out)
	preproc_meta.append(meta)
	else:
	preprocessed = list(pil_images)
	preproc_meta = [{} for _ in pil_images]

	if self.has_ec_image_model and preprocessed is not None:
	flux_scales = None
	if fluxes is not None:
	flux_scales = [
	float(np.log10(np.max(np.abs(np.asarray(f))) + 1e-30))
	for f in fluxes
	]
	try:
	image_result = self.predict_ec_image(
	preprocessed, sigmas, flux_scales=flux_scales,
	n_samples=n_samples, temperature=temperature,
	)
	except Exception as exc:
	print(f"[SPARKPredictor] image-mode CV failed: {exc}")

	if self.ec_model is not None and potentials is not None and fluxes is not None:
	try:
	waveform_result = self.predict_ec(
	potentials, fluxes, sigmas, times=times,
	n_samples=n_samples, temperature=temperature,
	)
	except Exception as exc:
	print(f"[SPARKPredictor] waveform CV failed: {exc}")

	if (self.has_ec_joint_model and preprocessed is not None
	and potentials is not None and fluxes is not None):
	try:
	joint_result = self.predict_ec_joint(
	preprocessed, sigmas, potentials, fluxes, times=times,
	n_samples=n_samples, temperature=temperature,
	)
	except Exception as exc:
	print(f"[SPARKPredictor] joint CV failed: {exc}")

	return image_result, waveform_result, joint_result, preproc_meta

	def predict_ec_hybrid(
	self, pil_images, sigmas, potentials=None, fluxes=None, times=None,
	n_samples=500, temperature=1.0, mode="ensemble",
	do_preprocess=True, ood_fallback_threshold=0.3,
	):
	"""Hybrid CV inference combining image-mode and waveform-mode.

	Args:
	pil_images: list of PIL.Image (one per scan rate). Required for
	image-mode; if missing, image-mode is skipped.
	sigmas: list of dimensionless scan rates.
	potentials, fluxes: dimensionless waveforms (one list of arrays
	per scan rate). Required for waveform-mode; if missing,
	waveform-mode is skipped.
	times: optional dimensionless time arrays.
	mode: one of 'ensemble', 'image_only', 'digitize_only',
	'auto_fallback'.
	do_preprocess: whether to run prepare_for_image_mode on inputs
	before image-mode (default True).
	ood_fallback_threshold: if mode='auto_fallback', image-mode's
	OOD score (P(ID)) below this threshold triggers fallback to
	waveform-mode.

	Returns dict with:
	headline: result dict to display (same shape as predict_ec).
	image_mode: image-mode result or None.
	waveform_mode: waveform result or None.
	preprocessing_meta: per-image preprocessing metadata list.
	agreement: agreement_stats(image, waveform) dict.
	method_used: human-readable string of which method produced
	'headline'.
	"""
	(image_result, waveform_result, joint_result, preproc_meta) = (
	self._predict_ec_two_paths(
	pil_images, sigmas, potentials, fluxes, times,
	n_samples=n_samples, temperature=temperature,
	do_preprocess=do_preprocess,
	)
	)
	agreement = self._agreement_stats(image_result, waveform_result)
	param_names_lookup = {m: MECHANISM_PARAMS[m]["names"] for m in MECHANISM_PARAMS}
	headline, method_used = self._select_headline(
	mode, image_result, waveform_result,
	param_names_lookup, ood_fallback_threshold,
	joint_result=joint_result,
	)
	return {
	"headline": headline,
	"image_mode": image_result,
	"waveform_mode": waveform_result,
	"joint_mode": joint_result,
	"preprocessing_meta": preproc_meta,
	"agreement": agreement,
	"method_used": method_used,
	}

	def _predict_tpd_two_paths(
	self, pil_images, betas, temperatures, rates,
	n_samples=500, temperature=1.0, do_preprocess=True,
	):
	image_result = None
	waveform_result = None
	joint_result = None
	preproc_meta = []

	preprocessed = None
	if pil_images and (self.has_tpd_image_model or self.has_tpd_joint_model):
	if do_preprocess:
	from image_preprocessing import prepare_for_image_mode
	preprocessed = []
	for p in pil_images:
	out, meta = prepare_for_image_mode(p)
	preprocessed.append(out)
	preproc_meta.append(meta)
	else:
	preprocessed = list(pil_images)
	preproc_meta = [{} for _ in pil_images]

	if self.has_tpd_image_model and preprocessed is not None:
	flux_scales = None
	if rates is not None:
	flux_scales = [
	float(np.log10(np.max(np.abs(np.asarray(r))) + 1e-30))
	for r in rates
	]
	try:
	image_result = self.predict_tpd_image(
	preprocessed, betas, flux_scales=flux_scales,
	n_samples=n_samples, temperature=temperature,
	)
	except Exception as exc:
	print(f"[SPARKPredictor] image-mode TPD failed: {exc}")

	if self.tpd_model is not None and temperatures is not None and rates is not None:
	try:
	waveform_result = self.predict_tpd(
	temperatures, rates, betas,
	n_samples=n_samples, temperature=temperature,
	)
	except Exception as exc:
	print(f"[SPARKPredictor] waveform TPD failed: {exc}")

	if (self.has_tpd_joint_model and preprocessed is not None
	and temperatures is not None and rates is not None):
	try:
	joint_result = self.predict_tpd_joint(
	preprocessed, betas, temperatures, rates,
	n_samples=n_samples, temperature=temperature,
	)
	except Exception as exc:
	print(f"[SPARKPredictor] joint TPD failed: {exc}")

	return image_result, waveform_result, joint_result, preproc_meta

	def predict_tpd_hybrid(
	self, pil_images, betas, temperatures=None, rates=None,
	n_samples=500, temperature=1.0, mode="ensemble",
	do_preprocess=True, ood_fallback_threshold=0.3,
	):
	"""Hybrid TPD inference. Same shape as predict_ec_hybrid."""
	(image_result, waveform_result, joint_result, preproc_meta) = (
	self._predict_tpd_two_paths(
	pil_images, betas, temperatures, rates,
	n_samples=n_samples, temperature=temperature,
	do_preprocess=do_preprocess,
	)
	)
	agreement = self._agreement_stats(image_result, waveform_result)
	param_names_lookup = {m: TPD_MECHANISM_PARAMS[m]["names"]
	for m in TPD_MECHANISM_PARAMS}
	headline, method_used = self._select_headline(
	mode, image_result, waveform_result,
	param_names_lookup, ood_fallback_threshold,
	joint_result=joint_result,
	)
	return {
	"headline": headline,
	"image_mode": image_result,
	"waveform_mode": waveform_result,
	"joint_mode": joint_result,
	"preprocessing_meta": preproc_meta,
	"agreement": agreement,
	"method_used": method_used,
	}

	def _select_headline(self, mode, image_result, waveform_result,
	param_names_lookup, ood_fallback_threshold,
	joint_result=None):
	"""Pick the headline result based on `mode`. Falls back gracefully
	when one of the available paths is unavailable.

	Supported modes: ``ensemble``, ``image_only``, ``digitize_only``,
	``auto_fallback``, ``joint``.
	"""
	if (image_result is None and waveform_result is None
	and joint_result is None):
	raise RuntimeError(
	"Hybrid inference: image, waveform, and joint paths all "
	"failed or were unavailable."
	)

	if mode == "joint":
	if joint_result is not None:
	return joint_result, "joint image+waveform (Phase 2)"
	if image_result is not None and waveform_result is not None:
	return (
	self._ensemble_results(
	image_result, waveform_result, param_names_lookup),
	"ensemble (joint unavailable)",
	)
	if image_result is not None:
	return image_result, "image-direct (joint unavailable)"
	return waveform_result, "digitize-then-infer (joint unavailable)"

	if mode == "image_only":
	if image_result is not None:
	return image_result, "image-direct"
	return waveform_result, "digitize-then-infer (image fallback)"

	if mode == "digitize_only":
	if waveform_result is not None:
	return waveform_result, "digitize-then-infer"
	return image_result, "image-direct (waveform fallback)"

	if mode == "auto_fallback":
	if image_result is None:
	return waveform_result, "digitize-then-infer (no image model)"
	ood = image_result.get("ood_score")
	if (ood is not None and ood < ood_fallback_threshold
	and waveform_result is not None):
	return waveform_result, (
	f"digitize-then-infer (image OOD score "
	f"{ood:.2f} < {ood_fallback_threshold:.2f})"
	)
	return image_result, "image-direct"

	# ensemble (default): prefer joint when present, else mix image+wave
	if joint_result is not None:
	return joint_result, "joint image+waveform (Phase 2)"
	if image_result is not None and waveform_result is not None:
	return (
	self._ensemble_results(
	image_result, waveform_result, param_names_lookup),
	"ensemble (image + digitize)",
	)
	if image_result is not None:
	return image_result, "image-direct (waveform unavailable)"
	return waveform_result, "digitize-then-infer (image unavailable)"

	def _prepare_ec_tensor(self, potentials, fluxes, times, sigmas):
	"""
	Build model input tensor from preprocessed dimensionless CV data.

	Args:
	potentials: list of 1-D arrays (dimensionless theta)
	fluxes: list of 1-D arrays (dimensionless flux)
	times: list of 1-D arrays (dimensionless time) or None
	sigmas: 1-D array of dimensionless scan rates

	Returns:
	dict of tensors ready for model.predict()
	"""
	from scipy.interpolate import interp1d

	n_scans = len(potentials)
	T_target = 672

	pot_resampled = []
	flux_resampled = []
	time_resampled = []
	flux_scales = []

	for i in range(n_scans):
	pot = np.asarray(potentials[i], dtype=np.float32)
	flx = np.asarray(fluxes[i], dtype=np.float32)

	if times is not None and times[i] is not None:
	tim = np.asarray(times[i], dtype=np.float32)
	else:
	theta_range = pot.max() - pot.min()
	sigma = sigmas[i]
	total_time = 2.0 * theta_range / sigma
	tim = np.linspace(0, total_time, len(pot), dtype=np.float32)

	peak = np.max(np.abs(flx)) + 1e-30
	flux_scales.append(np.log10(peak))
	flx = flx / peak

	t_uniform = np.linspace(tim[0], tim[-1], T_target)
	pot_resampled.append(
	interp1d(tim, pot, kind="linear", fill_value="extrapolate")(t_uniform)
	)
	flux_resampled.append(
	interp1d(tim, flx, kind="linear", fill_value="extrapolate")(t_uniform)
	)
	time_resampled.append(t_uniform)

	pot_arr = np.stack(pot_resampled).astype(np.float32)
	flx_arr = np.stack(flux_resampled).astype(np.float32)
	tim_arr = np.stack(time_resampled).astype(np.float32)

	ns = self.ec_norm_stats
	if ns:
	pot_arr = (pot_arr - ns["potential"][0]) / ns["potential"][1]
	flx_arr = (flx_arr - ns["flux"][0]) / ns["flux"][1]
	tim_arr = (tim_arr - ns["time"][0]) / ns["time"][1]

	# [1, N, 3, T]
	waveforms = np.stack([pot_arr, flx_arr, tim_arr], axis=1)
	x = torch.from_numpy(waveforms).unsqueeze(0).to(self.device)
	scan_mask = torch.ones(1, n_scans, T_target, dtype=torch.bool, device=self.device)
	sigmas_t = torch.from_numpy(
	np.log10(np.asarray(sigmas, dtype=np.float32))
	).unsqueeze(0).to(self.device)
	flux_scales_t = torch.from_numpy(
	np.asarray(flux_scales, dtype=np.float32)
	).unsqueeze(0).to(self.device)

	return {
	"input": x,
	"scan_mask": scan_mask,
	"sigmas": sigmas_t,
	"flux_scales": flux_scales_t,
	}

	def _prepare_tpd_tensor(self, temperatures, rates, betas):
	"""
	Build model input tensor from TPD data.

	Args:
	temperatures: list of 1-D arrays (K)
	rates: list of 1-D arrays (arb. units)
	betas: 1-D array of heating rates (K/s)

	Returns:
	dict of tensors ready for model.predict()
	"""
	from scipy.interpolate import interp1d

	n_rates = len(temperatures)
	T_target = 500

	temp_resampled = []
	rate_resampled = []

	for i in range(n_rates):
	temp = np.asarray(temperatures[i], dtype=np.float32)
	rate = np.asarray(rates[i], dtype=np.float32)

	t_uniform = np.linspace(temp[0], temp[-1], T_target)
	temp_resampled.append(t_uniform)
	rate_resampled.append(
	interp1d(temp, rate, kind="linear", fill_value="extrapolate")(t_uniform)
	)

	temp_arr = np.stack(temp_resampled).astype(np.float32)
	rate_arr = np.stack(rate_resampled).astype(np.float32)

	summary_t = None
	if getattr(self, 'tpd_use_summary', False):
	from preprocessing import extract_tpd_summary_stats
	hr_arr = np.asarray(betas, dtype=np.float32)
	lengths = np.full(n_rates, T_target, dtype=np.int32)
	summary = extract_tpd_summary_stats(
	temp_arr, rate_arr, lengths, hr_arr, n_rates)
	summary_t = torch.from_numpy(summary).unsqueeze(0).to(self.device)

	rate_scales = []
	for i in range(n_rates):
	peak = np.max(np.abs(rate_arr[i])) + 1e-30
	rate_scales.append(np.log10(peak))
	rate_arr[i] /= peak

	ns = self.tpd_norm_stats
	if ns:
	temp_arr = (temp_arr - ns["temperature"][0]) / ns["temperature"][1]
	rate_arr = (rate_arr - ns["rate"][0]) / ns["rate"][1]

	# [1, N, 2, T]
	waveforms = np.stack([temp_arr, rate_arr], axis=1)
	x = torch.from_numpy(waveforms).unsqueeze(0).to(self.device)
	scan_mask = torch.ones(1, n_rates, T_target, dtype=torch.bool, device=self.device)
	sigmas_t = torch.from_numpy(
	np.log10(np.asarray(betas, dtype=np.float32))
	).unsqueeze(0).to(self.device)
	rate_scales_t = torch.from_numpy(
	np.asarray(rate_scales, dtype=np.float32)
	).unsqueeze(0).to(self.device)

	result = {
	"input": x,
	"scan_mask": scan_mask,
	"sigmas": sigmas_t,
	"flux_scales": rate_scales_t,
	}
	if summary_t is not None:
	result["summary"] = summary_t
	return result

	@torch.no_grad()
	def predict_ec(self, potentials, fluxes, sigmas, times=None, n_samples=500, temperature=1.0):
	"""
	Run EC inference on dimensionless CV data.

	Args:
	potentials: list of 1-D arrays (dimensionless theta per scan rate)
	fluxes: list of 1-D arrays (dimensionless flux per scan rate)
	sigmas: list/array of dimensionless scan rates
	times: optional list of 1-D time arrays
	n_samples: posterior samples to draw
	temperature: sampling temperature (>1 broadens posteriors)

	Returns:
	dict with mechanism_probs, mechanism_names, predicted_mechanism,
	parameter_stats (per mechanism), posterior_samples (per mechanism)
	"""
	if self.ec_model is None:
	raise RuntimeError("EC model not loaded")

	tensors = self._prepare_ec_tensor(potentials, fluxes, times, sigmas)
	pred = self.ec_model.predict(
	tensors["input"],
	scan_mask=tensors["scan_mask"],
	sigmas=tensors["sigmas"],
	flux_scales=tensors["flux_scales"],
	n_samples=n_samples,
	temperature=temperature,
	)

	mech_list = self.ec_mechanism_list
	probs = pred["mechanism_probs"][0].cpu().numpy()
	pred_idx = int(pred["mechanism_pred"][0].cpu().item())
	pred_mech = mech_list[pred_idx]

	param_stats = {}
	samples_dict = {}
	for mech in mech_list:
	if pred["samples"][mech] is not None:
	s = pred["samples"][mech][0].cpu().numpy() # [n_samples, D]
	samples_dict[mech] = s
	param_stats[mech] = {
	"names": MECHANISM_PARAMS[mech]["names"],
	"mean": s.mean(axis=0).tolist(),
	"std": s.std(axis=0).tolist(),
	"median": np.median(s, axis=0).tolist(),
	"q05": np.quantile(s, 0.05, axis=0).tolist(),
	"q95": np.quantile(s, 0.95, axis=0).tolist(),
	}

	ood_score = pred.get("ood_score")
	ood_score_val = (float(ood_score[0].cpu().item())
	if ood_score is not None else None)

	return {
	"domain": "ec",
	"mechanism_probs": {m: float(probs[i]) for i, m in enumerate(mech_list)},
	"mechanism_names": mech_list,
	"predicted_mechanism": pred_mech,
	"predicted_mechanism_idx": pred_idx,
	"parameter_stats": param_stats,
	"posterior_samples": samples_dict,
	"ood_score": ood_score_val,
	}

	@torch.no_grad()
	def predict_tpd(self, temperatures, rates, betas, n_samples=500, temperature=1.0):
	"""
	Run TPD inference.

	Args:
	temperatures: list of 1-D arrays (K per heating rate)
	rates: list of 1-D arrays (signal per heating rate)
	betas: list/array of heating rates (K/s)
	n_samples: posterior samples to draw
	temperature: sampling temperature

	Returns:
	dict with mechanism_probs, parameter_stats, posterior_samples
	"""
	if self.tpd_model is None:
	raise RuntimeError("TPD model not loaded")

	tensors = self._prepare_tpd_tensor(temperatures, rates, betas)
	pred = self.tpd_model.predict(
	tensors["input"],
	scan_mask=tensors["scan_mask"],
	sigmas=tensors["sigmas"],
	flux_scales=tensors["flux_scales"],
	n_samples=n_samples,
	temperature=temperature,
	summary=tensors.get("summary"),
	)

	mech_list = self.tpd_mechanism_list
	probs = pred["mechanism_probs"][0].cpu().numpy()
	pred_idx = int(pred["mechanism_pred"][0].cpu().item())
	pred_mech = mech_list[pred_idx]

	param_stats = {}
	samples_dict = {}
	for mech in mech_list:
	if pred["samples"][mech] is not None:
	s = pred["samples"][mech][0].cpu().numpy()
	samples_dict[mech] = s
	param_stats[mech] = {
	"names": TPD_MECHANISM_PARAMS[mech]["names"],
	"mean": s.mean(axis=0).tolist(),
	"std": s.std(axis=0).tolist(),
	"median": np.median(s, axis=0).tolist(),
	"q05": np.quantile(s, 0.05, axis=0).tolist(),
	"q95": np.quantile(s, 0.95, axis=0).tolist(),
	}

	ood_score = pred.get("ood_score")
	ood_score_val = (float(ood_score[0].cpu().item())
	if ood_score is not None else None)

	return {
	"domain": "tpd",
	"mechanism_probs": {m: float(probs[i]) for i, m in enumerate(mech_list)},
	"mechanism_names": mech_list,
	"predicted_mechanism": pred_mech,
	"predicted_mechanism_idx": pred_idx,
	"parameter_stats": param_stats,
	"posterior_samples": samples_dict,
	"ood_score": ood_score_val,
	}

	# =====================================================================
	# Signal Reconstruction
	# =====================================================================

	def reconstruct_ec(self, result, potentials, fluxes, sigmas,
	base_params=None, mechanism=None):
	"""
	Reconstruct CV signals from inferred posterior median and compute metrics.

	Args:
	result: output dict from predict_ec()
	potentials: list of 1-D arrays (original dimensionless theta)
	fluxes: list of 1-D arrays (original dimensionless flux)
	sigmas: list of dimensionless scan rates
	base_params: dict of fixed simulation params; defaults used if None
	mechanism: which mechanism to reconstruct (default: predicted)

	Returns:
	dict with 'observed', 'reconstructed' curve lists,
	'nrmse', 'r2' per scan rate, and 'mean_nrmse', 'mean_r2'
	"""
	from evaluate_reconstruction import (
	reconstruct_ec_signal, signal_nrmse, signal_r2,
	)

	mech = mechanism or result["predicted_mechanism"]
	stats = result["parameter_stats"].get(mech)
	if stats is None:
	return None

	theta_point = np.array(stats["median"])

	if base_params is None:
	pot0 = np.asarray(potentials[0])
	base_params = {
	"theta_i": float(pot0.max()),
	"theta_v": float(pot0.min()),
	"dA": 1.0,
	"C_A_bulk": 1.0,
	"C_B_bulk": 0.0,
	"kinetics": mech,
	}

	try:
	recon_results = reconstruct_ec_signal(
	theta_point, mech, base_params, sigmas, n_spatial=64
	)
	except Exception:
	return None

	observed_curves = []
	recon_curves = []
	conc_curves = []
	nrmses = []
	r2s = []

	for i, (pot, flx, sigma) in enumerate(zip(potentials, fluxes, sigmas)):
	pot = np.asarray(pot)
	flx = np.asarray(flx)
	observed_curves.append({"x": pot, "y": flx})

	if i < len(recon_results) and recon_results[i].get("success", False):
	rec = recon_results[i]
	rec_pot = np.asarray(rec["potential"])
	rec_flx = np.asarray(rec["flux"])

	n_obs = len(pot)
	n_rec = len(rec_pot)
	t_obs = np.linspace(0, 1, n_obs)
	t_rec = np.linspace(0, 1, n_rec)
	rec_flx_interp = np.interp(t_obs, t_rec, rec_flx)
	recon_curves.append({"x": pot, "y": rec_flx_interp})
	nrmse_val = signal_nrmse(flx, rec_flx_interp)
	r2_val = signal_r2(flx, rec_flx_interp)
	nrmses.append(nrmse_val)
	r2s.append(r2_val)

	if "c_ox_surface" in rec and "c_red_surface" in rec:
	c_ox_interp = np.interp(t_obs, t_rec, np.asarray(rec["c_ox_surface"]))
	c_red_interp = np.interp(t_obs, t_rec, np.asarray(rec["c_red_surface"]))
	conc_curves.append({
	"x": pot,
	"c_ox": c_ox_interp,
	"c_red": c_red_interp,
	})
	else:
	conc_curves.append(None)
	else:
	recon_curves.append({"x": pot, "y": np.zeros_like(flx)})
	nrmses.append(float("nan"))
	r2s.append(float("nan"))
	conc_curves.append(None)

	valid_nrmse = [v for v in nrmses if np.isfinite(v)]
	valid_r2 = [v for v in r2s if np.isfinite(v)]

	return {
	"observed": observed_curves,
	"reconstructed": recon_curves,
	"concentrations": conc_curves,
	"nrmse": nrmses,
	"r2": r2s,
	"mean_nrmse": float(np.mean(valid_nrmse)) if valid_nrmse else float("nan"),
	"mean_r2": float(np.mean(valid_r2)) if valid_r2 else float("nan"),
	}

	def reconstruct_tpd(self, result, temperatures, rates, betas,
	base_params=None, mechanism=None):
	"""
	Reconstruct TPD signals from inferred posterior median and compute metrics.

	Args:
	result: output dict from predict_tpd()
	temperatures: list of 1-D arrays (K)
	rates: list of 1-D arrays (signal)
	betas: list of heating rates (K/s)
	base_params: dict of fixed simulation params; defaults used if None
	mechanism: which mechanism to reconstruct (default: predicted)

	Returns:
	dict with 'observed', 'reconstructed' curve lists,
	'nrmse', 'r2' per heating rate, and 'mean_nrmse', 'mean_r2'
	"""
	from evaluate_reconstruction import (
	reconstruct_tpd_signal, signal_nrmse, signal_r2,
	)

	mech = mechanism or result["predicted_mechanism"]
	stats = result["parameter_stats"].get(mech)
	if stats is None:
	return None

	theta_point = np.array(stats["median"])

	if base_params is None:
	temp0 = np.asarray(temperatures[0])
	base_params = {
	"mechanism": mech,
	"T_start": float(temp0.min()),
	"T_end": float(temp0.max()),
	"n_points": 500,
	}

	try:
	recon_results = reconstruct_tpd_signal(
	theta_point, mech, base_params, betas
	)
	except Exception:
	return None

	observed_curves = []
	recon_curves = []
	nrmses = []
	r2s = []

	for i, (temp, rate, beta) in enumerate(zip(temperatures, rates, betas)):
	temp = np.asarray(temp)
	rate = np.asarray(rate)
	observed_curves.append({"x": temp, "y": rate})

	if i < len(recon_results) and recon_results[i].get("success", False):
	rec = recon_results[i]
	rec_temp = np.asarray(rec["temperature"])
	rec_rate = np.asarray(rec["rate"])

	rec_rate_interp = np.interp(temp, rec_temp, rec_rate)
	recon_curves.append({"x": temp, "y": rec_rate_interp})
	nrmse_val = signal_nrmse(rate, rec_rate_interp)
	r2_val = signal_r2(rate, rec_rate_interp)

	nrmses.append(nrmse_val)
	r2s.append(r2_val)
	else:
	recon_curves.append({"x": temp, "y": np.zeros_like(rate)})
	nrmses.append(float("nan"))
	r2s.append(float("nan"))

	valid_nrmse = [v for v in nrmses if np.isfinite(v)]
	valid_r2 = [v for v in r2s if np.isfinite(v)]

	return {
	"observed": observed_curves,
	"reconstructed": recon_curves,
	"nrmse": nrmses,
	"r2": r2s,
	"mean_nrmse": float(np.mean(valid_nrmse)) if valid_nrmse else float("nan"),
	"mean_r2": float(np.mean(valid_r2)) if valid_r2 else float("nan"),
	}