Spaces:

hugging-science
/

SciMLx_Production

Runtime error

Moatasim Farooque

Remove problematic files

54fa103 25 days ago

7.71 kB

	"""Declarative experiment registry for autonomous SciML research.

	This module now loads experiment configurations from 'experiments.yaml'.
	To add a new experiment, append it to 'experiments.yaml'.
	"""

	import yaml
	from pathlib import Path
	from dataclasses import dataclass, field
	from typing import List, Optional

	# ── Config dataclass ──────────────────────────────────────────────────────────

	@dataclass
	class ExperimentConfig:
	name: str # unique key (used for dedup against results.json)
	benchmark: str # "burgers_1d" \| "darcy_2d" \| "kdv_1d" \| "wave_1d"
	model: str # "FNO" \| "RFNO" \| "AFNO" \| "FFNO" \| "UNO" \| "WNO" \| "DeepONet" \| "PODDeepONet"
	hidden_dim: int # channel width
	n_layers: int # depth (FNO blocks per level for UNO)
	n_modes: int = 16 # Fourier modes (FNO / UNO / RFNO / AFNO)
	n_levels: int = 3 # Haar levels (WNO)
	n_head: int = 4 # Attention heads (Transolver / GNOT / Transformer)
	slice_num: int = 32 # Physics slices (Transolver)
	lr: float = 1e-3 # learning rate
	batch_size: int = 64 # training batch size
	grad_clip: float = 1.0 # gradient clipping (0 = disabled)
	pino_lambda: float = 0.0 # PINO physics-loss weight
	loss_type: str = "l2_rel" # loss function
	h1_alpha: float = 0.1 # H1 loss derivative weight
	augment: bool = False # spatial-shift augmentation
	curriculum: bool = False # training curriculum
	curriculum_epochs: int = 0 # Phase 12: Curriculum ramp epochs
	save_ckpt: bool = False # save model checkpoint after training
	resume: bool = False # resume from best checkpoint if exists
	resume_from: str = "" # resume from specific checkpoint name/path
	budget_s: int = 1200 # training time budget in seconds
	parent_name: str = "" # name of parent experiment
	priority: int = 5 # 1 = highest
	rationale: str = "" # why this experiment?
	expected: str = "" # expected val_l2_rel range
	paper_ref: str = "" # paper ID from papers/*.yaml
	refine_grid: bool = False # Phase 11: Adaptive grid refinement
	cheb_degree: int = 5 # Phase 11: Degree for Chebyshev KAN
	seed: int = 42 # Global RNG seed for reproducibility
	lr_schedule: str = "warmup_cosine" # LR schedule: warmup_cosine\|cosine\|onecycle\|none
	ema_decay: float = 0.0 # EMA decay for model weights (0=disabled, 0.999 recommended)
	patience: int = 5 # early-stop patience: halt after this many consecutive non-improving evals (0=off)
	snapshot_ensemble: int = 0 # Phase 12: Snapshot ensembling (number of snapshots to average)
	n_iterations: int = 10 # Phase 14: Iterations for Neural Iterative Solver (Brandstetter et al.)

	def to_cli_args(self) -> List[str]:
	args = [
	"--benchmark", self.benchmark,
	"--model", self.model,
	"--name", self.name,
	"--hidden", str(self.hidden_dim),
	"--layers", str(self.n_layers),
	"--modes", str(self.n_modes),
	"--levels", str(self.n_levels),
	"--lr", str(self.lr),
	"--batch_size", str(self.batch_size),
	"--grad_clip", str(self.grad_clip),
	"--pino_lambda", str(self.pino_lambda),
	"--loss", self.loss_type,
	]
	if self.loss_type.startswith("h1"):
	args += ["--h1_alpha", str(self.h1_alpha)]
	if self.augment:
	args += ["--augment"]
	if self.curriculum:
	args += ["--curriculum"]
	if self.curriculum_epochs > 0:
	args += ["--curriculum_epochs", str(self.curriculum_epochs)]
	if self.model in ("Transolver", "Transolver2D", "Transolver2d", "GNOT", "GNOT_Axial2d"):
	args += ["--n_head", str(self.n_head)]
	args += ["--slice_num", str(self.slice_num)]
	if self.save_ckpt:
	args += ["--save_ckpt"]
	if self.resume:
	args += ["--resume"]
	if self.resume_from:
	args += ["--resume_from", self.resume_from]
	if self.refine_grid:
	args += ["--refine_grid"]
	if self.model == "cPIKAN_FNO":
	args += ["--degree", str(self.cheb_degree)]
	if self.model in ("IterativeFNO2D", "IterativeFNO2d"):
	args += ["--n_iterations", str(self.n_iterations)]
	args += ["--budget", str(self.budget_s)]
	args += ["--seed", str(self.seed)]
	if self.lr_schedule != "warmup_cosine":
	args += ["--lr_schedule", self.lr_schedule]
	if self.ema_decay > 0:
	args += ["--ema_decay", str(self.ema_decay)]
	if self.patience != 5:
	args += ["--patience", str(self.patience)]
	if self.snapshot_ensemble > 0:
	args += ["--snapshot_ensemble", str(self.snapshot_ensemble)]
	return args

	def short(self) -> str:
	"""One-line summary for logging."""
	parts = [f"{self.model}", f"h={self.hidden_dim}", f"l={self.n_layers}"]
	if self.model in ("FNO", "RFNO", "AFNO", "FFNO", "UNO", "UNO2d", "WNO2d", "Transolver", "Transolver2D"):
	parts.append(f"m={self.n_modes}")
	if self.model in ("Transolver", "Transolver2D", "GNOT", "GNOT_Axial2d"):
	parts.append(f"h={self.n_head}")
	parts.append(f"s={self.slice_num}")
	if self.model in ("WNO", "WNO2d"):
	parts.append(f"lvl={self.n_levels}")
	if self.pino_lambda > 0:
	parts.append(f"pino={self.pino_lambda}")
	if self.lr != 1e-3:
	parts.append(f"lr={self.lr:.0e}")
	if self.grad_clip != 1.0:
	parts.append(f"clip={self.grad_clip}")
	if self.loss_type != "l2_rel":
	parts.append(f"loss={self.loss_type}")
	if self.curriculum:
	parts.append("curric")
	if self.curriculum_epochs > 0:
	parts.append(f"cur_ep={self.curriculum_epochs}")
	return " ".join(parts)

	# ── Loader Logic ─────────────────────────────────────────────────────────────

	def load_experiments(yaml_path: Path) -> List[ExperimentConfig]:
	if not yaml_path.exists():
	return []

	with open(yaml_path, "r") as f:
	data = yaml.safe_load(f)

	if not data:
	return []

	return [ExperimentConfig(**d) for d in data]

	# Load default set
	REPO_ROOT = Path(__file__).parent.parent
	YAML_PATH = REPO_ROOT / "experiments.yaml"
	EXPERIMENTS = load_experiments(YAML_PATH)

	def get_experiments(benchmark: Optional[str] = None, model: Optional[str] = None, priority: Optional[int] = None) -> List[ExperimentConfig]:
	"""Return the experiments list, optionally filtered by benchmark, model, or priority."""
	queue = EXPERIMENTS
	if benchmark:
	queue = [e for e in queue if e.benchmark == benchmark]
	if model:
	queue = [e for e in queue if e.model == model]
	if priority:
	queue = [e for e in queue if e.priority <= priority]
	return queue

	if __name__ == "__main__":
	# Smoke test
	print(f"Loaded {len(EXPERIMENTS)} experiments.")
	if EXPERIMENTS:
	print(f"First experiment: {EXPERIMENTS[0].name} ({EXPERIMENTS[0].benchmark})")