Fixed code: vocab mismatch fix for cross-arch merging (Llama/Falcon)

5d61448 verified 3 months ago

36.9 kB

	"""
	TD Lang Grammar — Lark parser for .td files.

	Defines the syntax for Phase 1 commands (load, merge, heal, eval, commit)
	plus gate/budget blocks. Phase 2 commands are parsed into stub nodes so the
	compiler can reject them with a clear error until implemented.
	"""

	from lark import Lark, Token, Transformer, UnexpectedInput, v_args

	from .ast_nodes import (
	AbsorbCmd,
	BudgetBlock,
	CommitCmd,
	DataContractBlock,
	DebateCmd,
	DiagnoseCmd,
	DistillCmd,
	EditCmd,
	EvalCmd,
	FuseCmd,
	ForkCmd,
	GateBlock,
	HealCmd,
	IfBlock,
	LoadCmd,
	MergeCmd,
	NotifyCmd,
	OnErrorBlock,
	PromptBlock,
	PruneCmd,
	RepeatBlock,
	ReportCmd,
	ResetCmd,
	RewardContractBlock,
	RollbackCmd,
	CurriculumCmd,
	StarCmd,
	BestOfCmd,
	ExploitCmd,
	ArenaCmd,
	ResearchArenaCmd,
	SaveCmd,
	ScheduleCmd,
	DownloadCmd,
	LogBlock,
	CompareCmd,
	VerifyCmd,
	VoteCmd,
	SetupBlock,
	SnapshotCmd,
	SynthCmd,
	TDProgram,
	TrainCmd,
	)
	from .errors import TDSyntaxError


	# ============================================================================
	# LARK GRAMMAR DEFINITION
	# ============================================================================

	TD_GRAMMAR = r"""
	// TD Lang Grammar v0.1.0
	// One command per line, blocks with curly braces, comments with #

	start: (_NL* statement _NL) _NL*

	?statement: load_cmd
	\| merge_cmd
	\| heal_cmd
	\| eval_cmd
	\| commit_cmd
	\| synth_cmd
	\| train_cmd
	\| debate_cmd
	\| diagnose_cmd
	\| fork_cmd
	\| reset_cmd
	\| prune_cmd
	\| edit_cmd
	\| fuse_cmd
	\| absorb_cmd
	\| repeat_block_cmd
	\| if_block_cmd
	\| snapshot_cmd
	\| report_cmd
	\| notify_cmd
	\| save_cmd
	\| gate_block
	\| budget_block
	\| data_contract_block
	\| reward_contract_block
	\| setup_block
	\| on_error_block
	\| schedule_cmd
	\| download_cmd
	\| log_block
	\| compare_cmd
	\| verify_cmd
	\| vote_cmd
	\| prompt_cmd
	\| distill_cmd
	\| rollback_cmd
	\| curriculum_cmd
	\| star_cmd
	\| best_of_cmd
	\| exploit_cmd
	\| arena_cmd
	\| research_arena_cmd

	// ======================== PHASE 1 COMMANDS ========================

	// load "model/path" as alias
	load_cmd: "load" string "as" IDENT

	// merge "source" into target using method [strength 0.5]
	merge_cmd: "merge" string "into" IDENT "using" IDENT (merge_strength)?
	merge_strength: "strength" NUMBER

	// heal target [lora_r 32] [epochs 2]
	heal_cmd: "heal" IDENT (heal_opt)*
	heal_opt: "lora_r" INT -> heal_lora_r
	\| "epochs" INT -> heal_epochs

	// eval target [on "dataset"] [-> output.json]
	eval_cmd: "eval" IDENT (eval_on)? (eval_output)?
	eval_on: "on" string
	eval_output: "->" FILEPATH

	// commit target [if [gate1, gate2, gate3]]
	commit_cmd: "commit" IDENT (commit_gates)?
	commit_gates: "if" name_list

	// ======================== PHASE 2 COMMANDS ========================
	// (parsed but not compiled yet — will show "not implemented" message)

	// synth target from source [filter cherry_llm] [-> output.jsonl]
	synth_cmd: "synth" IDENT "from" IDENT (synth_filter)? (synth_output)?
	synth_filter: "filter" IDENT
	synth_output: "->" FILEPATH

	// train target on "dataset" using method [steps 100] [lr 0.0001]
	train_cmd: "train" IDENT "on" string "using" IDENT (train_opt)*
	train_opt: "steps" INT -> train_steps
	\| "lr" NUMBER -> train_lr

	// debate target rounds 3 candidates 8 [-> output.jsonl]
	debate_cmd: "debate" IDENT "rounds" INT "candidates" INT (debate_output)?
	debate_output: "->" FILEPATH

	// diagnose target [-> weaknesses.json]
	diagnose_cmd: "diagnose" IDENT (diagnose_output)?
	diagnose_output: "->" FILEPATH

	// fork source as alias
	fork_cmd: "fork" IDENT "as" IDENT

	// reset target to checkpoint_name
	reset_cmd: "reset" IDENT "to" (string \| IDENT)

	// prune target using method [aggressiveness 0.1]
	prune_cmd: "prune" IDENT "using" IDENT (prune_aggr)?
	prune_aggr: "aggressiveness" NUMBER

	// edit target layers 16-28 using lora [lr 0.0001]
	edit_cmd: "edit" IDENT "layers" LAYER_SPEC "using" IDENT (edit_lr)?
	edit_lr: "lr" NUMBER

	// ======================== PHASE 7 — LOOP CONTROL ========================

	// repeat N { commands... }
	repeat_block_cmd: "repeat" INT "{" _NL* body_cmd+ _NL* "}"
	// if condition target { commands... } [else { commands... }]
	if_block_cmd: "if" IDENT IDENT "{" _NL* body_cmd+ _NL* "}" (else_clause)?
	else_clause: "else" "{" _NL* body_cmd+ _NL* "}"

	// Commands allowed inside blocks (same as top-level minus config blocks)
	?body_cmd: (load_cmd \| merge_cmd \| heal_cmd \| eval_cmd \| commit_cmd
	\| synth_cmd \| train_cmd \| debate_cmd \| diagnose_cmd
	\| fork_cmd \| reset_cmd \| prune_cmd \| edit_cmd
	\| fuse_cmd \| absorb_cmd \| snapshot_cmd \| report_cmd
	\| notify_cmd \| save_cmd
	\| repeat_block_cmd \| if_block_cmd \| schedule_cmd
	\| download_cmd \| compare_cmd \| verify_cmd
	\| vote_cmd \| prompt_cmd \| distill_cmd \| rollback_cmd
	\| curriculum_cmd \| star_cmd \| best_of_cmd \| exploit_cmd
	\| arena_cmd \| research_arena_cmd) _NL*

	// ======================== PHASE 6 — EASY MERGE COMMANDS ========================

	// fuse [model1, model2, model3] into target [using method] [strategy equal\|weighted\|sequential]
	fuse_cmd: "fuse" model_list "into" IDENT (fuse_method)? (fuse_strategy)?
	model_list: "[" string ("," string)* "]"
	fuse_method: "using" IDENT
	fuse_strategy: "strategy" IDENT

	// absorb "model" into target [strength 0.5]
	absorb_cmd: "absorb" string "into" IDENT (absorb_strength)?
	absorb_strength: "strength" NUMBER

	// ======================== PHASE 4 COMMANDS ========================

	// snapshot target [-> output_dir]
	snapshot_cmd: "snapshot" IDENT (snapshot_output)?
	snapshot_output: "->" FILEPATH

	// report [-> economics.json]
	report_cmd: "report" (report_output)?
	report_output: "->" FILEPATH

	// ======================== BLOCKS ========================

	// gate { must_pass = [canary, perplexity, thinking_mode] }
	gate_block: "gate" "{" _NL* gate_field+ _NL* "}"
	gate_field: "must_pass" "=" name_list _NL*

	// budget { max_gpu_hours = 8 \n max_cost = 50.00 }
	budget_block: "budget" "{" _NL* budget_field+ _NL* "}"
	budget_field: (budget_gpu \| budget_cost \| budget_tokens \| budget_experiments) _NL*
	budget_gpu: "max_gpu_hours" "=" NUMBER
	budget_cost: "max_cost" "=" NUMBER
	budget_tokens: "max_tokens" "=" INT
	budget_experiments: "max_experiments" "=" INT

	// data_contract { required_fields = [prompt, response] \n min_samples = 100 \n max_perplexity = 50.0 }
	data_contract_block: "data_contract" "{" _NL* dc_field+ _NL* "}"
	dc_field: (dc_required \| dc_min_samples \| dc_max_ppl) _NL*
	dc_required: "required_fields" "=" name_list
	dc_min_samples: "min_samples" "=" INT
	dc_max_ppl: "max_perplexity" "=" NUMBER

	// reward_contract { verifiers = [code_compiles, math_correct] \n min_reward = 0.3 }
	reward_contract_block: "reward_contract" "{" _NL* rc_field+ _NL* "}"
	rc_field: (rc_verifiers \| rc_min_reward) _NL*
	rc_verifiers: "verifiers" "=" name_list
	rc_min_reward: "min_reward" "=" NUMBER

	// ======================== PHASE 8 — AUTOPILOT ========================

	// notify "Training complete!"
	notify_cmd: "notify" string

	// save target to "gdrive:TD/models/v1"
	save_cmd: "save" IDENT "to" string

	// setup { pip = [torch, transformers] hf_token = env notify = "ntfy.sh/my_ai" }
	setup_block: "setup" "{" _NL* setup_field+ _NL* "}"
	setup_field: (setup_pip \| setup_hf \| setup_notify) _NL*
	setup_pip: "pip" "=" name_list
	setup_hf: "hf_token" "=" IDENT
	setup_notify: "notify" "=" string

	// on_error { retry = 3 fallback = reduce_batch notify = true }
	on_error_block: "on_error" "{" _NL* on_error_field+ _NL* "}"
	on_error_field: (onerr_retry \| onerr_fallback \| onerr_notify) _NL*
	onerr_retry: "retry" "=" INT
	onerr_fallback: "fallback" "=" IDENT
	onerr_notify: "notify" "=" IDENT

	// ======================== PHASE 9 — SCHEDULE ========================

	// schedule "every 6h" { commands... }
	// schedule "at 02:00" { commands... }
	// schedule "after 30m" { commands... }
	schedule_cmd: "schedule" string "{" _NL* body_cmd+ _NL* "}"

	// ======================== PHASE 10 - TOOLBOX ========================

	// download "gsm8k" as math_data [split train]
	download_cmd: "download" string "as" IDENT (download_split)?
	download_split: "split" IDENT

	// log "training_log.txt"
	log_block: "log" string

	// compare target vs "source_model" [questions 50] [-> output.json]
	compare_cmd: "compare" IDENT "vs" string (compare_questions)? (compare_output)?
	compare_questions: "questions" INT
	compare_output: "->" FILEPATH

	// verify target on "dataset" [questions 100] [-> results.json]
	verify_cmd: "verify" IDENT "on" string (verify_questions)? (verify_output)?
	verify_questions: "questions" INT
	verify_output: "->" FILEPATH

	// ======================== PHASE 11 - INTELLIGENCE ========================

	// vote target "question" [samples 5] [-> output.json]
	vote_cmd: "vote" IDENT string (vote_samples)? (vote_output)?
	vote_samples: "samples" INT
	vote_output: "->" FILEPATH

	// prompt target "system prompt text"
	prompt_cmd: "prompt" IDENT string

	// distill target into "small_model" [steps 200] [-> output_dir]
	distill_cmd: "distill" IDENT "into" string (distill_steps)? (distill_output)?
	distill_steps: "steps" INT
	distill_output: "->" FILEPATH

	// rollback target
	rollback_cmd: "rollback" IDENT

	// ======================== PHASE 12 - RL & FINE-TUNING ========================

	// curriculum target on "dataset" using method [levels 3] [steps 64]
	curriculum_cmd: "curriculum" IDENT "on" string "using" IDENT (curriculum_opt)*
	curriculum_opt: "levels" INT -> curriculum_levels
	\| "steps" INT -> curriculum_steps

	// star target on "dataset" [rounds 3] [samples 8]
	star_cmd: "star" IDENT "on" string (star_opt)*
	star_opt: "rounds" INT -> star_rounds
	\| "samples" INT -> star_samples

	// best_of target on "dataset" [n 8] [steps 32]
	best_of_cmd: "best_of" IDENT "on" string (best_of_opt)*
	best_of_opt: "n" INT -> best_of_n
	\| "steps" INT -> best_of_steps

	// exploit target on "dataset" [samples 16] [steps 32] [-> output.jsonl]
	exploit_cmd: "exploit" IDENT "on" string (exploit_opt)*
	exploit_opt: "samples" INT -> exploit_samples
	\| "steps" INT -> exploit_steps
	\| "->" FILEPATH -> exploit_output

	// ======================== PHASE 13 - REAL RL (ARENA) ========================

	// arena target on "dataset" [rounds 5] [episodes 50] [steps 64] [curiosity 0.3] [-> log.json]
	arena_cmd: "arena" IDENT "on" string (arena_opt)*
	arena_opt: "rounds" INT -> arena_rounds
	\| "episodes" INT -> arena_episodes
	\| "steps" INT -> arena_steps
	\| "curiosity" NUMBER -> arena_curiosity
	\| "->" FILEPATH -> arena_output

	// research_arena target topic "subject" [sources "web"\|"pubmed"\|"arxiv"\|path]
	// [rounds 5] [episodes 30] [steps 64] [curiosity 0.3] [difficulty_scale 0.25] [-> log.json]
	research_arena_cmd: "research_arena" IDENT "topic" string (ra_opt)*
	ra_opt: "sources" string -> ra_sources
	\| "rounds" INT -> ra_rounds
	\| "episodes" INT -> ra_episodes
	\| "steps" INT -> ra_steps
	\| "curiosity" NUMBER -> ra_curiosity
	\| "difficulty_scale" NUMBER -> ra_difficulty
	\| "->" FILEPATH -> ra_output

	// ======================== SHARED RULES ========================

	// List of names: [name1, name2, name3]
	name_list: "[" IDENT ("," IDENT)* "]"

	// String: double-quoted
	string: ESCAPED_STRING

	// Layer spec: "all", single number, or range like "16-28"
	LAYER_SPEC: /all\|[0-9]+-[0-9]+\|[0-9]+/

	// Filepath: word with dots, slashes, underscores (no spaces)
	FILEPATH: /[a-zA-Z0-9_.\-\/]+/

	// Identifier: letters, numbers, underscores, hyphens (but starts with letter/underscore)
	IDENT: /[a-zA-Z_][a-zA-Z0-9_\-]*/

	// Numbers
	NUMBER: /\d+\.?\d*([eE][+-]?\d+)?/
	INT: /\d+/

	// Whitespace and comments
	_NL: /\s/ NEWLINE /\s/
	COMMENT: /#[^\n]*/
	%import common.ESCAPED_STRING
	%import common.NEWLINE
	%import common.WS_INLINE
	%ignore WS_INLINE
	%ignore COMMENT
	"""


	# ============================================================================
	# LARK TRANSFORMER — Parse Tree → AST Nodes
	# ============================================================================

	@v_args(inline=True)
	class TDTransformer(Transformer):
	"""Transforms Lark parse tree into td_lang AST nodes.

	Each method matches a grammar rule name and returns the corresponding
	dataclass from ast_nodes.py.
	"""

	# --- Helpers ---

	def string(self, s: Token) -> str:
	"""Strip quotes from a string token."""
	return str(s)[1:-1]

	def name_list(self, *names: Token) -> list[str]:
	"""Convert name list tokens to Python list of strings."""
	return [str(n) for n in names]

	def IDENT(self, token: Token) -> str:
	return str(token)

	def INT(self, token: Token) -> int:
	return int(token)

	def NUMBER(self, token: Token) -> float:
	return float(token)

	def FILEPATH(self, token: Token) -> str:
	return str(token)

	def LAYER_SPEC(self, token: Token) -> str:
	return str(token)

	# --- Phase 1 Commands ---

	def load_cmd(self, model_ref: str, alias: str) -> LoadCmd:
	return LoadCmd(model_ref=model_ref, alias=alias)

	def merge_cmd(self, source: str, target: str, method: str,
	strength: float \| None = None) -> MergeCmd:
	return MergeCmd(
	source=source,
	target=target,
	method=method,
	strength=strength if strength is not None else 0.5,
	)

	def merge_strength(self, value: float) -> float:
	return value

	def heal_cmd(self, target: str, *opts) -> HealCmd:
	cmd = HealCmd(target=target)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "lora_r":
	cmd.lora_r = val
	elif key == "epochs":
	cmd.epochs = val
	return cmd

	def heal_lora_r(self, value: int) -> tuple:
	return ("lora_r", value)

	def heal_epochs(self, value: int) -> tuple:
	return ("epochs", value)

	def eval_cmd(self, target: str, *opts) -> EvalCmd:
	cmd = EvalCmd(target=target)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "on":
	cmd.dataset = val
	elif key == "output":
	cmd.output = val
	return cmd

	def eval_on(self, dataset: str) -> tuple:
	return ("on", dataset)

	def eval_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	def commit_cmd(self, target: str, gates: list[str] \| None = None) -> CommitCmd:
	return CommitCmd(target=target, gates=gates)

	def commit_gates(self, gates: list[str]) -> list[str]:
	return gates

	# --- Phase 2 Commands ---

	def synth_cmd(self, target: str, source: str, *opts) -> SynthCmd:
	cmd = SynthCmd(target=target, source=source)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "filter":
	cmd.filter_method = val
	elif key == "output":
	cmd.output = val
	return cmd

	def synth_filter(self, method: str) -> tuple:
	return ("filter", method)

	def synth_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	def train_cmd(self, target: str, dataset: str, method: str, *opts) -> TrainCmd:
	cmd = TrainCmd(target=target, dataset=dataset, method=method)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "steps":
	cmd.steps = val
	elif key == "lr":
	cmd.learning_rate = val
	return cmd

	def train_steps(self, value: int) -> tuple:
	return ("steps", value)

	def train_lr(self, value: float) -> tuple:
	return ("lr", value)

	def debate_cmd(self, target: str, rounds: int, candidates: int,
	output: tuple \| None = None) -> DebateCmd:
	cmd = DebateCmd(target=target, rounds=rounds, candidates=candidates)
	if isinstance(output, tuple) and output[0] == "output":
	cmd.output = output[1]
	return cmd

	def debate_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	def diagnose_cmd(self, target: str, output: tuple \| None = None) -> DiagnoseCmd:
	cmd = DiagnoseCmd(target=target)
	if isinstance(output, tuple) and output[0] == "output":
	cmd.output = output[1]
	return cmd

	def diagnose_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	def fork_cmd(self, source: str, alias: str) -> ForkCmd:
	return ForkCmd(source=source, alias=alias)

	def reset_cmd(self, target: str, checkpoint) -> ResetCmd:
	return ResetCmd(target=target, checkpoint=str(checkpoint))

	def prune_cmd(self, target: str, method: str,
	aggressiveness: float \| None = None) -> PruneCmd:
	return PruneCmd(
	target=target,
	method=method,
	aggressiveness=aggressiveness if aggressiveness is not None else 0.1,
	)

	def prune_aggr(self, value: float) -> float:
	return value

	def edit_cmd(self, target: str, layers: str, method: str,
	lr: float \| None = None) -> EditCmd:
	return EditCmd(
	target=target,
	layers=layers,
	method=method,
	learning_rate=lr,
	)

	def edit_lr(self, value: float) -> float:
	return value

	# --- Phase 7: Loop Control ---

	def repeat_block_cmd(self, count: int, *body_cmds) -> RepeatBlock:
	return RepeatBlock(count=count, body=list(body_cmds))

	def if_block_cmd(self, condition: str, target: str, *rest) -> IfBlock:
	"""Parse if condition target { then... } [else { else... }]"""
	block = IfBlock(condition=condition, target=target)
	# rest contains then_body commands + possibly an else list
	for item in rest:
	if isinstance(item, list) and item and hasattr(item, '__iter__'):
	# This is the else body (passed from else_clause)
	block.else_body = item
	else:
	block.then_body.append(item)
	return block

	def else_clause(self, *body_cmds) -> list:
	return list(body_cmds)

	# --- Phase 9: Schedule ---

	def schedule_cmd(self, timing: str, *body_cmds) -> ScheduleCmd:
	return ScheduleCmd(timing=timing, body=list(body_cmds))

	# --- Phase 10: Toolbox ---

	def download_cmd(self, dataset: str, alias: str, split: str \| None = None) -> DownloadCmd:
	cmd = DownloadCmd(dataset=dataset, alias=alias)
	if isinstance(split, tuple) and split[0] == "split":
	cmd.split = split[1]
	elif isinstance(split, str):
	cmd.split = split
	return cmd

	def download_split(self, value: str) -> tuple:
	return ("split", value)

	def log_block(self, filepath: str) -> LogBlock:
	return LogBlock(filepath=filepath)

	def compare_cmd(self, target: str, source: str, *opts) -> CompareCmd:
	cmd = CompareCmd(target=target, source=source)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "questions":
	cmd.questions = val
	elif key == "output":
	cmd.output = val
	return cmd

	def compare_questions(self, value: int) -> tuple:
	return ("questions", value)

	def compare_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	def verify_cmd(self, target: str, dataset: str, *opts) -> VerifyCmd:
	cmd = VerifyCmd(target=target, dataset=dataset)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "questions":
	cmd.questions = val
	elif key == "output":
	cmd.output = val
	return cmd

	def verify_questions(self, value: int) -> tuple:
	return ("questions", value)

	def verify_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	# --- Phase 11: Intelligence Commands ---

	def vote_cmd(self, target: str, question: str, *opts) -> VoteCmd:
	cmd = VoteCmd(target=target, question=question)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "samples":
	cmd.samples = val
	elif key == "output":
	cmd.output = val
	return cmd

	def vote_samples(self, value: int) -> tuple:
	return ("samples", value)

	def vote_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	def prompt_cmd(self, target: str, text: str) -> PromptBlock:
	return PromptBlock(target=target, text=text)

	def distill_cmd(self, teacher: str, student: str, *opts) -> DistillCmd:
	cmd = DistillCmd(teacher=teacher, student=student)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "steps":
	cmd.steps = val
	elif key == "output":
	cmd.output = val
	return cmd

	def distill_steps(self, value: int) -> tuple:
	return ("steps", value)

	def distill_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	def rollback_cmd(self, target: str) -> RollbackCmd:
	return RollbackCmd(target=target)

	# --- Phase 12: RL & Fine-Tuning Commands ---

	def curriculum_cmd(self, target: str, dataset: str, method: str, *opts) -> CurriculumCmd:
	cmd = CurriculumCmd(target=target, dataset=dataset, method=method)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "levels":
	cmd.levels = val
	elif key == "steps":
	cmd.steps = val
	return cmd

	def curriculum_levels(self, value: int) -> tuple:
	return ("levels", value)

	def curriculum_steps(self, value: int) -> tuple:
	return ("steps", value)

	def star_cmd(self, target: str, dataset: str, *opts) -> StarCmd:
	cmd = StarCmd(target=target, dataset=dataset)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "rounds":
	cmd.rounds = val
	elif key == "samples":
	cmd.samples = val
	return cmd

	def star_rounds(self, value: int) -> tuple:
	return ("rounds", value)

	def star_samples(self, value: int) -> tuple:
	return ("samples", value)

	def best_of_cmd(self, target: str, dataset: str, *opts) -> BestOfCmd:
	cmd = BestOfCmd(target=target, dataset=dataset)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "n":
	cmd.n = val
	elif key == "steps":
	cmd.steps = val
	return cmd

	def best_of_n(self, value: int) -> tuple:
	return ("n", value)

	def best_of_steps(self, value: int) -> tuple:
	return ("steps", value)

	def exploit_cmd(self, target: str, dataset: str, *opts) -> ExploitCmd:
	cmd = ExploitCmd(target=target, dataset=dataset)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "samples":
	cmd.samples = val
	elif key == "steps":
	cmd.steps = val
	elif key == "output":
	cmd.output = val
	return cmd

	def exploit_samples(self, value: int) -> tuple:
	return ("samples", value)

	def exploit_steps(self, value: int) -> tuple:
	return ("steps", value)

	def exploit_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	# --- Phase 13: Real RL (Arena) ---

	def arena_cmd(self, target: str, dataset: str, *opts) -> ArenaCmd:
	cmd = ArenaCmd(target=target, dataset=dataset)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "rounds":
	cmd.rounds = val
	elif key == "episodes":
	cmd.episodes = val
	elif key == "steps":
	cmd.steps = val
	elif key == "curiosity":
	cmd.curiosity = val
	elif key == "output":
	cmd.output = val
	return cmd

	def arena_rounds(self, value: int) -> tuple:
	return ("rounds", value)

	def arena_episodes(self, value: int) -> tuple:
	return ("episodes", value)

	def arena_steps(self, value: int) -> tuple:
	return ("steps", value)

	def arena_curiosity(self, value: float) -> tuple:
	return ("curiosity", value)

	def arena_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	# --- Phase 13: Research Arena ---

	def research_arena_cmd(self, target: str, topic: str, *opts) -> ResearchArenaCmd:
	cmd = ResearchArenaCmd(target=target, topic=topic)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "sources":
	cmd.sources = val
	elif key == "rounds":
	cmd.rounds = val
	elif key == "episodes":
	cmd.episodes = val
	elif key == "steps":
	cmd.steps = val
	elif key == "curiosity":
	cmd.curiosity = val
	elif key == "difficulty_scale":
	cmd.difficulty_scale = val
	elif key == "output":
	cmd.output = val
	return cmd

	def ra_sources(self, value: str) -> tuple:
	return ("sources", value)

	def ra_rounds(self, value: int) -> tuple:
	return ("rounds", value)

	def ra_episodes(self, value: int) -> tuple:
	return ("episodes", value)

	def ra_steps(self, value: int) -> tuple:
	return ("steps", value)

	def ra_curiosity(self, value: float) -> tuple:
	return ("curiosity", value)

	def ra_difficulty(self, value: float) -> tuple:
	return ("difficulty_scale", value)

	def ra_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	# --- Phase 6: Easy Merge Commands ---

	def fuse_cmd(self, sources: list[str], target: str, *opts) -> FuseCmd:
	cmd = FuseCmd(sources=sources, target=target)
	for opt in opts:
	if isinstance(opt, tuple):
	key, val = opt
	if key == "method":
	cmd.method = val
	elif key == "strategy":
	cmd.strategy = val
	return cmd

	def model_list(self, *models: str) -> list[str]:
	return [str(m) for m in models]

	def fuse_method(self, method: str) -> tuple:
	return ("method", method)

	def fuse_strategy(self, strategy: str) -> tuple:
	return ("strategy", strategy)

	def absorb_cmd(self, source: str, target: str,
	strength: float \| None = None) -> AbsorbCmd:
	return AbsorbCmd(
	source=source,
	target=target,
	strength=strength if strength is not None else 0.5,
	)

	def absorb_strength(self, value: float) -> float:
	return value

	# --- Phase 4 Commands ---

	def snapshot_cmd(self, target: str, output: tuple \| None = None) -> SnapshotCmd:
	cmd = SnapshotCmd(target=target)
	if isinstance(output, tuple) and output[0] == "output":
	cmd.output = output[1]
	return cmd

	def snapshot_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	def report_cmd(self, output: tuple \| None = None) -> ReportCmd:
	cmd = ReportCmd()
	if isinstance(output, tuple) and output[0] == "output":
	cmd.output = output[1]
	return cmd

	def report_output(self, filepath: str) -> tuple:
	return ("output", filepath)

	# --- Blocks ---

	def gate_block(self, *fields) -> GateBlock:
	gate = GateBlock()
	for f in fields:
	if isinstance(f, list):
	gate.must_pass = f
	return gate

	def gate_field(self, names: list[str]) -> list[str]:
	return names

	def budget_block(self, *fields) -> BudgetBlock:
	budget = BudgetBlock()
	for f in fields:
	if isinstance(f, tuple):
	key, val = f
	if key == "max_gpu_hours":
	budget.max_gpu_hours = val
	elif key == "max_cost":
	budget.max_cost = val
	elif key == "max_tokens":
	budget.max_tokens = int(val)
	elif key == "max_experiments":
	budget.max_experiments = int(val)
	return budget

	def budget_field(self, field_data) -> tuple:
	return field_data

	def budget_gpu(self, value: float) -> tuple:
	return ("max_gpu_hours", value)

	def budget_cost(self, value: float) -> tuple:
	return ("max_cost", value)

	def budget_tokens(self, value: int) -> tuple:
	return ("max_tokens", value)

	def budget_experiments(self, value: int) -> tuple:
	return ("max_experiments", value)

	# --- Phase 8: Autopilot Commands ---

	def notify_cmd(self, message: str) -> NotifyCmd:
	return NotifyCmd(message=message)

	def save_cmd(self, target: str, destination: str) -> SaveCmd:
	return SaveCmd(target=target, destination=destination)

	def setup_block(self, *fields) -> SetupBlock:
	sb = SetupBlock()
	for f in fields:
	if isinstance(f, tuple):
	key, val = f
	if key == "pip":
	sb.pip_packages = val
	elif key == "hf_token":
	sb.hf_token = val
	elif key == "notify":
	sb.notify_url = val
	return sb

	def setup_field(self, field_data) -> tuple:
	return field_data

	def setup_pip(self, packages: list[str]) -> tuple:
	return ("pip", packages)

	def setup_hf(self, mode: str) -> tuple:
	return ("hf_token", mode)

	def setup_notify(self, url: str) -> tuple:
	return ("notify", url)

	def on_error_block(self, *fields) -> OnErrorBlock:
	oe = OnErrorBlock()
	for f in fields:
	if isinstance(f, tuple):
	key, val = f
	if key == "retry":
	oe.retry = int(val)
	elif key == "fallback":
	oe.fallback = val
	elif key == "notify":
	oe.notify = str(val).lower() == "true"
	return oe

	def on_error_field(self, field_data) -> tuple:
	return field_data

	def onerr_retry(self, value: int) -> tuple:
	return ("retry", value)

	def onerr_fallback(self, value: str) -> tuple:
	return ("fallback", value)

	def onerr_notify(self, value: str) -> tuple:
	return ("notify", value)

	# --- Contract Blocks (Phase 4) ---

	def data_contract_block(self, *fields) -> DataContractBlock:
	dc = DataContractBlock()
	for f in fields:
	if isinstance(f, tuple):
	key, val = f
	if key == "required_fields":
	dc.required_fields = val
	elif key == "min_samples":
	dc.min_samples = int(val)
	elif key == "max_perplexity":
	dc.max_perplexity = val
	return dc

	def dc_field(self, field_data) -> tuple:
	return field_data

	def dc_required(self, names: list[str]) -> tuple:
	return ("required_fields", names)

	def dc_min_samples(self, value: int) -> tuple:
	return ("min_samples", value)

	def dc_max_ppl(self, value: float) -> tuple:
	return ("max_perplexity", value)

	def reward_contract_block(self, *fields) -> RewardContractBlock:
	rc = RewardContractBlock()
	for f in fields:
	if isinstance(f, tuple):
	key, val = f
	if key == "verifiers":
	rc.verifiers = val
	elif key == "min_reward":
	rc.min_reward = val
	return rc

	def rc_field(self, field_data) -> tuple:
	return field_data

	def rc_verifiers(self, names: list[str]) -> tuple:
	return ("verifiers", names)

	def rc_min_reward(self, value: float) -> tuple:
	return ("min_reward", value)

	# --- Top Level ---

	def start(self, *items) -> TDProgram:
	"""Collect all parsed commands and blocks into a TDProgram."""
	program = TDProgram()
	for item in items:
	if item is None:
	continue
	if isinstance(item, GateBlock):
	program.gates = item
	elif isinstance(item, BudgetBlock):
	program.budget = item
	elif isinstance(item, DataContractBlock):
	program.data_contract = item
	elif isinstance(item, RewardContractBlock):
	program.reward_contract = item
	elif isinstance(item, SetupBlock):
	program.setup = item
	elif isinstance(item, OnErrorBlock):
	program.on_error = item
	elif isinstance(item, LogBlock):
	program.log = item
	else:
	program.commands.append(item)
	return program


	# ============================================================================
	# PUBLIC API
	# ============================================================================

	# Create the parser once — reuse for all files
	_parser = Lark(
	TD_GRAMMAR,
	parser="earley",
	propagate_positions=True,
	)

	_transformer = TDTransformer()


	def parse_td_string(source: str) -> TDProgram:
	"""Parse a .td source string into a TDProgram AST.

	Args:
	source: The .td file content as a string.

	Returns:
	TDProgram with all commands and blocks.

	Raises:
	TDSyntaxError: If the source has invalid syntax.
	"""
	try:
	tree = _parser.parse(source)
	return _transformer.transform(tree)
	except UnexpectedInput as e:
	raise TDSyntaxError(
	message=f"Unexpected {e.token!r}" if hasattr(e, "token") else str(e),
	line=getattr(e, "line", None),
	hint="Check for typos or missing quotes around model paths.",
	) from e


	def parse_td_file(filepath: str) -> TDProgram:
	"""Parse a .td file into a TDProgram AST.

	Args:
	filepath: Path to the .td file.

	Returns:
	TDProgram with all commands and blocks.

	Raises:
	TDSyntaxError: If the file has invalid syntax.
	FileNotFoundError: If the file doesn't exist.
	"""
	with open(filepath, "r") as f:
	source = f.read()
	program = parse_td_string(source)
	program.source_file = filepath
	return program