Spaces:

J94
/

bit-vector-tensor-control-policy

Runtime error

App Files Files Community

bit-vector-tensor-control-policy / scripts /compile_user_governance.py

J94

Initial Space upload

3436bdd verified 25 days ago

raw

history blame contribute delete

9.31 kB

	#!/usr/bin/env python3
	from __future__ import annotations

	import json
	import re
	from datetime import datetime, timezone
	from pathlib import Path
	from typing import Any

	ROOT = Path(__file__).resolve().parents[1]
	DATA_PREP = Path("/Users/jobs/Desktop/data_prep_stage")
	OUTPUT_DIR = ROOT / "build" / "system"
	OUTPUT_PATH = OUTPUT_DIR / "user_governance.json"

	BRAIN_SUMMARY_PATH = DATA_PREP / "artifacts" / "operator_brain" / "brain_summary.json"
	MOTIF_LEDGER_PATH = DATA_PREP / "artifacts" / "operator_delta" / "motif_family_ledger.md"
	TRIGGER_MAP_PATH = DATA_PREP / "artifacts" / "operator_delta" / "primitive_trigger_map.md"
	PRIMITIVE_CATALOG_PATH = DATA_PREP / "artifacts" / "operator_delta" / "interaction_primitives_catalog.md"
	FLOW_REDUCTION_PATH = DATA_PREP / "artifacts" / "operator_delta" / "flow_and_shell_reduction.md"
	HISTORY_REDUCTION_PATH = DATA_PREP / "artifacts" / "operator_delta" / "history_to_knowledge_reduction.md"
	REUSE_REDUCTION_PATH = DATA_PREP / "artifacts" / "operator_delta" / "continuity_and_reuse_reduction.md"
	FEATURE_LEDGER_PATH = DATA_PREP / "artifacts" / "operator_delta" / "llm_interaction_feature_ledger.md"


	def _utc_now() -> str:
	return datetime.now(timezone.utc).strftime("%Y-%m-%dT%H:%M:%SZ")


	def _load_json(path: Path) -> dict[str, Any]:
	return json.loads(path.read_text(encoding="utf-8"))


	def _load_text(path: Path) -> str:
	return path.read_text(encoding="utf-8")


	def _extract_numbered_split(markdown: str) -> list[str]:
	matches = re.findall(r"^\d+\.\s+`([^`]+)`", markdown, flags=re.MULTILINE)
	seen: set[str] = set()
	ordered: list[str] = []
	for item in matches:
	if item in seen:
	continue
	seen.add(item)
	ordered.append(item)
	return ordered


	def _extract_markdown_table(markdown: str, heading: str) -> list[dict[str, str]]:
	marker = f"## {heading}"
	if marker not in markdown:
	return []
	chunk = markdown.split(marker, 1)[1]
	lines = chunk.splitlines()
	table_lines: list[str] = []
	in_table = False
	for line in lines:
	if line.startswith("## ") and in_table:
	break
	if line.strip().startswith("\|"):
	in_table = True
	table_lines.append(line.rstrip())
	elif in_table and not line.strip():
	break
	if len(table_lines) < 3:
	return []
	headers = [cell.strip() for cell in table_lines[0].strip("\|").split("\|")]
	rows: list[dict[str, str]] = []
	for line in table_lines[2:]:
	cells = [cell.strip() for cell in line.strip("\|").split("\|")]
	if len(cells) != len(headers):
	continue
	rows.append(dict(zip(headers, cells)))
	return rows


	def _extract_highest_value_primitives(markdown: str) -> list[str]:
	rows = _extract_markdown_table(markdown, "Highest-Value Primitives")
	return [row["Primitive"].strip("`") for row in rows if row.get("Primitive")]


	def _extract_primitive_matrix(markdown: str) -> list[dict[str, str]]:
	return _extract_markdown_table(markdown, "Primitive Matrix")


	def _extract_trigger_map(markdown: str) -> list[dict[str, str]]:
	return _extract_markdown_table(markdown, "Trigger Map")


	def _extract_next_promotion_target(markdown: str) -> list[str]:
	marker = "## Next Promotion Target"
	if marker not in markdown:
	return []
	chunk = markdown.split(marker, 1)[1]
	results: list[str] = []
	for line in chunk.splitlines():
	stripped = line.strip()
	if stripped.startswith("## "):
	break
	if re.match(r"^\d+\.\s+", stripped):
	results.append(re.sub(r"^\d+\.\s+", "", stripped))
	return results


	def _primitive_status_map(rows: list[dict[str, str]]) -> dict[str, dict[str, str]]:
	result: dict[str, dict[str, str]] = {}
	for row in rows:
	primitive = row.get("Primitive", "").strip("`")
	if not primitive:
	continue
	result[primitive] = {
	"trigger": row.get("Typical trigger phrasing", ""),
	"meaning": row.get("What the user means", ""),
	"state_effect": row.get("State effect", ""),
	"evidence_effect": row.get("Evidence effect", ""),
	"status": row.get("Current status", ""),
	}
	return result


	def _build_next_moves(
	*,
	stable_rules: list[dict[str, Any]],
	next_tasks: list[dict[str, Any]],
	highest_value: list[str],
	primitive_status: dict[str, dict[str, str]],
	trigger_rows: list[dict[str, str]],
	next_promotion_target: list[str],
	) -> list[dict[str, Any]]:
	trigger_by_primitive = {
	row.get("Primitive", "").strip("`"): row for row in trigger_rows if row.get("Primitive")
	}
	move_ids = [
	"thin_intent_shell",
	"history_navigation_surface",
	"auto_reuse_prior_tools",
	"intent_to_packet",
	"route_by_purpose",
	]
	results: list[dict[str, Any]] = []
	stable_rule_labels = [rule["label"] for rule in stable_rules]
	task_labels = [task["label"] for task in next_tasks]
	for primitive in move_ids:
	primitive_info = primitive_status.get(primitive, {})
	trigger_info = trigger_by_primitive.get(primitive, {})
	score = 0
	if primitive in highest_value:
	score += 3
	if primitive in next_promotion_target:
	score += 2
	if primitive_info.get("status") == "`partial`" or primitive_info.get("status") == "partial":
	score += 2
	if primitive_info.get("status") == "`requested`" or primitive_info.get("status") == "requested":
	score += 1
	if primitive == "thin_intent_shell" and any("route by purpose" in label for label in stable_rule_labels):
	score += 2
	if primitive == "history_navigation_surface" and any("cluster repeated packets" in label for label in task_labels):
	score += 2
	if primitive == "auto_reuse_prior_tools" and any("reuse" in label.lower() for label in task_labels):
	score += 1
	results.append(
	{
	"primitive": primitive,
	"score": score,
	"status": primitive_info.get("status", "unknown").strip("`"),
	"why": primitive_info.get("meaning", ""),
	"trigger": trigger_info.get("Example trigger phrasing", "") or primitive_info.get("trigger", ""),
	"first_surface": trigger_info.get("First surface to check", ""),
	"expected_artifact": trigger_info.get("Expected artifact or receipt", ""),
	}
	)
	return sorted(results, key=lambda item: (-item["score"], item["primitive"]))


	def build_governance() -> dict[str, Any]:
	brain = _load_json(BRAIN_SUMMARY_PATH)
	motif_ledger = _load_text(MOTIF_LEDGER_PATH)
	trigger_map = _load_text(TRIGGER_MAP_PATH)
	primitive_catalog = _load_text(PRIMITIVE_CATALOG_PATH)
	flow_reduction = _load_text(FLOW_REDUCTION_PATH)
	history_reduction = _load_text(HISTORY_REDUCTION_PATH)
	reuse_reduction = _load_text(REUSE_REDUCTION_PATH)
	feature_ledger = _load_text(FEATURE_LEDGER_PATH)

	highest_value = _extract_highest_value_primitives(primitive_catalog)
	primitive_rows = _extract_primitive_matrix(primitive_catalog)
	trigger_rows = _extract_trigger_map(trigger_map)
	primitive_status = _primitive_status_map(primitive_rows)
	next_promotion_target = _extract_next_promotion_target(feature_ledger)

	reductions = {
	"flow_and_shell_simplification": _extract_numbered_split(flow_reduction),
	"history_to_knowledge": _extract_numbered_split(history_reduction),
	"continuity_and_reuse": _extract_numbered_split(reuse_reduction),
	}

	governance = {
	"compiled_at": _utc_now(),
	"source_root": str(DATA_PREP),
	"governing_rules": brain.get("stable_rules", []),
	"operator_next_tasks": brain.get("next_tasks", []),
	"motif_rule": "packet -> motif family -> primitive -> trigger map",
	"reduced_families": reductions,
	"highest_value_primitives": highest_value,
	"next_moves": _build_next_moves(
	stable_rules=brain.get("stable_rules", []),
	next_tasks=brain.get("next_tasks", []),
	highest_value=highest_value,
	primitive_status=primitive_status,
	trigger_rows=trigger_rows,
	next_promotion_target=next_promotion_target,
	),
	"sources": {
	"brain_summary": str(BRAIN_SUMMARY_PATH),
	"motif_family_ledger": str(MOTIF_LEDGER_PATH),
	"primitive_trigger_map": str(TRIGGER_MAP_PATH),
	"interaction_primitives_catalog": str(PRIMITIVE_CATALOG_PATH),
	"flow_and_shell_reduction": str(FLOW_REDUCTION_PATH),
	"history_to_knowledge_reduction": str(HISTORY_REDUCTION_PATH),
	"continuity_and_reuse_reduction": str(REUSE_REDUCTION_PATH),
	"llm_interaction_feature_ledger": str(FEATURE_LEDGER_PATH),
	},
	}
	return governance


	def main() -> int:
	OUTPUT_DIR.mkdir(parents=True, exist_ok=True)
	governance = build_governance()
	OUTPUT_PATH.write_text(json.dumps(governance, indent=2, sort_keys=True) + "\n", encoding="utf-8")
	print(OUTPUT_PATH)
	return 0


	if __name__ == "__main__":
	raise SystemExit(main())