Spaces:

Flamehaven
/

stem-bio-ai

Sleeping

stem-bio-ai / scripts /provider_packet_benchmark.py

Codex

sync hf space snapshot

6a1cba7 18 days ago

6.16 kB

	from __future__ import annotations

	import argparse
	import json
	import sys
	from datetime import date
	from pathlib import Path
	from typing import Any

	sys.path.insert(0, str(Path(__file__).resolve().parents[1]))

	from stem_ai import __version__
	from stem_ai.provider_benchmark import (
	PROVIDER_BENCHMARK_SCHEMA_VERSION,
	packet_stats_record,
	packet_summary,
	response_validation_record,
	)
	from stem_ai.render import _safe_name
	from stem_ai.scanner import audit_repository


	def main() -> int:
	args = _parser().parse_args()
	manifest_path = Path(args.manifest).expanduser().resolve()
	out_dir = Path(args.out).expanduser().resolve()
	response_dir = Path(args.responses).expanduser().resolve() if args.responses else None
	manifest = json.loads(manifest_path.read_text(encoding="utf-8"))
	out_dir.mkdir(parents=True, exist_ok=True)
	packet_dir = out_dir / "packets"
	packet_dir.mkdir(parents=True, exist_ok=True)

	packet_records: list[dict[str, Any]] = []
	response_records: list[dict[str, Any]] = []
	failures: list[str] = []
	for repo in manifest.get("repos", []):
	local_path = Path(repo["local_path"])
	if not local_path.exists():
	failures.append(f"- {repo.get('repo')}: local path missing: {local_path}")
	continue
	result = audit_repository(local_path, advisory="packet")
	packet = result["ai_advisory_input"]
	packet_path = packet_dir / f"{_safe_name(repo.get('local_name') or repo.get('repo'))}_advisory_input.json"
	packet_path.write_text(json.dumps(packet, indent=2), encoding="utf-8")
	packet_records.append(packet_stats_record(repo, result, packet, packet_path.relative_to(out_dir)))

	response_path = _response_path(response_dir, repo) if response_dir is not None else None
	if response_path is not None and response_path.exists():
	validated = audit_repository(local_path, advisory_response_path=response_path)
	response_records.append(response_validation_record(repo, validated["ai_advisory"], response_path))

	_write_json(out_dir / "benchmark_manifest.json", _output_manifest(manifest_path, manifest, packet_records, response_records))
	_write_jsonl(out_dir / "packet_stats.jsonl", packet_records)
	_write_json(out_dir / "packet_summary.json", packet_summary(packet_records))
	_write_jsonl(out_dir / "provider_response_validation.jsonl", response_records)
	_write_notes(out_dir / "provider_failure_notes.md", failures, response_dir, response_records)
	print(f"provider benchmark records: packets={len(packet_records)} responses={len(response_records)}")
	print(out_dir)
	return 0


	def _parser() -> argparse.ArgumentParser:
	parser = argparse.ArgumentParser(description="Build provider-packet benchmark artifacts without API calls.")
	parser.add_argument(
	"--manifest",
	default="audits/benchmark-v1.3/local-10/benchmark_manifest.json",
	help="Benchmark manifest containing repos with local_path fields",
	)
	parser.add_argument(
	"--out",
	default="audits/benchmark-v1.4/provider-response-local-10",
	help="Output directory for v1.4 provider benchmark artifacts",
	)
	parser.add_argument(
	"--responses",
	default=None,
	help="Optional directory of provider advisory JSON files named by local_name, repo safe name, or '<local_name>_provider_advisory.json'",
	)
	return parser


	def _output_manifest(
	source_manifest: Path,
	source: dict[str, Any],
	packet_records: list[dict[str, Any]],
	response_records: list[dict[str, Any]],
	) -> dict[str, Any]:
	return {
	"schema_version": PROVIDER_BENCHMARK_SCHEMA_VERSION,
	"generated_at": date.today().isoformat(),
	"stem_ai_version": __version__,
	"benchmark_type": "provider_packet_readiness",
	"source_manifest": str(source_manifest),
	"source_schema_version": source.get("schema_version"),
	"repo_count": len(packet_records),
	"response_validation_count": len(response_records),
	"packet_profile": "provider_budgeted",
	"api_calls_made_by_script": False,
	"repos": [
	{
	"repo": record.get("repo"),
	"local_name": record.get("local_name"),
	"local_path": record.get("local_path"),
	"expected_commit": record.get("expected_commit"),
	"scan_commit": record.get("scan_commit"),
	"packet_file": record.get("packet_file"),
	}
	for record in packet_records
	],
	}


	def _response_path(response_dir: Path \| None, repo: dict[str, Any]) -> Path \| None:
	if response_dir is None:
	return None
	names = [
	f"{repo.get('local_name')}_provider_advisory.json",
	f"{repo.get('local_name')}.json",
	f"{_safe_name(repo.get('repo') or '')}_provider_advisory.json",
	]
	for name in names:
	path = response_dir / name
	if path.exists():
	return path
	return None


	def _write_json(path: Path, value: Any) -> None:
	path.write_text(json.dumps(value, indent=2), encoding="utf-8")


	def _write_jsonl(path: Path, records: list[dict[str, Any]]) -> None:
	path.write_text("".join(json.dumps(record, sort_keys=True) + "\n" for record in records), encoding="utf-8")


	def _write_notes(
	path: Path,
	failures: list[str],
	response_dir: Path \| None,
	response_records: list[dict[str, Any]],
	) -> None:
	lines = [
	"# Provider Response Benchmark Notes",
	"",
	"This benchmark script makes no provider API calls.",
	"It exports provider-budgeted packets and optionally validates existing provider response JSON files.",
	"",
	f"Response directory: `{response_dir}`" if response_dir else "Response directory: not provided",
	f"Response validations: {len(response_records)}",
	"",
	"## Failures",
	"",
	]
	lines += failures or ["None"]
	lines.append("")
	path.write_text("\n".join(lines), encoding="utf-8")


	if __name__ == "__main__":
	raise SystemExit(main())