File size: 2,353 Bytes
951f760
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
#!/usr/bin/env python3
from __future__ import annotations

import json
from pathlib import Path
from typing import Any


def _require_path(payload: dict[str, Any], path: str) -> None:
    current: Any = payload
    for part in path.split('.'):
        if not isinstance(current, dict) or part not in current:
            raise ValueError(f"missing required field: {path}")
        current = current[part]


def validate_benchmark_contract(payload: dict[str, Any]) -> None:
    for field in [
        "cycle_id",
        "hardware_class",
        "seeds",
        "budget_modes",
        "coding_benchmarks.fast_iteration",
        "coding_benchmarks.milestone",
        "reasoning_benchmarks.fast_iteration",
        "reasoning_benchmarks.milestone",
        "variants.hydra_full",
        "variants.baseline_mamba_matched",
    ]:
        _require_path(payload, field)

    for section in [
        payload["coding_benchmarks"]["fast_iteration"],
        payload["coding_benchmarks"]["milestone"],
        payload["reasoning_benchmarks"]["fast_iteration"],
        payload["reasoning_benchmarks"]["milestone"],
    ]:
        if "name" not in section or "primary_metric" not in section or "decode" not in section:
            raise ValueError("benchmark sections require name, primary_metric, and decode")

    if not isinstance(payload["seeds"], list) or len(payload["seeds"]) < 3:
        raise ValueError("seeds must contain at least three values")

    if payload["variants"]["hydra_full"].get("status") != "runnable_now":
        raise ValueError("hydra_full must be runnable_now")

    if payload["variants"]["baseline_mamba_matched"].get("status") != "runnable_now":
        raise ValueError("baseline_mamba_matched must be runnable_now")


def load_benchmark_contract(path: Path) -> dict[str, Any]:
    payload = json.loads(path.read_text(encoding="utf-8"))
    if not isinstance(payload, dict):
        raise ValueError("benchmark contract must be a JSON object")
    validate_benchmark_contract(payload)
    return payload


def main() -> int:
    path = Path("artifacts/cycle_1_execution_freeze.json")
    payload = load_benchmark_contract(path)
    print(json.dumps(payload, indent=2, sort_keys=True))
    return 0


if __name__ == "__main__":
    raise SystemExit(main())