laguna-martini / scripts /eval_swebench.py
nikgeo's picture
Publish Laguna Martini grouped-pruning model card and reproducibility artifacts
6f11713 verified
Raw
History Blame Contribute Delete
635 Bytes
#!/usr/bin/env python3
"""Record and run an explicit SWE-bench command."""
from __future__ import annotations
import argparse
import sys
from pathlib import Path
sys.path.insert(0, str(Path(__file__).resolve().parents[1]))
from heapr.eval.swe_bench import run_swebench_command
def parse_args():
parser = argparse.ArgumentParser()
parser.add_argument("--output-dir", required=True)
parser.add_argument("cmd", nargs="+")
return parser.parse_args()
def main() -> None:
args = parse_args()
raise SystemExit(run_swebench_command(args.cmd, output_dir=args.output_dir))
if __name__ == "__main__":
main()