DarshanScripts commited on
Commit
390fdeb
·
verified ·
1 Parent(s): 1acd444

Upload stratego/benchmarking/main_benchmark.py with huggingface_hub

Browse files
stratego/benchmarking/main_benchmark.py ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # stratego/benchmarking/main_benchmark.py
2
+
3
+ import argparse
4
+ from stratego.models.ollama_model import OllamaAgent
5
+ from .run_benchmark import run_benchmark
6
+
7
+
8
+ def benchmark():
9
+ p = argparse.ArgumentParser()
10
+ p.add_argument("--p0", default="llama3.1:70b")
11
+ p.add_argument("--p1", default="gemma3:1b")
12
+ p.add_argument("--size", default="6")
13
+ p.add_argument("--games", default="3")
14
+ args = p.parse_args()
15
+ agent0 = OllamaAgent(args.p0)
16
+ agent1 = OllamaAgent(args.p1)
17
+
18
+ GAMES = int(args.games)
19
+ SIZE = int(args.size)
20
+
21
+ summary, csv_path = run_benchmark(
22
+ agent0,
23
+ agent1,
24
+ games=GAMES,
25
+ size=SIZE
26
+ )
27
+
28
+ print("\n=== BENCHMARK SUMMARY ===")
29
+ print(f"Source CSV: {csv_path}")
30
+ for k, v in summary.items():
31
+ print(f"{k:25s}: {v}")
32
+
33
+
34
+ def main():
35
+ benchmark()