wheattoast11 commited on
Commit
bdb8ce4
·
verified ·
1 Parent(s): 20fa6f2

Upload eval_baseline_v6.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. eval_baseline_v6.py +25 -0
eval_baseline_v6.py ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # /// script
2
+ # requires-python = ">=3.10"
3
+ # dependencies = [
4
+ # "lighteval[accelerate]>=0.6.0",
5
+ # "torch>=2.0.0",
6
+ # "transformers>=4.40.0",
7
+ # "accelerate>=0.30.0",
8
+ # ]
9
+ # ///
10
+
11
+ """Baseline eval: LiquidAI/LFM2.5-1.2B-Instruct on standard benchmarks."""
12
+
13
+ import subprocess, sys
14
+
15
+ model_args = "model_name=LiquidAI/LFM2.5-1.2B-Instruct,trust_remote_code=True,dtype=bfloat16"
16
+ tasks = "leaderboard|mmlu|5,leaderboard|arc:challenge|25,leaderboard|truthfulqa:mc|0"
17
+
18
+ cmd = [
19
+ sys.executable, "-m", "lighteval", "accelerate",
20
+ model_args, tasks,
21
+ "--output-dir", "./eval_results_baseline",
22
+ ]
23
+ print(f"Running: {' '.join(cmd)}")
24
+ result = subprocess.run(cmd)
25
+ sys.exit(result.returncode)