lthn commited on
Commit
4e3885c
·
verified ·
1 Parent(s): 1a9b96a

data: add benchmark result stock-e2b-bf16-math-nothink-temp1.json

Browse files
results/stock-e2b-bf16-math-nothink-temp1.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model": "mlx-community/gemma-4-e2b-it-bf16",
3
+ "benchmark": "MMLU-Pro",
4
+ "method": "rapid-mlx + openai SDK + google parse_response",
5
+ "temperature": 1.0,
6
+ "processor": "google/gemma-4-E2B-it",
7
+ "num_runs": 1,
8
+ "limit_per_subject": 20,
9
+ "runs": [
10
+ {
11
+ "math": {
12
+ "correct": 2,
13
+ "total": 20,
14
+ "accuracy": 0.1
15
+ },
16
+ "_overall": {
17
+ "correct": 2,
18
+ "total": 20,
19
+ "accuracy": 0.1
20
+ },
21
+ "_elapsed_s": 175.0
22
+ }
23
+ ]
24
+ }