lemer-bk / results /stock-e2b-bf16-math-temp0.json
lthn's picture
data: add benchmark result stock-e2b-bf16-math-temp0.json
86673fd verified
{
"model": "mlx-community/gemma-4-e2b-it-bf16",
"benchmark": "MMLU-Pro",
"method": "rapid-mlx + openai SDK + google parse_response",
"temperature": 0.0,
"processor": "google/gemma-4-E2B-it",
"num_runs": 1,
"limit_per_subject": 20,
"runs": [
{
"math": {
"correct": 2,
"total": 20,
"accuracy": 0.1
},
"_overall": {
"correct": 2,
"total": 20,
"accuracy": 0.1
},
"_elapsed_s": 394.3
}
]
}