Upload metadata.json
Browse files
runs/agent1_2026-04-16/metadata.json
CHANGED
|
@@ -5,5 +5,6 @@
|
|
| 5 |
"description": "The first AutoBench run to measure agentic performance of top LLMs",
|
| 6 |
"blog_url": "https://huggingface.co/blog/PeterKruger/autobench-agentic-1",
|
| 7 |
"model_count": 31,
|
| 8 |
-
"is_latest": true
|
|
|
|
| 9 |
}
|
|
|
|
| 5 |
"description": "The first AutoBench run to measure agentic performance of top LLMs",
|
| 6 |
"blog_url": "https://huggingface.co/blog/PeterKruger/autobench-agentic-1",
|
| 7 |
"model_count": 31,
|
| 8 |
+
"is_latest": true,
|
| 9 |
+
"benchmark_comparison_note": "This run targets agentic performance; reference scores are drawn from agentic benchmarks alongside the Artificial Analysis Intelligence Index."
|
| 10 |
}
|