Spaces:
Paused
Paused
CrispStrobe commited on
Commit ·
ac03708
1
Parent(s): db007de
feat: complete full set of Artificial Analysis metrics
Browse files
scripts/fetch-benchmarks.js
CHANGED
|
@@ -399,10 +399,16 @@ async function fetchArtificialAnalysis() {
|
|
| 399 |
aa_id: m.id,
|
| 400 |
aa_name: m.name,
|
| 401 |
aa_slug: m.slug,
|
| 402 |
-
aa_intelligence: ev.artificial_analysis_intelligence_index, //
|
|
|
|
|
|
|
| 403 |
aa_mmlu_pro: ev.mmlu_pro, // 0-1
|
| 404 |
aa_gpqa: ev.gpqa, // 0-1
|
| 405 |
aa_livecodebench: ev.livecodebench, // 0-1
|
|
|
|
|
|
|
|
|
|
|
|
|
| 406 |
aa_tokens_per_s: m.median_output_tokens_per_second,
|
| 407 |
aa_latency_s: m.median_time_to_first_token_seconds,
|
| 408 |
};
|
|
@@ -480,7 +486,7 @@ const SOURCE_FIELDS = {
|
|
| 480 |
livebench: ['lb_name', 'lb_global', 'lb_reasoning', 'lb_coding', 'lb_math', 'lb_language', 'lb_if', 'lb_data_analysis'],
|
| 481 |
arena: ['arena_name', 'arena_org', 'arena_elo', 'arena_rank', 'arena_votes'],
|
| 482 |
aider: ['aider_model', 'aider_pass_rate'],
|
| 483 |
-
aa: ['aa_id', 'aa_intelligence', 'aa_mmlu_pro', 'aa_gpqa', 'aa_livecodebench', 'aa_tokens_per_s', 'aa_latency_s'],
|
| 484 |
};
|
| 485 |
|
| 486 |
const SOURCE_ID_FIELD = {
|
|
|
|
| 399 |
aa_id: m.id,
|
| 400 |
aa_name: m.name,
|
| 401 |
aa_slug: m.slug,
|
| 402 |
+
aa_intelligence: ev.artificial_analysis_intelligence_index, // 0-100
|
| 403 |
+
aa_coding: ev.artificial_analysis_coding_index, // 0-100
|
| 404 |
+
aa_math: ev.artificial_analysis_math_index, // 0-100
|
| 405 |
aa_mmlu_pro: ev.mmlu_pro, // 0-1
|
| 406 |
aa_gpqa: ev.gpqa, // 0-1
|
| 407 |
aa_livecodebench: ev.livecodebench, // 0-1
|
| 408 |
+
aa_hle: ev.hle,
|
| 409 |
+
aa_scicode: ev.scicode,
|
| 410 |
+
aa_math_500: ev.math_500,
|
| 411 |
+
aa_aime: ev.aime,
|
| 412 |
aa_tokens_per_s: m.median_output_tokens_per_second,
|
| 413 |
aa_latency_s: m.median_time_to_first_token_seconds,
|
| 414 |
};
|
|
|
|
| 486 |
livebench: ['lb_name', 'lb_global', 'lb_reasoning', 'lb_coding', 'lb_math', 'lb_language', 'lb_if', 'lb_data_analysis'],
|
| 487 |
arena: ['arena_name', 'arena_org', 'arena_elo', 'arena_rank', 'arena_votes'],
|
| 488 |
aider: ['aider_model', 'aider_pass_rate'],
|
| 489 |
+
aa: ['aa_id', 'aa_intelligence', 'aa_coding', 'aa_math', 'aa_mmlu_pro', 'aa_gpqa', 'aa_livecodebench', 'aa_hle', 'aa_scicode', 'aa_math_500', 'aa_aime', 'aa_tokens_per_s', 'aa_latency_s'],
|
| 490 |
};
|
| 491 |
|
| 492 |
const SOURCE_ID_FIELD = {
|