CrispStrobe commited on
Commit
ac03708
·
1 Parent(s): db007de

feat: complete full set of Artificial Analysis metrics

Browse files
Files changed (1) hide show
  1. scripts/fetch-benchmarks.js +8 -2
scripts/fetch-benchmarks.js CHANGED
@@ -399,10 +399,16 @@ async function fetchArtificialAnalysis() {
399
  aa_id: m.id,
400
  aa_name: m.name,
401
  aa_slug: m.slug,
402
- aa_intelligence: ev.artificial_analysis_intelligence_index, // typically 0-100
 
 
403
  aa_mmlu_pro: ev.mmlu_pro, // 0-1
404
  aa_gpqa: ev.gpqa, // 0-1
405
  aa_livecodebench: ev.livecodebench, // 0-1
 
 
 
 
406
  aa_tokens_per_s: m.median_output_tokens_per_second,
407
  aa_latency_s: m.median_time_to_first_token_seconds,
408
  };
@@ -480,7 +486,7 @@ const SOURCE_FIELDS = {
480
  livebench: ['lb_name', 'lb_global', 'lb_reasoning', 'lb_coding', 'lb_math', 'lb_language', 'lb_if', 'lb_data_analysis'],
481
  arena: ['arena_name', 'arena_org', 'arena_elo', 'arena_rank', 'arena_votes'],
482
  aider: ['aider_model', 'aider_pass_rate'],
483
- aa: ['aa_id', 'aa_intelligence', 'aa_mmlu_pro', 'aa_gpqa', 'aa_livecodebench', 'aa_tokens_per_s', 'aa_latency_s'],
484
  };
485
 
486
  const SOURCE_ID_FIELD = {
 
399
  aa_id: m.id,
400
  aa_name: m.name,
401
  aa_slug: m.slug,
402
+ aa_intelligence: ev.artificial_analysis_intelligence_index, // 0-100
403
+ aa_coding: ev.artificial_analysis_coding_index, // 0-100
404
+ aa_math: ev.artificial_analysis_math_index, // 0-100
405
  aa_mmlu_pro: ev.mmlu_pro, // 0-1
406
  aa_gpqa: ev.gpqa, // 0-1
407
  aa_livecodebench: ev.livecodebench, // 0-1
408
+ aa_hle: ev.hle,
409
+ aa_scicode: ev.scicode,
410
+ aa_math_500: ev.math_500,
411
+ aa_aime: ev.aime,
412
  aa_tokens_per_s: m.median_output_tokens_per_second,
413
  aa_latency_s: m.median_time_to_first_token_seconds,
414
  };
 
486
  livebench: ['lb_name', 'lb_global', 'lb_reasoning', 'lb_coding', 'lb_math', 'lb_language', 'lb_if', 'lb_data_analysis'],
487
  arena: ['arena_name', 'arena_org', 'arena_elo', 'arena_rank', 'arena_votes'],
488
  aider: ['aider_model', 'aider_pass_rate'],
489
+ aa: ['aa_id', 'aa_intelligence', 'aa_coding', 'aa_math', 'aa_mmlu_pro', 'aa_gpqa', 'aa_livecodebench', 'aa_hle', 'aa_scicode', 'aa_math_500', 'aa_aime', 'aa_tokens_per_s', 'aa_latency_s'],
490
  };
491
 
492
  const SOURCE_ID_FIELD = {