File size: 1,343 Bytes
1ac264d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
{
  "input": "https://arxiv.org/abs/2508.13142",
  "resolved_source_url": "https://arxiv.org/pdf/2508.13142.pdf",
  "analysis": {
    "benchmark_name": "EASI",
    "benchmark_aliases": [
      "EASI-Leaderboard"
    ],
    "source_type": "paper",
    "table_hint": "Table 3",
    "likely_metrics": [
      "MRA",
      "Acc",
      "CAA",
      "F1"
    ],
    "search_terms": [
      "EASI leaderboard",
      "EASI benchmark",
      "Spatial Intelligence benchmark"
    ],
    "notes": "The paper introduces the EASI framework for evaluating Multimodal LLMs on Spatial Intelligence. It includes an accompanying leaderboard. Table 3 presents results for various models on eight key spatial benchmarks under the 'Official Protocol'."
  },
  "seed_work_openalex_id": "https://openalex.org/W2117359358",
  "seed_work_title": "The eczema area and severity index (EASI): assessment of reliability in atopic dermatitis",
  "notes": [
    "Fetched source URL content for extraction planning."
  ],
  "plan_steps": [
    "Extract the seed benchmark leaderboard from the provided source.",
    "Find possible newer benchmark results from citing works.",
    "Screen citations for benchmark-relevant score tables.",
    "Merge, deduplicate, and store leaderboard rows with citations.",
    "Generate Gradio app files for Hugging Face deployment."
  ]
}