File size: 1,240 Bytes
4db0438
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
"""Tests for literature-grounded benchmark utilities."""

from training.literature_benchmark import (
    run_paper_benchmark,
    select_literature_scenario,
)


def test_select_literature_scenario_for_ipf_prompt():
    scenario = select_literature_scenario(
        "Validate SPP1-positive macrophage findings in idiopathic pulmonary fibrosis."
    )
    assert scenario.name == "biomarker_validation_lung"


def test_select_literature_scenario_for_trajectory_prompt():
    scenario = select_literature_scenario(
        "Recover branching hematopoietic lineages and branch point transcription factors."
    )
    assert scenario.name == "hematopoiesis_trajectory"


def test_run_paper_benchmark_matches_curated_findings():
    result = run_paper_benchmark(
        problem_statement=(
            "Design a follow-up validation experiment for candidate biomarker "
            "SPP1 in idiopathic pulmonary fibrosis."
        ),
        scenario_name="biomarker_validation_lung",
        domain_randomise=False,
    )

    assert result.total_steps >= 1
    assert result.matched_papers
    assert result.match_ratio >= (2 / 3)
    assert any("SPP1" in finding for finding in result.matched_findings)