File size: 923 Bytes
38c9982
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
from src.executive_assistant.agent import BaselineAgent
from src.executive_assistant.runner import run_policy_suite


def test_run_policy_suite_returns_all_requested_tasks() -> None:
    traces = run_policy_suite(
        policy=BaselineAgent(),
        task_names=["easy_deadline_extraction", "hard_rag_reply"],
    )
    assert set(traces) == {"easy_deadline_extraction", "hard_rag_reply"}


def test_episode_runner_exposes_explicit_workflow_steps() -> None:
    from src.executive_assistant.runner import EpisodeRunner

    runner = EpisodeRunner(policy=BaselineAgent(), max_steps=12)
    env, observation = runner.initialize("easy_deadline_extraction")
    _, next_observation, reward, record = runner.advance(
        "easy_deadline_extraction",
        env,
        observation,
    )
    assert record.step_index == 1
    assert next_observation.last_action_status == "email read"
    assert reward.is_done is False