File size: 2,181 Bytes
9ea9f15
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
{
  "domain": "game",
  "scenario_id": "wikiwiper",
  "reset_payload": {
    "seed": 42,
    "scenario_id": "wikiwiper",
    "mission_id": "wikiwiper_game_sample",
    "options": {
      "env_id": "omnibench_aegis_env:game.wikiwiper",
      "max_steps": 8,
      "target_score": 1
    }
  },
  "action_examples": {
    "canonical": [
      {
        "name": "inspect_objective",
        "args": {}
      },
      {
        "name": "scan_zone",
        "args": {}
      },
      {
        "name": "select_tool",
        "args": {
          "tool_slot": "hotbar.2"
        }
      },
      {
        "name": "navigate_route",
        "args": {
          "route": "lower_corridor"
        }
      },
      {
        "name": "engage_threat",
        "args": {
          "aggressive": false
        }
      },
      {
        "name": "wipe_target",
        "args": {
          "target_id": "target-archive-core"
        }
      },
      {
        "name": "verify_cleanup",
        "args": {}
      },
      {
        "name": "submit_run",
        "args": {}
      }
    ],
    "shorthand": [
      {
        "action": "inspect_objective"
      },
      {
        "action": "scan_zone"
      },
      {
        "action": "select_tool",
        "tool_slot": "hotbar.2"
      },
      {
        "action": "navigate_route",
        "route": "lower_corridor"
      },
      {
        "action": "engage_threat",
        "aggressive": false
      },
      {
        "action": "wipe_target",
        "target_id": "target-archive-core"
      },
      {
        "action": "verify_cleanup"
      },
      {
        "action": "submit_run"
      }
    ]
  },
  "expected_good_trajectory": [
    "inspect_objective",
    "scan_zone",
    "select_tool",
    "navigate_route",
    "engage_threat",
    "wipe_target",
    "verify_cleanup",
    "submit_run"
  ],
  "expected_flow": [
    "health",
    "reset",
    "step",
    "state"
  ],
  "notes": [
    "Aligned fixture for the real wikiwiper domain.",
    "Uses domain-level semantic actions instead of raw control vectors.",
    "The selected tool slot and target_id match the default seeded wikiwiper variant used in local smoke/eval runs."
  ]
}