OpenRA-Bench / r_amc_medium.json
yxc20098's picture
prompt_v2: sanitize confusing 'Buildings: ? ()' briefing line
5a3c04b
Raw
History Blame Contribute Delete
1.57 kB
{
"run_id": "20260519-060529",
"model": "qwen/qwen3.6-flash",
"truncated": false,
"resumed": 0,
"cost": {
"calls": 13,
"prompt_tokens": 60915,
"completion_tokens": 7157,
"usd": 0.0,
"max_usd": 0.0
},
"summary": {
"action-multiunit-coordination:medium": {
"n": 1,
"win_rate": 1.0,
"composite_mean": 0.8044,
"composite_std": 0.0,
"perception_mean": 0.7405,
"reasoning_mean": 0.9414,
"action_mean": 1.0,
"objective_mean": 1.0,
"weakest_link_hist": {
"perception": 1
}
}
},
"overall": {
"n": 1,
"win_rate": 1.0,
"composite_mean": 0.8044,
"composite_std": 0.0,
"perception_mean": 0.7405,
"reasoning_mean": 0.9414,
"action_mean": 1.0,
"objective_mean": 1.0,
"weakest_link_hist": {
"perception": 1
}
},
"reward_vector_mean": {
"economy": 0.5,
"military": 0.1,
"territory": 0.6293,
"scouting": 0.5,
"objective": 1.0
},
"episodes": [
{
"cell": "action-multiunit-coordination:medium",
"capability": "action",
"split": "public",
"seed": 1,
"outcome": "win",
"composite": 0.8044,
"perception": 0.7405,
"reasoning": 0.9414,
"action": 1.0,
"weakest_link": "perception",
"objective_progress": 1.0,
"reward_vector": {
"economy": 0.5,
"military": 0.1,
"territory": 0.6293,
"scouting": 0.5,
"objective": 1.0
},
"turns": 13,
"notes": []
}
],
"skipped": []
}