visual_memory / scenarios /cascading_deduction_11x11.json
kdemon1011's picture
Upload folder using huggingface_hub
15503f9 verified
{
"scenario_id": "cascading_deduction_11x11",
"type": "hidden_grid",
"seed": 8401,
"board_width": 11,
"board_height": 11,
"hazard_count": 25,
"decoy_count": 5,
"max_steps": 38,
"max_hazard_reveals": 2,
"signal_mode": "partial",
"flags_count": 28,
"difficulty": "hard",
"description": "11x11 grid, 25 hazards, 5 decoys. Partial signals reveal only a subset of hazard directions plus a total hint. With 121 cells and 25 hazards, over 20% of the board is dangerous. The agent must chain partial deductions: signal A reveals 'N,E' out of 3 total → signal B at the inferred position reveals 'S,W' out of 2 → confirming hazard at intersection. Single-step reasoning sees incomplete clues. Models must track partial constraint sets across many reveals.",
"how_to_play": "Signals show partial directions like 'N,E' with a hint '3 total' — meaning 3 hazards nearby but only 2 directions shown. Chain deductions across signals: if cell A points East and cell B points West, a hazard sits between them. Flag all 25 hazards and submit.",
"tags": ["partial_observability", "multi_stage_solution", "unsafe_guess_penalty"],
"win_condition": {
"type": "flag_all_hazards"
}
}