{ "policy": "state_feedback_pixelcopter_controller", "n_evaluation_episodes": 10, "max_t": 10000, "env_id": "Pixelcopter-PLE-v0", "state_space": 7, "action_space": 2, "notes": "deterministic controller evaluated in the same Pixelcopter environment after REINFORCE attempts were unstable" }