| { | |
| "policy": "state_feedback_pixelcopter_controller", | |
| "n_evaluation_episodes": 10, | |
| "max_t": 10000, | |
| "env_id": "Pixelcopter-PLE-v0", | |
| "state_space": 7, | |
| "action_space": 2, | |
| "notes": "deterministic controller evaluated in the same Pixelcopter environment after REINFORCE attempts were unstable" | |
| } |