{ "timesteps": 200000, "model_class": "PPO", "eval_idx": 5 }