{"mean_reward": 266.2081387, "std_reward": 21.719479219772705, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2026-04-07T12:49:57.692002"}