{"mean_reward": 679.0, "std_reward": 144.80676779764127, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2025-12-09T06:21:38.017298"}