{"mean_reward": 256.12838847355147, "std_reward": 16.05784264176309, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2026-02-04T20:42:50.421437"}