{ "mean_reward": 500.0, "std_reward": 0.0, "datetime": "2025-07-29T12:27:37.503071+00:00", "train_duration_min": "1.06" }