| { | |
| "model_name": "PPO Pyramids Agent", | |
| "algorithm": "PPO", | |
| "environment": "ML-Agents-Pyramids", | |
| "performance": { | |
| "mean_reward": 5.1, | |
| "std_reward": 0.85, | |
| "pyramids_completed": 5.0 | |
| }, | |
| "training": { | |
| "episodes": 3000, | |
| "framework": "PyTorch", | |
| "course": "Hugging Face Deep RL Course Unit 5" | |
| }, | |
| "tags": [ | |
| "ML-Agents-Pyramids", | |
| "ppo", | |
| "deep-reinforcement-learning", | |
| "reinforcement-learning", | |
| "ml-agents" | |
| ] | |
| } |