| library_name: ml-agents | |
| tags: | |
| - ML-Agents-Pyramids | |
| - deep-rl-course | |
| - reinforcement-learning | |
| - reinforcement-learning-leaderboard | |
| model-index: | |
| - name: ppo-Pyramids | |
| results: | |
| - task: | |
| type: reinforcement-learning | |
| name: reinforcement-learning | |
| dataset: | |
| name: ML-Agents-Pyramids | |
| type: ML-Agents-Pyramids | |
| metrics: | |
| - type: mean_reward | |
| value: 2.0 | |
| name: mean_reward | |
| # ppo-Pyramids | |
| Surgical fix for Unit 5. | |