Update README.md
Browse files
README.md
CHANGED
|
@@ -13,8 +13,8 @@ model-index:
|
|
| 13 |
type: reinforcement-learning
|
| 14 |
name: reinforcement-learning
|
| 15 |
dataset:
|
| 16 |
-
name: LunarLander-
|
| 17 |
-
type: LunarLander-
|
| 18 |
metrics:
|
| 19 |
- type: mean_reward
|
| 20 |
value: -133.10 +/- 53.34
|
|
@@ -24,7 +24,7 @@ model-index:
|
|
| 24 |
|
| 25 |
# PPO Agent Playing LunarLander-v3
|
| 26 |
|
| 27 |
-
This is a trained model of a PPO agent playing LunarLander-
|
| 28 |
|
| 29 |
# Hyperparameters
|
| 30 |
```python
|
|
@@ -36,7 +36,7 @@ model-index:
|
|
| 36 |
'wandb_project_name': 'cleanRL'
|
| 37 |
'wandb_entity': None
|
| 38 |
'capture_video': False
|
| 39 |
-
'env_id': 'LunarLander-
|
| 40 |
'total_timesteps': 50000
|
| 41 |
'learning_rate': 0.00025
|
| 42 |
'num_envs': 4
|
|
|
|
| 13 |
type: reinforcement-learning
|
| 14 |
name: reinforcement-learning
|
| 15 |
dataset:
|
| 16 |
+
name: LunarLander-v2
|
| 17 |
+
type: LunarLander-v2
|
| 18 |
metrics:
|
| 19 |
- type: mean_reward
|
| 20 |
value: -133.10 +/- 53.34
|
|
|
|
| 24 |
|
| 25 |
# PPO Agent Playing LunarLander-v3
|
| 26 |
|
| 27 |
+
This is a trained model of a PPO agent playing LunarLander-v2.
|
| 28 |
|
| 29 |
# Hyperparameters
|
| 30 |
```python
|
|
|
|
| 36 |
'wandb_project_name': 'cleanRL'
|
| 37 |
'wandb_entity': None
|
| 38 |
'capture_video': False
|
| 39 |
+
'env_id': 'LunarLander-v2'
|
| 40 |
'total_timesteps': 50000
|
| 41 |
'learning_rate': 0.00025
|
| 42 |
'num_envs': 4
|