Akchunks commited on
Commit
d39f8b2
·
verified ·
1 Parent(s): ba8901f

Upload PPO agent

Browse files
Files changed (3) hide show
  1. README.md +6 -47
  2. model.pt +2 -2
  3. replay.mp4 +0 -0
README.md CHANGED
@@ -1,59 +1,18 @@
1
  ---
2
- tags:
3
- - LunarLander-v3
4
- - ppo
5
- - reinforcement-learning
6
- - cleanrl
7
- - colab
8
  model-index:
9
- - name: PPO
10
  results:
11
  - task:
12
  type: reinforcement-learning
13
  name: reinforcement-learning
14
  dataset:
15
- name: LunarLander-v3
16
- type: LunarLander-v3
17
  metrics:
18
  - type: mean_reward
19
- value: -200.82 +/- 95.02
20
  name: mean_reward
21
  verified: false
22
  ---
23
- # PPO Agent for LunarLander-v3
24
-
25
- Mean reward: -200.82 ± 95.02
26
-
27
- ```python
28
- {
29
- "exp_name": "ppo_colab",
30
- "seed": 1,
31
- "torch_deterministic": true,
32
- "cuda": true,
33
- "track": false,
34
- "wandb_project_name": "cleanRL",
35
- "wandb_entity": null,
36
- "capture_video": true,
37
- "env_id": "LunarLander-v3",
38
- "total_timesteps": 10,
39
- "learning_rate": 0.00025,
40
- "num_envs": 1,
41
- "num_steps": 128,
42
- "anneal_lr": true,
43
- "gae": true,
44
- "gamma": 0.99,
45
- "gae_lambda": 0.95,
46
- "num_minibatches": 1,
47
- "update_epochs": 4,
48
- "norm_adv": true,
49
- "clip_coef": 0.2,
50
- "clip_vloss": true,
51
- "ent_coef": 0.01,
52
- "vf_coef": 0.5,
53
- "max_grad_norm": 0.5,
54
- "target_kl": null,
55
- "repo_id": "Akchunks/LunarLander-v2",
56
- "batch_size": 128,
57
- "minibatch_size": 128
58
- }
59
- ```
 
1
  ---
 
 
 
 
 
 
2
  model-index:
3
+ - name: PPO LunarLander-v2
4
  results:
5
  - task:
6
  type: reinforcement-learning
7
  name: reinforcement-learning
8
  dataset:
9
+ name: LunarLander-v2
10
+ type: LunarLander-v2
11
  metrics:
12
  - type: mean_reward
13
+ value: -203.00 +/- 131.58
14
  name: mean_reward
15
  verified: false
16
  ---
17
+ # PPO Agent for LunarLander-v2
18
+ Mean reward: -203.00 ± 131.58
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:701d954461323cfbc3d99b1b5933e746fe6c44ac2196732d35fbc3e401205b23
3
- size 42898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b50b2efda5140d2b81aa36a60540e4d33765745d06096cf453ca892556280ac3
3
+ size 43291
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ