Upload 5 files
Browse files- .gitattributes +1 -0
- PPO_PongNoFrameskip-v4_performance.png +0 -0
- best_model.zip +2 -2
- best_model_atari_pong_ppo-step-0-to-step-10000.mp4 +3 -0
- evaluations.npz +2 -2
- parameters.json +1 -1
.gitattributes
CHANGED
|
@@ -35,3 +35,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
best_model_atari_pong_ppo-step-0-to-step-5000.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 37 |
replay.mp4 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
best_model_atari_pong_ppo-step-0-to-step-5000.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 37 |
replay.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
best_model_atari_pong_ppo-step-0-to-step-10000.mp4 filter=lfs diff=lfs merge=lfs -text
|
PPO_PongNoFrameskip-v4_performance.png
ADDED
|
best_model.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2460a602bfb33cf624792eb24d761855943ab98a7b13746568ed881727baa27f
|
| 3 |
+
size 20742060
|
best_model_atari_pong_ppo-step-0-to-step-10000.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d20b31810dec61a38586377f90e73d00a8918e470e532ed5d5654f588ee08ab8
|
| 3 |
+
size 205820
|
evaluations.npz
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff1cfa6312513bdadf508289098c29cc3013574c9e3798586819eb7b20a28f6c
|
| 3 |
+
size 1650
|
parameters.json
CHANGED
|
@@ -3,7 +3,7 @@
|
|
| 3 |
"env_str": "PongNoFrameskip-v4",
|
| 4 |
"rl_type": "PPO",
|
| 5 |
"eval_freq": 50000,
|
| 6 |
-
"total_timesteps":
|
| 7 |
"clip_range": 0.1,
|
| 8 |
"learning_rate": 0.00025,
|
| 9 |
"n_steps": 128,
|
|
|
|
| 3 |
"env_str": "PongNoFrameskip-v4",
|
| 4 |
"rl_type": "PPO",
|
| 5 |
"eval_freq": 50000,
|
| 6 |
+
"total_timesteps": 4000000,
|
| 7 |
"clip_range": 0.1,
|
| 8 |
"learning_rate": 0.00025,
|
| 9 |
"n_steps": 128,
|