Commit
·
4e15a01
1
Parent(s):
d7ef094
improved agent
Browse files- config.json +1 -1
- model.safetensors +1 -1
- model.zip +2 -2
- record.py +2 -1
- replay.mp4 +2 -2
- results.json +2 -2
config.json
CHANGED
|
@@ -6,7 +6,7 @@
|
|
| 6 |
"activation_fn" : "nn.ReLU",
|
| 7 |
"net_arch" : "dict(vf=[512, 256], pi=[256, 128])"
|
| 8 |
},
|
| 9 |
-
"learning_rate" :
|
| 10 |
"n_steps" : 256,
|
| 11 |
"batch_size" : 1024,
|
| 12 |
"n_epochs" : 4,
|
|
|
|
| 6 |
"activation_fn" : "nn.ReLU",
|
| 7 |
"net_arch" : "dict(vf=[512, 256], pi=[256, 128])"
|
| 8 |
},
|
| 9 |
+
"learning_rate" : "linear_schedule(3e-4,1e-6)",
|
| 10 |
"n_steps" : 256,
|
| 11 |
"batch_size" : 1024,
|
| 12 |
"n_epochs" : 4,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 8978048
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6dabad1bd1cf1028acb2f714cb7f5abb7ac8cae118a7261340b19204af34ee6d
|
| 3 |
size 8978048
|
model.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e242c0ca3b0fdc713582ed1489f9177bcee8b7da1820d40bfd78efb4134c144
|
| 3 |
+
size 27429328
|
record.py
CHANGED
|
@@ -23,7 +23,8 @@ if __name__ == "__main__":
|
|
| 23 |
frames = []
|
| 24 |
|
| 25 |
obs = env.reset()
|
| 26 |
-
|
|
|
|
| 27 |
action, _ = agent.predict(obs)
|
| 28 |
obs, _, done, _ = env.step(action)
|
| 29 |
frame = env.render()
|
|
|
|
| 23 |
frames = []
|
| 24 |
|
| 25 |
obs = env.reset()
|
| 26 |
+
|
| 27 |
+
for _ in range(1500):
|
| 28 |
action, _ = agent.predict(obs)
|
| 29 |
obs, _, done, _ = env.step(action)
|
| 30 |
frame = env.render()
|
replay.mp4
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:150c0d07ea35a2d682a5f927e542d878cb7c200eaaf3645b94e78b82aa201e0f
|
| 3 |
+
size 412218
|
results.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
-
"mean_reward":
|
| 3 |
-
"std_reward":
|
| 4 |
"episodes": 100,
|
| 5 |
"is_deterministic": true
|
| 6 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"mean_reward": 599.54,
|
| 3 |
+
"std_reward": 131.49809276183439,
|
| 4 |
"episodes": 100,
|
| 5 |
"is_deterministic": true
|
| 6 |
}
|