lucasschott commited on
Commit
4e15a01
·
1 Parent(s): d7ef094

improved agent

Browse files
Files changed (6) hide show
  1. config.json +1 -1
  2. model.safetensors +1 -1
  3. model.zip +2 -2
  4. record.py +2 -1
  5. replay.mp4 +2 -2
  6. results.json +2 -2
config.json CHANGED
@@ -6,7 +6,7 @@
6
  "activation_fn" : "nn.ReLU",
7
  "net_arch" : "dict(vf=[512, 256], pi=[256, 128])"
8
  },
9
- "learning_rate" : 2.5e-4,
10
  "n_steps" : 256,
11
  "batch_size" : 1024,
12
  "n_epochs" : 4,
 
6
  "activation_fn" : "nn.ReLU",
7
  "net_arch" : "dict(vf=[512, 256], pi=[256, 128])"
8
  },
9
+ "learning_rate" : "linear_schedule(3e-4,1e-6)",
10
  "n_steps" : 256,
11
  "batch_size" : 1024,
12
  "n_epochs" : 4,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79b3e4e51bfe3236e98c6ab08e1d19809b6879d64c561e426e0c7b2db7902db3
3
  size 8978048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dabad1bd1cf1028acb2f714cb7f5abb7ac8cae118a7261340b19204af34ee6d
3
  size 8978048
model.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a68839cbf79160dcbcc9a431f98060e5b1a96c43fa9f6ba250288c1f9ed115af
3
- size 27426366
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e242c0ca3b0fdc713582ed1489f9177bcee8b7da1820d40bfd78efb4134c144
3
+ size 27429328
record.py CHANGED
@@ -23,7 +23,8 @@ if __name__ == "__main__":
23
  frames = []
24
 
25
  obs = env.reset()
26
- for _ in range(1000):
 
27
  action, _ = agent.predict(obs)
28
  obs, _, done, _ = env.step(action)
29
  frame = env.render()
 
23
  frames = []
24
 
25
  obs = env.reset()
26
+
27
+ for _ in range(1500):
28
  action, _ = agent.predict(obs)
29
  obs, _, done, _ = env.step(action)
30
  frame = env.render()
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d492ac5e9dcd83531d247c79c8b51ea09f1472ebd943db2b93d5c6d10662da25
3
- size 295344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:150c0d07ea35a2d682a5f927e542d878cb7c200eaaf3645b94e78b82aa201e0f
3
+ size 412218
results.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "mean_reward": 454.12,
3
- "std_reward": 36.65,
4
  "episodes": 100,
5
  "is_deterministic": true
6
  }
 
1
  {
2
+ "mean_reward": 599.54,
3
+ "std_reward": 131.49809276183439,
4
  "episodes": 100,
5
  "is_deterministic": true
6
  }