benjipeng commited on
Commit
d2cbd1f
·
1 Parent(s): e60b26c

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 29.00 +/- 64.30
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -70,9 +70,9 @@ OrderedDict([('batch_size', 32),
70
  ('exploration_fraction', 0.1),
71
  ('frame_stack', 4),
72
  ('gradient_steps', 1),
73
- ('learning_rate', 0.0005),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 100000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 711.00 +/- 224.01
20
  name: mean_reward
21
  verified: false
22
  ---
 
70
  ('exploration_fraction', 0.1),
71
  ('frame_stack', 4),
72
  ('gradient_steps', 1),
73
+ ('learning_rate', 0.0002),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 114831432
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 4580660
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -14,11 +14,11 @@
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
- - 0.0005
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 100000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
14
  - - gradient_steps
15
  - 1
16
  - - learning_rate
17
+ - 0.0002
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b4a637547e2320949a74768539426f3bea68fadd0ee69b7e3a425fdfc48e25a
3
- size 13714997
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63f61fd87f083bb3f212979931cb384ab68677ea4005a461cb56d49a5cde8c11
3
+ size 27220122
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5abe8db2e07b1bf0a893ef3b3eb2235d6e756cb21498d756ac4bc6d486ecacff
3
- size 1120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77e0960d3c9420b6153932060ee1e55acc1ec80e02397820fc4d632b4683433e
3
+ size 13506236
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1eb1a7caf01747d9f3561eef03e548ec52bb0a12918c0da397db6f7ee7e70cff
3
  size 13505370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e87e628c816cf40afa986c84a53f41fe1a9bf5f3b0fa30ad1712b898c4fc37bc
3
  size 13505370
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cae3de750f432875df42a4011aeedbc220ba38b313576b27b5dbc3ebf8a98d59
3
- size 294896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75329840b7dce42a56fba4f40c60b99535d5a2a92b371d3b6114485f6ee2549c
3
+ size 206158
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 29.0, "std_reward": 64.29618962271404, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-10-28T18:35:50.789835"}
 
1
+ {"mean_reward": 711.0, "std_reward": 224.00669632848033, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-10-29T16:12:28.012089"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe79765c43033ff44853e414f534eaeb529e5a3b0884f24679a4f6e5c707fea9
3
- size 5795
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb08933ce857d85f59ea0fa7a5be67da80f56eb208a4e9952df0fba13abb0896
3
+ size 34415