cyeet commited on
Commit
aaf1e14
·
1 Parent(s): cbb8603

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 721.00 +/- 279.52
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -62,12 +62,12 @@ OrderedDict([('batch_size', 32),
62
  ('env_wrapper',
63
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
64
  ('exploration_final_eps', 0.01),
65
- ('exploration_fraction', 0.025),
66
  ('frame_stack', 4),
67
  ('gradient_steps', 1),
68
  ('learning_rate', 5e-05),
69
  ('learning_starts', 10000),
70
- ('n_timesteps', 50000),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 606.00 +/- 173.94
20
  name: mean_reward
21
  verified: false
22
  ---
 
62
  ('env_wrapper',
63
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
64
  ('exploration_final_eps', 0.01),
65
+ ('exploration_fraction', 0.1),
66
  ('frame_stack', 4),
67
  ('gradient_steps', 1),
68
  ('learning_rate', 5e-05),
69
  ('learning_starts', 10000),
70
+ ('n_timesteps', 100000),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -17,10 +17,9 @@
17
  - []
18
  - - hyperparams
19
  - buffer_size: 10000
20
- exploration_fraction: 0.025
21
  learning_rate: 5.0e-05
22
  learning_starts: 10000
23
- n_timesteps: 50000
24
  - - log_folder
25
  - logs/
26
  - - log_interval
@@ -58,7 +57,7 @@
58
  - - save_replay_buffer
59
  - false
60
  - - seed
61
- - 763537670
62
  - - storage
63
  - null
64
  - - study_name
@@ -68,7 +67,7 @@
68
  - - track
69
  - false
70
  - - trained_agent
71
- - logs/dqn/SpaceInvadersNoFrameskip-v4_3/SpaceInvadersNoFrameskip-v4.zip
72
  - - truncate_last_trajectory
73
  - true
74
  - - uuid
 
17
  - []
18
  - - hyperparams
19
  - buffer_size: 10000
 
20
  learning_rate: 5.0e-05
21
  learning_starts: 10000
22
+ n_timesteps: 100000
23
  - - log_folder
24
  - logs/
25
  - - log_interval
 
57
  - - save_replay_buffer
58
  - false
59
  - - seed
60
+ - 618051608
61
  - - storage
62
  - null
63
  - - study_name
 
67
  - - track
68
  - false
69
  - - trained_agent
70
+ - logs/dqn/SpaceInvadersNoFrameskip-v4_1/SpaceInvadersNoFrameskip-v4.zip
71
  - - truncate_last_trajectory
72
  - true
73
  - - uuid
config.yml CHANGED
@@ -8,7 +8,7 @@
8
  - - exploration_final_eps
9
  - 0.01
10
  - - exploration_fraction
11
- - 0.025
12
  - - frame_stack
13
  - 4
14
  - - gradient_steps
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 10000
20
  - - n_timesteps
21
- - 50000
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
8
  - - exploration_final_eps
9
  - 0.01
10
  - - exploration_fraction
11
+ - 0.1
12
  - - frame_stack
13
  - 4
14
  - - gradient_steps
 
18
  - - learning_starts
19
  - 10000
20
  - - n_timesteps
21
+ - 100000
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba1c4dd88eff51ad7cd05961c011204fc47bf12cfd237e2a5099e15f292d6798
3
- size 27223010
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f6fedb48663a92f1201abec12d987cd52b305560c2c444ee02b789a99c70ed4
3
+ size 27224805
dqn-SpaceInvadersNoFrameskip-v4/_stable_baselines3_version CHANGED
@@ -1 +1 @@
1
- 1.7.0a10
 
1
+ 1.7.0a11
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1ce68de8cc18c45ea333f2a62e483e61bce35c87e877d6005a1d532f92f7131
3
  size 13505739
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89952653d9b716cd0e2198427e0c2437a090f54014f4e4f3600dc44eded7806b
3
  size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1bc0f66c6fe26752c24113184c52d4af24b4b5e2b36cb4b43c4aff03a510734
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bc0712228020c5de3d5b5cd1ab6483abb419dfdcbe97581452ec8ac30ee4ee6
3
  size 13504937
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -1,7 +1,7 @@
1
- OS: Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022
2
- Python: 3.8.16
3
- Stable-Baselines3: 1.7.0a10
4
- PyTorch: 1.13.0+cu116
5
- GPU Enabled: True
6
- Numpy: 1.21.6
7
- Gym: 0.21.0
 
1
+ - OS: Linux-5.10.133+-x86_64-with-glibc2.27 # 1 SMP Fri Aug 26 08:44:51 UTC 2022
2
+ - Python: 3.8.16
3
+ - Stable-Baselines3: 1.7.0a11
4
+ - PyTorch: 1.13.0+cu116
5
+ - GPU Enabled: True
6
+ - Numpy: 1.21.6
7
+ - Gym: 0.21.0
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01b3dcbe0dd6c07e2bb5417ef12ab82309d4b6d090cdacb180022c09a4a2e866
3
- size 204442
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:364707a91a214ec6b53baa185e3fb254b537cebdb8d78a2c92902e92a0f7fb48
3
+ size 210882
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 721.0, "std_reward": 279.5156525134147, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-02T09:49:10.015614"}
 
1
+ {"mean_reward": 606.0, "std_reward": 173.93677012063895, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-01-02T16:11:31.288097"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82799ebe989320f9ed2746b2a2358ce89972b5fdbe872dc62d7155b2722b4eff
3
- size 2511
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9541176513617ac8b6630003c0b779ed1b7fb43f5378c27025750fe4f895fe7
3
+ size 3838