Malgesw commited on
Commit
b565ea0
·
verified ·
1 Parent(s): d746598

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 244.00 +/- 135.66
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -63,22 +63,22 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
63
 
64
  ## Hyperparameters
65
  ```python
66
- OrderedDict([('batch_size', 64),
67
- ('buffer_size', 200000),
68
  ('env_wrapper',
69
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
70
- ('exploration_final_eps', 0.0944),
71
- ('exploration_fraction', 0.137),
72
- ('exploration_initial_eps', 0.749),
73
  ('frame_stack', 4),
74
- ('gamma', 0.969),
75
  ('gradient_steps', 1),
76
- ('learning_rate', 4.53e-06),
77
- ('learning_starts', 100),
78
  ('n_timesteps', 1000000.0),
79
  ('optimize_memory_usage', False),
80
  ('policy', 'CnnPolicy'),
81
- ('target_update_interval', 11000),
82
  ('train_freq', 4),
83
  ('normalize', False)])
84
  ```
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 373.00 +/- 91.14
20
  name: mean_reward
21
  verified: false
22
  ---
 
63
 
64
  ## Hyperparameters
65
  ```python
66
+ OrderedDict([('batch_size', 16),
67
+ ('buffer_size', 100000),
68
  ('env_wrapper',
69
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
70
+ ('exploration_final_eps', 0.0316),
71
+ ('exploration_fraction', 0.159),
72
+ ('exploration_initial_eps', 0.85),
73
  ('frame_stack', 4),
74
+ ('gamma', 0.914),
75
  ('gradient_steps', 1),
76
+ ('learning_rate', 1.95e-06),
77
+ ('learning_starts', 1000),
78
  ('n_timesteps', 1000000.0),
79
  ('optimize_memory_usage', False),
80
  ('policy', 'CnnPolicy'),
81
+ ('target_update_interval', 8000),
82
  ('train_freq', 4),
83
  ('normalize', False)])
84
  ```
args.yml CHANGED
@@ -56,7 +56,7 @@
56
  - - save_replay_buffer
57
  - false
58
  - - seed
59
- - 3722634297
60
  - - storage
61
  - null
62
  - - study_name
 
56
  - - save_replay_buffer
57
  - false
58
  - - seed
59
+ - 2600369761
60
  - - storage
61
  - null
62
  - - study_name
config.yml CHANGED
@@ -1,26 +1,26 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 64
4
  - - buffer_size
5
- - 200000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
9
- - 0.0944
10
  - - exploration_fraction
11
- - 0.137
12
  - - exploration_initial_eps
13
- - 0.749
14
  - - frame_stack
15
  - 4
16
  - - gamma
17
- - 0.969
18
  - - gradient_steps
19
  - 1
20
  - - learning_rate
21
- - 4.53e-06
22
  - - learning_starts
23
- - 100
24
  - - n_timesteps
25
  - 1000000.0
26
  - - optimize_memory_usage
@@ -28,6 +28,6 @@
28
  - - policy
29
  - CnnPolicy
30
  - - target_update_interval
31
- - 11000
32
  - - train_freq
33
  - 4
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 16
4
  - - buffer_size
5
+ - 100000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
9
+ - 0.0316
10
  - - exploration_fraction
11
+ - 0.159
12
  - - exploration_initial_eps
13
+ - 0.85
14
  - - frame_stack
15
  - 4
16
  - - gamma
17
+ - 0.914
18
  - - gradient_steps
19
  - 1
20
  - - learning_rate
21
+ - 1.95e-06
22
  - - learning_starts
23
+ - 1000
24
  - - n_timesteps
25
  - 1000000.0
26
  - - optimize_memory_usage
 
28
  - - policy
29
  - CnnPolicy
30
  - - target_update_interval
31
+ - 8000
32
  - - train_freq
33
  - 4
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4bd97e1b878818ab80543560d39b07ee5e12cf134a9001ef96f63b8e0353527
3
- size 27219628
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c61c3667160b30cd1a78c93f42f2615822aa8ec543137712de86841eb4d2f8c7
3
+ size 27219626
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33c16f81428a1c8f1ccdd6bb89b23810dc6060372296deb2dd4c5c04fedf9dac
3
  size 13506569
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fc4f69dd17396b0384a06b50e71859359fae8ade75e8ed400cea4031cfdecf0
3
  size 13506569
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f7837ddb07fe00003e55b5b52f4bc465bf2338ff1eda2f90d60b66d85ab1166
3
  size 13505767
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c712be936d1364d714b27be4383f89857077d2ce7143ccc318273dd03f377cb6
3
  size 13505767
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 244.0, "std_reward": 135.66134305689297, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2026-01-18T15:13:47.914739"}
 
1
+ {"mean_reward": 373.0, "std_reward": 91.13725912051558, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2026-01-18T18:51:29.067018"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cbeecb2f9351bc7a9654efcc6a2891ebca0804107f69e2adfa4a1236f98dd6a9
3
- size 44777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:869622cb3086aba58d119f629ea2502d855115e83c522e61a8105a038621f3f3
3
+ size 40800