jfelgate commited on
Commit
10ff922
·
1 Parent(s): dae810a

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 191.50 +/- 74.87
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -62,21 +62,20 @@ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f lo
62
 
63
  ## Hyperparameters
64
  ```python
65
- OrderedDict([('batch_size', 32),
66
- ('buffer_size', 100000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.1),
70
- ('exploration_fraction', 1),
71
- ('frame_stack', 4),
72
  ('gamma', 0.99),
73
- ('gradient_steps', 1),
74
- ('learning_rate', 0.00025),
75
- ('learning_starts', 10000),
76
- ('n_timesteps', 10000000.0),
77
- ('optimize_memory_usage', False),
78
- ('policy', 'CnnPolicy'),
79
- ('target_update_interval', 10000),
80
  ('train_freq', 4),
81
  ('normalize', False)])
82
  ```
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 113.00 +/- 46.59
20
  name: mean_reward
21
  verified: false
22
  ---
 
62
 
63
  ## Hyperparameters
64
  ```python
65
+ OrderedDict([('batch_size', 128),
66
+ ('buffer_size', 50000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
69
  ('exploration_final_eps', 0.1),
70
+ ('exploration_fraction', 0.12),
 
71
  ('gamma', 0.99),
72
+ ('gradient_steps', -1),
73
+ ('learning_rate', 0.00063),
74
+ ('learning_starts', 0),
75
+ ('n_timesteps', 100000.0),
76
+ ('policy', 'MlpPolicy'),
77
+ ('policy_kwargs', 'dict(net_arch=[256, 256])'),
78
+ ('target_update_interval', 250),
79
  ('train_freq', 4),
80
  ('normalize', False)])
81
  ```
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 125510940
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 226175671
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -1,31 +1,29 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 32
4
  - - buffer_size
5
- - 100000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
9
  - 0.1
10
  - - exploration_fraction
11
- - 1
12
- - - frame_stack
13
- - 4
14
  - - gamma
15
  - 0.99
16
  - - gradient_steps
17
- - 1
18
  - - learning_rate
19
- - 0.00025
20
  - - learning_starts
21
- - 10000
22
  - - n_timesteps
23
- - 10000000.0
24
- - - optimize_memory_usage
25
- - false
26
  - - policy
27
- - CnnPolicy
 
 
28
  - - target_update_interval
29
- - 10000
30
  - - train_freq
31
  - 4
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 128
4
  - - buffer_size
5
+ - 50000
6
  - - env_wrapper
7
  - - stable_baselines3.common.atari_wrappers.AtariWrapper
8
  - - exploration_final_eps
9
  - 0.1
10
  - - exploration_fraction
11
+ - 0.12
 
 
12
  - - gamma
13
  - 0.99
14
  - - gradient_steps
15
+ - -1
16
  - - learning_rate
17
+ - 0.00063
18
  - - learning_starts
19
+ - 0
20
  - - n_timesteps
21
+ - 100000.0
 
 
22
  - - policy
23
+ - MlpPolicy
24
+ - - policy_kwargs
25
+ - dict(net_arch=[256, 256])
26
  - - target_update_interval
27
+ - 250
28
  - - train_freq
29
  - 4
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbfbd0560c768ff659e1f45d4fea44967c2b860cad079c6bdd61345b580c3f39
3
- size 27219543
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee1c4148b97a8844ec9b42e540a7e2c982f860e0da6bb3af90559e8094bf0a0d
3
+ size 30057641
dqn-SpaceInvadersNoFrameskip-v4/_stable_baselines3_version CHANGED
@@ -1 +1 @@
1
- 2.2.0a8
 
1
+ 2.2.0a9
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65d44e628b34c4dbf615cd3837e8c82b900a4de1286dedc4a9c3993cf46bae12
3
- size 13505852
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5ef147093360095b6e2df012a5142d73afb394b89279f0cd1c3eb604d03b4dd
3
+ size 14996640
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47c58793ca377bcb93b07a6cab7fe98012ffbe8cff718f718277b594e052be6e
3
- size 13505178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebac17fa66dabb65fd91207960dac03d9234fac13ff1cd3fc139fdc3a0aafdf2
3
+ size 14995762
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -1,6 +1,6 @@
1
  - OS: Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023
2
  - Python: 3.10.12
3
- - Stable-Baselines3: 2.2.0a8
4
  - PyTorch: 2.1.0+cu118
5
  - GPU Enabled: False
6
  - Numpy: 1.23.5
 
1
  - OS: Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023
2
  - Python: 3.10.12
3
+ - Stable-Baselines3: 2.2.0a9
4
  - PyTorch: 2.1.0+cu118
5
  - GPU Enabled: False
6
  - Numpy: 1.23.5
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41acc1f1ad783e994942eca11fbc921a10de14675e412dbc1167580a2740bc0a
3
- size 273434
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25d8d1c6f1271a484d5bf42a9b51aa5ee826f8117566c9da2d8ec04205fa2cb4
3
+ size 270829
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 191.5, "std_reward": 74.8682175559162, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-10-27T00:22:52.139923"}
 
1
+ {"mean_reward": 113.0, "std_reward": 46.593991028886975, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-10-27T20:28:41.102187"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d543838815a0e5b184008577e9882815cbe08b6bbe32b52c38918beda1295d69
3
- size 40932
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b56cabe9d758f0493d68e97d2854d2ed9a78df318b0c8545b8917dc1ff4215c9
3
+ size 5651