khaled5321 commited on
Commit
897807b
·
1 Parent(s): 2487d06

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 544.00 +/- 108.42
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -67,7 +67,7 @@ OrderedDict([('batch_size', 32),
67
  ('gradient_steps', 1),
68
  ('learning_rate', 0.0001),
69
  ('learning_starts', 100000),
70
- ('n_timesteps', 2000000.0),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 572.50 +/- 81.83
20
  name: mean_reward
21
  verified: false
22
  ---
 
67
  ('gradient_steps', 1),
68
  ('learning_rate', 0.0001),
69
  ('learning_starts', 100000),
70
+ ('n_timesteps', 5000000.0),
71
  ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
- - logs/
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
@@ -32,7 +32,7 @@
32
  - - n_startup_trials
33
  - 10
34
  - - n_timesteps
35
- - -1
36
  - - n_trials
37
  - 500
38
  - - no_optim_plots
@@ -44,7 +44,7 @@
44
  - - optimize_hyperparameters
45
  - false
46
  - - progress
47
- - true
48
  - - pruner
49
  - median
50
  - - sampler
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2839956984
58
  - - storage
59
  - null
60
  - - study_name
@@ -64,7 +64,7 @@
64
  - - track
65
  - false
66
  - - trained_agent
67
- - ''
68
  - - truncate_last_trajectory
69
  - true
70
  - - uuid
 
18
  - - hyperparams
19
  - null
20
  - - log_folder
21
+ - logs
22
  - - log_interval
23
  - -1
24
  - - max_total_trials
 
32
  - - n_startup_trials
33
  - 10
34
  - - n_timesteps
35
+ - 5000
36
  - - n_trials
37
  - 500
38
  - - no_optim_plots
 
44
  - - optimize_hyperparameters
45
  - false
46
  - - progress
47
+ - false
48
  - - pruner
49
  - median
50
  - - sampler
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2673070937
58
  - - storage
59
  - null
60
  - - study_name
 
64
  - - track
65
  - false
66
  - - trained_agent
67
+ - rl_trained/dqn/SpaceInvadersNoFrameskip-v4_1/SpaceInvadersNoFrameskip-v4.zip
68
  - - truncate_last_trajectory
69
  - true
70
  - - uuid
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 2000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 5000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f96ff3cb6461c7153b26aeb8d143c62ca6244b16ac78eab4c3f45cf54d541c0
3
- size 27224794
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b88b0e0b8b8121d67bf145fc10f15cd42e0cbaaa85be1a4be8d4ca02605c2b4a
3
+ size 27221388
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d8e8e26742a7917de7e166e6048ad3cd97593bdd65be71699816e0bc8b9a61f
3
  size 13505739
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea0100e5071db36b7eac131161705fb63cfd1e4d93ec87947f7166bd4ebc268c
3
  size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aad9edb91d62bf8f6d37dddaaae2011ab55fe96b41fdfa79e3d04cfcbf7482b5
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f5a03fed7a610a091e2f7e7918e2ddf9304aa536bea1aa3b20dbc2cb8d9c3a2
3
  size 13504937
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0cb502beeae5819dc644e8d27f82b87392f9cbda5b8cf6b13e8499f4efbef3f
3
- size 208520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:060c77efbc48f4cc190f824f193cd3d3f0938e5ec30a004d06d86a6fb52e9756
3
+ size 203440
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 544.0, "std_reward": 108.41586599755591, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-12-29T13:38:13.221363"}
 
1
+ {"mean_reward": 572.5, "std_reward": 81.83061774177193, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-12-31T10:15:25.456318"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8a6ee093af08b4958d164a224a1890855cf5cf7b6aad1ed0ee790d92148f67f
3
- size 63085
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64393816b7a9f0f72ff670cecd3c9c3dd656d55087ebd4da91edd3c407a9bcf7
3
+ size 417