charmquark commited on
Commit
00015dc
·
1 Parent(s): 1a1f76f

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 242.00 +/- 126.59
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -72,7 +72,7 @@ OrderedDict([('batch_size', 32),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 10000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
 
16
  type: SpaceInvadersNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 722.00 +/- 268.96
20
  name: mean_reward
21
  verified: false
22
  ---
 
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 937313208
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2597681427
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 10000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55fd290bbae48419327997b77d66b13ccc5d4ac96628ec36daf39cffc404136a
3
- size 27224834
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:951f6cfbb61954b82e5762a81a49a31244332c61686937b73fd1f3bf55182e02
3
+ size 27224817
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c5ce14bc0647f01a428c964db06c4ef5188c060b6b1404655e5738e02352448
3
  size 13505739
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05fb4a4dc9bf7467e12b7852f6e82b4e518d8ceb78d1d61869b89a63c2cecad3
3
  size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d5010b06f4f2e7467f94bf473e9d93775a38ad9ce87cfde060f2d1c7197ae5c
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa5c99e383c738fed0398f2ff1ba4253d41436f9aceba486255de7e1a17c147a
3
  size 13504937
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca6070ebf1c9f09f595ade6ca18e1273255f39af7e78f71ac5e50afc4ca3af6c
3
- size 269096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3266ad6cd447d1ab4c9d75a65e38991bc419932141a47d0a89ea79ff6226b7c3
3
+ size 200639
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 242.0, "std_reward": 126.59383871263246, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-03-09T07:30:43.009581"}
 
1
+ {"mean_reward": 722.0, "std_reward": 268.96282270975667, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-03-09T08:51:50.787127"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11a226ce895237da200b31b157c1efa19cea37d357d0099ea690d00f738bd922
3
- size 20302
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8d14a229ac8cf2ef7eb3b682c50677df31684f341e1248e223067c56c5b6ca9
3
+ size 36928