giansimone commited on
Commit
5b07a48
·
verified ·
1 Parent(s): e9ee4d5

Upload folder using huggingface_hub

Browse files
Files changed (6) hide show
  1. .gitattributes +1 -0
  2. README.md +63 -0
  3. config.json +1 -0
  4. model.pt +3 -0
  5. replay.mp4 +3 -0
  6. results.json +1 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ replay.mp4 filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - ALE/SpaceInvaders-v5
4
+ - reinforcement-learning
5
+ - dqn
6
+ - atari
7
+ - gymnasium
8
+ - pytorch
9
+ model-index:
10
+ - name: DQN-ALE-SpaceInvaders
11
+ results:
12
+ - task:
13
+ type: reinforcement-learning
14
+ name: reinforcement-learning
15
+ dataset:
16
+ name: ALE/SpaceInvaders-v5
17
+ type: ALE/SpaceInvaders-v5
18
+ metrics:
19
+ - type: mean_reward
20
+ value: 528.25 +/- 111.13
21
+ name: mean_reward
22
+ verified: false
23
+ ---
24
+
25
+ # Deep Q-Network (DQN) Agent playing ALE/SpaceInvaders-v5
26
+
27
+ This is a trained Deep Q-Network (DQN) agent for the Atari game ALE/SpaceInvaders-v5.
28
+
29
+ The model was trained using the code available [here](https://github.com/giansimone/dqn-ale-spaceinvaders/).
30
+
31
+ ## Usage
32
+ To load and use this model for inference:
33
+
34
+ ```python
35
+ import torch
36
+ import json
37
+
38
+ from model import DQN
39
+ from agent import Agent
40
+ from environment import make_env, get_env_dims
41
+
42
+ #Load the configuration
43
+ with open("config.json", "r") as f:
44
+ config = json.load(f)
45
+
46
+ # Create environment. Get action and space dimensions
47
+ env = make_env(config)
48
+ state_size, action_size = get_env_dims(env)
49
+
50
+ # Instantiate the agent and load the trained policy network
51
+ agent = Agent(state_size, action_size, config)
52
+ agent.policy_net.load_state_dict(torch.load("model.pt"))
53
+ agent.policy_net.eval()
54
+
55
+ # Enjoy the agent!
56
+ state, _ = env.reset()
57
+ done = False
58
+ while not done:
59
+ action = agent.act(state, epsilon=0.0) # Act greedily
60
+ state, reward, terminated, truncated, _ = env.step(action)
61
+ done = terminated or truncated
62
+ env.render()
63
+ ```
config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"env_id": "ALE/SpaceInvaders-v5", "frame_skip": 1, "frame_stack": 4, "resized_frame": 84, "training_steps": 10000000, "n_eval_episodes": 20, "epsilon_start": 1.0, "epsilon_end": 0.1, "anneal_steps": 1000000, "buffer_size": 100000, "batch_size": 32, "gamma": 0.99, "lr": 0.00025, "update_every": 4, "target_update_every": 10000, "max_len_window": 100, "eval_every": 50, "log_dir": "runs/", "double_dqn": false, "dueling": false, "clip_rewards": true, "seed": 42}
model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b600efd52c7b3293370043a2c993b93f87aba3342e16936e225c66cd71f4dd9
3
+ size 6752421
replay.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93641bbaf37f345cf911d2460101fa6c4dc6f62c59affe708e307b8ff97d24d2
3
+ size 524222
results.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"env_id": "ALE/SpaceInvaders-v5", "mean_reward": 528.25, "n_eval_episodes": 20, "eval_datetime": "2025-10-22T17:42:37.136035"}