winkin119 commited on
Commit
86065f5
·
verified ·
1 Parent(s): 8090332

upload via upload_folder 2025-07-27T10:15:35.880859+00:00

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ replay.mp4 filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ env_name: Walker2d-v5
3
+ tags:
4
+ - Walker2d-v5
5
+ - sac
6
+ - reinforcement-learning
7
+ - custom-implementation
8
+ - Walker2d
9
+ model-index:
10
+ - name: SAC-Walker2dV5
11
+ results:
12
+ - task:
13
+ type: reinforcement-learning
14
+ name: reinforcement-learning
15
+ dataset:
16
+ name: Walker2d-v5
17
+ type: Walker2d-v5
18
+ metrics:
19
+ - type: mean_reward
20
+ value: 4150.91 +/- 823.47
21
+ name: mean_reward
22
+ verified: false
23
+ ---
24
+
25
+ # **SAC** Agent playing **Walker2d-v5**
26
+ This is a trained model of a **SAC** agent playing **Walker2d-v5**.
27
+
28
+ ## Usage
29
+
30
+ model = load_from_hub(repo_id="winkin119/SAC-Walker2dV5", filename="sac_walker.pth")
31
+
32
+
33
+ env = gym.make("Walker2d-v5")
34
+ ...
eval_result.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "mean_reward": 4150.910494947614,
3
+ "std_reward": 823.4738749463849,
4
+ "datetime": "2025-07-26T21:01:59.365966+00:00",
5
+ "train_duration_min": "54.76"
6
+ }
params.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "env_config": {
3
+ "env_id": "Walker2d-v5",
4
+ "env_kwargs": {},
5
+ "max_steps": null,
6
+ "use_image": false,
7
+ "vector_env_num": 6,
8
+ "use_multi_processing": true,
9
+ "image_shape": null,
10
+ "frame_stack": 1,
11
+ "frame_skip": 1,
12
+ "training_render_mode": null
13
+ },
14
+ "device": "cpu",
15
+ "learning_rate": 0.0003,
16
+ "gamma": 0.995,
17
+ "checkpoint_pathname": "",
18
+ "max_grad_norm": 0.5,
19
+ "log_interval": 100,
20
+ "eval_episodes": 50,
21
+ "eval_random_seed": 42,
22
+ "eval_video_num": 10,
23
+ "total_steps": 1200000,
24
+ "hidden_sizes": [
25
+ 256,
26
+ 256,
27
+ 256
28
+ ],
29
+ "use_layer_norm": true,
30
+ "critic_lr": 0.0003,
31
+ "replay_buffer_capacity": 960000,
32
+ "batch_size": 256,
33
+ "update_start_step": 10000,
34
+ "alpha": 0.2,
35
+ "auto_tune_alpha": true,
36
+ "alpha_lr": 0.0003,
37
+ "target_entropy": -6.0,
38
+ "tau": 0.005,
39
+ "max_action": 1.0,
40
+ "log_std_min": -20,
41
+ "log_std_max": 2
42
+ }
replay.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7626e2ced6ddc0bb19c00948ac2594a044556cc3168b3f22aceb53bf190fc653
3
+ size 1238845
sac_walker.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35b4ec498e9814cf6a03cbf35b91030e1c2dc6c11a0e2399f050d7fe5b4a46d4
3
+ size 570421
tensorboard/events.out.tfevents.1753560365.winkindeMacBook-Air.local.4586.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84204083aaf1dba6bcd4250304ba735ecdf32edd209bbd220b41b66bc6fc051c
3
+ size 1622991