Upload PPO LunarLander-v2 LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep25000K.zip
Browse files- LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep25000K.zip +1 -1
- LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep25000K/data +16 -16
- LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep25000K/policy.optimizer.pth +1 -1
- LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep25000K/policy.pth +1 -1
- README.md +1 -1
- config.json +1 -1
- replay.mp4 +2 -2
- results.json +1 -1
LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep25000K.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 147519
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7a8eed0c194b0fbd3ec5e5fe53a66efc2dba02128d61de81cb60c2a1e473c77
|
| 3 |
size 147519
|
LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep25000K/data
CHANGED
|
@@ -4,20 +4,20 @@
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
| 8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
| 9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
| 10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
| 11 |
-
"_build": "<function ActorCriticPolicy._build at
|
| 12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
| 13 |
-
"extract_features": "<function ActorCriticPolicy.extract_features at
|
| 14 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
| 15 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
| 16 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
| 17 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
| 18 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
-
"_abc_impl": "<_abc_data object at
|
| 21 |
},
|
| 22 |
"verbose": 0,
|
| 23 |
"policy_kwargs": {},
|
|
@@ -26,12 +26,12 @@
|
|
| 26 |
"_num_timesteps_at_start": 0,
|
| 27 |
"seed": null,
|
| 28 |
"action_noise": null,
|
| 29 |
-
"start_time":
|
| 30 |
"learning_rate": 0.0003,
|
| 31 |
"tensorboard_log": null,
|
| 32 |
"_last_obs": {
|
| 33 |
":type:": "<class 'numpy.ndarray'>",
|
| 34 |
-
":serialized:": "
|
| 35 |
},
|
| 36 |
"_last_episode_starts": {
|
| 37 |
":type:": "<class 'numpy.ndarray'>",
|
|
@@ -45,7 +45,7 @@
|
|
| 45 |
"_stats_window_size": 100,
|
| 46 |
"ep_info_buffer": {
|
| 47 |
":type:": "<class 'collections.deque'>",
|
| 48 |
-
":serialized:": "
|
| 49 |
},
|
| 50 |
"ep_success_buffer": {
|
| 51 |
":type:": "<class 'collections.deque'>",
|
|
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7f2803f51160>",
|
| 8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f2803f511f0>",
|
| 9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f2803f51280>",
|
| 10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f2803f51310>",
|
| 11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7f2803f513a0>",
|
| 12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7f2803f51430>",
|
| 13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x7f2803f514c0>",
|
| 14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f2803f51550>",
|
| 15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7f2803f515e0>",
|
| 16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f2803f51670>",
|
| 17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f2803f51700>",
|
| 18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7f2803f51790>",
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
+
"_abc_impl": "<_abc_data object at 0x7f2803fb2d20>"
|
| 21 |
},
|
| 22 |
"verbose": 0,
|
| 23 |
"policy_kwargs": {},
|
|
|
|
| 26 |
"_num_timesteps_at_start": 0,
|
| 27 |
"seed": null,
|
| 28 |
"action_noise": null,
|
| 29 |
+
"start_time": 1744344722995548300,
|
| 30 |
"learning_rate": 0.0003,
|
| 31 |
"tensorboard_log": null,
|
| 32 |
"_last_obs": {
|
| 33 |
":type:": "<class 'numpy.ndarray'>",
|
| 34 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAE3mer28GW09IuGQPq3m0L53oYA9gsOFPgAAAAAAAAAAgESmPRX9jT9FEVg+FuxWvwSFcD64/yQ+AAAAAAAAAABGbCg+OqmZPxdFED96lA6/uSyRPn235D4AAAAAAAAAAGaGMruqw6k/+Nj6vClHBr++JUs7dpHgOwAAAAAAAAAA5lNdPoB9oT/gP+c+rIMhv+1eHz88Upw+AAAAAAAAAABz+c89ESsFPjwXCb/Li/i+QrsBvgjQ7r4AAAAAAAAAAAAcjjtWvrM/s5tgPSZrBb4LMqG71RlJvAAAAAAAAAAAmqcLPUN5Gj07hQ6+sl3PvgGipru2C+a9AAAAAAAAAACaABs+ZRvYPiD87r0mPlO/muuLPjd3RL4AAAAAAAAAADPHJLz7G3I/Jq9Gu0n3f7+CCY67Zs+PvQAAAAAAAAAABowLvnmPZT7+IKg+f9cQv7I3K75/f4Y+AAAAAAAAAAC+3YW+e7NyP/FuBj5ACSu/rr0lvzv9eD4AAAAAAAAAAJqQSz3hgO66g897vnFFk745e1G++ShJPwAAgD8AAAAAmiEXO+Hwq7rcgCe5c2EctErPqDraGUA4AACAPwAAgD+a2eC74RSOuvhCojvV/JM8K9gnOiubgL0AAIA/AACAP2Zp4T0Mv64/tdGTPvSk9b6KHEk+VcmjPgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
| 35 |
},
|
| 36 |
"_last_episode_starts": {
|
| 37 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
|
| 45 |
"_stats_window_size": 100,
|
| 46 |
"ep_info_buffer": {
|
| 47 |
":type:": "<class 'collections.deque'>",
|
| 48 |
+
":serialized:": "gAWV4gsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHLc/lZHNHKMAWyUS6aMAXSUR0EKPC2lIuoQdX2UKGgGR0BwMCEvkBCEaAdLqWgIR0EKPC2oK2KEdX2UKGgGR0Bws1wm3OObaAdLmGgIR0EKPC31X/5tdX2UKGgGR0BypxbVz6rOaAdLrmgIR0EKPC5DgZTAdX2UKGgGR0BzFYWP91loaAdLvGgIR0EKPC6f4yoGdX2UKGgGR0BzVR5ooNNKaAdLrGgIR0EKPC8FWfbsdX2UKGgGR0By4h9/jKgaaAdLvmgIR0EKPEIV3Ux3dX2UKGgGR0BzQ9IZqEeyaAdLy2gIR0EKPENVVPvbdX2UKGgGR0BzXeoLofSyaAdLp2gIR0EKPEOwVbiZdX2UKGgGR0ByxZwn6VMVaAdLn2gIR0EKPEP5hz/7dX2UKGgGR0BxZL7IkqtpaAdLj2gIR0EKPERn4fwJdX2UKGgGR0BxAeOU+s5oaAdLl2gIR0EKPESOjASGdX2UKGgGR0ByqM7QswtbaAdLk2gIR0EKPEX60hNedX2UKGgGR0ByjO3jMmngaAdLo2gIR0EKPEaeWfK7dX2UKGgGR0ByDUNYr8R+aAdLt2gIR0EKPEdTOxB3dX2UKGgGR0BzNwRIz3yqaAdLsWgIR0EKPEeE0zj4dX2UKGgGR0BpE+XmeUY9aAdN6ANoCEdBCjxHonWrfnV9lChoBkdAcYR4ACGN72gHS6RoCEdBCjxHrM9r43V9lChoBkdAcjBaKDTScGgHS5xoCEdBCjxICBkI5nV9lChoBkdAc1j0+1SflWgHS9NoCEdBCjxICcVgyHV9lChoBkdAcqz8c+7lJmgHS79oCEdBCjxIPVoYenV9lChoBkdAc3w0CRwIdGgHS7VoCEdBCjxIeU4aP3V9lChoBkdAcrBVu76HkGgHS6NoCEdBCjxJGIInjXV9lChoBkdAcPl0qYqoZWgHS55oCEdBCjxJgB5ooXV9lChoBkdAcDGTkQwsXmgHS7FoCEdBCjxKChpQDXV9lChoBkdAcHdcgyM1j2gHS6toCEdBCjxK/jp9qnV9lChoBkdAcrAehwl0HWgHS8RoCEdBCjxMMYQ8OnV9lChoBkdAcmwlenhsImgHS39oCEdBCjxNsvCdjHV9lChoBkdAcBiTrE9+w2gHS45oCEdBCjxN0VJti3V9lChoBkdAc+xB6KLsKWgHS6doCEdBCjxNz7CSBHV9lChoBkdAc/7xXGOuJWgHS51oCEdBCjxOPXd0rHV9lChoBkdAcP/Z0Syt3mgHS41oCEdBCjxOvi97GHV9lChoBkdAcAHChvitJWgHS5NoCEdBCjxOvZ00WXV9lChoBkdAcz4N3GGVRmgHS9BoCEdBCjxPKu6mO3V9lChoBkdAcUg3AVO9FmgHS6poCEdBCjxPRF/hEXV9lChoBkdAdJoX9BKL9GgHS8poCEdBCjxQfV9WqHV9lChoBkdAcopRChN/OWgHS5RoCEdBCjxQjKgZj3V9lChoBkdAcgVPmgam42gHS7RoCEdBCjxQ1v863nV9lChoBkdAcYsSnLq2SmgHS5toCEdBCjxRn7SApnV9lChoBkdAcmRKOT7l72gHS6poCEdBCjxRvkq+anV9lChoBkdAcrvYa5wwTWgHS6hoCEdBCjxSswJw9HV9lChoBkdAcWWwK0D2amgHS5doCEdBCjxS2SOinHV9lChoBkdAcYHL9uP3jGgHS45oCEdBCjxTefXf7HV9lChoBkdAcgPP+XJHRWgHS5loCEdBCjxT8MG5c3V9lChoBkdAcUyVf/m1Y2gHS5VoCEdBCjxUIYYR/XV9lChoBkdAcESrd30PH2gHS5toCEdBCjxUEfvF33V9lChoBkdAcWvN7BwdbWgHS5FoCEdBCjxUVByCF3V9lChoBkdAcI4ZpSJj2GgHS55oCEdBCjxVF4RmLHV9lChoBkdAc/wnRb8m8mgHS6loCEdBCjxVjYsd1nV9lChoBkdAcuRJY1YQrmgHS5poCEdBCjxWKt3fRHV9lChoBkdAcmBuf29L6GgHS5loCEdBCjxWZubZvnV9lChoBkdAc+Ve5WilBWgHS89oCEdBCjxWpfjS5XV9lChoBkdAc7zSVnmJWWgHS6hoCEdBCjxWp+6RQ3V9lChoBkdAcbQTYdyT6mgHS5RoCEdBCjxXDOgQH3V9lChoBkdAcFsRGtp22WgHS7FoCEdBCjxYPL1VYXV9lChoBkdAc99yHmA9V2gHS6toCEdBCjxZLb5/LHV9lChoBkdAc+gZ26kIomgHS7FoCEdBCjxZQhfShXV9lChoBkdAcvZXxvvSdGgHS5VoCEdBCjxZkAFPi3V9lChoBkdAcg4XaJyhjGgHS6BoCEdBCjxZ5iAlOXV9lChoBkdAc1UtEofCAWgHS7hoCEdBCjxaSG8Em3V9lChoBkdAci35Ke05VGgHS7hoCEdBCjxa6aG5+nV9lChoBkdAcLORbr1M/WgHS6FoCEdBCjxbC+nIhnV9lChoBkdAcP9QvYe1bGgHS79oCEdBCjxbV+Xqq3V9lChoBkdAcZnEBbOeKGgHS6VoCEdBCjxboElme3V9lChoBkdAcuzJcPe54GgHS59oCEdBCjxb8d/8VHV9lChoBkdAccMyad+Xq2gHS5toCEdBCjxcNpPAPHV9lChoBkdAcswpCa7Va2gHS7doCEdBCjxc8zwc53V9lChoBkdAcWxAtFrmAGgHS6RoCEdBCjxc6EQGwHV9lChoBkdAcZ/IyTINmWgHS7RoCEdBCjxdCVB2OnV9lChoBkdAcRtsp5NXYGgHS4xoCEdBCjxdKM5wO3V9lChoBkdAcbyIjnmq52gHS5toCEdBCjxeXc1wYXV9lChoBkdAdAO/SpiqhmgHS7VoCEdBCjxfKeqaPXV9lChoBkdAcys4nndO7GgHS5hoCEdBCjxfOMfignV9lChoBkdAcrhd2xIJ7mgHS5RoCEdBCjxfsyrPt3V9lChoBkdAcKgDCgsbvWgHS7ZoCEdBCjxf8enyeHV9lChoBkdAc9+Ooo/iYWgHS8NoCEdBCjxgGpsGgXV9lChoBkdAcqzmmce8w2gHS5loCEdBCjxgiiwjdHV9lChoBkdAc0QwiaAnUmgHS69oCEdBCjxgvoV2zXV9lChoBkdAc21v/R3NcGgHS5toCEdBCjxhKCz1LHV9lChoBkdAcg+2/zreImgHS7doCEdBCjxhOv2XcHV9lChoBkdAcgIa6STyKGgHS4poCEdBCjxhQUSIxnV9lChoBkdAcGlt3OfNA2gHS5ZoCEdBCjxhq02LpHV9lChoBkdAcpLtozvZy2gHS7doCEdBCjxhuT1TSHV9lChoBkdAcLhcC5mRNmgHS6NoCEdBCjxiD9n9N3V9lChoBkdAcnSV/c32mGgHS6JoCEdBCjxiJ+lTFXV9lChoBkdAY9jLq2SdOWgHTegDaAhHQQo8Ys8cMmZ1fZQoaAZHQHM4JOnEVFhoB0uiaAhHQQo8Y04MnZ11fZQoaAZHQHD9DZlFtsNoB0ujaAhHQQo8Y/vjwQV1fZQoaAZHQHELCwbEP2BoB0uZaAhHQQo8ZB4L1Ep1fZQoaAZHQHEHOnMt9QZoB0uraAhHQQo8ZDYxL011fZQoaAZHQHI7sLORkmRoB0uLaAhHQQo8ZGGqxTt1fZQoaAZHQHLsurlvIfdoB0unaAhHQQo8ZLDtPYZ1fZQoaAZHQHHsFdcB2fVoB0usaAhHQQo8ZLpxFRZ1fZQoaAZHQHCXF50KZ2JoB0ufaAhHQQo8ZWWmgrZ1fZQoaAZHQHCpDpX6qKhoB0u0aAhHQQo8ZZI7Njd1fZQoaAZHQHDkKWX1J19oB0uSaAhHQQo8ZZUtqYZ1fZQoaAZHQHAu6G5+YtxoB0ujaAhHQQo8ZZsUIs11fZQoaAZHQHKv52pyZKFoB0uvaAhHQQo8ZefdRBN1fZQoaAZHQHJZn2IwdsBoB0uvaAhHQQo8Zj/echF1fZQoaAZHQHLA5YkmhM9oB0ucaAhHQQo8Zj3XZoR1ZS4="
|
| 49 |
},
|
| 50 |
"ep_success_buffer": {
|
| 51 |
":type:": "<class 'collections.deque'>",
|
LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep25000K/policy.optimizer.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87978
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5085babf1acf3a01396282d221ce0408a13a8d6a0bb0e8eaa8e26c8540611984
|
| 3 |
size 87978
|
LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep25000K/policy.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 43634
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c40876421dea7ae94c8ca22ec4276c1aebca6e549f30b246729d31f3ff0d06b1
|
| 3 |
size 43634
|
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value:
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: 261.75 +/- 67.92
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7ff7606941f0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7ff760694280>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7ff760694310>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7ff7606943a0>", "_build": "<function ActorCriticPolicy._build at 0x7ff760694430>", "forward": "<function ActorCriticPolicy.forward at 0x7ff7606944c0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7ff760694550>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7ff7606945e0>", "_predict": "<function ActorCriticPolicy._predict at 0x7ff760694670>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7ff760694700>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7ff760694790>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7ff760694820>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7ff7606f3d20>"}, "verbose": 0, "policy_kwargs": {}, "num_timesteps": 26001408, "_total_timesteps": 26000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1744342013578088700, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAAUpzv2UGG62ZuLtasgkK4Iugy7SsO5NAAAgD8AAIA/89uQvQzOsj5w1FA+t2E8vxJmFb6rq3I+AAAAAAAAAAAzD0W89lRyut68WztR84S1qg8QOqibgLoAAAAAAAAAAM1w/ztsV4u7pYWGvXd6qzxn1788JoGRvQAAgD8AAIA/5ukcPVQmTD6amsy9Vvgev0XSFT2iJqq9AAAAAAAAAABmJKw9Q14VvC0J174g+Fq+jaxHvSvnYz8AAIA/AACAP5o5Irt7zpK6JT8UPC1XK7NUPVw6Er1AswAAgD8AAIA/IK8JvmYMmT/qPRW/5zUnvwJ4Rr4ckQO/AAAAAAAAAAAAWjc84eiAuvq/GbjCqBizhHFeOxqGMzcAAIA/AACAP6bJIj6KmZA/pC2MPveYOL89aOo+mo2APgAAAAAAAAAATWBWPS2NJz+G1jM915Bsv5AiJj5zDa88AAAAAAAAAAAa1UO9j259ulqWgrpETp204a3huThSmDkAAIA/AACAP+aHcj1pmHA9R7mIviyi8b5yBCA8iR8tvgAAAAAAAAAAmhHDPGk2YbzYOIK+hRlpPey/XT37Aoo7AACAPwAAgD/a+YK9snVePuPFXT4liSe/bdmNvZJxZz4AAAAAAAAAAM2Eejtcg2e6fk8qs4pBiCm3Aia6ZrfMMwAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -5.415384615381491e-05, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHHcR51Ng0GMAWyUS6WMAXSUR0EJxFHRRl6JdX2UKGgGR0ByTcxtYSxraAdLrWgIR0EJxFHUTL4fdX2UKGgGR0BxJbktEofCaAdLjmgIR0EJxFJtCZ4OdX2UKGgGR0By3CoUBXCCaAdLqGgIR0EJxFKojW07dX2UKGgGR0BygHwTdtVJaAdLm2gIR0EJxFMcVpK0dX2UKGgGR0BxMx4s3AEdaAdLqGgIR0EJxFNQ9aEBdX2UKGgGR0BzvVDXvphXaAdLsGgIR0EJxFOROclPdX2UKGgGR0BxzorMC9ytaAdLlWgIR0EJxFO6XjU/dX2UKGgGR0BxLT/uLJjlaAdLo2gIR0EJxGcM7lq8dX2UKGgGR0BzrTGp++dtaAdLvGgIR0EJxGcjP4VRdX2UKGgGR0B0mm7xusLfaAdLqmgIR0EJxGdUy57PdX2UKGgGR0BzbIYXO4XoaAdLomgIR0EJxGexaX8gdX2UKGgGR0B0TbVz6rNoaAdLqmgIR0EJxGhgQ6IWdX2UKGgGR0Bxqd0PpY9xaAdLjGgIR0EJxGnlFc6edX2UKGgGR0BzHtc9nscAaAdLmGgIR0EJxGpbWEsbdX2UKGgGR0B0AoKeCkGiaAdLqmgIR0EJxGrVUModdX2UKGgGR0BwTmIqLCN0aAdLl2gIR0EJxGre+VTrdX2UKGgGR0BxUh3Tuv2XaAdLtGgIR0EJxGr5FgDzdX2UKGgGR0BxTttfoicHaAdLlmgIR0EJxGtu9WZJdX2UKGgGR0ByaHUlRgqmaAdLj2gIR0EJxGvKWcBmdX2UKGgGR0BxY1WV/tpmaAdLhmgIR0EJxGwh/iHZdX2UKGgGR0B0O0IkZ75VaAdLxGgIR0EJxGyogV45dX2UKGgGR0B0EUzsQd0aaAdLuWgIR0EJxGzd92HMdX2UKGgGR0Bzn1FAmiQDaAdLtGgIR0EJxGzuZLIxdX2UKGgGR0Byc1MURFqjaAdLqmgIR0EJxG0MuWa+dX2UKGgGR0ByUG4b0e2eaAdLjmgIR0EJxG15c9nsdX2UKGgGR0BzOZzXBguzaAdLtGgIR0EJxG10wSJ1dX2UKGgGR0Bznu//NqxkaAdNTwJoCEdBCcRuYzYVZnV9lChoBkdAc9yA/LTx5WgHS8JoCEdBCcRueSntOXV9lChoBkdAchaagVXV9WgHS7RoCEdBCcRwFOVPe3V9lChoBkdAc4Zy9EkSmWgHS7loCEdBCcRwsaAFxHV9lChoBkdAcgK4jKPn0WgHS5hoCEdBCcRw6cAimnV9lChoBkdAcbiWMju8b2gHS6BoCEdBCcRw2kWRBHV9lChoBkdAczgMy8BdU2gHS7poCEdBCcRxLZvkzXV9lChoBkdAcmtdGy5ZsGgHS7VoCEdBCcRxH1xsEnV9lChoBkdAcndYnfEXL2gHS7loCEdBCcRxKVrylXV9lChoBkdAcUlv4M4LkWgHS6RoCEdBCcRxkdHUdHV9lChoBkdAcK3R51Ng0GgHS59oCEdBCcRyDArQPnV9lChoBkdAco3fZElVtGgHS6xoCEdBCcRyg00m+nV9lChoBkdAc76A1vVEu2gHS7ZoCEdBCcRylyimEXV9lChoBkdAcd8OZb6gumgHS7doCEdBCcRy/Hggo3V9lChoBkdAc8cXPZ7HAGgHS7JoCEdBCcRzOo3rEHV9lChoBkdAcsctZFG5MGgHS8BoCEdBCcRzsWykbnV9lChoBkdAcUwBX0XgtWgHS6NoCEdBCcRzsjHGTHV9lChoBkdAcqUhGYrrgWgHS75oCEdBCcR0knTiKnV9lChoBkdAcP3wVCXyAmgHS4RoCEdBCcR04jhUBHV9lChoBkdAcoGviLl3hWgHS4xoCEdBCcR1aVnmJXV9lChoBkdAclKpm29cr2gHS51oCEdBCcR1iTbFj3V9lChoBkdAb/aHJLdvbWgHS5xoCEdBCcR1tjZtenV9lChoBkdAcTv2cawUxmgHS7NoCEdBCcR1ubXpW3V9lChoBkdAcj/pS75EdGgHS5hoCEdBCcR10uez2XV9lChoBkdAcny6ij+Jg2gHS45oCEdBCcR2W/rSmnV9lChoBkdAdFFdZJTVD2gHS69oCEdBCcR23ai9I3V9lChoBkdAdBSubI91U2gHS8loCEdBCcR3NqveQHV9lChoBkdAcZ49hZyMk2gHS6NoCEdBCcR3eepXIXV9lChoBkdAcu6qy4Wk8GgHS61oCEdBCcR33V/c33V9lChoBkdAc7cLCemNzmgHS6VoCEdBCcR4AqI8AHV9lChoBkdAcSEbj94u9WgHS5NoCEdBCcR4JiLEUHV9lChoBkdAch6yqMm4RWgHS6hoCEdBCcR4UjxCpnV9lChoBkdAcxodgfEGaGgHS6loCEdBCcR4xqynk3V9lChoBkdAcYnBN21Ul2gHS6VoCEdBCcR5l4A0bnV9lChoBkdAciPGzru6VmgHS49oCEdBCcR6RwQ18HV9lChoBkdAct2fmLcbi2gHS6RoCEdBCcR6nWhAW3V9lChoBkdAc9ZQmeDnNmgHS75oCEdBCcR69FrmAHV9lChoBkdAc5bmdRR/E2gHS6toCEdBCcR7CUqx1XV9lChoBkdAcphsGPgeimgHS61oCEdBCcR7TFCLM3V9lChoBkdAc5GKwIMSb2gHS7poCEdBCcR7tuP3jHV9lChoBkdAck0t8/lhgGgHS7BoCEdBCcR8NhkRSXV9lChoBkdAcplOLR8c/GgHS5VoCEdBCcR9GWQfZHV9lChoBkdAcyWctoSL62gHS7poCEdBCcR9J8x9HHV9lChoBkdAc+DMBp5/smgHS7FoCEdBCcR9NxGUfXV9lChoBkdAce6L3K0UoWgHS6toCEdBCcR9TTQVsXV9lChoBkdActQ50KZ2IWgHS6VoCEdBCcR9fdsSCnV9lChoBkdAcn6c2BJ7LWgHS6FoCEdBCcR9pqfvnnV9lChoBkdAcyAe4Cp3o2gHS6FoCEdBCcR901dgOXV9lChoBkdAdFVUwBYFJWgHS71oCEdBCcR/IHVwxXV9lChoBkdAcF62HtWuHWgHS51oCEdBCcR/iYXwb3V9lChoBkdAcuDkpI+W4WgHS45oCEdBCcR/oRwqAnV9lChoBkdAc2c63RXwLGgHS5poCEdBCcR/vrQgLnV9lChoBkdAcWfXiBGx2WgHS6RoCEdBCcSAd67dznV9lChoBkdAcfVxPO6d2GgHS5VoCEdBCcSApZ2ZA3V9lChoBkdAcj0XP7el9GgHS61oCEdBCcSBDDIiknV9lChoBkdAb6N1M/QjU2gHS5poCEdBCcSBTQb++HV9lChoBkdAcj7287IT5GgHS5xoCEdBCcSCWdXkpHV9lChoBkdAc6RHoX9BKWgHS6ZoCEdBCcSCqi22HHV9lChoBkdAcGPzzmOlwmgHS6NoCEdBCcSCtfReC3V9lChoBkdAcNCwFTvRZ2gHS5ZoCEdBCcSC3Z5AyHV9lChoBkdAccr25hBqsWgHS6VoCEdBCcSDAEZBLXV9lChoBkdAc45lSjxkNGgHS7toCEdBCcSDY1+AmXV9lChoBkdAc/MPQv6CUWgHS69oCEdBCcSDh/Aj6nV9lChoBkdAcjswOOKfnWgHS5doCEdBCcSE35aePXV9lChoBkdAcjW2CuloDmgHS5ZoCEdBCcSE7urp7nV9lChoBkdAc/elf7aZhWgHS65oCEdBCcSFQePq93V9lChoBkdAcCmEIPbwjWgHS4poCEdBCcSF717IDHV9lChoBkdAcP0c1O0sv2gHS69oCEdBCcSF8QyylnV9lChoBkdAc4UsUIsyz2gHS6loCEdBCcSGjBj4H3V9lChoBkdAclEEvCdjG2gHS61oCEdBCcSG+df9gnV9lChoBkdAdInzyjHn2mgHS65oCEdBCcSIC4jKPnV9lChoBkdAcaJ7/XGwR2gHS4poCEdBCcSIM1n/UHV9lChoBkdAchmxO+IuXmgHS6hoCEdBCcSJAbuMM3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 85748, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV5QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZS9ob21lL3NlbmxpLy5jb25kYS9lbnZzL3NlbmxpX1B5dGhvbjMuOC9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLhEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxlL2hvbWUvc2VubGkvLmNvbmRhL2VudnMvc2VubGlfUHl0aG9uMy44L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV5QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZS9ob21lL3NlbmxpLy5jb25kYS9lbnZzL3NlbmxpX1B5dGhvbjMuOC9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLhEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxlL2hvbWUvc2VubGkvLmNvbmRhL2VudnMvc2VubGlfUHl0aG9uMy44L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-5.15.0-134-generic-x86_64-with-glibc2.17 # 145-Ubuntu SMP Wed Feb 12 20:08:39 UTC 2025", "Python": "3.8.20", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.1+cu121", "GPU Enabled": "True", "Numpy": "1.24.4", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.26.2"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f2803f51160>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f2803f511f0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f2803f51280>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f2803f51310>", "_build": "<function ActorCriticPolicy._build at 0x7f2803f513a0>", "forward": "<function ActorCriticPolicy.forward at 0x7f2803f51430>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f2803f514c0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f2803f51550>", "_predict": "<function ActorCriticPolicy._predict at 0x7f2803f515e0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f2803f51670>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f2803f51700>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f2803f51790>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f2803fb2d20>"}, "verbose": 0, "policy_kwargs": {}, "num_timesteps": 25001984, "_total_timesteps": 25000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1744344722995548300, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAE3mer28GW09IuGQPq3m0L53oYA9gsOFPgAAAAAAAAAAgESmPRX9jT9FEVg+FuxWvwSFcD64/yQ+AAAAAAAAAABGbCg+OqmZPxdFED96lA6/uSyRPn235D4AAAAAAAAAAGaGMruqw6k/+Nj6vClHBr++JUs7dpHgOwAAAAAAAAAA5lNdPoB9oT/gP+c+rIMhv+1eHz88Upw+AAAAAAAAAABz+c89ESsFPjwXCb/Li/i+QrsBvgjQ7r4AAAAAAAAAAAAcjjtWvrM/s5tgPSZrBb4LMqG71RlJvAAAAAAAAAAAmqcLPUN5Gj07hQ6+sl3PvgGipru2C+a9AAAAAAAAAACaABs+ZRvYPiD87r0mPlO/muuLPjd3RL4AAAAAAAAAADPHJLz7G3I/Jq9Gu0n3f7+CCY67Zs+PvQAAAAAAAAAABowLvnmPZT7+IKg+f9cQv7I3K75/f4Y+AAAAAAAAAAC+3YW+e7NyP/FuBj5ACSu/rr0lvzv9eD4AAAAAAAAAAJqQSz3hgO66g897vnFFk745e1G++ShJPwAAgD8AAAAAmiEXO+Hwq7rcgCe5c2EctErPqDraGUA4AACAPwAAgD+a2eC74RSOuvhCojvV/JM8K9gnOiubgL0AAIA/AACAP2Zp4T0Mv64/tdGTPvSk9b6KHEk+VcmjPgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -7.935999999997279e-05, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4gsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHLc/lZHNHKMAWyUS6aMAXSUR0EKPC2lIuoQdX2UKGgGR0BwMCEvkBCEaAdLqWgIR0EKPC2oK2KEdX2UKGgGR0Bws1wm3OObaAdLmGgIR0EKPC31X/5tdX2UKGgGR0BypxbVz6rOaAdLrmgIR0EKPC5DgZTAdX2UKGgGR0BzFYWP91loaAdLvGgIR0EKPC6f4yoGdX2UKGgGR0BzVR5ooNNKaAdLrGgIR0EKPC8FWfbsdX2UKGgGR0By4h9/jKgaaAdLvmgIR0EKPEIV3Ux3dX2UKGgGR0BzQ9IZqEeyaAdLy2gIR0EKPENVVPvbdX2UKGgGR0BzXeoLofSyaAdLp2gIR0EKPEOwVbiZdX2UKGgGR0ByxZwn6VMVaAdLn2gIR0EKPEP5hz/7dX2UKGgGR0BxZL7IkqtpaAdLj2gIR0EKPERn4fwJdX2UKGgGR0BxAeOU+s5oaAdLl2gIR0EKPESOjASGdX2UKGgGR0ByqM7QswtbaAdLk2gIR0EKPEX60hNedX2UKGgGR0ByjO3jMmngaAdLo2gIR0EKPEaeWfK7dX2UKGgGR0ByDUNYr8R+aAdLt2gIR0EKPEdTOxB3dX2UKGgGR0BzNwRIz3yqaAdLsWgIR0EKPEeE0zj4dX2UKGgGR0BpE+XmeUY9aAdN6ANoCEdBCjxHonWrfnV9lChoBkdAcYR4ACGN72gHS6RoCEdBCjxHrM9r43V9lChoBkdAcjBaKDTScGgHS5xoCEdBCjxICBkI5nV9lChoBkdAc1j0+1SflWgHS9NoCEdBCjxICcVgyHV9lChoBkdAcqz8c+7lJmgHS79oCEdBCjxIPVoYenV9lChoBkdAc3w0CRwIdGgHS7VoCEdBCjxIeU4aP3V9lChoBkdAcrBVu76HkGgHS6NoCEdBCjxJGIInjXV9lChoBkdAcPl0qYqoZWgHS55oCEdBCjxJgB5ooXV9lChoBkdAcDGTkQwsXmgHS7FoCEdBCjxKChpQDXV9lChoBkdAcHdcgyM1j2gHS6toCEdBCjxK/jp9qnV9lChoBkdAcrAehwl0HWgHS8RoCEdBCjxMMYQ8OnV9lChoBkdAcmwlenhsImgHS39oCEdBCjxNsvCdjHV9lChoBkdAcBiTrE9+w2gHS45oCEdBCjxN0VJti3V9lChoBkdAc+xB6KLsKWgHS6doCEdBCjxNz7CSBHV9lChoBkdAc/7xXGOuJWgHS51oCEdBCjxOPXd0rHV9lChoBkdAcP/Z0Syt3mgHS41oCEdBCjxOvi97GHV9lChoBkdAcAHChvitJWgHS5NoCEdBCjxOvZ00WXV9lChoBkdAcz4N3GGVRmgHS9BoCEdBCjxPKu6mO3V9lChoBkdAcUg3AVO9FmgHS6poCEdBCjxPRF/hEXV9lChoBkdAdJoX9BKL9GgHS8poCEdBCjxQfV9WqHV9lChoBkdAcopRChN/OWgHS5RoCEdBCjxQjKgZj3V9lChoBkdAcgVPmgam42gHS7RoCEdBCjxQ1v863nV9lChoBkdAcYsSnLq2SmgHS5toCEdBCjxRn7SApnV9lChoBkdAcmRKOT7l72gHS6poCEdBCjxRvkq+anV9lChoBkdAcrvYa5wwTWgHS6hoCEdBCjxSswJw9HV9lChoBkdAcWWwK0D2amgHS5doCEdBCjxS2SOinHV9lChoBkdAcYHL9uP3jGgHS45oCEdBCjxTefXf7HV9lChoBkdAcgPP+XJHRWgHS5loCEdBCjxT8MG5c3V9lChoBkdAcUyVf/m1Y2gHS5VoCEdBCjxUIYYR/XV9lChoBkdAcESrd30PH2gHS5toCEdBCjxUEfvF33V9lChoBkdAcWvN7BwdbWgHS5FoCEdBCjxUVByCF3V9lChoBkdAcI4ZpSJj2GgHS55oCEdBCjxVF4RmLHV9lChoBkdAc/wnRb8m8mgHS6loCEdBCjxVjYsd1nV9lChoBkdAcuRJY1YQrmgHS5poCEdBCjxWKt3fRHV9lChoBkdAcmBuf29L6GgHS5loCEdBCjxWZubZvnV9lChoBkdAc+Ve5WilBWgHS89oCEdBCjxWpfjS5XV9lChoBkdAc7zSVnmJWWgHS6hoCEdBCjxWp+6RQ3V9lChoBkdAcbQTYdyT6mgHS5RoCEdBCjxXDOgQH3V9lChoBkdAcFsRGtp22WgHS7FoCEdBCjxYPL1VYXV9lChoBkdAc99yHmA9V2gHS6toCEdBCjxZLb5/LHV9lChoBkdAc+gZ26kIomgHS7FoCEdBCjxZQhfShXV9lChoBkdAcvZXxvvSdGgHS5VoCEdBCjxZkAFPi3V9lChoBkdAcg4XaJyhjGgHS6BoCEdBCjxZ5iAlOXV9lChoBkdAc1UtEofCAWgHS7hoCEdBCjxaSG8Em3V9lChoBkdAci35Ke05VGgHS7hoCEdBCjxa6aG5+nV9lChoBkdAcLORbr1M/WgHS6FoCEdBCjxbC+nIhnV9lChoBkdAcP9QvYe1bGgHS79oCEdBCjxbV+Xqq3V9lChoBkdAcZnEBbOeKGgHS6VoCEdBCjxboElme3V9lChoBkdAcuzJcPe54GgHS59oCEdBCjxb8d/8VHV9lChoBkdAccMyad+Xq2gHS5toCEdBCjxcNpPAPHV9lChoBkdAcswpCa7Va2gHS7doCEdBCjxc8zwc53V9lChoBkdAcWxAtFrmAGgHS6RoCEdBCjxc6EQGwHV9lChoBkdAcZ/IyTINmWgHS7RoCEdBCjxdCVB2OnV9lChoBkdAcRtsp5NXYGgHS4xoCEdBCjxdKM5wO3V9lChoBkdAcbyIjnmq52gHS5toCEdBCjxeXc1wYXV9lChoBkdAdAO/SpiqhmgHS7VoCEdBCjxfKeqaPXV9lChoBkdAcys4nndO7GgHS5hoCEdBCjxfOMfignV9lChoBkdAcrhd2xIJ7mgHS5RoCEdBCjxfsyrPt3V9lChoBkdAcKgDCgsbvWgHS7ZoCEdBCjxf8enyeHV9lChoBkdAc9+Ooo/iYWgHS8NoCEdBCjxgGpsGgXV9lChoBkdAcqzmmce8w2gHS5loCEdBCjxgiiwjdHV9lChoBkdAc0QwiaAnUmgHS69oCEdBCjxgvoV2zXV9lChoBkdAc21v/R3NcGgHS5toCEdBCjxhKCz1LHV9lChoBkdAcg+2/zreImgHS7doCEdBCjxhOv2XcHV9lChoBkdAcgIa6STyKGgHS4poCEdBCjxhQUSIxnV9lChoBkdAcGlt3OfNA2gHS5ZoCEdBCjxhq02LpHV9lChoBkdAcpLtozvZy2gHS7doCEdBCjxhuT1TSHV9lChoBkdAcLhcC5mRNmgHS6NoCEdBCjxiD9n9N3V9lChoBkdAcnSV/c32mGgHS6JoCEdBCjxiJ+lTFXV9lChoBkdAY9jLq2SdOWgHTegDaAhHQQo8Ys8cMmZ1fZQoaAZHQHM4JOnEVFhoB0uiaAhHQQo8Y04MnZ11fZQoaAZHQHD9DZlFtsNoB0ujaAhHQQo8Y/vjwQV1fZQoaAZHQHELCwbEP2BoB0uZaAhHQQo8ZB4L1Ep1fZQoaAZHQHEHOnMt9QZoB0uraAhHQQo8ZDYxL011fZQoaAZHQHI7sLORkmRoB0uLaAhHQQo8ZGGqxTt1fZQoaAZHQHLsurlvIfdoB0unaAhHQQo8ZLDtPYZ1fZQoaAZHQHHsFdcB2fVoB0usaAhHQQo8ZLpxFRZ1fZQoaAZHQHCXF50KZ2JoB0ufaAhHQQo8ZWWmgrZ1fZQoaAZHQHCpDpX6qKhoB0u0aAhHQQo8ZZI7Njd1fZQoaAZHQHDkKWX1J19oB0uSaAhHQQo8ZZUtqYZ1fZQoaAZHQHAu6G5+YtxoB0ujaAhHQQo8ZZsUIs11fZQoaAZHQHKv52pyZKFoB0uvaAhHQQo8ZefdRBN1fZQoaAZHQHJZn2IwdsBoB0uvaAhHQQo8Zj/echF1fZQoaAZHQHLA5YkmhM9oB0ucaAhHQQo8Zj3XZoR1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 79400, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV5QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZS9ob21lL3NlbmxpLy5jb25kYS9lbnZzL3NlbmxpX1B5dGhvbjMuOC9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLhEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxlL2hvbWUvc2VubGkvLmNvbmRhL2VudnMvc2VubGlfUHl0aG9uMy44L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV5QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZS9ob21lL3NlbmxpLy5jb25kYS9lbnZzL3NlbmxpX1B5dGhvbjMuOC9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLhEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxlL2hvbWUvc2VubGkvLmNvbmRhL2VudnMvc2VubGlfUHl0aG9uMy44L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-5.15.0-134-generic-x86_64-with-glibc2.17 # 145-Ubuntu SMP Wed Feb 12 20:08:39 UTC 2025", "Python": "3.8.20", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.1+cu121", "GPU Enabled": "True", "Numpy": "1.24.4", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.26.2"}}
|
replay.mp4
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b57c914a530c74add5e0d5ed61df5e06a1c301aa4627f982d859cd2771471370
|
| 3 |
+
size 159670
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward":
|
|
|
|
| 1 |
+
{"mean_reward": 261.7525052, "std_reward": 67.91867714355469, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-04-11T08:09:50.649879"}
|