Upload PPO BipedalWalker-v3 trained agent
Browse files- BipedalWalker-v3.zip +2 -2
- BipedalWalker-v3/data +21 -21
- BipedalWalker-v3/policy.optimizer.pth +1 -1
- BipedalWalker-v3/policy.pth +1 -1
- README.md +1 -1
- config.json +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
BipedalWalker-v3.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f32267edd904b8cab23930eb85c7f3af605e7a4477e8d9fd2bdce341c41cce4
|
| 3 |
+
size 176431
|
BipedalWalker-v3/data
CHANGED
|
@@ -4,34 +4,34 @@
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
| 8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
| 9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
| 10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
| 11 |
-
"_build": "<function ActorCriticPolicy._build at
|
| 12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
| 13 |
-
"extract_features": "<function ActorCriticPolicy.extract_features at
|
| 14 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
| 15 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
| 16 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
| 17 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
| 18 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
-
"_abc_impl": "<_abc._abc_data object at
|
| 21 |
},
|
| 22 |
"verbose": 1,
|
| 23 |
"policy_kwargs": {},
|
| 24 |
-
"num_timesteps":
|
| 25 |
-
"_total_timesteps":
|
| 26 |
"_num_timesteps_at_start": 0,
|
| 27 |
"seed": null,
|
| 28 |
"action_noise": null,
|
| 29 |
-
"start_time":
|
| 30 |
"learning_rate": 0.0003,
|
| 31 |
"tensorboard_log": null,
|
| 32 |
"_last_obs": {
|
| 33 |
":type:": "<class 'numpy.ndarray'>",
|
| 34 |
-
":serialized:": "
|
| 35 |
},
|
| 36 |
"_last_episode_starts": {
|
| 37 |
":type:": "<class 'numpy.ndarray'>",
|
|
@@ -41,17 +41,17 @@
|
|
| 41 |
"_episode_num": 0,
|
| 42 |
"use_sde": false,
|
| 43 |
"sde_sample_freq": -1,
|
| 44 |
-
"_current_progress_remaining": -
|
| 45 |
"_stats_window_size": 100,
|
| 46 |
"ep_info_buffer": {
|
| 47 |
":type:": "<class 'collections.deque'>",
|
| 48 |
-
":serialized:": "
|
| 49 |
},
|
| 50 |
"ep_success_buffer": {
|
| 51 |
":type:": "<class 'collections.deque'>",
|
| 52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 53 |
},
|
| 54 |
-
"_n_updates":
|
| 55 |
"observation_space": {
|
| 56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
| 57 |
":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==",
|
|
@@ -83,7 +83,7 @@
|
|
| 83 |
"_np_random": null
|
| 84 |
},
|
| 85 |
"n_envs": 16,
|
| 86 |
-
"n_steps":
|
| 87 |
"gamma": 0.999,
|
| 88 |
"gae_lambda": 0.98,
|
| 89 |
"ent_coef": 0.01,
|
|
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7e38025c36d0>",
|
| 8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e38025c3760>",
|
| 9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e38025c37f0>",
|
| 10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e38025c3880>",
|
| 11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7e38025c3910>",
|
| 12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7e38025c39a0>",
|
| 13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x7e38025c3a30>",
|
| 14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e38025c3ac0>",
|
| 15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7e38025c3b50>",
|
| 16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e38025c3be0>",
|
| 17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e38025c3c70>",
|
| 18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7e38025c3d00>",
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
+
"_abc_impl": "<_abc._abc_data object at 0x7e380255dec0>"
|
| 21 |
},
|
| 22 |
"verbose": 1,
|
| 23 |
"policy_kwargs": {},
|
| 24 |
+
"num_timesteps": 104000,
|
| 25 |
+
"_total_timesteps": 100000,
|
| 26 |
"_num_timesteps_at_start": 0,
|
| 27 |
"seed": null,
|
| 28 |
"action_noise": null,
|
| 29 |
+
"start_time": 1714106227409224375,
|
| 30 |
"learning_rate": 0.0003,
|
| 31 |
"tensorboard_log": null,
|
| 32 |
"_last_obs": {
|
| 33 |
":type:": "<class 'numpy.ndarray'>",
|
| 34 |
+
":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAMIJBD7QzQA8/lIjPIr3Ozwlf0S/ZFonPyCr0z1ZNBG/AAAAAIDelD///38/dDIuPzXnv78AAIA/X6ltPkHdbz4rsHc+73WDPhLvjz6efqE+iyy8Pm8l6z78Tx8/AACAP+cNzj1Xxws9sPoiPdpdXzyrhJA/9OLwPsRlSj/7/3+/AACAPyBUKr/OdBS+mM/CvjzweL8AAAAAKQKKPimAiz7+/Y8+c7CYPpxKqD6B6L0+DtvePrGeCz9Vazc/AACAPwFr3j06IKk7hADePFKH/Dyq/FK/AAAAM0BfX70FAIA/AAAAAEVzjT8AAAAA/OdaP58z5b0AAIA/8apnPnVMaj6if3I+8aOAPvxYjD5uT54+TVi6PnTM6D4BbCc/AACAP02wXL9IhsC91PaauwWHCb4P5uQ+udGMPiKjKD/9/38/AAAAAMFbET6ADOQ7bH4uPyVWer8AAAAAzbvdPnBA4D6aGeg+lD/2PlFUBj+UhRc/sloyP+fQXj8AAIA/AACAP1FCXz0Nkq485H3nPGFe6Dwg4hq/XCtbvVg4Nr5W0oC/AAAAAB1ekD8ANH85KlxbP9Isgb4AAIA/Z8l/PnDegT7liYY+67SOPptsmj46B6w+/X3KPndk8z7MRho/ErN3P75zTD5loAS9am7ZO2ZovTyfRJE/AGYqOzRcRT+5CIA/AAAAAG8NSr++ZpE+MLz6vnXck74AAIA/BEODPlHxhT6T8Ys+j3yUPin9oT6tuLY+0qDUPjce/z4fjys/AACAP+T92z2vjgG8DkKVPOofAj2DU1W/oI7QuqhGcT6zH+o9AAAAABjijD8AJJo4SEZsP0t0VjsAAIA/qZZsPnxGbz4/pnc+dm6DPnF5jz7zYJ8+NBO3Plqq3z4FtSI/AACAP5Lp1D0bL4A9de3yutODfrxG91K/SDwAPSxbCD4AAIC/AAAAALa2jj8AAAAAvCtOP/gBB78AAIA/Z9ptPueNcD7cwXc+I7KCPq46jz6HOaM+15nAPhHL8T4AEC0/AACAP/6rFj6e/IC8sJELPt+B87xRz1G/YGc8OwBOfL6FbIC/AAAAAKREkT8AEJy3gG9NPw0RgD8AAAAAJvJrPhygbj4M+nY+0POCPiIWjj7kJJ8+JYW5Pk7Z7j5UDSU/AACAP1Wxvj3kamC87DYLPfSuMD0tvVG/ANSeuITBaz7bEzI+AACAP5dMjj8AgF42QlxbP7HS+zwAAIA/KZ1qPj5HbT4dlXU+v0aCPuYhjj7TUqA++La8PkLh7T5h0SY/AACAP4L+gj2d7KI7+D1mvHY8Nj3AbDy/OEsoPkDDcL3dt3+/AAAAAB26jT/M2qm+4jdZPzC6qT4AAIA/lw9sPjfrbj6ShXc+Hn+DPh7Ljz6PZaM+sQXEPtT0/j6Fxi0/AACAP7W/Kj5I7YQ9DJsTPYU44byRuo8/eLYMvvafTz8AAIC/AAAAALl4UL8e5oi/WIm0PcmcIj8AAIA/aUKFPtXFhj5RfYs+Ff6TPnsqoT7wrrU+DNTYPgRbCT/hVTk/AACAP210S74hahy9tmTAvZfGvb2Gd4++L9TRPgtWbz8AAAAAAAAAAG57Jj9HQaQ/qJ1GPwAAgL8AAAAA9pDoPhg16z5pcPM+qyMBP1bkDD+e7B4/UxE7P5mzaT8AAIA/AACAPzEroz07oOq82P3EPHj3Ar2x41K/AABAM+g2dz4CAIA/AAAAAD1wkD8w+Ps+Qo5sPwAAAAAAAIA/qRdtPvPIbz5HLXg+EqeDPkqijz5k76A+r8O5PlC44T6cdyA/AACAP8VD/T3m9fU7w6yYvEHqCLk6OE6/ZnWXPaT9jb4RCxa+AAAAANhRiD/WPTm/CMR8PwAAgD8AAIA/O9BnPjrnaD56O24+fk15Pjkihj6HI5U+lIuuPnfj2T4j0Rg/AACAP8gmvD2j9Xm7OqM7PSmmvb0Q0U6/AADAsuCUkj5QuRS+AACAP4wZkD8AAAAAUhxCP/z/f78AAAAAS4R5PrRZfD5Ol4I+No2KPikplz7mgao+uLPIPnEL+T5Ebiw/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="
|
| 35 |
},
|
| 36 |
"_last_episode_starts": {
|
| 37 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
|
| 41 |
"_episode_num": 0,
|
| 42 |
"use_sde": false,
|
| 43 |
"sde_sample_freq": -1,
|
| 44 |
+
"_current_progress_remaining": -0.040000000000000036,
|
| 45 |
"_stats_window_size": 100,
|
| 46 |
"ep_info_buffer": {
|
| 47 |
":type:": "<class 'collections.deque'>",
|
| 48 |
+
":serialized:": "gAWVAQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwF24MBp5/sqMAWyUS1iMAXSUR0Btyv7+DOC5dX2UKGgGR8BaevKdQO4HaAdLOWgIR0Bt24V/MGHIdX2UKGgGR8Ba06MNtqHoaAdLS2gIR0BuM2gOBlMAdX2UKGgGR8BcJc4T9KmLaAdLR2gIR0BuTNjEvTPTdX2UKGgGR8BhJ5NwiqyXaAdLo2gIR0Buc/lOoHcDdX2UKGgGR8Bcl9L127nQaAdLNGgIR0Bufvcxj8UFdX2UKGgGR8BbUWpVCHARaAdLPmgIR0BujQAEMb3odX2UKGgGR8BdfvRqoIfKaAdLV2gIR0BuoSynk1dgdX2UKGgGR8BZd4TfzjFRaAdNQAZoCEdAbtwzMzMzM3V9lChoBkfAX1hOIqLCN2gHS1ZoCEdAbt3QcghbGHV9lChoBkfAWy3yd4FA3WgHSzhoCEdAbupeVLSNO3V9lChoBkfAWYU5R0lqrWgHS0FoCEdAbusIxgy/K3V9lChoBkfAXBYG+sYEXGgHS0doCEdAbvqBU70WdnV9lChoBkfAXDxZ+x4Y8GgHS1BoCEdAbvwP7N0NjXV9lChoBkfAWcVMURFqjGgHTUAGaAhHQG8CvwEyLyd1fZQoaAZHwFnrKq4pc5doB01ABmgIR0BvApgogFHKdX2UKGgGR8Bb2C+cpb2UaAdNQAZoCEdAbwK2gFotc3V9lChoBkfAWMz7ALy+YmgHTUAGaAhHQG8Cwpe/pMZ1fZQoaAZHwFtQXeWOZLJoB01ABmgIR0BvAtPxhDw6dX2UKGgGR8BaHWsA/9pAaAdLN2gIR0BvCDHyVfNSdX2UKGgGR8BXUlZDArQPaAdNQAZoCEdAbxOSpR4yGnV9lChoBkfAWuNN7BwdbWgHS0doCEdAbxNVIZqEe3V9lChoBkfAWNWOPvKEFmgHTUAGaAhHQG8Teb/ffoB1fZQoaAZHwFlT3RG+bmVoB0tIaAhHQG8Ub961LJ11fZQoaAZHwF5LImw7kn1oB0tJaAhHQG8URe1KGtZ1fZQoaAZHwFn5uMdcSoRoB0tOaAhHQG8V/zJ6po91fZQoaAZHwFv4pY9xIatoB0thaAhHQG8aE6DGtIV1fZQoaAZHwFyR/LDAJsxoB0uOaAhHQG8cFev6j351fZQoaAZHwFromfGuLaVoB0tkaAhHQG8gZc1O0sx1fZQoaAZHwFy3Btk4FRpoB0s3aAhHQG8mGSpzcRF1fZQoaAZHwF4d8eS0Sh9oB0tzaAhHQG8t62WpqAV1fZQoaAZHwFn+KzRhMJxoB01ABmgIR0BvMTbi6xxDdX2UKGgGR8BbctugpSaWaAdNQAZoCEdAbzKenyd4FHV9lChoBkfAWWphDw6QvGgHSz9oCEdAbzVND+irUHV9lChoBkfAW4K3WnTAnGgHS1hoCEdAb0KtUXHim3V9lChoBkfAXCxgWrOqvWgHS05oCEdAb0Pc+qzZ6HV9lChoBkfAWaBkH2RJVmgHTUAGaAhHQG9FqTr3TNN1fZQoaAZHwGHAtQbdadNoB0v0aAhHQG93yXUpd8l1fZQoaAZHwFi9QJ5VwP1oB01ABmgIR0BveBzHS4OMdX2UKGgGR8BcAvsRg7YDaAdLNWgIR0Bvfa5LAYYSdX2UKGgGR8BcknF98Z1naAdLS2gIR0BvgCgZjx0/dX2UKGgGR8BZIBMWXTmXaAdLWGgIR0BvhApjMFEBdX2UKGgGR8BcmP7WNFSbaAdLUmgIR0BviwYLsruqdX2UKGgGR8BcorhvR7Z4aAdLMWgIR0Bvi5YmsvIwdX2UKGgGR8BYzWoJiRW+aAdNQAZoCEdAb5E8EFGG23V9lChoBkfAWUpK02LpA2gHS1loCEdAb5NaIvalDXV9lChoBkfAWfnaTOgQH2gHS0BoCEdAb50jcEeQuHV9lChoBkfAWcCtJWeYlmgHS09oCEdAb6MREF4cFXV9lChoBkfAWNHlp48lomgHTUAGaAhHQG+kTxXnyNJ1fZQoaAZHwFoYRChN/ONoB0t+aAhHQG+o/p2U0N11fZQoaAZHwFsGBi1AqutoB01ABmgIR0Bvsz850bLmdX2UKGgGR8BcWZ8jRlYmaAdLOWgIR0BvxkebNKRMdX2UKGgGR8BeVdUKiO/+aAdLZ2gIR0BvzQRGtp22dX2UKGgGR8Be72g3974SaAdLe2gIR0Bv0CrtE5QxdX2UKGgGR8Bb+USqU/wBaAdLOWgIR0Bv4kZJkGzKdX2UKGgGR8BZS0AggX/HaAdLWGgIR0Bv5zWPLgXNdX2UKGgGR8BbdoiX6ZYxaAdLU2gIR0Bv7acslLOBdX2UKGgGR8BbKbhaTwDvaAdLNmgIR0Bv+atHQQcxdX2UKGgGR8BaYZzLfUF0aAdLUmgIR0BwBM4PwuuidX2UKGgGR8Bb2OLR8c+8aAdNQAZoCEdAcJSvEjxCpnV9lChoBkfAV/n/xUedTmgHTUAGaAhHQHCU8UEgW8B1fZQoaAZHwFiJJF9a2WpoB01ABmgIR0BwlN6AvtdBdX2UKGgGR8BZyZKODJ2daAdNQAZoCEdAcJWmXgLqlnV9lChoBkfAWizJvHcUNGgHTUAGaAhHQHCY1LvkRz11fZQoaAZHwFkaCFsYVItoB01ABmgIR0Bwmy+fywwCdX2UKGgGR8BaSLyUcGTtaAdLRWgIR0BwnQu8K5TZdX2UKGgGR8Bal8kdFOO9aAdLL2gIR0BwnhQsPJ7tdX2UKGgGR8BfY2yHEdeZaAdLU2gIR0BwnwyN4qwydX2UKGgGR8BZQ8PBi1AraAdLLWgIR0BwofZ+QU5/dX2UKGgGR8Bbc0n5SFXaaAdNQAZoCEdAcLtbmEGqxXV9lChoBkfAWidowmE5AGgHSy9oCEdAcLwajN6gNHV9lChoBkfAWGRWJaaCtmgHTUAGaAhHQHC9VHSWqtJ1fZQoaAZHwFmA287IT5BoB0tdaAhHQHC90xASnLt1fZQoaAZHwFlPKkVN5+poB0tWaAhHQHDBSprDZUV1fZQoaAZHwFyuXhfjS5RoB0tIaAhHQHDFTAeq7yx1fZQoaAZHwFlm8scyWRloB0s4aAhHQHDMDch1Tzd1fZQoaAZHwFnZMqz7di5oB0tmaAhHQHDOqqXF98Z1fZQoaAZHwFgRsMRYigVoB01ABmgIR0Bw0DiT+vQodX2UKGgGR8BfNTeTFERbaAdLZWgIR0Bw0KBEroW6dX2UKGgGR8BaaAam4y44aAdLLGgIR0Bw2GafBeoldX2UKGgGR8BW/T101ZTyaAdNQAZoCEdAcOKNlRP423V9lChoBkfAWv2RLbpNbmgHTUAGaAhHQHDkDGYKIBR1fZQoaAZHwF0RCaqjrRloB01ABmgIR0Bw6f8/D+BIdX2UKGgGR8BXqFqagElmaAdNQAZoCEdAcO1PdVNpNHV9lChoBkfAWgIhGH58B2gHSzloCEdAcO7a1Cw8n3V9lChoBkfAXHzXiBGx2WgHSz9oCEdAcPNqqfe1r3V9lChoBkfAWyzbi6xxDWgHSzBoCEdAcPSxYJVsDXV9lChoBkfAXNqdvsJID2gHS0loCEdAcPchUBGQS3V9lChoBkfAWcLD50r9VGgHS1hoCEdAcP98ejmCAnV9lChoBkfAXSUqmTC+DmgHS0xoCEdAcQBFXq7iAHV9lChoBkfAVyVfgJkXlGgHTUAGaAhHQHEDlcY64lR1fZQoaAZHwFanqYJE6T5oB01ABmgIR0BxH1C2MKkVdX2UKGgGR8BfBPmcOLBLaAdLb2gIR0BxI7bJwKjSdX2UKGgGR8BaS91hb4ahaAdNQAZoCEdAcSQvLowEhnV9lChoBkfAXVCF+NLlFWgHS0BoCEdAcSYDGLk0anV9lChoBkfAWjyHvc8DCGgHS0JoCEdAcSrBacI7eXV9lChoBkfAWuFhG6PKdWgHS1toCEdAcTUJu2qkunV9lChoBkfAWzYk8ifQKWgHSy5oCEdAcTqz90ihWnV9lChoBkfAWC825xzaK2gHTUAGaAhHQHGvNWQwK0F1fZQoaAZHwFm8e4kNWlxoB01ABmgIR0Bxr43WFvhqdWUu"
|
| 49 |
},
|
| 50 |
"ep_success_buffer": {
|
| 51 |
":type:": "<class 'collections.deque'>",
|
| 52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 53 |
},
|
| 54 |
+
"_n_updates": 52,
|
| 55 |
"observation_space": {
|
| 56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
| 57 |
":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==",
|
|
|
|
| 83 |
"_np_random": null
|
| 84 |
},
|
| 85 |
"n_envs": 16,
|
| 86 |
+
"n_steps": 500,
|
| 87 |
"gamma": 0.999,
|
| 88 |
"gae_lambda": 0.98,
|
| 89 |
"ent_coef": 0.01,
|
BipedalWalker-v3/policy.optimizer.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 105121
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe480b1affd3f12c7bdbfa38d90e0efaa46541ee8bdb46a0ccd1a14548f3760f
|
| 3 |
size 105121
|
BipedalWalker-v3/policy.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 52143
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2cd9fbe0b5642c693800623b3c04934011be739d37d15f644055770befea5a76
|
| 3 |
size 52143
|
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: BipedalWalker-v3
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value: -
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: BipedalWalker-v3
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: -56.38 +/- 0.22
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x783b7dbb27a0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x783b7dbb2830>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x783b7dbb28c0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x783b7dbb2950>", "_build": "<function ActorCriticPolicy._build at 0x783b7dbb29e0>", "forward": "<function ActorCriticPolicy.forward at 0x783b7dbb2a70>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x783b7dbb2b00>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x783b7dbb2b90>", "_predict": "<function ActorCriticPolicy._predict at 0x783b7dbb2c20>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x783b7dbb2cb0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x783b7dbb2d40>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x783b7dbb2dd0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x783b7db57600>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 4800, "_total_timesteps": 2000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1714022747756011012, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAJfx1T0yGOw6RPSNvXNMwrztv40/yB5tP6YuTD/9/3+/AACAPyio775VwQ+/LE6svv3/fz8AAAAAuySQPsvHkT7m4ZY+dRSgPvilrj5GAMU+KePnPt7YED+K5UY/AACAP9pWkj6E//i8kj8nPUEONbwRhVa/QDIdOwA1X764fn8/AACAPxpflT88IYA/Ui4yP1XXf78AAAAAOR58PjL7fj7W84M+/f6LPpe8mD73SKw+XsvKPktZ/T5a8S0/AACAP/2niT8WpqC9L8NePRYJ1Dyr42c+HrGnPvB/Cb4A+2W8AACAP5sRSb82WeU+YNgiv8W84rsAAIA/SFybPvUfnT6zn6I+fImsPjk9vD7TVNQ+su75PnAeHD/bX1Y/AACAP+KZij5DS2w9jmmHvKi3KjzfL4U/Hby3vljLLD+UYE+9AACAP+ymV7+cSQO/+m0mvwEAgL8AAAAAmI2DPg4MhT4UtIk++RiSPrpknz41y7M+BKLTPv8xBD8XhjU/AACAPxHApD/Akd492si4PCgoC7od4le+4MLKvSihMr/9/3+/AAAAAL3bV78AAIC/TIkiv5Xjvj4AAAAAox6oPmgHqj7D+q8+97S6PtWyyz71xOU+rzoHP73wKD+pVWg/AACAP4RRwT4Pvow9Vrb9Ozov7jrDxD0+gDVeuzAVOT77/38/AAAAANuAEr9QpVu/HVZvPwAAAAAAAAAAd2DyPh4h9T5Vtf0+QZYGP9jVEj/boCU/fPVCP12Pcz8AAIA/AACAPzs3kD42UZW7lHLpvNvR2jzv0YI/bE47Pdr7OD8BAIC/AAAAAN8MT796YT4+IIaRvp0lWr4AAAAAm4CEPtMBhj5zsoo+2iaTPiuLoD5VF7U+9SjVPjImBT9p1TY/AACAPxBbjz9OXFg9LwSWvX2csDzG8Ls9/P9/vz5DC7+0WOE+AAAAABzo3r7vdrG+zIocv8kW+D0AAIA/E7uqPm+rrD5ztrI+Tpu9Prvczj6DVuk+WlQJP3CQKz9JlWs/AACAP+UlrD521fy6bI+QvEEUj72Cf5A/BOJSP5w5ND8AAIC/AAAAANlmT78AAAAAPOsBv/j/fz8AAAAA9lCGPnTXhz6EmIw+jCqVPsu9oj74kbc++hPYPtH4Bj/mFDY/AACAP2tNKz74gRs8eyEMvQTcNzy9G1e/AAqKOYBlsTuJAIC/AAAAAKTcgD8MHKC90GBvP1UN7DgAAIA/3xhpPou+az6s/nM+I2+BPqs2jT59SZ8+pX67Piw86j7b0SA/AACAP24v9b7XoAW9GvYGPn1+N71JZ+M+AgCAP4Bwyb6P16W/AAAAABbjSD/kfVK+jt0rv/3/f78AAIA/TJ6vPt6csT4s1Lc+3QjDPr/I1D6PBPA+yUINP8V5MD8GIHI/AACAPzXP4D2EuMo9OaMePNvCWjyoCVK/AACAs7DT+T0AAIC/AAAAAAwukT8AAAAAjmFDPxl5ab8AAIA/iT9uPi/0cD78Ynk+XUuEPolVkD6azqI+VKO/PkZp7z6jXyQ/AACAP7z4gD40zne8YZtmPWWflLxShos/zZipvZzJVj+tAIA/AAAAAHKgVb8AABw1APQ6vZS9ej0AAIA/IAqCPi+Egz5+Hog+qmqQPkKPnT6nubE+rzLRPqOsAj9xbzM/AACAP/mGoT4kxgu99x4JvWigmzxi8Y4/AACAsnR6nD77/38/AACAP9YyQr/27fY9gGZfvv3/fz8AAAAAB3GLPmwGjT7s9ZE+rNuaPojzqD4rk74+u1LgPkofDD+caEA/AACAP6sNuD9MZ9g8FIEEPCVUWDujOFy/8Gp1v07QGL8AAAAAAACAPx5igD7Jpz++yIwivwAAgLEAAAAAjjCiPhUIpD61xak+DB+0PnuDxD4xqt0+mHUCPz77Ij83zF8/AACAPxoEQT3xaqu8aYQmPr29GLyjqgq//xKPvnCHm76jDYA/AAAAAIfadL4k9MI8qrEOv4DVf78AAIA/wvKQPimYkj6PuZc+Q/mgPpmfrz7aGcY+mi7pPuenET/UAUg/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -1.4, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV+AIAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwFtsxpcophGMAWyUSzCMAXSUR0AVHjrAxi5NdX2UKGgGR8BcyqAnUlRhaAdLM2gIR0AVOGetjkMkdX2UKGgGR8BdgXX7Lt/naAdLP2gIR0AVfcIqslsxdX2UKGgGR8BZnbzkIX0oaAdLQWgIR0AVk7fYSQHSdX2UKGgGR8BaxrhegL7XaAdLQ2gIR0AVp5HEuQIVdX2UKGgGR8BdnFO9FnZkaAdLRGgIR0AVqneizsyBdX2UKGgGR8BanrpRoAXEaAdLRmgIR0AVu9g4OtnxdX2UKGgGR8BZtIQSSNfgaAdLVGgIR0AWDZcs189fdX2UKGgGR8BZwIkqtozvaAdLN2gIR0AWfrJKaodddX2UKGgGR8Bb1nFglWwNaAdLPGgIR0AWtBJI1+AmdX2UKGgGR8BbrTv/io87aAdLNGgIR0AWzTkQwsXjdX2UKGgGR8BcvF5WzWwvaAdLemgIR0AW/guRLbpNdX2UKGgGR8Bb4Cr5qM3qaAdLPWgIR0AXLEFW4mTldX2UKGgGR8BbLQc94eLfaAdLQGgIR0AXNg1FYuCgdX2UKGgGR8BfLF5v99+gaAdLYmgIR0AYAre67NB4dX2UKGgGR8BcWyWmgrYoaAdLOGgIR0AYYXVLBbfQdX2UKGgGR8BaszMA3kxRaAdLRmgIR0AYdfLLZBcBdX2UKGgGR8BZn/va11GLaAdLXmgIR0AY2kFfReC1dX2UKGgGR8BfNT7ZWaMKaAdLeGgIR0AZBPVNHpbEdX2UKGgGR8BbjXRkVeruaAdLK2gIR0AZfzbvgFX8dX2UKGgGR8BaJRPj4pMIaAdLSGgIR0AZygSOBDohdX2UKGgGR8BcKyntOVPfaAdLOWgIR0AaMxzq8lHCdX2UKGgGR8Ba8uDe0ojOaAdLOGgIR0AaWasp5NXYdX2UKGgGR8BZG5JwsGxEaAdLQWgIR0AbDl+3H7xedWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 4, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "_shape": [24], "low": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "low_repr": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high_repr": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVpwEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True]", "bounded_above": "[ True True True True]", "_shape": [4], "low": "[-1. -1. -1. -1.]", "high": "[1. 1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 16, "n_steps": 300, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 128, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "False", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7e38025c36d0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e38025c3760>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e38025c37f0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e38025c3880>", "_build": "<function ActorCriticPolicy._build at 0x7e38025c3910>", "forward": "<function ActorCriticPolicy.forward at 0x7e38025c39a0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7e38025c3a30>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e38025c3ac0>", "_predict": "<function ActorCriticPolicy._predict at 0x7e38025c3b50>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e38025c3be0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e38025c3c70>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7e38025c3d00>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7e380255dec0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 104000, "_total_timesteps": 100000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1714106227409224375, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAMIJBD7QzQA8/lIjPIr3Ozwlf0S/ZFonPyCr0z1ZNBG/AAAAAIDelD///38/dDIuPzXnv78AAIA/X6ltPkHdbz4rsHc+73WDPhLvjz6efqE+iyy8Pm8l6z78Tx8/AACAP+cNzj1Xxws9sPoiPdpdXzyrhJA/9OLwPsRlSj/7/3+/AACAPyBUKr/OdBS+mM/CvjzweL8AAAAAKQKKPimAiz7+/Y8+c7CYPpxKqD6B6L0+DtvePrGeCz9Vazc/AACAPwFr3j06IKk7hADePFKH/Dyq/FK/AAAAM0BfX70FAIA/AAAAAEVzjT8AAAAA/OdaP58z5b0AAIA/8apnPnVMaj6if3I+8aOAPvxYjD5uT54+TVi6PnTM6D4BbCc/AACAP02wXL9IhsC91PaauwWHCb4P5uQ+udGMPiKjKD/9/38/AAAAAMFbET6ADOQ7bH4uPyVWer8AAAAAzbvdPnBA4D6aGeg+lD/2PlFUBj+UhRc/sloyP+fQXj8AAIA/AACAP1FCXz0Nkq485H3nPGFe6Dwg4hq/XCtbvVg4Nr5W0oC/AAAAAB1ekD8ANH85KlxbP9Isgb4AAIA/Z8l/PnDegT7liYY+67SOPptsmj46B6w+/X3KPndk8z7MRho/ErN3P75zTD5loAS9am7ZO2ZovTyfRJE/AGYqOzRcRT+5CIA/AAAAAG8NSr++ZpE+MLz6vnXck74AAIA/BEODPlHxhT6T8Ys+j3yUPin9oT6tuLY+0qDUPjce/z4fjys/AACAP+T92z2vjgG8DkKVPOofAj2DU1W/oI7QuqhGcT6zH+o9AAAAABjijD8AJJo4SEZsP0t0VjsAAIA/qZZsPnxGbz4/pnc+dm6DPnF5jz7zYJ8+NBO3Plqq3z4FtSI/AACAP5Lp1D0bL4A9de3yutODfrxG91K/SDwAPSxbCD4AAIC/AAAAALa2jj8AAAAAvCtOP/gBB78AAIA/Z9ptPueNcD7cwXc+I7KCPq46jz6HOaM+15nAPhHL8T4AEC0/AACAP/6rFj6e/IC8sJELPt+B87xRz1G/YGc8OwBOfL6FbIC/AAAAAKREkT8AEJy3gG9NPw0RgD8AAAAAJvJrPhygbj4M+nY+0POCPiIWjj7kJJ8+JYW5Pk7Z7j5UDSU/AACAP1Wxvj3kamC87DYLPfSuMD0tvVG/ANSeuITBaz7bEzI+AACAP5dMjj8AgF42QlxbP7HS+zwAAIA/KZ1qPj5HbT4dlXU+v0aCPuYhjj7TUqA++La8PkLh7T5h0SY/AACAP4L+gj2d7KI7+D1mvHY8Nj3AbDy/OEsoPkDDcL3dt3+/AAAAAB26jT/M2qm+4jdZPzC6qT4AAIA/lw9sPjfrbj6ShXc+Hn+DPh7Ljz6PZaM+sQXEPtT0/j6Fxi0/AACAP7W/Kj5I7YQ9DJsTPYU44byRuo8/eLYMvvafTz8AAIC/AAAAALl4UL8e5oi/WIm0PcmcIj8AAIA/aUKFPtXFhj5RfYs+Ff6TPnsqoT7wrrU+DNTYPgRbCT/hVTk/AACAP210S74hahy9tmTAvZfGvb2Gd4++L9TRPgtWbz8AAAAAAAAAAG57Jj9HQaQ/qJ1GPwAAgL8AAAAA9pDoPhg16z5pcPM+qyMBP1bkDD+e7B4/UxE7P5mzaT8AAIA/AACAPzEroz07oOq82P3EPHj3Ar2x41K/AABAM+g2dz4CAIA/AAAAAD1wkD8w+Ps+Qo5sPwAAAAAAAIA/qRdtPvPIbz5HLXg+EqeDPkqijz5k76A+r8O5PlC44T6cdyA/AACAP8VD/T3m9fU7w6yYvEHqCLk6OE6/ZnWXPaT9jb4RCxa+AAAAANhRiD/WPTm/CMR8PwAAgD8AAIA/O9BnPjrnaD56O24+fk15Pjkihj6HI5U+lIuuPnfj2T4j0Rg/AACAP8gmvD2j9Xm7OqM7PSmmvb0Q0U6/AADAsuCUkj5QuRS+AACAP4wZkD8AAAAAUhxCP/z/f78AAAAAS4R5PrRZfD5Ol4I+No2KPikplz7mgao+uLPIPnEL+T5Ebiw/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.040000000000000036, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVAQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwF24MBp5/sqMAWyUS1iMAXSUR0Btyv7+DOC5dX2UKGgGR8BaevKdQO4HaAdLOWgIR0Bt24V/MGHIdX2UKGgGR8Ba06MNtqHoaAdLS2gIR0BuM2gOBlMAdX2UKGgGR8BcJc4T9KmLaAdLR2gIR0BuTNjEvTPTdX2UKGgGR8BhJ5NwiqyXaAdLo2gIR0Buc/lOoHcDdX2UKGgGR8Bcl9L127nQaAdLNGgIR0Bufvcxj8UFdX2UKGgGR8BbUWpVCHARaAdLPmgIR0BujQAEMb3odX2UKGgGR8BdfvRqoIfKaAdLV2gIR0BuoSynk1dgdX2UKGgGR8BZd4TfzjFRaAdNQAZoCEdAbtwzMzMzM3V9lChoBkfAX1hOIqLCN2gHS1ZoCEdAbt3QcghbGHV9lChoBkfAWy3yd4FA3WgHSzhoCEdAbupeVLSNO3V9lChoBkfAWYU5R0lqrWgHS0FoCEdAbusIxgy/K3V9lChoBkfAXBYG+sYEXGgHS0doCEdAbvqBU70WdnV9lChoBkfAXDxZ+x4Y8GgHS1BoCEdAbvwP7N0NjXV9lChoBkfAWcVMURFqjGgHTUAGaAhHQG8CvwEyLyd1fZQoaAZHwFnrKq4pc5doB01ABmgIR0BvApgogFHKdX2UKGgGR8Bb2C+cpb2UaAdNQAZoCEdAbwK2gFotc3V9lChoBkfAWMz7ALy+YmgHTUAGaAhHQG8Cwpe/pMZ1fZQoaAZHwFtQXeWOZLJoB01ABmgIR0BvAtPxhDw6dX2UKGgGR8BaHWsA/9pAaAdLN2gIR0BvCDHyVfNSdX2UKGgGR8BXUlZDArQPaAdNQAZoCEdAbxOSpR4yGnV9lChoBkfAWuNN7BwdbWgHS0doCEdAbxNVIZqEe3V9lChoBkfAWNWOPvKEFmgHTUAGaAhHQG8Teb/ffoB1fZQoaAZHwFlT3RG+bmVoB0tIaAhHQG8Ub961LJ11fZQoaAZHwF5LImw7kn1oB0tJaAhHQG8URe1KGtZ1fZQoaAZHwFn5uMdcSoRoB0tOaAhHQG8V/zJ6po91fZQoaAZHwFv4pY9xIatoB0thaAhHQG8aE6DGtIV1fZQoaAZHwFyR/LDAJsxoB0uOaAhHQG8cFev6j351fZQoaAZHwFromfGuLaVoB0tkaAhHQG8gZc1O0sx1fZQoaAZHwFy3Btk4FRpoB0s3aAhHQG8mGSpzcRF1fZQoaAZHwF4d8eS0Sh9oB0tzaAhHQG8t62WpqAV1fZQoaAZHwFn+KzRhMJxoB01ABmgIR0BvMTbi6xxDdX2UKGgGR8BbctugpSaWaAdNQAZoCEdAbzKenyd4FHV9lChoBkfAWWphDw6QvGgHSz9oCEdAbzVND+irUHV9lChoBkfAW4K3WnTAnGgHS1hoCEdAb0KtUXHim3V9lChoBkfAXCxgWrOqvWgHS05oCEdAb0Pc+qzZ6HV9lChoBkfAWaBkH2RJVmgHTUAGaAhHQG9FqTr3TNN1fZQoaAZHwGHAtQbdadNoB0v0aAhHQG93yXUpd8l1fZQoaAZHwFi9QJ5VwP1oB01ABmgIR0BveBzHS4OMdX2UKGgGR8BcAvsRg7YDaAdLNWgIR0Bvfa5LAYYSdX2UKGgGR8BcknF98Z1naAdLS2gIR0BvgCgZjx0/dX2UKGgGR8BZIBMWXTmXaAdLWGgIR0BvhApjMFEBdX2UKGgGR8BcmP7WNFSbaAdLUmgIR0BviwYLsruqdX2UKGgGR8BcorhvR7Z4aAdLMWgIR0Bvi5YmsvIwdX2UKGgGR8BYzWoJiRW+aAdNQAZoCEdAb5E8EFGG23V9lChoBkfAWUpK02LpA2gHS1loCEdAb5NaIvalDXV9lChoBkfAWfnaTOgQH2gHS0BoCEdAb50jcEeQuHV9lChoBkfAWcCtJWeYlmgHS09oCEdAb6MREF4cFXV9lChoBkfAWNHlp48lomgHTUAGaAhHQG+kTxXnyNJ1fZQoaAZHwFoYRChN/ONoB0t+aAhHQG+o/p2U0N11fZQoaAZHwFsGBi1AqutoB01ABmgIR0Bvsz850bLmdX2UKGgGR8BcWZ8jRlYmaAdLOWgIR0BvxkebNKRMdX2UKGgGR8BeVdUKiO/+aAdLZ2gIR0BvzQRGtp22dX2UKGgGR8Be72g3974SaAdLe2gIR0Bv0CrtE5QxdX2UKGgGR8Bb+USqU/wBaAdLOWgIR0Bv4kZJkGzKdX2UKGgGR8BZS0AggX/HaAdLWGgIR0Bv5zWPLgXNdX2UKGgGR8BbdoiX6ZYxaAdLU2gIR0Bv7acslLOBdX2UKGgGR8BbKbhaTwDvaAdLNmgIR0Bv+atHQQcxdX2UKGgGR8BaYZzLfUF0aAdLUmgIR0BwBM4PwuuidX2UKGgGR8Bb2OLR8c+8aAdNQAZoCEdAcJSvEjxCpnV9lChoBkfAV/n/xUedTmgHTUAGaAhHQHCU8UEgW8B1fZQoaAZHwFiJJF9a2WpoB01ABmgIR0BwlN6AvtdBdX2UKGgGR8BZyZKODJ2daAdNQAZoCEdAcJWmXgLqlnV9lChoBkfAWizJvHcUNGgHTUAGaAhHQHCY1LvkRz11fZQoaAZHwFkaCFsYVItoB01ABmgIR0Bwmy+fywwCdX2UKGgGR8BaSLyUcGTtaAdLRWgIR0BwnQu8K5TZdX2UKGgGR8Bal8kdFOO9aAdLL2gIR0BwnhQsPJ7tdX2UKGgGR8BfY2yHEdeZaAdLU2gIR0BwnwyN4qwydX2UKGgGR8BZQ8PBi1AraAdLLWgIR0BwofZ+QU5/dX2UKGgGR8Bbc0n5SFXaaAdNQAZoCEdAcLtbmEGqxXV9lChoBkfAWidowmE5AGgHSy9oCEdAcLwajN6gNHV9lChoBkfAWGRWJaaCtmgHTUAGaAhHQHC9VHSWqtJ1fZQoaAZHwFmA287IT5BoB0tdaAhHQHC90xASnLt1fZQoaAZHwFlPKkVN5+poB0tWaAhHQHDBSprDZUV1fZQoaAZHwFyuXhfjS5RoB0tIaAhHQHDFTAeq7yx1fZQoaAZHwFlm8scyWRloB0s4aAhHQHDMDch1Tzd1fZQoaAZHwFnZMqz7di5oB0tmaAhHQHDOqqXF98Z1fZQoaAZHwFgRsMRYigVoB01ABmgIR0Bw0DiT+vQodX2UKGgGR8BfNTeTFERbaAdLZWgIR0Bw0KBEroW6dX2UKGgGR8BaaAam4y44aAdLLGgIR0Bw2GafBeoldX2UKGgGR8BW/T101ZTyaAdNQAZoCEdAcOKNlRP423V9lChoBkfAWv2RLbpNbmgHTUAGaAhHQHDkDGYKIBR1fZQoaAZHwF0RCaqjrRloB01ABmgIR0Bw6f8/D+BIdX2UKGgGR8BXqFqagElmaAdNQAZoCEdAcO1PdVNpNHV9lChoBkfAWgIhGH58B2gHSzloCEdAcO7a1Cw8n3V9lChoBkfAXHzXiBGx2WgHSz9oCEdAcPNqqfe1r3V9lChoBkfAWyzbi6xxDWgHSzBoCEdAcPSxYJVsDXV9lChoBkfAXNqdvsJID2gHS0loCEdAcPchUBGQS3V9lChoBkfAWcLD50r9VGgHS1hoCEdAcP98ejmCAnV9lChoBkfAXSUqmTC+DmgHS0xoCEdAcQBFXq7iAHV9lChoBkfAVyVfgJkXlGgHTUAGaAhHQHEDlcY64lR1fZQoaAZHwFanqYJE6T5oB01ABmgIR0BxH1C2MKkVdX2UKGgGR8BfBPmcOLBLaAdLb2gIR0BxI7bJwKjSdX2UKGgGR8BaS91hb4ahaAdNQAZoCEdAcSQvLowEhnV9lChoBkfAXVCF+NLlFWgHS0BoCEdAcSYDGLk0anV9lChoBkfAWjyHvc8DCGgHS0JoCEdAcSrBacI7eXV9lChoBkfAWuFhG6PKdWgHS1toCEdAcTUJu2qkunV9lChoBkfAWzYk8ifQKWgHSy5oCEdAcTqz90ihWnV9lChoBkfAWC825xzaK2gHTUAGaAhHQHGvNWQwK0F1fZQoaAZHwFm8e4kNWlxoB01ABmgIR0Bxr43WFvhqdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 52, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "_shape": [24], "low": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "low_repr": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high_repr": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVpwEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True]", "bounded_above": "[ True True True True]", "_shape": [4], "low": "[-1. -1. -1. -1.]", "high": "[1. 1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 16, "n_steps": 500, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 128, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "False", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
replay.mp4
CHANGED
|
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward": -
|
|
|
|
| 1 |
+
{"mean_reward": -56.37531610364094, "std_reward": 0.21513498902641692, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-04-26T04:40:03.821594"}
|