Initial commit
Browse files- .gitattributes +1 -0
- README.md +1 -1
- a2c-AntBulletEnv-v0.zip +2 -2
- a2c-AntBulletEnv-v0/data +19 -19
- a2c-AntBulletEnv-v0/policy.optimizer.pth +2 -2
- a2c-AntBulletEnv-v0/policy.pth +2 -2
- a2c-AntBulletEnv-v0/system_info.txt +1 -1
- config.json +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
- vec_normalize.pkl +1 -1
.gitattributes
CHANGED
|
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
replay.mp4 filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: AntBulletEnv-v0
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value:
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: AntBulletEnv-v0
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: 1893.63 +/- 99.91
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
a2c-AntBulletEnv-v0.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:950a62b3c82cf4c40fc8bb8f49b92988fd05c199241f30722f436f16fd7c38cb
|
| 3 |
+
size 128975
|
a2c-AntBulletEnv-v0/data
CHANGED
|
@@ -4,20 +4,20 @@
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
| 8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
| 9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
| 10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
| 11 |
-
"_build": "<function ActorCriticPolicy._build at
|
| 12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
| 13 |
-
"extract_features": "<function ActorCriticPolicy.extract_features at
|
| 14 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
| 15 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
| 16 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
| 17 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
| 18 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
-
"_abc_impl": "<_abc._abc_data object at
|
| 21 |
},
|
| 22 |
"verbose": 1,
|
| 23 |
"policy_kwargs": {
|
|
@@ -37,16 +37,16 @@
|
|
| 37 |
"_num_timesteps_at_start": 0,
|
| 38 |
"seed": null,
|
| 39 |
"action_noise": null,
|
| 40 |
-
"start_time":
|
| 41 |
-
"learning_rate": 0.
|
| 42 |
"tensorboard_log": null,
|
| 43 |
"lr_schedule": {
|
| 44 |
":type:": "<class 'function'>",
|
| 45 |
-
":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/
|
| 46 |
},
|
| 47 |
"_last_obs": {
|
| 48 |
":type:": "<class 'numpy.ndarray'>",
|
| 49 |
-
":serialized:": "
|
| 50 |
},
|
| 51 |
"_last_episode_starts": {
|
| 52 |
":type:": "<class 'numpy.ndarray'>",
|
|
@@ -54,7 +54,7 @@
|
|
| 54 |
},
|
| 55 |
"_last_original_obs": {
|
| 56 |
":type:": "<class 'numpy.ndarray'>",
|
| 57 |
-
":serialized:": "
|
| 58 |
},
|
| 59 |
"_episode_num": 0,
|
| 60 |
"use_sde": true,
|
|
@@ -63,7 +63,7 @@
|
|
| 63 |
"_stats_window_size": 100,
|
| 64 |
"ep_info_buffer": {
|
| 65 |
":type:": "<class 'collections.deque'>",
|
| 66 |
-
":serialized:": "
|
| 67 |
},
|
| 68 |
"ep_success_buffer": {
|
| 69 |
":type:": "<class 'collections.deque'>",
|
|
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7f51f005b1f0>",
|
| 8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f51f005b280>",
|
| 9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f51f005b310>",
|
| 10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f51f005b3a0>",
|
| 11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7f51f005b430>",
|
| 12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7f51f005b4c0>",
|
| 13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x7f51f005b550>",
|
| 14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f51f005b5e0>",
|
| 15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7f51f005b670>",
|
| 16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f51f005b700>",
|
| 17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f51f005b790>",
|
| 18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7f51f005b820>",
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f51f0059b00>"
|
| 21 |
},
|
| 22 |
"verbose": 1,
|
| 23 |
"policy_kwargs": {
|
|
|
|
| 37 |
"_num_timesteps_at_start": 0,
|
| 38 |
"seed": null,
|
| 39 |
"action_noise": null,
|
| 40 |
+
"start_time": 1681288652863329946,
|
| 41 |
+
"learning_rate": 0.0001,
|
| 42 |
"tensorboard_log": null,
|
| 43 |
"lr_schedule": {
|
| 44 |
":type:": "<class 'function'>",
|
| 45 |
+
":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
|
| 46 |
},
|
| 47 |
"_last_obs": {
|
| 48 |
":type:": "<class 'numpy.ndarray'>",
|
| 49 |
+
":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAACakjz/Kkc8+UTAqP5bTUz+xgeM/Ryogv5sWpz5YAR8/Q7Z0v9cNiL1rmhs+q3q4v6yaRD+ASsY/YF3bv/1WUT8Ouc6+XZN+vmm9k79wnkjAoRXIvwwywzwI0DM/EiAdPW9XuL+kt8Q+lvP1PjbKXj9RuZI++BBiP7aJBj9CwZg9k7C9P/zmvT7v7JQ/T+xBPv9Nj78gT0A85Q6APutZer8UT+2/1IOEP6RL1b9tk9e9Dce6vTm6Zb2HHBE/KzGGPbVFRb7m55G/kLLxvkp9cz1vV7i/pLfEPpbz9T42yl4/oREPP+YlYr86dAq+1iB4v/nUFz9WsY+6QF3kProGBr1lh4c/5uBuPhHbwz/J4o28gXK0P+sXWj760Ku+jgUSPh0K5T6f4L893q+SPdaf/j2bK8Q/Tb1puv7dbD+p7wW8y8ExP6S3xD6W8/U+NspePxYXfD9+DHg/FonzPgOFwj8pLVc/7C0yPpKqpj+aIYg/slaSvw9/UL/y6kk/QONUP/qJGsAbbSU+1G3Bv8dV7r/joYm/mGQvPk4Zlr9xXKs/WuXCP+MDK7++vES/zIIFQMvBMT/zkibAlvP1Po0Uk7+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
|
| 50 |
},
|
| 51 |
"_last_episode_starts": {
|
| 52 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
|
| 54 |
},
|
| 55 |
"_last_original_obs": {
|
| 56 |
":type:": "<class 'numpy.ndarray'>",
|
| 57 |
+
":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAACBcsi2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAv2AIvAAAAACfDNm/AAAAAE/8GL0AAAAAIxH6PwAAAAAlHfm9AAAAAGOQ3z8AAAAApx3kPQAAAAAPkeu/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAcQaHtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgKGBwD0AAAAAt5HlvwAAAAC6sq07AAAAANWZ6z8AAAAAaTo2vQAAAABvhQBAAAAAAKeMQD0AAAAAdfb+vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAFnP7DQAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAMWJS7AAAAAGcu7L8AAAAAvT/lvQAAAACan+w/AAAAAIxUAz4AAAAA9e3pPwAAAABX6Oe6AAAAAKVI/r8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADCL/41AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAm0GSvQAAAAA+Oei/AAAAAC613rwAAAAAji/wPwAAAAAmw9Y9AAAAAMHR+D8AAAAAfvx1PQAAAAAu0vO/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
|
| 58 |
},
|
| 59 |
"_episode_num": 0,
|
| 60 |
"use_sde": true,
|
|
|
|
| 63 |
"_stats_window_size": 100,
|
| 64 |
"ep_info_buffer": {
|
| 65 |
":type:": "<class 'collections.deque'>",
|
| 66 |
+
":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJidmUs4DLeMAWyUTegDjAF0lEdAwgVsB8QZoHV9lChoBkdAlHO8Rcu8LGgHTegDaAhHQMIG6sJ6Y3N1fZQoaAZHQJfHA/qxC6ZoB03oA2gIR0DCBwzEvTPTdX2UKGgGR0CY9KS5AhStaAdN6ANoCEdAwgcS/M4cWHV9lChoBkdAlcHHPJJXhmgHTegDaAhHQMIJ5N+TeO51fZQoaAZHQJfWdZkkKNRoB03oA2gIR0DCCyL+WGATdX2UKGgGR0CYK/BOYYzjaAdN6ANoCEdAwgtdUjLSu3V9lChoBkdAl3hrVJ+UhWgHTegDaAhHQMILZvGp++d1fZQoaAZHQJV3Qlu3trtoB03oA2gIR0DCD3SnpB5YdX2UKGgGR0CZBhC53C9AaAdN6ANoCEdAwhDA+tbLU3V9lChoBkdAlcLPDxb0OGgHTegDaAhHQMIQ6Sr5qM51fZQoaAZHQJZZbOIInjRoB03oA2gIR0DCEO+mFajfdX2UKGgGR0CbScNVzZHvaAdN6ANoCEdAwhOYLkS26XV9lChoBkdAmAOTJ+2E02gHTegDaAhHQMIVd20zCUJ1fZQoaAZHQJS6gSYgJTloB03oA2gIR0DCFa7XnQpndX2UKGgGR0CWKX8rI5o5aAdN6ANoCEdAwhW46qbSZ3V9lChoBkdAlU9KVD8cdmgHTegDaAhHQMIY8U8NhE11fZQoaAZHQJYtLyrgflpoB03oA2gIR0DCGi18qnWKdX2UKGgGR0CWsKos7MgVaAdN6ANoCEdAwhpNcVxjrnV9lChoBkdAmWsmFzuF6GgHTegDaAhHQMIaU9DhLoR1fZQoaAZHQJe7dnBciW5oB03oA2gIR0DCHW0EJSiudX2UKGgGR0CXmfHP/rB1aAdN6ANoCEdAwh9qQz1scnV9lChoBkdAmFsAk9lmOGgHTegDaAhHQMIflrlmvnt1fZQoaAZHQJiGZlI3BHloB03oA2gIR0DCH51eUpuudX2UKGgGR0CXJF5XU6PsaAdN6ANoCEdAwiJ2lE7W/nV9lChoBkdAlJTgIUrTY2gHTegDaAhHQMIjvYKx9oh1fZQoaAZHQJZE6WjXWe9oB03oA2gIR0DCI+WLzf78dX2UKGgGR0CaUkAn2IweaAdN6ANoCEdAwiPsVzIV/XV9lChoBkdAla9c4o7V8WgHTegDaAhHQMIn3KJl8PZ1fZQoaAZHQJdKVWkrPMVoB03oA2gIR0DCKSBOLzf8dX2UKGgGR0CZW7KiwjdIaAdN6ANoCEdAwik+/zJ6p3V9lChoBkdAlcGvxUedTmgHTegDaAhHQMIpRYcvM8p1fZQoaAZHQJg3bxy4nWtoB03oA2gIR0DCK/17jT8YdX2UKGgGR0CWUQrZrYXgaAdN6ANoCEdAwi12AVfu1HV9lChoBkdAlSlLWmP5pWgHTegDaAhHQMItrEVnEl51fZQoaAZHQJhkDdnCfpVoB03oA2gIR0DCLbXn2ZiNdX2UKGgGR0CY71RkmQbNaAdN6ANoCEdAwjGTZQpF1HV9lChoBkdAm+YKUmlZYGgHTegDaAhHQMIy59/jKgZ1fZQoaAZHQJXNJIsiB5JoB03oA2gIR0DCMwoe3hGZdX2UKGgGR0CZTc/T9bX6aAdN6ANoCEdAwjMQmwaBJHV9lChoBkdAkm3ZQ+EAYGgHTegDaAhHQMI128dxQzl1fZQoaAZHQJhtd+z+m3xoB03oA2gIR0DCN+KobXHzdX2UKGgGR0CWcaq4pc5baAdN6ANoCEdAwjgec2BJ7XV9lChoBkdAmRDK5sj3VWgHTegDaAhHQMI4KNxdY4h1fZQoaAZHQJdY9Gqgh8poB03oA2gIR0DCO0WycCo1dX2UKGgGR0CWQHHVPN3XaAdN6ANoCEdAwjyo5paibnV9lChoBkdAl87JjlPrOmgHTegDaAhHQMI80QJPZZl1fZQoaAZHQJtjAuAZsKtoB03oA2gIR0DCPNeUfPondX2UKGgGR0CXWFRSxZ+yaAdN6ANoCEdAwkBfY+0PYnV9lChoBkdAmckZCngpB2gHTegDaAhHQMJCBrfk3jx1fZQoaAZHQJdlzWvr4WVoB03oA2gIR0DCQioLNOdodX2UKGgGR0CWfFXSjQAuaAdN6ANoCEdAwkIxUWEbpHV9lChoBkdAl/gE2pAD72gHTegDaAhHQMJEw5lvqC91fZQoaAZHQJao+9K28ZloB03oA2gIR0DCRf/gUDdQdX2UKGgGR0CbHnQWepXIaAdN6ANoCEdAwkYnP+n623V9lChoBkdAmN1BwVCXyGgHTegDaAhHQMJGLOkLx7R1fZQoaAZHQJWuaKAJ9iNoB03oA2gIR0DCSk3qTr3TdX2UKGgGR0CYcd4NqgyuaAdN6ANoCEdAwkuY/qxC6nV9lChoBkdAlx6QNwzch2gHTegDaAhHQMJLv1Muez51fZQoaAZHQJjAk2Hck+poB03oA2gIR0DCS8bm6oVEdX2UKGgGR0CZ+sqkdmxuaAdN6ANoCEdAwk6OpWFN+XV9lChoBkdAl4yo5ggHNWgHTegDaAhHQMJQJ2M85jp1fZQoaAZHQJU/t7AtWdVoB03oA2gIR0DCUFmr4nF6dX2UKGgGR0CaZUIkZ75VaAdN6ANoCEdAwlBihL5AQnV9lChoBkdAm3N4tQKrrGgHTegDaAhHQMJT96/h2nt1fZQoaAZHQJW4aDlHSWtoB03oA2gIR0DCVVfxSYPYdX2UKGgGR0CYc96Rhc7haAdN6ANoCEdAwlV8bAk9lnV9lChoBkdAmoRFJYkmhWgHTegDaAhHQMJVhDEvTPV1fZQoaAZHQJl2HwazeGhoB03oA2gIR0DCWNcbJfY0dX2UKGgGR0CXfyoIv8IiaAdN6ANoCEdAwlq8814xDnV9lChoBkdAk5ly5qdpZmgHTegDaAhHQMJa4fsNUfh1fZQoaAZHQJdxQxcmjTNoB03oA2gIR0DCWuiXlbNbdX2UKGgGR0CQ8ohoM8YAaAdN6ANoCEdAwl2OHoHLR3V9lChoBkdAlubBIre67WgHTegDaAhHQMJe434CZF51fZQoaAZHQJjotf1HvttoB03oA2gIR0DCXwh8IAwPdX2UKGgGR0CZsFIsiB5HaAdN6ANoCEdAwl8P5gPVeHV9lChoBkdAmOF20Re1KGgHTegDaAhHQMJi23Vsk6d1fZQoaAZHQJXsmydFvydoB03oA2gIR0DCZCPOObRXdX2UKGgGR0CZmlRg7YChaAdN6ANoCEdAwmRDqKP4mHV9lChoBkdAmE+w1rIo3WgHTegDaAhHQMJkSYKx9oh1fZQoaAZHQJYBi3XqZ+hoB03oA2gIR0DCZxunjyWidX2UKGgGR0CXHO3Ehq0uaAdN6ANoCEdAwmi3wd8zAXV9lChoBkdAl9eXY150KmgHTegDaAhHQMJo7nJ9y951fZQoaAZHQJiEnBj4HopoB03oA2gIR0DCaPeQMhHLdX2UKGgGR0CZVcRGc4HYaAdN6ANoCEdAwmy2r+YMOXV9lChoBkdAl2YcUAT7EmgHTegDaAhHQMJt6pm29ct1fZQoaAZHQJo0Q99tuUFoB03oA2gIR0DCbg6FEiMYdX2UKGgGR0CZgSEGqxTsaAdN6ANoCEdAwm4Vr6ciGHV9lChoBkdAmSVnPE87p2gHTegDaAhHQMJw6Z4W1tx1fZQoaAZHQJmDhLYf4h5oB03oA2gIR0DCcteu9vjwdX2UKGgGR0CXrzYQarFPaAdN6ANoCEdAwnMQRhc7hnV9lChoBkdAlrxx9b5dnmgHTegDaAhHQMJzGtTkyUN1fZQoaAZHQJYc2r8zhxZoB03oA2gIR0DCdiGcSXdCdX2UKGgGR0CYVeCa7VawaAdN6ANoCEdAwneEgIQe3nV9lChoBkdAmNflyeZof2gHTegDaAhHQMJ3pmvfTCt1fZQoaAZHQJkxH6eoUBZoB03oA2gIR0DCd60INVindX2UKGgGR0CZJXBUaQ3haAdN6ANoCEdAwntvYpUgjnV9lChoBkdAmU9/GlyimGgHTegDaAhHQMJ81gPNFBp1fZQoaAZHQJnwINKAavRoB03oA2gIR0DCfPpxBE8adX2UKGgGR0CYmfpobn5jaAdN6ANoCEdAwn0Bz8P4EnVlLg=="
|
| 67 |
},
|
| 68 |
"ep_success_buffer": {
|
| 69 |
":type:": "<class 'collections.deque'>",
|
a2c-AntBulletEnv-v0/policy.optimizer.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b720c4c505ef920ccdb0804b474d841cf5119f56f904d2246ecba9f599f00f6f
|
| 3 |
+
size 56062
|
a2c-AntBulletEnv-v0/policy.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f60fb7bf909dab05e132f8b385afb808076ba13626ddb3138f70efb2fbebd19
|
| 3 |
+
size 56766
|
a2c-AntBulletEnv-v0/system_info.txt
CHANGED
|
@@ -2,6 +2,6 @@
|
|
| 2 |
- Python: 3.9.16
|
| 3 |
- Stable-Baselines3: 1.8.0
|
| 4 |
- PyTorch: 2.0.0+cu118
|
| 5 |
-
- GPU Enabled:
|
| 6 |
- Numpy: 1.22.4
|
| 7 |
- Gym: 0.21.0
|
|
|
|
| 2 |
- Python: 3.9.16
|
| 3 |
- Stable-Baselines3: 1.8.0
|
| 4 |
- PyTorch: 2.0.0+cu118
|
| 5 |
+
- GPU Enabled: False
|
| 6 |
- Numpy: 1.22.4
|
| 7 |
- Gym: 0.21.0
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fec6ce7f280>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fec6ce7f310>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fec6ce7f3a0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fec6ce7f430>", "_build": "<function ActorCriticPolicy._build at 0x7fec6ce7f4c0>", "forward": "<function ActorCriticPolicy.forward at 0x7fec6ce7f550>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fec6ce7f5e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fec6ce7f670>", "_predict": "<function ActorCriticPolicy._predict at 0x7fec6ce7f700>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fec6ce7f790>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fec6ce7f820>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fec6ce7f8b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fec6ce802c0>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1681226124513463565, "learning_rate": 0.00096, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/T3UQTVUdaYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAGt/bj/eCna+Ea7xPolotr8G8Ng/G0EWP4+lA7841T299q1aPlcNA8CttWa/KWM3PH9UfL/46Zo+lKXEvVm2ML9G9Em+gCb4P8T92z4NTipAkxHEPQW6I78+sP0/Tk+5vuU2C8DaoZM+5tcJwImANj+Czpc/eOa+v6slOsBayAI/BfffPYtHwT2sjxo/TrL8vtKghL8mQYBACJIcQH1Pj0AiLEy/EAIjv+jKhb/gLDs/VRzUP/mwTL97IYy+SrPXvub86T/T4MQ9Tge9PwrpoT7lNgvA2qGTPhe47T6JgDY/Ip2BP/tuer9LuYi+/6kkP+O4UL+PKSa/rrNTP0lDc7+DRrI911UuwPhF9T9L51/Aq7pUvxwyuj8PHjy/mjGUv0q9vb/DCXU/lxwZP7/h3T+FBiI/VaZxvsoNpz8q1BI/5TYLwPn0XcAXuO0+iYA2P10C7j7jK7K/cVqcv8RiBL4jhyi+hMpkPUmRvj86/uC+KTHlvxpuID2rF0K/pC3HPzIq9L4QQCBAReqVvzFiFz+CPCQ/8GmBP3IthT9/meW+UDJdPybUAUDn1Yw9fDFpPuU2C8DaoZM+F7jtPomANj+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAAAjRi62AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA5m9dPQAAAACKDt2/AAAAAJWd1zwAAAAA+ovgPwAAAAB3Rxy8AAAAAIdl+z8AAAAA0kOZPQAAAACf5Om/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAzPPrNAAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgEvevr0AAAAASN3fvwAAAACc9Mq9AAAAAOU+/z8AAAAASfvtPQAAAAAQ+OM/AAAAAExuvD0AAAAAhfjqvwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAM7MqTYAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAq5G29AAAAAK9p/L8AAAAAf2jmPQAAAAAyt+U/AAAAAH/75T0AAAAAqQ3iPwAAAADgBoY9AAAAAF38678AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACftnO1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAD/4IPQAAAAAO1/W/AAAAAMQXuD0AAAAAG7zdPwAAAABReb48AAAAAHk//j8AAAAAXurvPQAAAAAzzey/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJJn9z+3pfSMAWyUTegDjAF0lEdAq06n5N47inV9lChoBkdAkqeQwj+rEWgHTegDaAhHQKtSE72+PBB1fZQoaAZHQJKYLjENvwVoB03oA2gIR0CrWUSJTER8dX2UKGgGR0CQGj0PpY9xaAdN6ANoCEdAq1lxVsDW9XV9lChoBkdAkU2e3Ytg8mgHTegDaAhHQKta/ViF0xN1fZQoaAZHQIvtWIGhVVBoB03oA2gIR0CrXydPk7wKdX2UKGgGR0CSW1D6WPcSaAdN6ANoCEdAq2jxujynUHV9lChoBkdAkwq+k1uR92gHTegDaAhHQKtpHNB4Uvh1fZQoaAZHQJRWC/xlQMxoB03oA2gIR0Crap/i5uqFdX2UKGgGR0CR4bSk0rLAaAdN6ANoCEdAq23/rY5DJHV9lChoBkdAlUa7hrFfiWgHTegDaAhHQKt1DvrGBFx1fZQoaAZHQJZsZUzbeuVoB03oA2gIR0CrdTon0CiidX2UKGgGR0CT6jYzSCvpaAdN6ANoCEdAq3a8Fr2xp3V9lChoBkdAltQlyzXz2GgHTegDaAhHQKt6M3kPtlZ1fZQoaAZHQJX6TiZOSGJoB03oA2gIR0CrhH8TakAQdX2UKGgGR0CTvbA6Mir1aAdN6ANoCEdAq4TFz0Yj0XV9lChoBkdAlzqLmlqJuWgHTegDaAhHQKuGZTrE9+x1fZQoaAZHQJaqeWjXWe9oB03oA2gIR0CrifBbnoxIdX2UKGgGR0CWcB0Yj0L/aAdN6ANoCEdAq5DnSa3I/HV9lChoBkdAlhCKpgkTpWgHTegDaAhHQKuREMRYigV1fZQoaAZHQJV9WvwEyL1oB03oA2gIR0Crkqp2ECeVdX2UKGgGR0CWSf8Sf16FaAdN6ANoCEdAq5ZmALApKHV9lChoBkdAkjT6PKdQPGgHTegDaAhHQKufxBQemvZ1fZQoaAZHQIyOnGwRoRJoB03oA2gIR0CroA4IBzV+dX2UKGgGR0CVMVcG1QZXaAdN6ANoCEdAq6Jt/QSi/XV9lChoBkdAk7U7mMfigmgHTegDaAhHQKumFleWv8t1fZQoaAZHQJCH4qlP8AJoB03oA2gIR0CrrT7TUiIMdX2UKGgGR0CSLz3ueBhAaAdN6ANoCEdAq61rTBqKxnV9lChoBkdAkQeNAX2ugmgHTegDaAhHQKuu+pXIU8F1fZQoaAZHQJL7jsyBTXJoB03oA2gIR0Crsnei8FpxdX2UKGgGR0CR1fPFvQ4TaAdN6ANoCEdAq7qtTFVDKHV9lChoBkdAk+8YBvJiiWgHTegDaAhHQKu68JTl1bJ1fZQoaAZHQJOaPLfUF0RoB03oA2gIR0CrvVmK64DtdX2UKGgGR0CSf7SLZSNwaAdN6ANoCEdAq8IhTZQHiXV9lChoBkdAk5hwLRa5gGgHTegDaAhHQKvJW0CzTnd1fZQoaAZHQJPU0XyiEg5oB03oA2gIR0CryYd+XqqwdX2UKGgGR0CU5GMFlkH2aAdN6ANoCEdAq8sImCyyEHV9lChoBkdAYeQsQNCqqGgHS6poCEdAq8tvDUExI3V9lChoBkdAkVwkdzXBg2gHTegDaAhHQKvOcDsdDIB1fZQoaAZHQJVSmSX+l0poB03oA2gIR0Cr1n2nKnvVdX2UKGgGR0CSqgQxesxPaAdN6ANoCEdAq9ip+OOsDHV9lChoBkdAkifWuX/o7mgHTegDaAhHQKvZOD3/PxB1fZQoaAZHQJaD5VJcxCZoB03oA2gIR0Cr3gKubI91dX2UKGgGR0CUDEYAKfFraAdN6ANoCEdAq+W+ZgG8mXV9lChoBkdAlWld5Y5ksmgHTegDaAhHQKvnQgK4QSV1fZQoaAZHQIwT6qCHymRoB03oA2gIR0Cr56M8gZCOdX2UKGgGR0CVyC+GXXyzaAdN6ANoCEdAq+rBL/S6UnV9lChoBkdAlAzCHM2WIGgHTegDaAhHQKvx/sTFl051fZQoaAZHQJHf4S7GvOhoB03oA2gIR0Cr872BJ7LMdX2UKGgGR0CTDcTnJT2naAdN6ANoCEdAq/RPJPqLTHV9lChoBkdAlPICWeHzpWgHTegDaAhHQKv46aNMoMN1fZQoaAZHQI6HmjASFoNoB03oA2gIR0CsAdlN+LFXdX2UKGgGR0CQvyvB7/n4aAdN6ANoCEdArANi8lHBlHV9lChoBkdAkooJMxoIwGgHTegDaAhHQKwDxF0gbId1fZQoaAZHQJOUJZeRgZ1oB03oA2gIR0CsBtr9MsYmdX2UKGgGR0CBxGT4cm0FaAdN6ANoCEdArA46Ss8xK3V9lChoBkdAhLuOavzOHGgHTegDaAhHQKwPzKSxJNF1fZQoaAZHQI20l+CsfaJoB03oA2gIR0CsEC7zshPkdX2UKGgGR0CRp7JRwZO0aAdN6ANoCEdArBQsLa24NXV9lChoBkdAiKxkG7jDK2gHTegDaAhHQKwd8wWWQfZ1fZQoaAZHQJGUvo/zJ6poB03oA2gIR0CsH3yHM2WIdX2UKGgGR0CSv4B9Cu2aaAdN6ANoCEdArB/Zw++ueXV9lChoBkdAlDozxgAp8WgHTegDaAhHQKwi5pKSPlx1fZQoaAZHQJLvUnmaH9FoB03oA2gIR0CsKjFaKUFCdX2UKGgGR0CTRYOVgQYlaAdN6ANoCEdArCu4ZMtbtHV9lChoBkdAkdXt7SiM52gHTegDaAhHQKwsGX4TK1Z1fZQoaAZHQIIWrzPKMehoB03oA2gIR0CsLzV5jYqYdX2UKGgGR0CSUTqWTot+aAdN6ANoCEdArDoPvnbItHV9lChoBkdAi222vbGm12gHTegDaAhHQKw7kmj0tiB1fZQoaAZHQJLekyeqaPVoB03oA2gIR0CsO/me+VTrdX2UKGgGR0CHduw9JSR9aAdN6ANoCEdArD790A93bHV9lChoBkdAi8FZpi7TUmgHTegDaAhHQKxGGhY/3WZ1fZQoaAZHQJGMG25QP7NoB03oA2gIR0CsR5kQwsXjdX2UKGgGR0COOE0TDfm+aAdN6ANoCEdArEf/E87p3XV9lChoBkdAkHJ9To+wDGgHTegDaAhHQKxLKGHHmzV1fZQoaAZHQJGUdc3VColoB03oA2gIR0CsVQ6ttALRdX2UKGgGR0CQ6SL9MsYmaAdN6ANoCEdArFdZ9b5dnnV9lChoBkdAjqmaya/h2mgHTegDaAhHQKxXvBOYYzl1fZQoaAZHQI5l4llbu+hoB03oA2gIR0CsWs9QO4G2dX2UKGgGR0CLeUDbJwKjaAdN6ANoCEdArGIjKgZjx3V9lChoBkdAkKzjr/sE7mgHTegDaAhHQKxjqh8IAwR1fZQoaAZHQIQIllRP421oB03oA2gIR0CsZAoToMa1dX2UKGgGR0CQ69V/+bVjaAdN6ANoCEdArGcPDm8ujHV9lChoBkdAi1SbAckt3GgHTegDaAhHQKxvrzySV4Z1fZQoaAZHQI0u/5HmRvFoB03oA2gIR0Cscg7TlT3qdX2UKGgGR0CRlkYzSCvpaAdN6ANoCEdArHKpwOvt+nV9lChoBkdAjekEGqxTsWgHTegDaAhHQKx2vgzguRN1fZQoaAZHQIonmDcuandoB03oA2gIR0CsfkDAzpHJdX2UKGgGR0CMYcD9wWFfaAdN6ANoCEdArH/SAavRq3V9lChoBkdAgeiGhufmLmgHTegDaAhHQKyAOdMCcPR1fZQoaAZHQJL7WlchTwVoB03oA2gIR0Csg0ZB1LamdX2UKGgGR0CUDivVVghKaAdN6ANoCEdArIs+lGgBcXV9lChoBkdAkheBvm5lOGgHTegDaAhHQKyNb5ylvZR1fZQoaAZHQJNCHnq3VkNoB03oA2gIR0CsjgN+LFXJdX2UKGgGR0CRGjzsyBTXaAdN6ANoCEdArJLGrIYFaHV9lChoBkdAkv/eotL+P2gHTegDaAhHQKyaN6u4gA91fZQoaAZHQIrLhVp9JBhoB03oA2gIR0Csm8Cr92ovdX2UKGgGR0CL57b5dnkDaAdN6ANoCEdArJwnD3ueBnV9lChoBkdAkcCljZtelmgHTegDaAhHQKyfTyNn5BV1fZQoaAZHQIAQCfjCHh1oB027AmgIR0CsourCemNzdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 62500, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVZwIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSxyFlIwBQ5R0lFKUjARoaWdolGgSKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaApLHIWUaBV0lFKUjA1ib3VuZGVkX2JlbG93lGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCFLHIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAEBAQEBAQEBlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.8.0", "PyTorch": "2.0.0+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Gym": "0.21.0"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f51f005b1f0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f51f005b280>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f51f005b310>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f51f005b3a0>", "_build": "<function ActorCriticPolicy._build at 0x7f51f005b430>", "forward": "<function ActorCriticPolicy.forward at 0x7f51f005b4c0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f51f005b550>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f51f005b5e0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f51f005b670>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f51f005b700>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f51f005b790>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f51f005b820>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f51f0059b00>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1681288652863329946, "learning_rate": 0.0001, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAACakjz/Kkc8+UTAqP5bTUz+xgeM/Ryogv5sWpz5YAR8/Q7Z0v9cNiL1rmhs+q3q4v6yaRD+ASsY/YF3bv/1WUT8Ouc6+XZN+vmm9k79wnkjAoRXIvwwywzwI0DM/EiAdPW9XuL+kt8Q+lvP1PjbKXj9RuZI++BBiP7aJBj9CwZg9k7C9P/zmvT7v7JQ/T+xBPv9Nj78gT0A85Q6APutZer8UT+2/1IOEP6RL1b9tk9e9Dce6vTm6Zb2HHBE/KzGGPbVFRb7m55G/kLLxvkp9cz1vV7i/pLfEPpbz9T42yl4/oREPP+YlYr86dAq+1iB4v/nUFz9WsY+6QF3kProGBr1lh4c/5uBuPhHbwz/J4o28gXK0P+sXWj760Ku+jgUSPh0K5T6f4L893q+SPdaf/j2bK8Q/Tb1puv7dbD+p7wW8y8ExP6S3xD6W8/U+NspePxYXfD9+DHg/FonzPgOFwj8pLVc/7C0yPpKqpj+aIYg/slaSvw9/UL/y6kk/QONUP/qJGsAbbSU+1G3Bv8dV7r/joYm/mGQvPk4Zlr9xXKs/WuXCP+MDK7++vES/zIIFQMvBMT/zkibAlvP1Po0Uk7+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAACBcsi2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAv2AIvAAAAACfDNm/AAAAAE/8GL0AAAAAIxH6PwAAAAAlHfm9AAAAAGOQ3z8AAAAApx3kPQAAAAAPkeu/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAcQaHtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgKGBwD0AAAAAt5HlvwAAAAC6sq07AAAAANWZ6z8AAAAAaTo2vQAAAABvhQBAAAAAAKeMQD0AAAAAdfb+vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAFnP7DQAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAMWJS7AAAAAGcu7L8AAAAAvT/lvQAAAACan+w/AAAAAIxUAz4AAAAA9e3pPwAAAABX6Oe6AAAAAKVI/r8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADCL/41AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAm0GSvQAAAAA+Oei/AAAAAC613rwAAAAAji/wPwAAAAAmw9Y9AAAAAMHR+D8AAAAAfvx1PQAAAAAu0vO/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJidmUs4DLeMAWyUTegDjAF0lEdAwgVsB8QZoHV9lChoBkdAlHO8Rcu8LGgHTegDaAhHQMIG6sJ6Y3N1fZQoaAZHQJfHA/qxC6ZoB03oA2gIR0DCBwzEvTPTdX2UKGgGR0CY9KS5AhStaAdN6ANoCEdAwgcS/M4cWHV9lChoBkdAlcHHPJJXhmgHTegDaAhHQMIJ5N+TeO51fZQoaAZHQJfWdZkkKNRoB03oA2gIR0DCCyL+WGATdX2UKGgGR0CYK/BOYYzjaAdN6ANoCEdAwgtdUjLSu3V9lChoBkdAl3hrVJ+UhWgHTegDaAhHQMILZvGp++d1fZQoaAZHQJV3Qlu3trtoB03oA2gIR0DCD3SnpB5YdX2UKGgGR0CZBhC53C9AaAdN6ANoCEdAwhDA+tbLU3V9lChoBkdAlcLPDxb0OGgHTegDaAhHQMIQ6Sr5qM51fZQoaAZHQJZZbOIInjRoB03oA2gIR0DCEO+mFajfdX2UKGgGR0CbScNVzZHvaAdN6ANoCEdAwhOYLkS26XV9lChoBkdAmAOTJ+2E02gHTegDaAhHQMIVd20zCUJ1fZQoaAZHQJS6gSYgJTloB03oA2gIR0DCFa7XnQpndX2UKGgGR0CWKX8rI5o5aAdN6ANoCEdAwhW46qbSZ3V9lChoBkdAlU9KVD8cdmgHTegDaAhHQMIY8U8NhE11fZQoaAZHQJYtLyrgflpoB03oA2gIR0DCGi18qnWKdX2UKGgGR0CWsKos7MgVaAdN6ANoCEdAwhpNcVxjrnV9lChoBkdAmWsmFzuF6GgHTegDaAhHQMIaU9DhLoR1fZQoaAZHQJe7dnBciW5oB03oA2gIR0DCHW0EJSiudX2UKGgGR0CXmfHP/rB1aAdN6ANoCEdAwh9qQz1scnV9lChoBkdAmFsAk9lmOGgHTegDaAhHQMIflrlmvnt1fZQoaAZHQJiGZlI3BHloB03oA2gIR0DCH51eUpuudX2UKGgGR0CXJF5XU6PsaAdN6ANoCEdAwiJ2lE7W/nV9lChoBkdAlJTgIUrTY2gHTegDaAhHQMIjvYKx9oh1fZQoaAZHQJZE6WjXWe9oB03oA2gIR0DCI+WLzf78dX2UKGgGR0CaUkAn2IweaAdN6ANoCEdAwiPsVzIV/XV9lChoBkdAla9c4o7V8WgHTegDaAhHQMIn3KJl8PZ1fZQoaAZHQJdKVWkrPMVoB03oA2gIR0DCKSBOLzf8dX2UKGgGR0CZW7KiwjdIaAdN6ANoCEdAwik+/zJ6p3V9lChoBkdAlcGvxUedTmgHTegDaAhHQMIpRYcvM8p1fZQoaAZHQJg3bxy4nWtoB03oA2gIR0DCK/17jT8YdX2UKGgGR0CWUQrZrYXgaAdN6ANoCEdAwi12AVfu1HV9lChoBkdAlSlLWmP5pWgHTegDaAhHQMItrEVnEl51fZQoaAZHQJhkDdnCfpVoB03oA2gIR0DCLbXn2ZiNdX2UKGgGR0CY71RkmQbNaAdN6ANoCEdAwjGTZQpF1HV9lChoBkdAm+YKUmlZYGgHTegDaAhHQMIy59/jKgZ1fZQoaAZHQJXNJIsiB5JoB03oA2gIR0DCMwoe3hGZdX2UKGgGR0CZTc/T9bX6aAdN6ANoCEdAwjMQmwaBJHV9lChoBkdAkm3ZQ+EAYGgHTegDaAhHQMI128dxQzl1fZQoaAZHQJhtd+z+m3xoB03oA2gIR0DCN+KobXHzdX2UKGgGR0CWcaq4pc5baAdN6ANoCEdAwjgec2BJ7XV9lChoBkdAmRDK5sj3VWgHTegDaAhHQMI4KNxdY4h1fZQoaAZHQJdY9Gqgh8poB03oA2gIR0DCO0WycCo1dX2UKGgGR0CWQHHVPN3XaAdN6ANoCEdAwjyo5paibnV9lChoBkdAl87JjlPrOmgHTegDaAhHQMI80QJPZZl1fZQoaAZHQJtjAuAZsKtoB03oA2gIR0DCPNeUfPondX2UKGgGR0CXWFRSxZ+yaAdN6ANoCEdAwkBfY+0PYnV9lChoBkdAmckZCngpB2gHTegDaAhHQMJCBrfk3jx1fZQoaAZHQJdlzWvr4WVoB03oA2gIR0DCQioLNOdodX2UKGgGR0CWfFXSjQAuaAdN6ANoCEdAwkIxUWEbpHV9lChoBkdAl/gE2pAD72gHTegDaAhHQMJEw5lvqC91fZQoaAZHQJao+9K28ZloB03oA2gIR0DCRf/gUDdQdX2UKGgGR0CbHnQWepXIaAdN6ANoCEdAwkYnP+n623V9lChoBkdAmN1BwVCXyGgHTegDaAhHQMJGLOkLx7R1fZQoaAZHQJWuaKAJ9iNoB03oA2gIR0DCSk3qTr3TdX2UKGgGR0CYcd4NqgyuaAdN6ANoCEdAwkuY/qxC6nV9lChoBkdAlx6QNwzch2gHTegDaAhHQMJLv1Muez51fZQoaAZHQJjAk2Hck+poB03oA2gIR0DCS8bm6oVEdX2UKGgGR0CZ+sqkdmxuaAdN6ANoCEdAwk6OpWFN+XV9lChoBkdAl4yo5ggHNWgHTegDaAhHQMJQJ2M85jp1fZQoaAZHQJU/t7AtWdVoB03oA2gIR0DCUFmr4nF6dX2UKGgGR0CaZUIkZ75VaAdN6ANoCEdAwlBihL5AQnV9lChoBkdAm3N4tQKrrGgHTegDaAhHQMJT96/h2nt1fZQoaAZHQJW4aDlHSWtoB03oA2gIR0DCVVfxSYPYdX2UKGgGR0CYc96Rhc7haAdN6ANoCEdAwlV8bAk9lnV9lChoBkdAmoRFJYkmhWgHTegDaAhHQMJVhDEvTPV1fZQoaAZHQJl2HwazeGhoB03oA2gIR0DCWNcbJfY0dX2UKGgGR0CXfyoIv8IiaAdN6ANoCEdAwlq8814xDnV9lChoBkdAk5ly5qdpZmgHTegDaAhHQMJa4fsNUfh1fZQoaAZHQJdxQxcmjTNoB03oA2gIR0DCWuiXlbNbdX2UKGgGR0CQ8ohoM8YAaAdN6ANoCEdAwl2OHoHLR3V9lChoBkdAlubBIre67WgHTegDaAhHQMJe434CZF51fZQoaAZHQJjotf1HvttoB03oA2gIR0DCXwh8IAwPdX2UKGgGR0CZsFIsiB5HaAdN6ANoCEdAwl8P5gPVeHV9lChoBkdAmOF20Re1KGgHTegDaAhHQMJi23Vsk6d1fZQoaAZHQJXsmydFvydoB03oA2gIR0DCZCPOObRXdX2UKGgGR0CZmlRg7YChaAdN6ANoCEdAwmRDqKP4mHV9lChoBkdAmE+w1rIo3WgHTegDaAhHQMJkSYKx9oh1fZQoaAZHQJYBi3XqZ+hoB03oA2gIR0DCZxunjyWidX2UKGgGR0CXHO3Ehq0uaAdN6ANoCEdAwmi3wd8zAXV9lChoBkdAl9eXY150KmgHTegDaAhHQMJo7nJ9y951fZQoaAZHQJiEnBj4HopoB03oA2gIR0DCaPeQMhHLdX2UKGgGR0CZVcRGc4HYaAdN6ANoCEdAwmy2r+YMOXV9lChoBkdAl2YcUAT7EmgHTegDaAhHQMJt6pm29ct1fZQoaAZHQJo0Q99tuUFoB03oA2gIR0DCbg6FEiMYdX2UKGgGR0CZgSEGqxTsaAdN6ANoCEdAwm4Vr6ciGHV9lChoBkdAmSVnPE87p2gHTegDaAhHQMJw6Z4W1tx1fZQoaAZHQJmDhLYf4h5oB03oA2gIR0DCcteu9vjwdX2UKGgGR0CXrzYQarFPaAdN6ANoCEdAwnMQRhc7hnV9lChoBkdAlrxx9b5dnmgHTegDaAhHQMJzGtTkyUN1fZQoaAZHQJYc2r8zhxZoB03oA2gIR0DCdiGcSXdCdX2UKGgGR0CYVeCa7VawaAdN6ANoCEdAwneEgIQe3nV9lChoBkdAmNflyeZof2gHTegDaAhHQMJ3pmvfTCt1fZQoaAZHQJkxH6eoUBZoB03oA2gIR0DCd60INVindX2UKGgGR0CZJXBUaQ3haAdN6ANoCEdAwntvYpUgjnV9lChoBkdAmU9/GlyimGgHTegDaAhHQMJ81gPNFBp1fZQoaAZHQJnwINKAavRoB03oA2gIR0DCfPpxBE8adX2UKGgGR0CYmfpobn5jaAdN6ANoCEdAwn0Bz8P4EnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 62500, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVZwIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSxyFlIwBQ5R0lFKUjARoaWdolGgSKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaApLHIWUaBV0lFKUjA1ib3VuZGVkX2JlbG93lGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCFLHIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAEBAQEBAQEBlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.8.0", "PyTorch": "2.0.0+cu118", "GPU Enabled": "False", "Numpy": "1.22.4", "Gym": "0.21.0"}}
|
replay.mp4
CHANGED
|
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward":
|
|
|
|
| 1 |
+
{"mean_reward": 1893.631191460346, "std_reward": 99.9121690982914, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-04-12T09:52:14.240754"}
|
vec_normalize.pkl
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2170
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba461503ff84349f653667005790706b9ff1b5bb8e46499a21c0973424e1d112
|
| 3 |
size 2170
|