Updated PPO agent
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +3 -0
- ppo-LunarLander-v2/_stable_baselines3_version +1 -0
- ppo-LunarLander-v2/data +99 -0
- ppo-LunarLander-v2/policy.optimizer.pth +3 -0
- ppo-LunarLander-v2/policy.pth +3 -0
- ppo-LunarLander-v2/pytorch_variables.pth +3 -0
- ppo-LunarLander-v2/system_info.txt +8 -0
- results.json +1 -1
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value:
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: 266.47 +/- 20.50
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7cb6613363b0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7cb661336440>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7cb6613364d0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7cb661336560>", "_build": "<function ActorCriticPolicy._build at 0x7cb6613365f0>", "forward": "<function ActorCriticPolicy.forward at 0x7cb661336680>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7cb661336710>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7cb6613367a0>", "_predict": "<function ActorCriticPolicy._predict at 0x7cb661336830>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7cb6613368c0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7cb661336950>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7cb6613369e0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7cb661338a00>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1024000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1693148242521917335, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV9QIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJaAAgAAAAAAAA2XQL492Bo8uAiztJGzUDJtl669DG0fNAAAgD8AAIA/M/9APoGzu7xOFL07Q/RLuvwaI77jQR+7AACAPwAAgD/zs5S9FEiMugBsd7npyoe08t+AOgNkjzgAAAAAAACAPyZXLL7t3JM/UuD6vtoNGL8F4UC+uNucvQAAAAAAAAAAzb/cPMTjsT+ZtA0+vRiPvrPe3jxPII49AAAAAAAAAACtsgu+T8NIPubGuD1mOae+SAeFPQ4Ojz0AAAAAAAAAAIAwVz0meak/9VPaPmZD+L7n0yc9XmCHPgAAAAAAAAAATYMsvnSIi7xQXLc4TqjFN3YPAT7Bbhe4AACAPwAAgD8gCBm+dmsmP4uDQL2acOW+KIG9vaUHAT0AAAAAAAAAALNZf70p5DW6wCIXtadgDLBN2iI7jo1mNAAAgD8AAIA/3TFhvrt+jz7lZ9q8RJ6OvnRoPb24YiA9AAAAAAAAAACAHV+9boa8P+N+o76yoOu8AjkxvSK3Ar4AAAAAAAAAAMBdKb6p2km8AJ5Wu27RiLk3UrM9CAaJOgAAgD8AAIA/s6sdPo+AHj+sFsw9CROyvjxR4z0CHZg7AAAAAAAAAACaSTK80i2CPnM0973wepe+W+cmvToMiTwAAAAAAAAAAJNbKr70coq8C8yZOAQ79jUIkfI9fgG6twAAgD8AAIA/42WpvqfSaz5v4DI+5X+NvgzMA722HSg9AAAAAAAAAABzmSe+AZGRvEAbLjvAQ4Y50lgBPnD7aroAAIA/AACAP6Zf5j1cyy66Gr7Otd5jkq8XW6m7Wjz8NAAAAAAAAIA/HXyWPl8xHD9SAIY9+pPVvmYMHT62NeC9AAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSxRLCIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVhwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYUAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksUhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.02400000000000002, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVBQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHBTNRm9QGiMAWyUS+6MAXSUR0CkthdlEqlQdX2UKGgGR0BxSL1schkiaAdNRAFoCEdApLbN+w1R+HV9lChoBkdAYnXzundfs2gHTegDaAhHQKS5STJyQxN1fZQoaAZHQGIhtXxOLzhoB03oA2gIR0CkuXMzEaVEdX2UKGgGR0ByEE72criEaAdNVQFoCEdApLpRazNUwXV9lChoBkdAX5iCSRr8BWgHTegDaAhHQKS6gy9mHxl1fZQoaAZHQGD3PJq7AcloB03oA2gIR0CkvIQAEMb4dX2UKGgGR0BxY9Ed/8VIaAdNDwFoCEdApL1g6XBxgnV9lChoBkdAcBFoFFDv3WgHS9toCEdApL2Flbu+iHV9lChoBkdAcU3KMefZmWgHTSEBaAhHQKS9l+BH09R1fZQoaAZHQHJ34pH7P6doB0vmaAhHQKS+Puk1uR91fZQoaAZHQHGauCkGiYdoB0vXaAhHQKS+Rfl6qsF1fZQoaAZHQG7hnyNGViZoB0vmaAhHQKS+qnNxEOR1fZQoaAZHQHB82Z7XxvxoB0vvaAhHQKS+qrbQC0Z1fZQoaAZHQGGmgOBlMAZoB03oA2gIR0CkvztLL6k7dX2UKGgGR0Bp56AjIJZ4aAdNZAFoCEdApMAmOdXkpHV9lChoBkdAb7BWjGkvb2gHS99oCEdApMDQeV9nb3V9lChoBkdAbZTNqQA+6mgHS9FoCEdApMESasp5NXV9lChoBkdAYRmImgJ1JWgHTegDaAhHQKTBRGdZq211fZQoaAZHQHGJRbB42TBoB0v5aAhHQKTBc0WuX/p1fZQoaAZHQHGSse8wpONoB0v3aAhHQKTB8uGsV+J1fZQoaAZHQHHZbZSNwR5oB0vRaAhHQKTC9w7T2Fp1fZQoaAZHQG85g5BC2MNoB0vcaAhHQKTDLO58Sf11fZQoaAZHQHBHaR+z+m5oB0vyaAhHQKTDoP07KaJ1fZQoaAZHQGCJKnvUjLVoB03oA2gIR0Ckw6+3pfQbdX2UKGgGR0BhUEyFfzBiaAdN6ANoCEdApMPGg13t8nV9lChoBkdAcivFGG21D2gHTbIBaAhHQKTEDyU9pyp1fZQoaAZHQHBo51vES/VoB0vQaAhHQKTEFNLUTct1fZQoaAZHQG+uq2SdOItoB0vqaAhHQKTEOoG6f8N1fZQoaAZHQG223nZCfHxoB00GAWgIR0CkxIUG3WnTdX2UKGgGR0BxsICyQgcMaAdL2mgIR0CkxbhtDUmVdX2UKGgGR0Bul+o5xR2saAdNCgFoCEdApMcfGn4wiHV9lChoBkdAbau3GXHBDWgHS/9oCEdApMe3QyAQQXV9lChoBkdAb+brylN1yWgHS9VoCEdApMiI6ySmqHV9lChoBkdAb8/hXKbKBGgHS/FoCEdApMjRaxHG0nV9lChoBkdAcKDR/EwWWWgHS/toCEdApMjY7/4qPXV9lChoBkdAbfhKGtZFHGgHS+loCEdApMlGI0qH5HV9lChoBkdAa6CAVfu1GGgHS+FoCEdApMltRHf/FXV9lChoBkdAcELH58BuGmgHS+FoCEdApMl0POIInnV9lChoBkdAYJ/7N0NjLGgHTegDaAhHQKTKXXf642F1fZQoaAZHQHESvyoXKr9oB00DAWgIR0CkyoUcOskqdX2UKGgGR0BuHre40/GEaAdL4GgIR0Cky3xDLKV6dX2UKGgGR0BttBXIU8FIaAdNqgFoCEdApMuJQemvXHV9lChoBkdAbzGS8J2MbWgHS9hoCEdApMyeqJdjXnV9lChoBkdAcM0Hoouwo2gHTQQBaAhHQKTOVe/pMYd1fZQoaAZHQHAy/WlMyrRoB0vtaAhHQKTOiVh1DBx1fZQoaAZHQHHi+h0yP+5oB0vlaAhHQKTOlLZi/fx1fZQoaAZHQHAOLGm1pkBoB0vpaAhHQKTOuY4yXUp1fZQoaAZHQG/NfEXLvCxoB0vzaAhHQKTPn28IzFd1fZQoaAZHQHGkR3NcGC9oB00EAWgIR0Ckz+TMqz7edX2UKGgGR0Blw1weeWfLaAdN6ANoCEdApM/uS6lLvnV9lChoBkdAbRefapPykWgHS9hoCEdApNAHN5dGAnV9lChoBkdAbrDO3UhFE2gHS9VoCEdApNJkCo0hvHV9lChoBkdAcOm9nK4hEGgHTQ4BaAhHQKTSseK8+Rp1fZQoaAZHQHHa7H+6y0NoB01QAWgIR0Ck00ti6QNkdX2UKGgGR0BwifZ13dKvaAdN8QJoCEdApNN+aYu01XV9lChoBkdAcQL1sLv1DmgHS8poCEdApNRShg3Lm3V9lChoBkdAOM+TeO4oZ2gHS8toCEdApNSQNgBtDXV9lChoBkdAbi2mJFb3XmgHS+5oCEdApNVrt1IRRXV9lChoBkdAcNXMXrMTvmgHS/doCEdApNYK7Xg9/3V9lChoBkdAbTZr4WUKRmgHS9NoCEdApNaj7yhBaHV9lChoBkdAbsyhq0tyxWgHS9hoCEdApNcAUxmCiHV9lChoBkdAZBVjQzDXOGgHTegDaAhHQKTXkV1wHZ91fZQoaAZHQHKuUXUH6dloB0v+aAhHQKTX7PhybQV1fZQoaAZHQG+JM6aLGaRoB039AWgIR0Ck2F3Wvr4WdX2UKGgGR0BvT+/N7jT8aAdNCgFoCEdApNjAkX1rZnV9lChoBkdAZBUvkBCD3GgHTegDaAhHQKTZZch1Tzd1fZQoaAZHQGL8qNQ0oBtoB03oA2gIR0Ck2dLFGXoldX2UKGgGR0BxVDF4s3AEaAdL1GgIR0Ck2f4qXnhbdX2UKGgGR0BusYN0/4ZdaAdL42gIR0Ck2skdmxt6dX2UKGgGR0BvpOCROk+HaAdL1GgIR0Ck2vDhDPWydX2UKGgGR0BvhRDzAeq8aAdL1mgIR0Ck2zomgJ1JdX2UKGgGR0Bg7kPJ7sv7aAdN6ANoCEdApNtQNTcZcnV9lChoBkdAcCteZof0VmgHS+loCEdApNzEnNPgvXV9lChoBkdAbo4DM/yGz2gHS9poCEdApN14/xDst3V9lChoBkdAcVnbWEsasWgHTWgCaAhHQKTecwPAfuF1fZQoaAZHQG7lbiqABktoB0vIaAhHQKTe4yJKraN1fZQoaAZHQG6BpvP1L8JoB0vkaAhHQKTff9R77bd1fZQoaAZHQHBVhm03OwBoB0v8aAhHQKTgFpYcNpd1fZQoaAZHQGI4hZyMkyFoB03oA2gIR0Ck4JLiVB2PdX2UKGgGR0BwIfZQHiWFaAdLz2gIR0Ck4LXHq/ucdX2UKGgGR0BxUvWjGkvcaAdL7WgIR0Ck4U33Hq/udX2UKGgGR0BvxyoAGSpzaAdL02gIR0Ck4Wd2HLzPdX2UKGgGR0Boq3k7wKBvaAdNQQFoCEdApOGCSidrf3V9lChoBkdAYspreIl+mWgHTegDaAhHQKThlr30wrV1fZQoaAZHQG8FLcbiqABoB0veaAhHQKTiAFj/dZd1fZQoaAZHQHBRXjyWiURoB00cAWgIR0Ck4g4287IUdX2UKGgGR0BwFJzp5eJIaAdL6GgIR0Ck4ia6J66bdX2UKGgGR0Byg2eSSvC/aAdL8WgIR0Ck4iQdjoZAdX2UKGgGR0BwkiiHqNZNaAdL82gIR0Ck42M4tHx0dX2UKGgGR0Bv2YBRyfcvaAdL6WgIR0Ck46VObiIddX2UKGgGR0ByfFcPe54GaAdL22gIR0Ck5DF2/zredX2UKGgGR0BvEHEjxCpnaAdL7GgIR0Ck5E2ycCo1dX2UKGgGR0Bvke6TW5H3aAdLyWgIR0Ck5NbQLNOedX2UKGgGR0BwJDFAE+xGaAdL22gIR0Ck5OVlf7aadX2UKGgGR0Bwe7Z13dKvaAdL7mgIR0Ck5Pi83++/dX2UKGgGR0BwbVqBVdX1aAdL1mgIR0Ck5eWmHgxbdX2UKGgGR0BwxO2SdOIqaAdL6GgIR0Ck5jgGSpzcdX2UKGgGR0Bwq+XhOxjbaAdL4WgIR0Ck5kKdYnv2dX2UKGgGR0BuDRa5f+juaAdNCAFoCEdApOZfZuhsZnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 690, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 20, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 512, "n_epochs": 23, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.109+-x86_64-with-glibc2.35 # 1 SMP Fri Jun 9 10:57:30 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.1.0", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x000001630D2B2E80>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x000001630D2B2F20>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x000001630D2B2FC0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x000001630D2B3060>", "_build": "<function ActorCriticPolicy._build at 0x000001630D2B3100>", "forward": "<function ActorCriticPolicy.forward at 0x000001630D2B31A0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x000001630D2B3240>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x000001630D2B32E0>", "_predict": "<function ActorCriticPolicy._predict at 0x000001630D2B3380>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x000001630D2B3420>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x000001630D2B34C0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x000001630D2B3560>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x000001630D2AA900>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1693165098167503900, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAJp56Tu4pN27MFHSPYUb4L1BwYU83n0svgAAgD8AAIA/ZkQVPMMlJzk2VKC7J5Jdu3HhW7tPbDa9AAAAAAAAAADAVeA99kRMutZsvDvAmsm4j41xugGmwbcAAIA/AACAP+aCHL32DEW6VgFkunnp2DwZNCe6AgaruwAAgD8AAIA/zTTjPApbGDoOTr87distPKKo+jnYjAs5AAAAAAAAAACaJbo7PQYmOkXchrutpBY9BshkOi9vATwAAAAAAAAAAI19kr5+2Pc+fsFKPl+qp74RLBK9Gi8iPgAAAAAAAAAAzaYDPLjG1rnyFIo7ZgANvbC4TjsqtPe9AAAAAAAAgD9mlhy99rxzuubCgjm7Jog0P2+ZOi3xlLgAAIA/AACAPwBwxTvh6Ia6KLoYunFhCjZmWdm5bm4sOQAAgD8AAIA/MwD4vMMRGLpKx6G6/MbJtcWZOLutlLw5AACAPwAAgD8NGa69bSNCPt+TCT48I4q+ZyHZPHUeQb0AAAAAAAAAAK0gOL7YBf0+YFlYPsuvn76ugTQ92bsnPAAAAAAAAAAAM5trvDgzq7tZh5E8ZAqBPEUMGr1QMVw9AACAPwAAgD/NiKi7KVxNN0VDC7t6N/K8JBqoO82SVLsAAAAAAAAAAAAsL73sx+Y6ntkPuyKqmj1feA66av+huwAAAAAAAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHFXCgf2boeMAWyUTQYBjAF0lEdAkktlJYkmhXV9lChoBkdAcFOiAlOXV2gHTQUBaAhHQJJLpsJpnHx1fZQoaAZHQHLaDBRAKOVoB0v6aAhHQJJLthttQ9B1fZQoaAZHQHGWJ44ZMtdoB01HAWgIR0CSS+XT3IuHdX2UKGgGR0BwaEHE/B3zaAdNBQFoCEdAkk0jtb9qDnV9lChoBkdAcPp3V09yLmgHS/xoCEdAkk0qXBxgiXV9lChoBkdAcqnmLcbiqGgHTT0BaAhHQJJOB6Tnq3V1fZQoaAZHQDwx15jYqXpoB0vgaAhHQJJP73QD3dt1fZQoaAZHQHD0Lz9S/CZoB00ZAWgIR0CSUIdJ8OTadX2UKGgGR0Bx2IoQWepXaAdNAQFoCEdAklIpH/cWTHV9lChoBkdAcI5Hh0hePmgHTRoBaAhHQJJSZawD/2l1fZQoaAZHQHH633YcvM9oB00vAWgIR0CSUp+Yc/+sdX2UKGgGR0BwxeYJE6T4aAdNIwFoCEdAklLYBzV+Z3V9lChoBkdAbKPiobXHzmgHTQ0BaAhHQJJTbsF+uvF1fZQoaAZHQHLZjbeuV5doB00BAWgIR0CSU7JUo8ZDdX2UKGgGR0BxUmT/yXlbaAdNDQFoCEdAklRE8A7xNXV9lChoBkdAbRk1Aqur62gHTQkBaAhHQJJUdKraM751fZQoaAZHQG1OpZW7vohoB00OAWgIR0CSVMyWAwwkdX2UKGgGR0BwD3FwT/Q0aAdNCgFoCEdAklXuI68xsXV9lChoBkdAcC+h9LHuJGgHTV4BaAhHQJJ9clPacqh1fZQoaAZHQG+3qNQ0oBtoB00NAWgIR0CShb1KGtZFdX2UKGgGR0BZR0n9ehPCaAdN6ANoCEdAkphSHARChXV9lChoBkdAUaB8iOearmgHTegDaAhHQJKquYUnG851fZQoaAZHQFu0IKc/dIpoB03oA2gIR0CSrK9DQZ4wdX2UKGgGR0BY7t6gM+eOaAdN6ANoCEdAkrFbQb+98XV9lChoBkdAWGrlq8DjimgHTegDaAhHQJKyuYfGMn91fZQoaAZHQFoYNzKcNH9oB03oA2gIR0CStkfO2RaHdX2UKGgGR0BgLsdJaq0daAdN6ANoCEdAkrbDxG2CunV9lChoBkdAWe6yZ8a4t2gHTegDaAhHQJK3SdlNDdB1fZQoaAZHQF8gMoMKCxxoB03oA2gIR0CSt7+d9UjtdX2UKGgGR0BRVkmhM8HOaAdN6ANoCEdAkrjvva11GXV9lChoBkdAV48yULUkOmgHTegDaAhHQJK5h1GLDQ91fZQoaAZHQF7kpMHryDtoB03oA2gIR0CSuruMdcSodX2UKGgGR0BUz6BI4EOiaAdN6ANoCEdAkrsh6nivPnV9lChoBkdAUGhbmlqJuWgHTegDaAhHQJK9sU9IPLB1fZQoaAZHQFHi55qubI9oB03oA2gIR0CSvvTsIE8rdX2UKGgGR0Beb3rhR64UaAdN6ANoCEdAkuwcbaRISXV9lChoBkdAX9I/1QIldGgHTegDaAhHQJL8y4b0e2d1fZQoaAZHQGDwMlC1JDpoB03oA2gIR0CTDRZOzposdX2UKGgGR0BSh8JUo8ZDaAdN6ANoCEdAkw6v4qPOp3V9lChoBkdAXvgyoGY8dWgHTegDaAhHQJMSoHv+fiB1fZQoaAZHQGF4ZFPSDyxoB03oA2gIR0CTE86Z6UqydX2UKGgGR0BbO/r4WUKRaAdN6ANoCEdAkxc4FA3T/nV9lChoBkdAXkYvsZ5zHWgHTegDaAhHQJMXsvqTr3V1fZQoaAZHQFgVHi3ocJdoB03oA2gIR0CTGCm7aqS6dX2UKGgGR0BeLpfhMrVfaAdN6ANoCEdAkxighwEQoXV9lChoBkdATmY+GGmDUWgHTegDaAhHQJMZ0Ka5PM11fZQoaAZHQGJNoj4YaYNoB03oA2gIR0CTGlfP5YYBdX2UKGgGR0BhUy8FpwjuaAdN6ANoCEdAkxtGcSXdCXV9lChoBkdAXLY/2TPjXGgHTegDaAhHQJMbif7Jnxt1fZQoaAZHQEbrT0g8r7RoB03oA2gIR0CTHUNXHR1HdX2UKGgGR0BVCrOiWVu8aAdN6ANoCEdAkx5+ws5GSnV9lChoBkdAWWB9YwIt2GgHTegDaAhHQJNLuKWLP2R1fZQoaAZHQGJopMpPRAtoB03oA2gIR0CTXIqQiiZfdX2UKGgGR0BcVyR8twrEaAdN6ANoCEdAk2w5soDxLHV9lChoBkdAWGyOOsDGLmgHTegDaAhHQJNtweS0Sh91fZQoaAZHQFazlFMIu5BoB03oA2gIR0CTca9tuUD/dX2UKGgGR0Ba1xUBGQS0aAdN6ANoCEdAk3LflZHNHHV9lChoBkdAWXK4LCvX9WgHTegDaAhHQJN1vcSGrS51fZQoaAZHQF/lV4X40uVoB03oA2gIR0CTdiU34sVddX2UKGgGR0Bi2ITCcf/4aAdN6ANoCEdAk3aGdiDujXV9lChoBkdAYRbJYkmhNGgHTegDaAhHQJN23ojfNzN1fZQoaAZHQFuCNX5nDixoB03oA2gIR0CTd6xcE/0NdX2UKGgGR0BTIsafjCHiaAdN6ANoCEdAk3gRw2l2vHV9lChoBkdAX5tjlPrOaGgHTegDaAhHQJN49AnlXBB1fZQoaAZHQFyzdfb9If9oB03oA2gIR0CTeT/I8yN5dX2UKGgGR0BelHEQ5FPSaAdN6ANoCEdAk3snPE87p3V9lChoBkdAYshtBOYYzmgHTegDaAhHQJN8/UDuBtl1fZQoaAZHQGAlExqO939oB03oA2gIR0CTqXU8FINFdX2UKGgGR0BhMjfxc3VDaAdN6ANoCEdAk7nQX2ugYnV9lChoBkdAYe/B1s+FDmgHTegDaAhHQJPHWptJnQJ1fZQoaAZHQGBO4SpR4yJoB03oA2gIR0CTyOLVnVXndX2UKGgGR0BhG2XgLqlhaAdN6ANoCEdAk8z3QD3dsXV9lChoBkdAYDZpeu3c6GgHTegDaAhHQJPN5/RVp9J1fZQoaAZHQGBdK2BreqJoB03oA2gIR0CT0Dvjfek6dX2UKGgGR0Bg2XRqoIfKaAdN6ANoCEdAk9CR8IAwPHV9lChoBkdAZpGWtU4rBmgHTegDaAhHQJPQ4cYIjW11fZQoaAZHQGF2HYQJ5VxoB03oA2gIR0CT0TCgsbvPdX2UKGgGR0BbnvgJkXk6aAdN6ANoCEdAk9Hq/IsAenV9lChoBkdAVeu9US7GvWgHTegDaAhHQJPSSkDZDiR1fZQoaAZHQGKFOlfqoqFoB03oA2gIR0CT0vdQwblzdX2UKGgGR0Bce+0G/vfCaAdN6ANoCEdAk9Mthy8zynV9lChoBkdAWudGrjo6jmgHTegDaAhHQJPUxhqj8DV1fZQoaAZHQGO/kqc3EQ5oB03oA2gIR0CT1hka/ATJdX2UKGgGR0BX75jYqXnhaAdN6ANoCEdAlANnscABDHV9lChoBkdAWY/2kBS1mmgHTegDaAhHQJQUEbaRISV1fZQoaAZHQGFDo8hcJMRoB03oA2gIR0CUI/cTrVvudX2UKGgGR0BvKFDF6zE8aAdNjQNoCEdAlCSSvX9R8HV9lChoBkdAYQHvYODraGgHTegDaAhHQJQlgExIre91fZQoaAZHQGM2G+sYEW9oB03oA2gIR0CUKXDgqEvkdX2UKGgGR0BU7gHNX5nEaAdN6ANoCEdAlC3lpTMq0HV9lChoBkdAYgOZJkGzKWgHTegDaAhHQJQuTh73PAx1fZQoaAZHQFUPtmL9/BpoB03oA2gIR0CULrJxNqQBdX2UKGgGR0BbQIH5aePJaAdN6ANoCEdAlC8RrJr+HnV9lChoBkdAXslGrjo6jmgHTegDaAhHQJQv9gmZ3LV1fZQoaAZHQFpWRFqi48VoB03oA2gIR0CUMGWluWKNdX2UKGgGR0BkWma4MF2WaAdN6ANoCEdAlDEzf779AHV9lChoBkdAXrodHUc4pGgHTegDaAhHQJQxdw5vLox1fZQoaAZHQFz2WdEsrd5oB03oA2gIR0CUM2SXt0FKdX2UKGgGR0BjucUbkwN9aAdN6ANoCEdAlDUa7NB4U3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 372, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWVnwEAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBBfX2dlbmVyYXRvcl9jdG9ylJOUjAVQQ0c2NJRoG4wUX19iaXRfZ2VuZXJhdG9yX2N0b3KUk5SGlFKUfZQojA1iaXRfZ2VuZXJhdG9ylIwFUENHNjSUjAVzdGF0ZZR9lChoJooQVWit40MD1/+RECJ/K8NKGIwDaW5jlIoRjS1pR1UecEBB1rNOLUJ72AB1jApoYXNfdWludDMylEsAjAh1aW50ZWdlcpRLAHVidWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": "Generator(PCG64)"}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.97, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 6, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjFVjOlxVc2Vyc1xhZGl0eVxhbmFjb25kYTNcZW52c1xzYjNcTGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4NDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5RoDHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjFVjOlxVc2Vyc1xhZGl0eVxhbmFjb25kYTNcZW52c1xzYjNcTGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4NDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5RoDHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "system_info": {"OS": "Windows-10-10.0.22621-SP0 10.0.22621", "Python": "3.11.4", "Stable-Baselines3": "2.1.0", "PyTorch": "2.0.1", "GPU Enabled": "True", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1"}}
|
ppo-LunarLander-v2.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60feb7a67d0dd6fa568fa950d3439f57ba240f93635c0a0c4b5035514ccff908
|
| 3 |
+
size 146907
|
ppo-LunarLander-v2/_stable_baselines3_version
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
2.1.0
|
ppo-LunarLander-v2/data
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"policy_class": {
|
| 3 |
+
":type:": "<class 'abc.ABCMeta'>",
|
| 4 |
+
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
+
"__module__": "stable_baselines3.common.policies",
|
| 6 |
+
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x000001630D2B2E80>",
|
| 8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x000001630D2B2F20>",
|
| 9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x000001630D2B2FC0>",
|
| 10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x000001630D2B3060>",
|
| 11 |
+
"_build": "<function ActorCriticPolicy._build at 0x000001630D2B3100>",
|
| 12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x000001630D2B31A0>",
|
| 13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x000001630D2B3240>",
|
| 14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x000001630D2B32E0>",
|
| 15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x000001630D2B3380>",
|
| 16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x000001630D2B3420>",
|
| 17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x000001630D2B34C0>",
|
| 18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x000001630D2B3560>",
|
| 19 |
+
"__abstractmethods__": "frozenset()",
|
| 20 |
+
"_abc_impl": "<_abc._abc_data object at 0x000001630D2AA900>"
|
| 21 |
+
},
|
| 22 |
+
"verbose": 1,
|
| 23 |
+
"policy_kwargs": {},
|
| 24 |
+
"num_timesteps": 1015808,
|
| 25 |
+
"_total_timesteps": 1000000,
|
| 26 |
+
"_num_timesteps_at_start": 0,
|
| 27 |
+
"seed": null,
|
| 28 |
+
"action_noise": null,
|
| 29 |
+
"start_time": 1693165098167503900,
|
| 30 |
+
"learning_rate": 0.0003,
|
| 31 |
+
"tensorboard_log": null,
|
| 32 |
+
"_last_obs": {
|
| 33 |
+
":type:": "<class 'numpy.ndarray'>",
|
| 34 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAJp56Tu4pN27MFHSPYUb4L1BwYU83n0svgAAgD8AAIA/ZkQVPMMlJzk2VKC7J5Jdu3HhW7tPbDa9AAAAAAAAAADAVeA99kRMutZsvDvAmsm4j41xugGmwbcAAIA/AACAP+aCHL32DEW6VgFkunnp2DwZNCe6AgaruwAAgD8AAIA/zTTjPApbGDoOTr87distPKKo+jnYjAs5AAAAAAAAAACaJbo7PQYmOkXchrutpBY9BshkOi9vATwAAAAAAAAAAI19kr5+2Pc+fsFKPl+qp74RLBK9Gi8iPgAAAAAAAAAAzaYDPLjG1rnyFIo7ZgANvbC4TjsqtPe9AAAAAAAAgD9mlhy99rxzuubCgjm7Jog0P2+ZOi3xlLgAAIA/AACAPwBwxTvh6Ia6KLoYunFhCjZmWdm5bm4sOQAAgD8AAIA/MwD4vMMRGLpKx6G6/MbJtcWZOLutlLw5AACAPwAAgD8NGa69bSNCPt+TCT48I4q+ZyHZPHUeQb0AAAAAAAAAAK0gOL7YBf0+YFlYPsuvn76ugTQ92bsnPAAAAAAAAAAAM5trvDgzq7tZh5E8ZAqBPEUMGr1QMVw9AACAPwAAgD/NiKi7KVxNN0VDC7t6N/K8JBqoO82SVLsAAAAAAAAAAAAsL73sx+Y6ntkPuyKqmj1feA66av+huwAAAAAAAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
| 35 |
+
},
|
| 36 |
+
"_last_episode_starts": {
|
| 37 |
+
":type:": "<class 'numpy.ndarray'>",
|
| 38 |
+
":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
|
| 39 |
+
},
|
| 40 |
+
"_last_original_obs": null,
|
| 41 |
+
"_episode_num": 0,
|
| 42 |
+
"use_sde": false,
|
| 43 |
+
"sde_sample_freq": -1,
|
| 44 |
+
"_current_progress_remaining": -0.015808000000000044,
|
| 45 |
+
"_stats_window_size": 100,
|
| 46 |
+
"ep_info_buffer": {
|
| 47 |
+
":type:": "<class 'collections.deque'>",
|
| 48 |
+
":serialized:": "gAWVQQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHFXCgf2boeMAWyUTQYBjAF0lEdAkktlJYkmhXV9lChoBkdAcFOiAlOXV2gHTQUBaAhHQJJLpsJpnHx1fZQoaAZHQHLaDBRAKOVoB0v6aAhHQJJLthttQ9B1fZQoaAZHQHGWJ44ZMtdoB01HAWgIR0CSS+XT3IuHdX2UKGgGR0BwaEHE/B3zaAdNBQFoCEdAkk0jtb9qDnV9lChoBkdAcPp3V09yLmgHS/xoCEdAkk0qXBxgiXV9lChoBkdAcqnmLcbiqGgHTT0BaAhHQJJOB6Tnq3V1fZQoaAZHQDwx15jYqXpoB0vgaAhHQJJP73QD3dt1fZQoaAZHQHD0Lz9S/CZoB00ZAWgIR0CSUIdJ8OTadX2UKGgGR0Bx2IoQWepXaAdNAQFoCEdAklIpH/cWTHV9lChoBkdAcI5Hh0hePmgHTRoBaAhHQJJSZawD/2l1fZQoaAZHQHH633YcvM9oB00vAWgIR0CSUp+Yc/+sdX2UKGgGR0BwxeYJE6T4aAdNIwFoCEdAklLYBzV+Z3V9lChoBkdAbKPiobXHzmgHTQ0BaAhHQJJTbsF+uvF1fZQoaAZHQHLZjbeuV5doB00BAWgIR0CSU7JUo8ZDdX2UKGgGR0BxUmT/yXlbaAdNDQFoCEdAklRE8A7xNXV9lChoBkdAbRk1Aqur62gHTQkBaAhHQJJUdKraM751fZQoaAZHQG1OpZW7vohoB00OAWgIR0CSVMyWAwwkdX2UKGgGR0BwD3FwT/Q0aAdNCgFoCEdAklXuI68xsXV9lChoBkdAcC+h9LHuJGgHTV4BaAhHQJJ9clPacqh1fZQoaAZHQG+3qNQ0oBtoB00NAWgIR0CShb1KGtZFdX2UKGgGR0BZR0n9ehPCaAdN6ANoCEdAkphSHARChXV9lChoBkdAUaB8iOearmgHTegDaAhHQJKquYUnG851fZQoaAZHQFu0IKc/dIpoB03oA2gIR0CSrK9DQZ4wdX2UKGgGR0BY7t6gM+eOaAdN6ANoCEdAkrFbQb+98XV9lChoBkdAWGrlq8DjimgHTegDaAhHQJKyuYfGMn91fZQoaAZHQFoYNzKcNH9oB03oA2gIR0CStkfO2RaHdX2UKGgGR0BgLsdJaq0daAdN6ANoCEdAkrbDxG2CunV9lChoBkdAWe6yZ8a4t2gHTegDaAhHQJK3SdlNDdB1fZQoaAZHQF8gMoMKCxxoB03oA2gIR0CSt7+d9UjtdX2UKGgGR0BRVkmhM8HOaAdN6ANoCEdAkrjvva11GXV9lChoBkdAV48yULUkOmgHTegDaAhHQJK5h1GLDQ91fZQoaAZHQF7kpMHryDtoB03oA2gIR0CSuruMdcSodX2UKGgGR0BUz6BI4EOiaAdN6ANoCEdAkrsh6nivPnV9lChoBkdAUGhbmlqJuWgHTegDaAhHQJK9sU9IPLB1fZQoaAZHQFHi55qubI9oB03oA2gIR0CSvvTsIE8rdX2UKGgGR0Beb3rhR64UaAdN6ANoCEdAkuwcbaRISXV9lChoBkdAX9I/1QIldGgHTegDaAhHQJL8y4b0e2d1fZQoaAZHQGDwMlC1JDpoB03oA2gIR0CTDRZOzposdX2UKGgGR0BSh8JUo8ZDaAdN6ANoCEdAkw6v4qPOp3V9lChoBkdAXvgyoGY8dWgHTegDaAhHQJMSoHv+fiB1fZQoaAZHQGF4ZFPSDyxoB03oA2gIR0CTE86Z6UqydX2UKGgGR0BbO/r4WUKRaAdN6ANoCEdAkxc4FA3T/nV9lChoBkdAXkYvsZ5zHWgHTegDaAhHQJMXsvqTr3V1fZQoaAZHQFgVHi3ocJdoB03oA2gIR0CTGCm7aqS6dX2UKGgGR0BeLpfhMrVfaAdN6ANoCEdAkxighwEQoXV9lChoBkdATmY+GGmDUWgHTegDaAhHQJMZ0Ka5PM11fZQoaAZHQGJNoj4YaYNoB03oA2gIR0CTGlfP5YYBdX2UKGgGR0BhUy8FpwjuaAdN6ANoCEdAkxtGcSXdCXV9lChoBkdAXLY/2TPjXGgHTegDaAhHQJMbif7Jnxt1fZQoaAZHQEbrT0g8r7RoB03oA2gIR0CTHUNXHR1HdX2UKGgGR0BVCrOiWVu8aAdN6ANoCEdAkx5+ws5GSnV9lChoBkdAWWB9YwIt2GgHTegDaAhHQJNLuKWLP2R1fZQoaAZHQGJopMpPRAtoB03oA2gIR0CTXIqQiiZfdX2UKGgGR0BcVyR8twrEaAdN6ANoCEdAk2w5soDxLHV9lChoBkdAWGyOOsDGLmgHTegDaAhHQJNtweS0Sh91fZQoaAZHQFazlFMIu5BoB03oA2gIR0CTca9tuUD/dX2UKGgGR0Ba1xUBGQS0aAdN6ANoCEdAk3LflZHNHHV9lChoBkdAWXK4LCvX9WgHTegDaAhHQJN1vcSGrS51fZQoaAZHQF/lV4X40uVoB03oA2gIR0CTdiU34sVddX2UKGgGR0Bi2ITCcf/4aAdN6ANoCEdAk3aGdiDujXV9lChoBkdAYRbJYkmhNGgHTegDaAhHQJN23ojfNzN1fZQoaAZHQFuCNX5nDixoB03oA2gIR0CTd6xcE/0NdX2UKGgGR0BTIsafjCHiaAdN6ANoCEdAk3gRw2l2vHV9lChoBkdAX5tjlPrOaGgHTegDaAhHQJN49AnlXBB1fZQoaAZHQFyzdfb9If9oB03oA2gIR0CTeT/I8yN5dX2UKGgGR0BelHEQ5FPSaAdN6ANoCEdAk3snPE87p3V9lChoBkdAYshtBOYYzmgHTegDaAhHQJN8/UDuBtl1fZQoaAZHQGAlExqO939oB03oA2gIR0CTqXU8FINFdX2UKGgGR0BhMjfxc3VDaAdN6ANoCEdAk7nQX2ugYnV9lChoBkdAYe/B1s+FDmgHTegDaAhHQJPHWptJnQJ1fZQoaAZHQGBO4SpR4yJoB03oA2gIR0CTyOLVnVXndX2UKGgGR0BhG2XgLqlhaAdN6ANoCEdAk8z3QD3dsXV9lChoBkdAYDZpeu3c6GgHTegDaAhHQJPN5/RVp9J1fZQoaAZHQGBdK2BreqJoB03oA2gIR0CT0Dvjfek6dX2UKGgGR0Bg2XRqoIfKaAdN6ANoCEdAk9CR8IAwPHV9lChoBkdAZpGWtU4rBmgHTegDaAhHQJPQ4cYIjW11fZQoaAZHQGF2HYQJ5VxoB03oA2gIR0CT0TCgsbvPdX2UKGgGR0BbnvgJkXk6aAdN6ANoCEdAk9Hq/IsAenV9lChoBkdAVeu9US7GvWgHTegDaAhHQJPSSkDZDiR1fZQoaAZHQGKFOlfqoqFoB03oA2gIR0CT0vdQwblzdX2UKGgGR0Bce+0G/vfCaAdN6ANoCEdAk9Mthy8zynV9lChoBkdAWudGrjo6jmgHTegDaAhHQJPUxhqj8DV1fZQoaAZHQGO/kqc3EQ5oB03oA2gIR0CT1hka/ATJdX2UKGgGR0BX75jYqXnhaAdN6ANoCEdAlANnscABDHV9lChoBkdAWY/2kBS1mmgHTegDaAhHQJQUEbaRISV1fZQoaAZHQGFDo8hcJMRoB03oA2gIR0CUI/cTrVvudX2UKGgGR0BvKFDF6zE8aAdNjQNoCEdAlCSSvX9R8HV9lChoBkdAYQHvYODraGgHTegDaAhHQJQlgExIre91fZQoaAZHQGM2G+sYEW9oB03oA2gIR0CUKXDgqEvkdX2UKGgGR0BU7gHNX5nEaAdN6ANoCEdAlC3lpTMq0HV9lChoBkdAYgOZJkGzKWgHTegDaAhHQJQuTh73PAx1fZQoaAZHQFUPtmL9/BpoB03oA2gIR0CULrJxNqQBdX2UKGgGR0BbQIH5aePJaAdN6ANoCEdAlC8RrJr+HnV9lChoBkdAXslGrjo6jmgHTegDaAhHQJQv9gmZ3LV1fZQoaAZHQFpWRFqi48VoB03oA2gIR0CUMGWluWKNdX2UKGgGR0BkWma4MF2WaAdN6ANoCEdAlDEzf779AHV9lChoBkdAXrodHUc4pGgHTegDaAhHQJQxdw5vLox1fZQoaAZHQFz2WdEsrd5oB03oA2gIR0CUM2SXt0FKdX2UKGgGR0BjucUbkwN9aAdN6ANoCEdAlDUa7NB4U3VlLg=="
|
| 49 |
+
},
|
| 50 |
+
"ep_success_buffer": {
|
| 51 |
+
":type:": "<class 'collections.deque'>",
|
| 52 |
+
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 53 |
+
},
|
| 54 |
+
"_n_updates": 372,
|
| 55 |
+
"observation_space": {
|
| 56 |
+
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
| 57 |
+
":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
|
| 58 |
+
"dtype": "float32",
|
| 59 |
+
"bounded_below": "[ True True True True True True True True]",
|
| 60 |
+
"bounded_above": "[ True True True True True True True True]",
|
| 61 |
+
"_shape": [
|
| 62 |
+
8
|
| 63 |
+
],
|
| 64 |
+
"low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
|
| 65 |
+
"high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
|
| 66 |
+
"low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
|
| 67 |
+
"high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
|
| 68 |
+
"_np_random": null
|
| 69 |
+
},
|
| 70 |
+
"action_space": {
|
| 71 |
+
":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
|
| 72 |
+
":serialized:": "gAWVnwEAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBBfX2dlbmVyYXRvcl9jdG9ylJOUjAVQQ0c2NJRoG4wUX19iaXRfZ2VuZXJhdG9yX2N0b3KUk5SGlFKUfZQojA1iaXRfZ2VuZXJhdG9ylIwFUENHNjSUjAVzdGF0ZZR9lChoJooQVWit40MD1/+RECJ/K8NKGIwDaW5jlIoRjS1pR1UecEBB1rNOLUJ72AB1jApoYXNfdWludDMylEsAjAh1aW50ZWdlcpRLAHVidWIu",
|
| 73 |
+
"n": "4",
|
| 74 |
+
"start": "0",
|
| 75 |
+
"_shape": [],
|
| 76 |
+
"dtype": "int64",
|
| 77 |
+
"_np_random": "Generator(PCG64)"
|
| 78 |
+
},
|
| 79 |
+
"n_envs": 16,
|
| 80 |
+
"n_steps": 1024,
|
| 81 |
+
"gamma": 0.999,
|
| 82 |
+
"gae_lambda": 0.97,
|
| 83 |
+
"ent_coef": 0.01,
|
| 84 |
+
"vf_coef": 0.5,
|
| 85 |
+
"max_grad_norm": 0.5,
|
| 86 |
+
"batch_size": 64,
|
| 87 |
+
"n_epochs": 6,
|
| 88 |
+
"clip_range": {
|
| 89 |
+
":type:": "<class 'function'>",
|
| 90 |
+
":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjFVjOlxVc2Vyc1xhZGl0eVxhbmFjb25kYTNcZW52c1xzYjNcTGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4NDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5RoDHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
|
| 91 |
+
},
|
| 92 |
+
"clip_range_vf": null,
|
| 93 |
+
"normalize_advantage": true,
|
| 94 |
+
"target_kl": null,
|
| 95 |
+
"lr_schedule": {
|
| 96 |
+
":type:": "<class 'function'>",
|
| 97 |
+
":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjFVjOlxVc2Vyc1xhZGl0eVxhbmFjb25kYTNcZW52c1xzYjNcTGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4NDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5RoDHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
|
| 98 |
+
}
|
| 99 |
+
}
|
ppo-LunarLander-v2/policy.optimizer.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee800822a694302fc6a217ef185e231b8286881414b18eebe244c4e435f4a72b
|
| 3 |
+
size 87929
|
ppo-LunarLander-v2/policy.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:434f18f8816f8997936f66dea4c9050235e001ce1bbea9c5b67f87accbbc1bdd
|
| 3 |
+
size 43329
|
ppo-LunarLander-v2/pytorch_variables.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1
|
| 3 |
+
size 431
|
ppo-LunarLander-v2/system_info.txt
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- OS: Windows-10-10.0.22621-SP0 10.0.22621
|
| 2 |
+
- Python: 3.11.4
|
| 3 |
+
- Stable-Baselines3: 2.1.0
|
| 4 |
+
- PyTorch: 2.0.1
|
| 5 |
+
- GPU Enabled: True
|
| 6 |
+
- Numpy: 1.25.2
|
| 7 |
+
- Cloudpickle: 2.2.1
|
| 8 |
+
- Gymnasium: 0.28.1
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward":
|
|
|
|
| 1 |
+
{"mean_reward": 266.46527890000004, "std_reward": 20.495153794780187, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-08-27T16:03:46.620705"}
|