adyprat commited on
Commit
7a3c925
·
1 Parent(s): d0b177f

Updated PPO agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 216.84 +/- 99.53
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 266.47 +/- 20.50
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7cb6613363b0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7cb661336440>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7cb6613364d0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7cb661336560>", "_build": "<function ActorCriticPolicy._build at 0x7cb6613365f0>", "forward": "<function ActorCriticPolicy.forward at 0x7cb661336680>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7cb661336710>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7cb6613367a0>", "_predict": "<function ActorCriticPolicy._predict at 0x7cb661336830>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7cb6613368c0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7cb661336950>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7cb6613369e0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7cb661338a00>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1024000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1693148242521917335, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV9QIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJaAAgAAAAAAAA2XQL492Bo8uAiztJGzUDJtl669DG0fNAAAgD8AAIA/M/9APoGzu7xOFL07Q/RLuvwaI77jQR+7AACAPwAAgD/zs5S9FEiMugBsd7npyoe08t+AOgNkjzgAAAAAAACAPyZXLL7t3JM/UuD6vtoNGL8F4UC+uNucvQAAAAAAAAAAzb/cPMTjsT+ZtA0+vRiPvrPe3jxPII49AAAAAAAAAACtsgu+T8NIPubGuD1mOae+SAeFPQ4Ojz0AAAAAAAAAAIAwVz0meak/9VPaPmZD+L7n0yc9XmCHPgAAAAAAAAAATYMsvnSIi7xQXLc4TqjFN3YPAT7Bbhe4AACAPwAAgD8gCBm+dmsmP4uDQL2acOW+KIG9vaUHAT0AAAAAAAAAALNZf70p5DW6wCIXtadgDLBN2iI7jo1mNAAAgD8AAIA/3TFhvrt+jz7lZ9q8RJ6OvnRoPb24YiA9AAAAAAAAAACAHV+9boa8P+N+o76yoOu8AjkxvSK3Ar4AAAAAAAAAAMBdKb6p2km8AJ5Wu27RiLk3UrM9CAaJOgAAgD8AAIA/s6sdPo+AHj+sFsw9CROyvjxR4z0CHZg7AAAAAAAAAACaSTK80i2CPnM0973wepe+W+cmvToMiTwAAAAAAAAAAJNbKr70coq8C8yZOAQ79jUIkfI9fgG6twAAgD8AAIA/42WpvqfSaz5v4DI+5X+NvgzMA722HSg9AAAAAAAAAABzmSe+AZGRvEAbLjvAQ4Y50lgBPnD7aroAAIA/AACAP6Zf5j1cyy66Gr7Otd5jkq8XW6m7Wjz8NAAAAAAAAIA/HXyWPl8xHD9SAIY9+pPVvmYMHT62NeC9AAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSxRLCIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVhwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYUAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksUhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.02400000000000002, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVBQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHBTNRm9QGiMAWyUS+6MAXSUR0CkthdlEqlQdX2UKGgGR0BxSL1schkiaAdNRAFoCEdApLbN+w1R+HV9lChoBkdAYnXzundfs2gHTegDaAhHQKS5STJyQxN1fZQoaAZHQGIhtXxOLzhoB03oA2gIR0CkuXMzEaVEdX2UKGgGR0ByEE72criEaAdNVQFoCEdApLpRazNUwXV9lChoBkdAX5iCSRr8BWgHTegDaAhHQKS6gy9mHxl1fZQoaAZHQGD3PJq7AcloB03oA2gIR0CkvIQAEMb4dX2UKGgGR0BxY9Ed/8VIaAdNDwFoCEdApL1g6XBxgnV9lChoBkdAcBFoFFDv3WgHS9toCEdApL2Flbu+iHV9lChoBkdAcU3KMefZmWgHTSEBaAhHQKS9l+BH09R1fZQoaAZHQHJ34pH7P6doB0vmaAhHQKS+Puk1uR91fZQoaAZHQHGauCkGiYdoB0vXaAhHQKS+Rfl6qsF1fZQoaAZHQG7hnyNGViZoB0vmaAhHQKS+qnNxEOR1fZQoaAZHQHB82Z7XxvxoB0vvaAhHQKS+qrbQC0Z1fZQoaAZHQGGmgOBlMAZoB03oA2gIR0CkvztLL6k7dX2UKGgGR0Bp56AjIJZ4aAdNZAFoCEdApMAmOdXkpHV9lChoBkdAb7BWjGkvb2gHS99oCEdApMDQeV9nb3V9lChoBkdAbZTNqQA+6mgHS9FoCEdApMESasp5NXV9lChoBkdAYRmImgJ1JWgHTegDaAhHQKTBRGdZq211fZQoaAZHQHGJRbB42TBoB0v5aAhHQKTBc0WuX/p1fZQoaAZHQHGSse8wpONoB0v3aAhHQKTB8uGsV+J1fZQoaAZHQHHZbZSNwR5oB0vRaAhHQKTC9w7T2Fp1fZQoaAZHQG85g5BC2MNoB0vcaAhHQKTDLO58Sf11fZQoaAZHQHBHaR+z+m5oB0vyaAhHQKTDoP07KaJ1fZQoaAZHQGCJKnvUjLVoB03oA2gIR0Ckw6+3pfQbdX2UKGgGR0BhUEyFfzBiaAdN6ANoCEdApMPGg13t8nV9lChoBkdAcivFGG21D2gHTbIBaAhHQKTEDyU9pyp1fZQoaAZHQHBo51vES/VoB0vQaAhHQKTEFNLUTct1fZQoaAZHQG+uq2SdOItoB0vqaAhHQKTEOoG6f8N1fZQoaAZHQG223nZCfHxoB00GAWgIR0CkxIUG3WnTdX2UKGgGR0BxsICyQgcMaAdL2mgIR0CkxbhtDUmVdX2UKGgGR0Bul+o5xR2saAdNCgFoCEdApMcfGn4wiHV9lChoBkdAbau3GXHBDWgHS/9oCEdApMe3QyAQQXV9lChoBkdAb+brylN1yWgHS9VoCEdApMiI6ySmqHV9lChoBkdAb8/hXKbKBGgHS/FoCEdApMjRaxHG0nV9lChoBkdAcKDR/EwWWWgHS/toCEdApMjY7/4qPXV9lChoBkdAbfhKGtZFHGgHS+loCEdApMlGI0qH5HV9lChoBkdAa6CAVfu1GGgHS+FoCEdApMltRHf/FXV9lChoBkdAcELH58BuGmgHS+FoCEdApMl0POIInnV9lChoBkdAYJ/7N0NjLGgHTegDaAhHQKTKXXf642F1fZQoaAZHQHESvyoXKr9oB00DAWgIR0CkyoUcOskqdX2UKGgGR0BuHre40/GEaAdL4GgIR0Cky3xDLKV6dX2UKGgGR0BttBXIU8FIaAdNqgFoCEdApMuJQemvXHV9lChoBkdAbzGS8J2MbWgHS9hoCEdApMyeqJdjXnV9lChoBkdAcM0Hoouwo2gHTQQBaAhHQKTOVe/pMYd1fZQoaAZHQHAy/WlMyrRoB0vtaAhHQKTOiVh1DBx1fZQoaAZHQHHi+h0yP+5oB0vlaAhHQKTOlLZi/fx1fZQoaAZHQHAOLGm1pkBoB0vpaAhHQKTOuY4yXUp1fZQoaAZHQG/NfEXLvCxoB0vzaAhHQKTPn28IzFd1fZQoaAZHQHGkR3NcGC9oB00EAWgIR0Ckz+TMqz7edX2UKGgGR0Blw1weeWfLaAdN6ANoCEdApM/uS6lLvnV9lChoBkdAbRefapPykWgHS9hoCEdApNAHN5dGAnV9lChoBkdAbrDO3UhFE2gHS9VoCEdApNJkCo0hvHV9lChoBkdAcOm9nK4hEGgHTQ4BaAhHQKTSseK8+Rp1fZQoaAZHQHHa7H+6y0NoB01QAWgIR0Ck00ti6QNkdX2UKGgGR0BwifZ13dKvaAdN8QJoCEdApNN+aYu01XV9lChoBkdAcQL1sLv1DmgHS8poCEdApNRShg3Lm3V9lChoBkdAOM+TeO4oZ2gHS8toCEdApNSQNgBtDXV9lChoBkdAbi2mJFb3XmgHS+5oCEdApNVrt1IRRXV9lChoBkdAcNXMXrMTvmgHS/doCEdApNYK7Xg9/3V9lChoBkdAbTZr4WUKRmgHS9NoCEdApNaj7yhBaHV9lChoBkdAbsyhq0tyxWgHS9hoCEdApNcAUxmCiHV9lChoBkdAZBVjQzDXOGgHTegDaAhHQKTXkV1wHZ91fZQoaAZHQHKuUXUH6dloB0v+aAhHQKTX7PhybQV1fZQoaAZHQG+JM6aLGaRoB039AWgIR0Ck2F3Wvr4WdX2UKGgGR0BvT+/N7jT8aAdNCgFoCEdApNjAkX1rZnV9lChoBkdAZBUvkBCD3GgHTegDaAhHQKTZZch1Tzd1fZQoaAZHQGL8qNQ0oBtoB03oA2gIR0Ck2dLFGXoldX2UKGgGR0BxVDF4s3AEaAdL1GgIR0Ck2f4qXnhbdX2UKGgGR0BusYN0/4ZdaAdL42gIR0Ck2skdmxt6dX2UKGgGR0BvpOCROk+HaAdL1GgIR0Ck2vDhDPWydX2UKGgGR0BvhRDzAeq8aAdL1mgIR0Ck2zomgJ1JdX2UKGgGR0Bg7kPJ7sv7aAdN6ANoCEdApNtQNTcZcnV9lChoBkdAcCteZof0VmgHS+loCEdApNzEnNPgvXV9lChoBkdAbo4DM/yGz2gHS9poCEdApN14/xDst3V9lChoBkdAcVnbWEsasWgHTWgCaAhHQKTecwPAfuF1fZQoaAZHQG7lbiqABktoB0vIaAhHQKTe4yJKraN1fZQoaAZHQG6BpvP1L8JoB0vkaAhHQKTff9R77bd1fZQoaAZHQHBVhm03OwBoB0v8aAhHQKTgFpYcNpd1fZQoaAZHQGI4hZyMkyFoB03oA2gIR0Ck4JLiVB2PdX2UKGgGR0BwIfZQHiWFaAdLz2gIR0Ck4LXHq/ucdX2UKGgGR0BxUvWjGkvcaAdL7WgIR0Ck4U33Hq/udX2UKGgGR0BvxyoAGSpzaAdL02gIR0Ck4Wd2HLzPdX2UKGgGR0Boq3k7wKBvaAdNQQFoCEdApOGCSidrf3V9lChoBkdAYspreIl+mWgHTegDaAhHQKThlr30wrV1fZQoaAZHQG8FLcbiqABoB0veaAhHQKTiAFj/dZd1fZQoaAZHQHBRXjyWiURoB00cAWgIR0Ck4g4287IUdX2UKGgGR0BwFJzp5eJIaAdL6GgIR0Ck4ia6J66bdX2UKGgGR0Byg2eSSvC/aAdL8WgIR0Ck4iQdjoZAdX2UKGgGR0BwkiiHqNZNaAdL82gIR0Ck42M4tHx0dX2UKGgGR0Bv2YBRyfcvaAdL6WgIR0Ck46VObiIddX2UKGgGR0ByfFcPe54GaAdL22gIR0Ck5DF2/zredX2UKGgGR0BvEHEjxCpnaAdL7GgIR0Ck5E2ycCo1dX2UKGgGR0Bvke6TW5H3aAdLyWgIR0Ck5NbQLNOedX2UKGgGR0BwJDFAE+xGaAdL22gIR0Ck5OVlf7aadX2UKGgGR0Bwe7Z13dKvaAdL7mgIR0Ck5Pi83++/dX2UKGgGR0BwbVqBVdX1aAdL1mgIR0Ck5eWmHgxbdX2UKGgGR0BwxO2SdOIqaAdL6GgIR0Ck5jgGSpzcdX2UKGgGR0Bwq+XhOxjbaAdL4WgIR0Ck5kKdYnv2dX2UKGgGR0BuDRa5f+juaAdNCAFoCEdApOZfZuhsZnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 690, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 20, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 512, "n_epochs": 23, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.109+-x86_64-with-glibc2.35 # 1 SMP Fri Jun 9 10:57:30 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.1.0", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x000001630D2B2E80>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x000001630D2B2F20>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x000001630D2B2FC0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x000001630D2B3060>", "_build": "<function ActorCriticPolicy._build at 0x000001630D2B3100>", "forward": "<function ActorCriticPolicy.forward at 0x000001630D2B31A0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x000001630D2B3240>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x000001630D2B32E0>", "_predict": "<function ActorCriticPolicy._predict at 0x000001630D2B3380>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x000001630D2B3420>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x000001630D2B34C0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x000001630D2B3560>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x000001630D2AA900>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1693165098167503900, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAJp56Tu4pN27MFHSPYUb4L1BwYU83n0svgAAgD8AAIA/ZkQVPMMlJzk2VKC7J5Jdu3HhW7tPbDa9AAAAAAAAAADAVeA99kRMutZsvDvAmsm4j41xugGmwbcAAIA/AACAP+aCHL32DEW6VgFkunnp2DwZNCe6AgaruwAAgD8AAIA/zTTjPApbGDoOTr87distPKKo+jnYjAs5AAAAAAAAAACaJbo7PQYmOkXchrutpBY9BshkOi9vATwAAAAAAAAAAI19kr5+2Pc+fsFKPl+qp74RLBK9Gi8iPgAAAAAAAAAAzaYDPLjG1rnyFIo7ZgANvbC4TjsqtPe9AAAAAAAAgD9mlhy99rxzuubCgjm7Jog0P2+ZOi3xlLgAAIA/AACAPwBwxTvh6Ia6KLoYunFhCjZmWdm5bm4sOQAAgD8AAIA/MwD4vMMRGLpKx6G6/MbJtcWZOLutlLw5AACAPwAAgD8NGa69bSNCPt+TCT48I4q+ZyHZPHUeQb0AAAAAAAAAAK0gOL7YBf0+YFlYPsuvn76ugTQ92bsnPAAAAAAAAAAAM5trvDgzq7tZh5E8ZAqBPEUMGr1QMVw9AACAPwAAgD/NiKi7KVxNN0VDC7t6N/K8JBqoO82SVLsAAAAAAAAAAAAsL73sx+Y6ntkPuyKqmj1feA66av+huwAAAAAAAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHFXCgf2boeMAWyUTQYBjAF0lEdAkktlJYkmhXV9lChoBkdAcFOiAlOXV2gHTQUBaAhHQJJLpsJpnHx1fZQoaAZHQHLaDBRAKOVoB0v6aAhHQJJLthttQ9B1fZQoaAZHQHGWJ44ZMtdoB01HAWgIR0CSS+XT3IuHdX2UKGgGR0BwaEHE/B3zaAdNBQFoCEdAkk0jtb9qDnV9lChoBkdAcPp3V09yLmgHS/xoCEdAkk0qXBxgiXV9lChoBkdAcqnmLcbiqGgHTT0BaAhHQJJOB6Tnq3V1fZQoaAZHQDwx15jYqXpoB0vgaAhHQJJP73QD3dt1fZQoaAZHQHD0Lz9S/CZoB00ZAWgIR0CSUIdJ8OTadX2UKGgGR0Bx2IoQWepXaAdNAQFoCEdAklIpH/cWTHV9lChoBkdAcI5Hh0hePmgHTRoBaAhHQJJSZawD/2l1fZQoaAZHQHH633YcvM9oB00vAWgIR0CSUp+Yc/+sdX2UKGgGR0BwxeYJE6T4aAdNIwFoCEdAklLYBzV+Z3V9lChoBkdAbKPiobXHzmgHTQ0BaAhHQJJTbsF+uvF1fZQoaAZHQHLZjbeuV5doB00BAWgIR0CSU7JUo8ZDdX2UKGgGR0BxUmT/yXlbaAdNDQFoCEdAklRE8A7xNXV9lChoBkdAbRk1Aqur62gHTQkBaAhHQJJUdKraM751fZQoaAZHQG1OpZW7vohoB00OAWgIR0CSVMyWAwwkdX2UKGgGR0BwD3FwT/Q0aAdNCgFoCEdAklXuI68xsXV9lChoBkdAcC+h9LHuJGgHTV4BaAhHQJJ9clPacqh1fZQoaAZHQG+3qNQ0oBtoB00NAWgIR0CShb1KGtZFdX2UKGgGR0BZR0n9ehPCaAdN6ANoCEdAkphSHARChXV9lChoBkdAUaB8iOearmgHTegDaAhHQJKquYUnG851fZQoaAZHQFu0IKc/dIpoB03oA2gIR0CSrK9DQZ4wdX2UKGgGR0BY7t6gM+eOaAdN6ANoCEdAkrFbQb+98XV9lChoBkdAWGrlq8DjimgHTegDaAhHQJKyuYfGMn91fZQoaAZHQFoYNzKcNH9oB03oA2gIR0CStkfO2RaHdX2UKGgGR0BgLsdJaq0daAdN6ANoCEdAkrbDxG2CunV9lChoBkdAWe6yZ8a4t2gHTegDaAhHQJK3SdlNDdB1fZQoaAZHQF8gMoMKCxxoB03oA2gIR0CSt7+d9UjtdX2UKGgGR0BRVkmhM8HOaAdN6ANoCEdAkrjvva11GXV9lChoBkdAV48yULUkOmgHTegDaAhHQJK5h1GLDQ91fZQoaAZHQF7kpMHryDtoB03oA2gIR0CSuruMdcSodX2UKGgGR0BUz6BI4EOiaAdN6ANoCEdAkrsh6nivPnV9lChoBkdAUGhbmlqJuWgHTegDaAhHQJK9sU9IPLB1fZQoaAZHQFHi55qubI9oB03oA2gIR0CSvvTsIE8rdX2UKGgGR0Beb3rhR64UaAdN6ANoCEdAkuwcbaRISXV9lChoBkdAX9I/1QIldGgHTegDaAhHQJL8y4b0e2d1fZQoaAZHQGDwMlC1JDpoB03oA2gIR0CTDRZOzposdX2UKGgGR0BSh8JUo8ZDaAdN6ANoCEdAkw6v4qPOp3V9lChoBkdAXvgyoGY8dWgHTegDaAhHQJMSoHv+fiB1fZQoaAZHQGF4ZFPSDyxoB03oA2gIR0CTE86Z6UqydX2UKGgGR0BbO/r4WUKRaAdN6ANoCEdAkxc4FA3T/nV9lChoBkdAXkYvsZ5zHWgHTegDaAhHQJMXsvqTr3V1fZQoaAZHQFgVHi3ocJdoB03oA2gIR0CTGCm7aqS6dX2UKGgGR0BeLpfhMrVfaAdN6ANoCEdAkxighwEQoXV9lChoBkdATmY+GGmDUWgHTegDaAhHQJMZ0Ka5PM11fZQoaAZHQGJNoj4YaYNoB03oA2gIR0CTGlfP5YYBdX2UKGgGR0BhUy8FpwjuaAdN6ANoCEdAkxtGcSXdCXV9lChoBkdAXLY/2TPjXGgHTegDaAhHQJMbif7Jnxt1fZQoaAZHQEbrT0g8r7RoB03oA2gIR0CTHUNXHR1HdX2UKGgGR0BVCrOiWVu8aAdN6ANoCEdAkx5+ws5GSnV9lChoBkdAWWB9YwIt2GgHTegDaAhHQJNLuKWLP2R1fZQoaAZHQGJopMpPRAtoB03oA2gIR0CTXIqQiiZfdX2UKGgGR0BcVyR8twrEaAdN6ANoCEdAk2w5soDxLHV9lChoBkdAWGyOOsDGLmgHTegDaAhHQJNtweS0Sh91fZQoaAZHQFazlFMIu5BoB03oA2gIR0CTca9tuUD/dX2UKGgGR0Ba1xUBGQS0aAdN6ANoCEdAk3LflZHNHHV9lChoBkdAWXK4LCvX9WgHTegDaAhHQJN1vcSGrS51fZQoaAZHQF/lV4X40uVoB03oA2gIR0CTdiU34sVddX2UKGgGR0Bi2ITCcf/4aAdN6ANoCEdAk3aGdiDujXV9lChoBkdAYRbJYkmhNGgHTegDaAhHQJN23ojfNzN1fZQoaAZHQFuCNX5nDixoB03oA2gIR0CTd6xcE/0NdX2UKGgGR0BTIsafjCHiaAdN6ANoCEdAk3gRw2l2vHV9lChoBkdAX5tjlPrOaGgHTegDaAhHQJN49AnlXBB1fZQoaAZHQFyzdfb9If9oB03oA2gIR0CTeT/I8yN5dX2UKGgGR0BelHEQ5FPSaAdN6ANoCEdAk3snPE87p3V9lChoBkdAYshtBOYYzmgHTegDaAhHQJN8/UDuBtl1fZQoaAZHQGAlExqO939oB03oA2gIR0CTqXU8FINFdX2UKGgGR0BhMjfxc3VDaAdN6ANoCEdAk7nQX2ugYnV9lChoBkdAYe/B1s+FDmgHTegDaAhHQJPHWptJnQJ1fZQoaAZHQGBO4SpR4yJoB03oA2gIR0CTyOLVnVXndX2UKGgGR0BhG2XgLqlhaAdN6ANoCEdAk8z3QD3dsXV9lChoBkdAYDZpeu3c6GgHTegDaAhHQJPN5/RVp9J1fZQoaAZHQGBdK2BreqJoB03oA2gIR0CT0Dvjfek6dX2UKGgGR0Bg2XRqoIfKaAdN6ANoCEdAk9CR8IAwPHV9lChoBkdAZpGWtU4rBmgHTegDaAhHQJPQ4cYIjW11fZQoaAZHQGF2HYQJ5VxoB03oA2gIR0CT0TCgsbvPdX2UKGgGR0BbnvgJkXk6aAdN6ANoCEdAk9Hq/IsAenV9lChoBkdAVeu9US7GvWgHTegDaAhHQJPSSkDZDiR1fZQoaAZHQGKFOlfqoqFoB03oA2gIR0CT0vdQwblzdX2UKGgGR0Bce+0G/vfCaAdN6ANoCEdAk9Mthy8zynV9lChoBkdAWudGrjo6jmgHTegDaAhHQJPUxhqj8DV1fZQoaAZHQGO/kqc3EQ5oB03oA2gIR0CT1hka/ATJdX2UKGgGR0BX75jYqXnhaAdN6ANoCEdAlANnscABDHV9lChoBkdAWY/2kBS1mmgHTegDaAhHQJQUEbaRISV1fZQoaAZHQGFDo8hcJMRoB03oA2gIR0CUI/cTrVvudX2UKGgGR0BvKFDF6zE8aAdNjQNoCEdAlCSSvX9R8HV9lChoBkdAYQHvYODraGgHTegDaAhHQJQlgExIre91fZQoaAZHQGM2G+sYEW9oB03oA2gIR0CUKXDgqEvkdX2UKGgGR0BU7gHNX5nEaAdN6ANoCEdAlC3lpTMq0HV9lChoBkdAYgOZJkGzKWgHTegDaAhHQJQuTh73PAx1fZQoaAZHQFUPtmL9/BpoB03oA2gIR0CULrJxNqQBdX2UKGgGR0BbQIH5aePJaAdN6ANoCEdAlC8RrJr+HnV9lChoBkdAXslGrjo6jmgHTegDaAhHQJQv9gmZ3LV1fZQoaAZHQFpWRFqi48VoB03oA2gIR0CUMGWluWKNdX2UKGgGR0BkWma4MF2WaAdN6ANoCEdAlDEzf779AHV9lChoBkdAXrodHUc4pGgHTegDaAhHQJQxdw5vLox1fZQoaAZHQFz2WdEsrd5oB03oA2gIR0CUM2SXt0FKdX2UKGgGR0BjucUbkwN9aAdN6ANoCEdAlDUa7NB4U3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 372, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWVnwEAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBBfX2dlbmVyYXRvcl9jdG9ylJOUjAVQQ0c2NJRoG4wUX19iaXRfZ2VuZXJhdG9yX2N0b3KUk5SGlFKUfZQojA1iaXRfZ2VuZXJhdG9ylIwFUENHNjSUjAVzdGF0ZZR9lChoJooQVWit40MD1/+RECJ/K8NKGIwDaW5jlIoRjS1pR1UecEBB1rNOLUJ72AB1jApoYXNfdWludDMylEsAjAh1aW50ZWdlcpRLAHVidWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": "Generator(PCG64)"}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.97, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 6, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjFVjOlxVc2Vyc1xhZGl0eVxhbmFjb25kYTNcZW52c1xzYjNcTGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4NDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5RoDHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjFVjOlxVc2Vyc1xhZGl0eVxhbmFjb25kYTNcZW52c1xzYjNcTGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4NDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5RoDHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "system_info": {"OS": "Windows-10-10.0.22621-SP0 10.0.22621", "Python": "3.11.4", "Stable-Baselines3": "2.1.0", "PyTorch": "2.0.1", "GPU Enabled": "True", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1"}}
ppo-LunarLander-v2.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60feb7a67d0dd6fa568fa950d3439f57ba240f93635c0a0c4b5035514ccff908
3
+ size 146907
ppo-LunarLander-v2/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 2.1.0
ppo-LunarLander-v2/data ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
+ "__module__": "stable_baselines3.common.policies",
6
+ "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x000001630D2B2E80>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x000001630D2B2F20>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x000001630D2B2FC0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x000001630D2B3060>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x000001630D2B3100>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x000001630D2B31A0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x000001630D2B3240>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x000001630D2B32E0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x000001630D2B3380>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x000001630D2B3420>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x000001630D2B34C0>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x000001630D2B3560>",
19
+ "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x000001630D2AA900>"
21
+ },
22
+ "verbose": 1,
23
+ "policy_kwargs": {},
24
+ "num_timesteps": 1015808,
25
+ "_total_timesteps": 1000000,
26
+ "_num_timesteps_at_start": 0,
27
+ "seed": null,
28
+ "action_noise": null,
29
+ "start_time": 1693165098167503900,
30
+ "learning_rate": 0.0003,
31
+ "tensorboard_log": null,
32
+ "_last_obs": {
33
+ ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAJp56Tu4pN27MFHSPYUb4L1BwYU83n0svgAAgD8AAIA/ZkQVPMMlJzk2VKC7J5Jdu3HhW7tPbDa9AAAAAAAAAADAVeA99kRMutZsvDvAmsm4j41xugGmwbcAAIA/AACAP+aCHL32DEW6VgFkunnp2DwZNCe6AgaruwAAgD8AAIA/zTTjPApbGDoOTr87distPKKo+jnYjAs5AAAAAAAAAACaJbo7PQYmOkXchrutpBY9BshkOi9vATwAAAAAAAAAAI19kr5+2Pc+fsFKPl+qp74RLBK9Gi8iPgAAAAAAAAAAzaYDPLjG1rnyFIo7ZgANvbC4TjsqtPe9AAAAAAAAgD9mlhy99rxzuubCgjm7Jog0P2+ZOi3xlLgAAIA/AACAPwBwxTvh6Ia6KLoYunFhCjZmWdm5bm4sOQAAgD8AAIA/MwD4vMMRGLpKx6G6/MbJtcWZOLutlLw5AACAPwAAgD8NGa69bSNCPt+TCT48I4q+ZyHZPHUeQb0AAAAAAAAAAK0gOL7YBf0+YFlYPsuvn76ugTQ92bsnPAAAAAAAAAAAM5trvDgzq7tZh5E8ZAqBPEUMGr1QMVw9AACAPwAAgD/NiKi7KVxNN0VDC7t6N/K8JBqoO82SVLsAAAAAAAAAAAAsL73sx+Y6ntkPuyKqmj1feA66av+huwAAAAAAAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
+ },
36
+ "_last_episode_starts": {
37
+ ":type:": "<class 'numpy.ndarray'>",
38
+ ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
39
+ },
40
+ "_last_original_obs": null,
41
+ "_episode_num": 0,
42
+ "use_sde": false,
43
+ "sde_sample_freq": -1,
44
+ "_current_progress_remaining": -0.015808000000000044,
45
+ "_stats_window_size": 100,
46
+ "ep_info_buffer": {
47
+ ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWVQQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHFXCgf2boeMAWyUTQYBjAF0lEdAkktlJYkmhXV9lChoBkdAcFOiAlOXV2gHTQUBaAhHQJJLpsJpnHx1fZQoaAZHQHLaDBRAKOVoB0v6aAhHQJJLthttQ9B1fZQoaAZHQHGWJ44ZMtdoB01HAWgIR0CSS+XT3IuHdX2UKGgGR0BwaEHE/B3zaAdNBQFoCEdAkk0jtb9qDnV9lChoBkdAcPp3V09yLmgHS/xoCEdAkk0qXBxgiXV9lChoBkdAcqnmLcbiqGgHTT0BaAhHQJJOB6Tnq3V1fZQoaAZHQDwx15jYqXpoB0vgaAhHQJJP73QD3dt1fZQoaAZHQHD0Lz9S/CZoB00ZAWgIR0CSUIdJ8OTadX2UKGgGR0Bx2IoQWepXaAdNAQFoCEdAklIpH/cWTHV9lChoBkdAcI5Hh0hePmgHTRoBaAhHQJJSZawD/2l1fZQoaAZHQHH633YcvM9oB00vAWgIR0CSUp+Yc/+sdX2UKGgGR0BwxeYJE6T4aAdNIwFoCEdAklLYBzV+Z3V9lChoBkdAbKPiobXHzmgHTQ0BaAhHQJJTbsF+uvF1fZQoaAZHQHLZjbeuV5doB00BAWgIR0CSU7JUo8ZDdX2UKGgGR0BxUmT/yXlbaAdNDQFoCEdAklRE8A7xNXV9lChoBkdAbRk1Aqur62gHTQkBaAhHQJJUdKraM751fZQoaAZHQG1OpZW7vohoB00OAWgIR0CSVMyWAwwkdX2UKGgGR0BwD3FwT/Q0aAdNCgFoCEdAklXuI68xsXV9lChoBkdAcC+h9LHuJGgHTV4BaAhHQJJ9clPacqh1fZQoaAZHQG+3qNQ0oBtoB00NAWgIR0CShb1KGtZFdX2UKGgGR0BZR0n9ehPCaAdN6ANoCEdAkphSHARChXV9lChoBkdAUaB8iOearmgHTegDaAhHQJKquYUnG851fZQoaAZHQFu0IKc/dIpoB03oA2gIR0CSrK9DQZ4wdX2UKGgGR0BY7t6gM+eOaAdN6ANoCEdAkrFbQb+98XV9lChoBkdAWGrlq8DjimgHTegDaAhHQJKyuYfGMn91fZQoaAZHQFoYNzKcNH9oB03oA2gIR0CStkfO2RaHdX2UKGgGR0BgLsdJaq0daAdN6ANoCEdAkrbDxG2CunV9lChoBkdAWe6yZ8a4t2gHTegDaAhHQJK3SdlNDdB1fZQoaAZHQF8gMoMKCxxoB03oA2gIR0CSt7+d9UjtdX2UKGgGR0BRVkmhM8HOaAdN6ANoCEdAkrjvva11GXV9lChoBkdAV48yULUkOmgHTegDaAhHQJK5h1GLDQ91fZQoaAZHQF7kpMHryDtoB03oA2gIR0CSuruMdcSodX2UKGgGR0BUz6BI4EOiaAdN6ANoCEdAkrsh6nivPnV9lChoBkdAUGhbmlqJuWgHTegDaAhHQJK9sU9IPLB1fZQoaAZHQFHi55qubI9oB03oA2gIR0CSvvTsIE8rdX2UKGgGR0Beb3rhR64UaAdN6ANoCEdAkuwcbaRISXV9lChoBkdAX9I/1QIldGgHTegDaAhHQJL8y4b0e2d1fZQoaAZHQGDwMlC1JDpoB03oA2gIR0CTDRZOzposdX2UKGgGR0BSh8JUo8ZDaAdN6ANoCEdAkw6v4qPOp3V9lChoBkdAXvgyoGY8dWgHTegDaAhHQJMSoHv+fiB1fZQoaAZHQGF4ZFPSDyxoB03oA2gIR0CTE86Z6UqydX2UKGgGR0BbO/r4WUKRaAdN6ANoCEdAkxc4FA3T/nV9lChoBkdAXkYvsZ5zHWgHTegDaAhHQJMXsvqTr3V1fZQoaAZHQFgVHi3ocJdoB03oA2gIR0CTGCm7aqS6dX2UKGgGR0BeLpfhMrVfaAdN6ANoCEdAkxighwEQoXV9lChoBkdATmY+GGmDUWgHTegDaAhHQJMZ0Ka5PM11fZQoaAZHQGJNoj4YaYNoB03oA2gIR0CTGlfP5YYBdX2UKGgGR0BhUy8FpwjuaAdN6ANoCEdAkxtGcSXdCXV9lChoBkdAXLY/2TPjXGgHTegDaAhHQJMbif7Jnxt1fZQoaAZHQEbrT0g8r7RoB03oA2gIR0CTHUNXHR1HdX2UKGgGR0BVCrOiWVu8aAdN6ANoCEdAkx5+ws5GSnV9lChoBkdAWWB9YwIt2GgHTegDaAhHQJNLuKWLP2R1fZQoaAZHQGJopMpPRAtoB03oA2gIR0CTXIqQiiZfdX2UKGgGR0BcVyR8twrEaAdN6ANoCEdAk2w5soDxLHV9lChoBkdAWGyOOsDGLmgHTegDaAhHQJNtweS0Sh91fZQoaAZHQFazlFMIu5BoB03oA2gIR0CTca9tuUD/dX2UKGgGR0Ba1xUBGQS0aAdN6ANoCEdAk3LflZHNHHV9lChoBkdAWXK4LCvX9WgHTegDaAhHQJN1vcSGrS51fZQoaAZHQF/lV4X40uVoB03oA2gIR0CTdiU34sVddX2UKGgGR0Bi2ITCcf/4aAdN6ANoCEdAk3aGdiDujXV9lChoBkdAYRbJYkmhNGgHTegDaAhHQJN23ojfNzN1fZQoaAZHQFuCNX5nDixoB03oA2gIR0CTd6xcE/0NdX2UKGgGR0BTIsafjCHiaAdN6ANoCEdAk3gRw2l2vHV9lChoBkdAX5tjlPrOaGgHTegDaAhHQJN49AnlXBB1fZQoaAZHQFyzdfb9If9oB03oA2gIR0CTeT/I8yN5dX2UKGgGR0BelHEQ5FPSaAdN6ANoCEdAk3snPE87p3V9lChoBkdAYshtBOYYzmgHTegDaAhHQJN8/UDuBtl1fZQoaAZHQGAlExqO939oB03oA2gIR0CTqXU8FINFdX2UKGgGR0BhMjfxc3VDaAdN6ANoCEdAk7nQX2ugYnV9lChoBkdAYe/B1s+FDmgHTegDaAhHQJPHWptJnQJ1fZQoaAZHQGBO4SpR4yJoB03oA2gIR0CTyOLVnVXndX2UKGgGR0BhG2XgLqlhaAdN6ANoCEdAk8z3QD3dsXV9lChoBkdAYDZpeu3c6GgHTegDaAhHQJPN5/RVp9J1fZQoaAZHQGBdK2BreqJoB03oA2gIR0CT0Dvjfek6dX2UKGgGR0Bg2XRqoIfKaAdN6ANoCEdAk9CR8IAwPHV9lChoBkdAZpGWtU4rBmgHTegDaAhHQJPQ4cYIjW11fZQoaAZHQGF2HYQJ5VxoB03oA2gIR0CT0TCgsbvPdX2UKGgGR0BbnvgJkXk6aAdN6ANoCEdAk9Hq/IsAenV9lChoBkdAVeu9US7GvWgHTegDaAhHQJPSSkDZDiR1fZQoaAZHQGKFOlfqoqFoB03oA2gIR0CT0vdQwblzdX2UKGgGR0Bce+0G/vfCaAdN6ANoCEdAk9Mthy8zynV9lChoBkdAWudGrjo6jmgHTegDaAhHQJPUxhqj8DV1fZQoaAZHQGO/kqc3EQ5oB03oA2gIR0CT1hka/ATJdX2UKGgGR0BX75jYqXnhaAdN6ANoCEdAlANnscABDHV9lChoBkdAWY/2kBS1mmgHTegDaAhHQJQUEbaRISV1fZQoaAZHQGFDo8hcJMRoB03oA2gIR0CUI/cTrVvudX2UKGgGR0BvKFDF6zE8aAdNjQNoCEdAlCSSvX9R8HV9lChoBkdAYQHvYODraGgHTegDaAhHQJQlgExIre91fZQoaAZHQGM2G+sYEW9oB03oA2gIR0CUKXDgqEvkdX2UKGgGR0BU7gHNX5nEaAdN6ANoCEdAlC3lpTMq0HV9lChoBkdAYgOZJkGzKWgHTegDaAhHQJQuTh73PAx1fZQoaAZHQFUPtmL9/BpoB03oA2gIR0CULrJxNqQBdX2UKGgGR0BbQIH5aePJaAdN6ANoCEdAlC8RrJr+HnV9lChoBkdAXslGrjo6jmgHTegDaAhHQJQv9gmZ3LV1fZQoaAZHQFpWRFqi48VoB03oA2gIR0CUMGWluWKNdX2UKGgGR0BkWma4MF2WaAdN6ANoCEdAlDEzf779AHV9lChoBkdAXrodHUc4pGgHTegDaAhHQJQxdw5vLox1fZQoaAZHQFz2WdEsrd5oB03oA2gIR0CUM2SXt0FKdX2UKGgGR0BjucUbkwN9aAdN6ANoCEdAlDUa7NB4U3VlLg=="
49
+ },
50
+ "ep_success_buffer": {
51
+ ":type:": "<class 'collections.deque'>",
52
+ ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
+ },
54
+ "_n_updates": 372,
55
+ "observation_space": {
56
+ ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
+ ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
58
+ "dtype": "float32",
59
+ "bounded_below": "[ True True True True True True True True]",
60
+ "bounded_above": "[ True True True True True True True True]",
61
+ "_shape": [
62
+ 8
63
+ ],
64
+ "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
65
+ "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
66
+ "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
67
+ "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
68
+ "_np_random": null
69
+ },
70
+ "action_space": {
71
+ ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
72
+ ":serialized:": "gAWVnwEAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBBfX2dlbmVyYXRvcl9jdG9ylJOUjAVQQ0c2NJRoG4wUX19iaXRfZ2VuZXJhdG9yX2N0b3KUk5SGlFKUfZQojA1iaXRfZ2VuZXJhdG9ylIwFUENHNjSUjAVzdGF0ZZR9lChoJooQVWit40MD1/+RECJ/K8NKGIwDaW5jlIoRjS1pR1UecEBB1rNOLUJ72AB1jApoYXNfdWludDMylEsAjAh1aW50ZWdlcpRLAHVidWIu",
73
+ "n": "4",
74
+ "start": "0",
75
+ "_shape": [],
76
+ "dtype": "int64",
77
+ "_np_random": "Generator(PCG64)"
78
+ },
79
+ "n_envs": 16,
80
+ "n_steps": 1024,
81
+ "gamma": 0.999,
82
+ "gae_lambda": 0.97,
83
+ "ent_coef": 0.01,
84
+ "vf_coef": 0.5,
85
+ "max_grad_norm": 0.5,
86
+ "batch_size": 64,
87
+ "n_epochs": 6,
88
+ "clip_range": {
89
+ ":type:": "<class 'function'>",
90
+ ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjFVjOlxVc2Vyc1xhZGl0eVxhbmFjb25kYTNcZW52c1xzYjNcTGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4NDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5RoDHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
91
+ },
92
+ "clip_range_vf": null,
93
+ "normalize_advantage": true,
94
+ "target_kl": null,
95
+ "lr_schedule": {
96
+ ":type:": "<class 'function'>",
97
+ ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjFVjOlxVc2Vyc1xhZGl0eVxhbmFjb25kYTNcZW52c1xzYjNcTGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4NDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5RoDHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
98
+ }
99
+ }
ppo-LunarLander-v2/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee800822a694302fc6a217ef185e231b8286881414b18eebe244c4e435f4a72b
3
+ size 87929
ppo-LunarLander-v2/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:434f18f8816f8997936f66dea4c9050235e001ce1bbea9c5b67f87accbbc1bdd
3
+ size 43329
ppo-LunarLander-v2/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1
3
+ size 431
ppo-LunarLander-v2/system_info.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ - OS: Windows-10-10.0.22621-SP0 10.0.22621
2
+ - Python: 3.11.4
3
+ - Stable-Baselines3: 2.1.0
4
+ - PyTorch: 2.0.1
5
+ - GPU Enabled: True
6
+ - Numpy: 1.25.2
7
+ - Cloudpickle: 2.2.1
8
+ - Gymnasium: 0.28.1
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 216.83668219999998, "std_reward": 99.52550730969489, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-08-27T15:30:44.260900"}
 
1
+ {"mean_reward": 266.46527890000004, "std_reward": 20.495153794780187, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-08-27T16:03:46.620705"}