fredchung commited on
Commit
db40e5f
·
1 Parent(s): 583008f

Incrased epoch led to increase in mean reward.

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 268.09 +/- 20.94
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 277.86 +/- 11.59
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7b29f4fcd990>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7b29f4fcda20>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7b29f4fcdab0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7b29f4fcdb40>", "_build": "<function ActorCriticPolicy._build at 0x7b29f4fcdbd0>", "forward": "<function ActorCriticPolicy.forward at 0x7b29f4fcdc60>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7b29f4fcdcf0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7b29f4fcdd80>", "_predict": "<function ActorCriticPolicy._predict at 0x7b29f4fcde10>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7b29f4fcdea0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7b29f4fcdf30>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7b29f4fcdfc0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7b29f5167380>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1695506330784314652, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGYkd7zDCTu6vkiFtrY9N7IzR2U7ZridNQAAgD8AAIA/ZvaeO49iJrpopHM6CmqjNe/bgTt+5I25AACAPwAAgD+aEbe8FCyWusvC6brRqva1kWiyuSEUBzoAAIA/AACAP80rS70Uzr248yTeupY9NrZJiTS6f1IDOgAAgD8AAIA/ZlHHPK5LkrrsNCQ4Ri6OMyMFBzs7hju3AACAPwAAgD/NlzC9FJiEuigc8rutwSM4+K9EO7FXFbcAAIA/AACAPwBXST17IIa6zsCMufLMJLWdlg47erKfOAAAgD8AAIA/AOxivMOhdbrFPcy6x0lYtuI9kzo2T+k5AACAPwAAgD9mPg67nbysPyxgOrw7Or2+aI+oPFVqbzsAAAAAAAAAALPkJ71IG5+61ZPiumSv+rUJjus3coMCOgAAgD8AAIA/gDUPvVx7A7rLEG03dR3FMja6izq/HIq2AACAPwAAgD/NOKK9FCyfuuy4AThzusgyTTMTuIb2FLcAAIA/AACAP2ZGgTwIOaC8zXHfOjeDET3gLRG+8JXfPQAAgD8AAIA/zZIGvPZUabqcKKa6bD0dNZINljuTK5W0AACAPwAAgD/m1OQ9oeuWvG73Hr7bRpK9mDPTPa6JwT4AAIA/AACAP00VTD0pXGm6Ku9IuS93wjPGpCi7ogJmOAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVOQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGcl6MaS9uiMAWyUTegDjAF0lEdAsOyNdiUgS3V9lChoBkdAZxF07KaG6GgHTegDaAhHQLDt+gpjMFF1fZQoaAZHQHFRD4pMHr1oB02HA2gIR0Cw7jARwqAjdX2UKGgGR0BmRPEfkmx/aAdN6ANoCEdAsO5maWom5XV9lChoBkdAYwIL8aXKKmgHTegDaAhHQLDujIznA7B1fZQoaAZHQGZd6w2VE/loB03oA2gIR0Cw7tcpobn6dX2UKGgGR0Bp1hQ53kgfaAdN6ANoCEdAsO9jMEA5rHV9lChoBkdAadWqABkqc2gHTegDaAhHQLDxCsWfseJ1fZQoaAZHQGX+/BFd9lVoB03oA2gIR0Cw8juJP69CdX2UKGgGR0BjMTZFocrBaAdN6ANoCEdAsPKP8AJb+3V9lChoBkdAacUCDEm6XmgHTegDaAhHQLD0tZf2K2t1fZQoaAZHQGxfkH+qBEtoB01VA2gIR0Cw9R8JD3M7dX2UKGgGR0BnGn4fwI+oaAdN6ANoCEdAsPWgImgJ1XV9lChoBkdAZXW5uIhyKmgHTegDaAhHQLD3SvGp++d1fZQoaAZHQGLUIO6NEPVoB03oA2gIR0Cw+B1A3T/idX2UKGgGR0BjjTmKZUkwaAdN6ANoCEdAsPkMUM5OrXV9lChoBkdAYe2AOrhismgHTegDaAhHQLD5IFDfFaV1fZQoaAZHQHJu4t16mfpoB00yAmgIR0Cw+TmxY7q6dX2UKGgGR0Bnr04rBj4IaAdN6ANoCEdAsRLLoX9BKXV9lChoBkdAYFh4rz5GjWgHTegDaAhHQLETBLsrupl1fZQoaAZHQGV8LupjtoloB03oA2gIR0CxEz4Lw4KhdX2UKGgGR0ByuJ5IH1OCaAdNDwFoCEdAsRNMdLg4wXV9lChoBkdAZDKsMiKR+2gHTegDaAhHQLETZqwQlKN1fZQoaAZHQGioEPtlZoxoB03oA2gIR0CxE5f4qPOqdX2UKGgGR0Bwi5z+3pfQaAdNMQJoCEdAsROjzMA3k3V9lChoBkdAZcoqNp/PPmgHTegDaAhHQLET86gM+eR1fZQoaAZHQDWrwrlNlAhoB0uXaAhHQLEVCAvtdAx1fZQoaAZHQGfoxTCLuQZoB03oA2gIR0CxFRVd5Y5ldX2UKGgGR0BmAzSy+pOvaAdN6ANoCEdAsRYARChN/XV9lChoBkdAcTiFhoduHmgHTVsDaAhHQLEWLea8Yht1fZQoaAZHQHFZTsyBTXJoB03fAWgIR0CxGETK1XvIdX2UKGgGR0BnuIFotcv/aAdN6ANoCEdAsRiluQ6p53V9lChoBkdAcshVQQ+UyGgHTRECaAhHQLEYv4etCAt1fZQoaAZHQGTIhUaQ3gloB03oA2gIR0CxGkQIUrTZdX2UKGgGR0BmKaGL1mJ4aAdN6ANoCEdAsRwc4YJmd3V9lChoBkdAZxap++dsi2gHTegDaAhHQLEcOsQNCqp1fZQoaAZHQGQL18kUsWhoB03oA2gIR0CxHGDoUzsQdX2UKGgGR0BkWxOzposaaAdN6ANoCEdAsR58593KS3V9lChoBkdAZ1njCpFTemgHTegDaAhHQLEe1MpgCwN1fZQoaAZHQGcptdRiw0RoB03oA2gIR0CxHykCvHLidX2UKGgGR0Bw9gpKBd2QaAdNUwFoCEdAsR9BW+49YHV9lChoBkdAZVlPqLS/kGgHTegDaAhHQLEfr029+PR1fZQoaAZHQGow75uZThpoB03oA2gIR0CxIEfBJqZddX2UKGgGR0Bk3J8F6iTMaAdN6ANoCEdAsSHUG9pRGnV9lChoBkdAZUoer+5vtWgHTegDaAhHQLEh36VMVUN1fZQoaAZHQGQaaguh9LJoB03oA2gIR0CxItiXdCVsdX2UKGgGR0BmKyKYRdyDaAdN6ANoCEdAsSMHrxAjZHV9lChoBkdARON1KXfIjmgHS5toCEdAsSTOAtnPFHV9lChoBkdAYTfaUzKs+2gHTegDaAhHQLElO+w1R+B1fZQoaAZHQGni9CNS619oB03oA2gIR0CxJZsB2fTTdX2UKGgGR0BoRdC7btZ3aAdN6ANoCEdAsSWz8n/kvXV9lChoBkdAcFZS13MY/GgHTWADaAhHQLEnX3WnTAp1fZQoaAZHQGdH2bPQfIVoB03oA2gIR0CxKK+pOvdNdX2UKGgGR0BoQMJMQEpzaAdN6ANoCEdAsSjCqhlDnnV9lChoBkdAZv3UjLSuyWgHTegDaAhHQLFCR1+AmRh1fZQoaAZHQGzaLyDqW1NoB02iA2gIR0CxQlpbY9PldX2UKGgGR0Bm4movSMLnaAdN6ANoCEdAsUJ/6YVqOHV9lChoBkdAZT9+CsfaH2gHTegDaAhHQLFCsrSE12t1fZQoaAZHQHJjSro4dZJoB00rA2gIR0CxQrpemelLdX2UKGgGR0BjL56F/QSjaAdN6ANoCEdAsULAdwNsnHV9lChoBkdAZUKuhbnoxGgHTegDaAhHQLFDY60IC2d1fZQoaAZHQHE4qUVzp5hoB016AmgIR0CxQ4dSIgvEdX2UKGgGR0BLQjrJKaodaAdLomgIR0CxQ9QG0NSZdX2UKGgGR0BEyVhLGrCFaAdLqGgIR0CxRC2qHXVcdX2UKGgGR0BTDEr08NhFaAdLvWgIR0CxRGxwMpgDdX2UKGgGR0BnQiQA+6iCaAdN6ANoCEdAsURwBxPweHV9lChoBkdAZsoYCQtBfWgHTegDaAhHQLFFRtix3V11fZQoaAZHQGNlKZtvXK9oB03oA2gIR0CxR4p1JUYLdX2UKGgGR0BmootthuwYaAdN6ANoCEdAsUfo2XLNfXV9lChoBkdAZ98Fotcv/WgHTegDaAhHQLFIARigCfZ1fZQoaAZHQHNIPa11GLFoB02HAWgIR0CxSEBE4NqhdX2UKGgGR0BxkpxAB1cMaAdNnAJoCEdAsUjp0ZFXrHV9lChoBkdAYsDeOXE61mgHTegDaAhHQLFJpjyFwkx1fZQoaAZHQE2N3os7MgVoB0u0aAhHQLFKQFvhqCZ1fZQoaAZHQGHBwnhKlHloB03oA2gIR0CxS0fduYQbdX2UKGgGR0Bj6h31SOzZaAdN6ANoCEdAsUthUDMeOnV9lChoBkdAcmCq1PWQOmgHTU0DaAhHQLFLcMQVbiZ1fZQoaAZHQGVLooE0SAZoB03oA2gIR0CxThcWXTmXdX2UKGgGR0BxxykpI+W4aAdNvgFoCEdAsU8SLpA2RHV9lChoBkdAY+S/Zdv862gHTegDaAhHQLFPHr6tT1l1fZQoaAZHQGT9MLF4s3BoB03oA2gIR0CxT03L3bmEdX2UKGgGR0Bk0c/bCaZyaAdN6ANoCEdAsU+s/D+BH3V9lChoBkdAaY6kiUxEfGgHTegDaAhHQLFQYkKu0Tl1fZQoaAZHQGbxoeYD1XhoB03oA2gIR0CxUGXscABDdX2UKGgGR0BumedK/VRUaAdN7wJoCEdAsVDlSvTw2HV9lChoBkdAcJWtShrWRWgHTRMCaAhHQLFRJvphWo51fZQoaAZHQGQpozN2TxJoB03oA2gIR0CxUVAsGxD9dX2UKGgGR0BwLQE4ecQRaAdNAwJoCEdAsVHAhmoR7XV9lChoBkdATugTh5xBFGgHS4poCEdAsVJyNm16V3V9lChoBkdAVz7Abhm5D2gHS7doCEdAsVKmp84Pw3V9lChoBkdAZIVjfek562gHTegDaAhHQLFTrp4rz5J1fZQoaAZHQGkP0QTVUddoB03oA2gIR0CxU8WmtQsPdX2UKGgGR0Bu1/c8DB/JaAdN0QFoCEdAsVRj83uNP3V9lChoBkdAN7JMYdhiLGgHS5hoCEdAsVVLhsImgXV9lChoBkdAYQTHXEqDsmgHTegDaAhHQLFVdnpB5X51fZQoaAZHQG3ov/JeVs1oB03eAmgIR0CxVen7gsK9dX2UKGgGR0Bj1c+RoysTaAdN6ANoCEdAsVavnEETx3V9lChoBkdAZxKOEug6EWgHTegDaAhHQLFWy5xzaK11fZQoaAZHQB3of8uSOipoB0ucaAhHQLFXCA+Y+jd1fZQoaAZHQD/unyd4FA5oB0ubaAhHQLFYVyu6mO51ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7e2a0f6172e0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e2a0f617370>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e2a0f617400>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e2a0f617490>", "_build": "<function ActorCriticPolicy._build at 0x7e2a0f617520>", "forward": "<function ActorCriticPolicy.forward at 0x7e2a0f6175b0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7e2a0f617640>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e2a0f6176d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7e2a0f617760>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e2a0f6177f0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e2a0f617880>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7e2a0f617910>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7e2a0f5c7700>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1695522685106348523, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALOj0b2GplY/kRA4vjH/KL8Frha+da8IvQAAAAAAAAAAmh/evAqRLru6aQY8lreQPLAcTLzFank9AACAPwAAgD9APC2+TuaFP5kCBr/kdTK/IVmFviYlk74AAAAAAAAAADO4Gb4iaoY+LpmBPowNiL7lyNS8brL6PQAAAAAAAAAAppB5vuq8Wj+jRgS+h9A/v63ehr7i3pU9AAAAAAAAAACAtBG9pK8cuzBS/TmhU408p5f7u7NTdD0AAIA/AACAPxqXBr32sDG6aMSUthp+gbE/UQu7mFq0NQAAgD8AAIA/Zu3TvBRQurpaUB05VUoONDKLYzm+TDO4AACAPwAAgD/wHme+2Qn3PoaAzT3pHBC/97svvlKrHz4AAAAAAAAAAIAWaL0KynC71YlkPHtGjDwYp7g8taZwvQAAgD8AAIA/JpDevdULFj73arA+gLJovozU4j3O9aw8AAAAAAAAAAAzKW68byPEPsPEoL1KpPu+T6ZqPJI3E74AAAAAAAAAADN6jb3a4KU/8A6nvqc4Ar/2dN+9kYy8vQAAAAAAAAAAzZ6cvK5HjbjrtYY5STOrNHhd0TtKdaS4AACAPwAAgD+zGhO9eTSZPlEpoT05EdK+TSM6PfNj0joAAAAAAAAAADNbODwuo689Jlf+veTem77EQ528/kKmvQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV5wsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHIVpXuE25yMAWyUS7qMAXSUR0ClplLFXJYDdX2UKGgGR0BzUdv863iJaAdL8WgIR0ClppwLNOdodX2UKGgGR0BxQsxQBPsSaAdL7WgIR0ClpqIBq9GrdX2UKGgGR0ByerLDAJswaAdLzWgIR0ClprFlbu+idX2UKGgGR0BuA1mrbQC0aAdL0mgIR0Clpr/xDst1dX2UKGgGR0BxjdpnHvMKaAdLz2gIR0Clp1U7KaG6dX2UKGgGR0Bw6Og7HQyAaAdL42gIR0Clp1qm8/UwdX2UKGgGR0BymnPiT+vRaAdL1WgIR0Clp23vx6OYdX2UKGgGR0BxlJyhi9ZiaAdL2mgIR0Clp/sx46fbdX2UKGgGR0BNO/bCaZx8aAdLnWgIR0ClqDEc0cfedX2UKGgGR0BzG4w+MZP3aAdL1WgIR0ClqK3PzFuOdX2UKGgGR0BtZ8Nc4YJmaAdLymgIR0ClqT7kGRmsdX2UKGgGR0BxCgeKbaysaAdL0mgIR0ClqabbUPQOdX2UKGgGR0Bx0ELkS26TaAdLuWgIR0ClqbeBYmsvdX2UKGgGR0BvxLRhMJyAaAdLzGgIR0ClqfMvIwM6dX2UKGgGR0BzH3giu+yraAdL5GgIR0ClqmSUC7sfdX2UKGgGR0BwlbkT6BRRaAdL2WgIR0Clqt8FhXr/dX2UKGgGR0B0KDHbRF7VaAdL/mgIR0ClqznUtqYadX2UKGgGR0ByvJFvybx3aAdL+GgIR0Clq2wuVX3hdX2UKGgGR0BwBZ40Mw10aAdL0mgIR0Clq4W6bvw3dX2UKGgGR0BynfbDdgv2aAdL+mgIR0Clq547zTWodX2UKGgGR0BQtFLBbfP5aAdLuWgIR0Clq6pYDDCQdX2UKGgGR0BxkvwKBun/aAdL5mgIR0Clq9748EFGdX2UKGgGR0B0bJdPci4baAdL8mgIR0Clq/bALy+YdX2UKGgGR0ByuhMAWBSUaAdL02gIR0ClrBbMPjGUdX2UKGgGR0BzvJ04iosJaAdNKgFoCEdApawdHvttynV9lChoBkdAcGX5dWyTp2gHS71oCEdApax1yimEXnV9lChoBkdAcfm8n/kvK2gHS+JoCEdApayMwi7kGXV9lChoBkdAcKL+pOvdM2gHS+NoCEdApa041LrX2HV9lChoBkdAcfXr6tT1kGgHS/BoCEdApa2Lp5eJHnV9lChoBkdAcwZwyIpH7WgHTQEBaAhHQKWtkJLM9r51fZQoaAZHQHOljWsijcpoB0vKaAhHQKWtonv2GqR1fZQoaAZHQHKT2ZZ0SytoB0vraAhHQKWtwTyrgfl1fZQoaAZHQG35T/hl18toB0u7aAhHQKWt66FuejF1fZQoaAZHQHObO63AmAtoB0vTaAhHQKWuIM+/xlR1fZQoaAZHQHFCBdpqREFoB0vpaAhHQKWuN+AmReV1fZQoaAZHQHDdk5yU9p1oB0vkaAhHQKWuSdCE6DJ1fZQoaAZHQHMt4OUdJatoB0vBaAhHQKWueKCQLeB1fZQoaAZHQHGf6pgkTpRoB0vtaAhHQKWuf2YfGMp1fZQoaAZHQHM0hd+ocaRoB0vdaAhHQKWuovBacI91fZQoaAZHQHAzTYI0IkZoB0vRaAhHQKWuoOmR/3F1fZQoaAZHQHPDilenhsJoB0vqaAhHQKWur8D0UXZ1fZQoaAZHQHKOwnc+JP9oB0vPaAhHQKWvCYw7DEZ1fZQoaAZHQHEifLX+VC5oB0vGaAhHQKWvl86V+ql1fZQoaAZHQHK9+VHFxXJoB00XAWgIR0Clr9RI8QqadX2UKGgGR0BwF9nh86V/aAdLv2gIR0Clr+e1a4c4dX2UKGgGR0BwJ4/OdGy5aAdLzGgIR0Clr/3k5p8GdX2UKGgGR0ByPHsHB1s+aAdLr2gIR0ClsAAjps42dX2UKGgGR0Bx8BIVdonKaAdL5WgIR0ClsEJqASWadX2UKGgGR0BxpbY/Vy3kaAdLqmgIR0ClsEVrylN2dX2UKGgGR0ByXkP+XJHRaAdL2WgIR0ClsFThYNiIdX2UKGgGR0BuUuKZUkv9aAdL2GgIR0ClsKkR8MNMdX2UKGgGR0By3tHc1wYMaAdLxmgIR0ClsNCih37ldX2UKGgGR0Bx5AwSJ0nxaAdL42gIR0ClsOKv3ai9dX2UKGgGR0Bx8wQ/X5FgaAdLy2gIR0ClsQVEuxr0dX2UKGgGR0Bwg8spXp4baAdL5WgIR0ClsSlqrR0EdX2UKGgGR0BzCLoxHoX9aAdL22gIR0ClsTbr9l3AdX2UKGgGR0BxkTSpiqhlaAdL22gIR0ClsaWNedCmdX2UKGgGR0ByjLRrrPdEaAdNAwFoCEdApbHBaC+UQnV9lChoBkdAcfbl+Vkc0mgHS+FoCEdApbJEBXCCSXV9lChoBkdAcZJaLn9vTGgHS8xoCEdApbJrNdJJ5HV9lChoBkdAcLcMjNY8uGgHS8toCEdApbJqpcX3xnV9lChoBkdAcomdDIBBA2gHS9hoCEdApbJ6fzz3AXV9lChoBkdAckGJvo/zKGgHS8VoCEdApbKfGp++d3V9lChoBkdAcej4/u9eyGgHS6xoCEdApbMhU1hsqXV9lChoBkdAc6qbMHKOk2gHS/RoCEdApbM/NHH3lHV9lChoBkdAcsuQ3xWkrWgHS8FoCEdApbNEgOjIrHV9lChoBkdAcsjsqrilzmgHS9loCEdApbNWi5/b03V9lChoBkdAcwlVxjriVGgHTQABaAhHQKWzdYGMXJp1fZQoaAZHQHD1YoE0SAZoB0vWaAhHQKWz16sySFJ1fZQoaAZHQHFiLHuJDVpoB01KAWgIR0Cls+DhUBGQdX2UKGgGR0Bya6j/MnqnaAdLsmgIR0Cls+mqHXVcdX2UKGgGR0BxD1xeb/fgaAdL2mgIR0Cls/Q4sEq2dX2UKGgGR0BxSCQEIPbxaAdLp2gIR0CltJB/qgRLdX2UKGgGR0BzgUqVhTfjaAdL52gIR0CltLQnhKlIdX2UKGgGR0ByYbpfQa73aAdLwmgIR0CltTMVclgMdX2UKGgGR0BzX0LSeAd5aAdLzmgIR0CltTR6fJ3gdX2UKGgGR0BwAW7OE/SqaAdL7WgIR0CltWrRrrPddX2UKGgGR0BxriM3qAz6aAdNbgFoCEdApbWGF10T13V9lChoBkdAdEuIBzV+Z2gHS+5oCEdApbWU/Y8MeHV9lChoBkdAcxyEZR8+imgHS7xoCEdApbWnw7T2FnV9lChoBkdAb29TRYzSC2gHS7toCEdApbW+kUKzA3V9lChoBkdAcvaziCJ40WgHS8JoCEdApbXW5jH4oXV9lChoBkdAcgYn889wFWgHS81oCEdApbYfZTQ3P3V9lChoBkfANJ98E3bVSWgHS1poCEdApbZMaVD8cnV9lChoBkdAcSSCrLhaT2gHS8NoCEdApbZ3KQq7RXV9lChoBkdAc9XeeWfK6mgHS85oCEdApbaFdRiw0XV9lChoBkdAcdig2Ifr8mgHS/hoCEdApbaIHAymAXV9lChoBkdAcPh8r7O3UmgHS9poCEdApbataUzKtHV9lChoBkdAco9zXBguy2gHS+poCEdApbbMd7v5QHV9lChoBkdAcOC37UG3WmgHS8toCEdApbcxNXYDknV9lChoBkdAcOpR6nivPmgHS99oCEdApbdRwZOzp3V9lChoBkdAcc5UlAu7H2gHS81oCEdApbehIWgvlHV9lChoBkdAcG59ph4MW2gHS7loCEdApbe2Zb6gunV9lChoBkdAbjZebd8ArGgHS8BoCEdApbe+YMOPNnV9lChoBkdAcIyWpqASWmgHS7poCEdApbfkfs/puHV9lChoBkdAc+AKAJ9iMGgHS7loCEdApbf6MJhOQHV9lChoBkdAc5J13t8eCGgHS/hoCEdApbhO2LHdXXV9lChoBkdAbSMTsY2sJmgHS8loCEdApbh4geRxLnV9lChoBkdAcnURcNYr8WgHS/hoCEdApbiKfg75mHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 690, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 15, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab1966635737f6ee0dde29b87aaa9fae0c7840e9b9dda7fac9b161dff522c5b6
3
- size 146755
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:043295c04ba49947fee15b10e34953a35b700c9374f96c3c239f375e485d4779
3
+ size 146636
ppo-LunarLander-v2/data CHANGED
@@ -4,34 +4,34 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7b29f4fcd990>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7b29f4fcda20>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7b29f4fcdab0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7b29f4fcdb40>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7b29f4fcdbd0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7b29f4fcdc60>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7b29f4fcdcf0>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7b29f4fcdd80>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7b29f4fcde10>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7b29f4fcdea0>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7b29f4fcdf30>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7b29f4fcdfc0>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7b29f5167380>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
- "num_timesteps": 1015808,
25
- "_total_timesteps": 1000000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1695503808138910790,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAPODUT4K6h8/axaovP5lqL4DGZY93gHCvAAAAAAAAAAAZhBvvMSA8j0aJiK+hEtOvvsa3L06U/m8AAAAAAAAAAAzkxm6eHyuPS7YGr2O5xK+a6szOkWX+bwAAAAAAAAAAKZxdT6/kx4/fq1aPRO8k744lck9am0QPQAAAAAAAAAAmnu+vNVfXj6OPZW9erJZvsCusL0xCSa9AAAAAAAAAADg6Bg+LQosPoCEBb7m2E2+Jz47vaKrc70AAAAAAAAAAACAVTp76pG66M/WO1I2jTym9Zi6lft1vQAAgD8AAIA/zeBnPe6dn7xSp+S75yTVPDPk8j0Sy5Q9AACAPwAAgD+aTfW7H/HNPH4tNTtKkAy+MDX/ujhvuz0AAAAAAAAAAGZstL0U5Ji6rVbFuqZv0bUQ/FI6Ct/jOQAAAAAAAIA/s8BqPXuGpLpGJLY6b9lUNfGGzDojg9G5AACAPwAAgD8N/rq9r9gTPYXhZj3UvAK+MQ9GPbuO1roAAAAAAAAAAJpT9LweFlI/ljwnvYYypb41SJm8gF4KvgAAAAAAAAAAWqsaPvTWQD6zVlS+7Zc2vqBGL72aEyG9AAAAAAAAAADGkZo+3xNyP44XyT16ete+PBFDPmvDBr4AAAAAAAAAAIBBdD3sv8m7zkHpu1bt+jzCkeI8HowfPAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -41,17 +41,17 @@
41
  "_episode_num": 0,
42
  "use_sde": false,
43
  "sde_sample_freq": -1,
44
- "_current_progress_remaining": -0.015808000000000044,
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHEtFDOTq0OMAWyUTSgBjAF0lEdAmE8RTGYKIHV9lChoBkdAcPI6Ae7tiWgHTe8BaAhHQJhPXIsAeaN1fZQoaAZHQGblHuAqd6NoB03oA2gIR0CYUit16mfodX2UKGgGR0BwT6FajesQaAdNwAFoCEdAmFLev+wTunV9lChoBkdAcDtNxVAAyWgHTdEBaAhHQJhTnKMefZp1fZQoaAZHQHG9jBEa2ndoB01zAWgIR0CYU9LLpzLfdX2UKGgGR0Br1sQsf7rLaAdNTAFoCEdAmFQlHe7+UHV9lChoBkdAPl8QVbiZOWgHS/doCEdAmFW1TvRZ2nV9lChoBkdAcZ8pWmxdIGgHTZMBaAhHQJhXzdl/Yrd1fZQoaAZHQHD+eyVv/BFoB02lAWgIR0CYWJJ/5LyudX2UKGgGR0BuoyKHfuTiaAdNngFoCEdAmFqeH31zyXV9lChoBkdAbJv/jKgZj2gHTSoBaAhHQJhcZS4vvjR1fZQoaAZHQHBUmTgVGkNoB003AWgIR0CYXZF1jiGWdX2UKGgGR0BuIhCfHxSYaAdNQgFoCEdAmF4Moc7yQXV9lChoBkdAcNkAVO9FnmgHTU0BaAhHQJhhy4oZydZ1fZQoaAZHQHDofjKgZjxoB02YAWgIR0CYYjvJiiItdX2UKGgGR0BwqWAmReTnaAdNFgJoCEdAmGQsabWmQHV9lChoBkdAbvNRVp9JBmgHTRcCaAhHQJhlXFWGRFJ1fZQoaAZHQG/18RtgrpdoB027AWgIR0CYftzK9wm3dX2UKGgGR0BxtgVZcLSeaAdNYwJoCEdAmH/5MpPRA3V9lChoBkdAbBMXzDn/1mgHTbcCaAhHQJiAN8eCCjF1fZQoaAZHQHIckJKJ2uBoB00OAmgIR0CYgLDf3vhIdX2UKGgGR0BylOBbwBo3aAdNuQFoCEdAmIECFPBSDXV9lChoBkdAb5EpBHCoCWgHTUYBaAhHQJiBZCF9KEp1fZQoaAZHQHKDHctXgcdoB03PAWgIR0CYhG1rIo3KdX2UKGgGR0BujZda+vhZaAdNdQFoCEdAmISm6bvw3HV9lChoBkdAcZvfpD/lyWgHTcACaAhHQJiFZ5Y5ksl1fZQoaAZHQHFWZpSJj2BoB01dAWgIR0CYhZujh1kldX2UKGgGR0BwZnmr8zhxaAdNegJoCEdAmIXY6nzg/HV9lChoBkdAbShmMfigkGgHTUoBaAhHQJiGDiVB2Oh1fZQoaAZHQHAEANPP9k1oB002AWgIR0CYj9YjjaPCdX2UKGgGR0BvyyekHlfaaAdNpQNoCEdAmJAPmLcbi3V9lChoBkdAbzWDNhVlw2gHTUABaAhHQJiUZKODJ2d1fZQoaAZHQGFbIBzV+ZxoB03oA2gIR0CYltgNgBtDdX2UKGgGR0BsXfQhOgxraAdNggFoCEdAmJbn3lCCz3V9lChoBkdAcIFi0v4/NmgHTXQBaAhHQJiXSjBVMmF1fZQoaAZHQHEKrIPsiStoB01AAWgIR0CYl7YfW+XadX2UKGgGR0Bvv+AuqWC3aAdNNgFoCEdAmJg3uuzQeHV9lChoBkdAbvju0kWykmgHTVEBaAhHQJiYoAKfFrF1fZQoaAZHQF4GNLlFMIxoB03oA2gIR0CYmPZh8YygdX2UKGgGR0BwWQCyQgcMaAdNRgFoCEdAmJk7Hhjvu3V9lChoBkdAbnz1EmY0EWgHTaMBaAhHQJictGpda+x1fZQoaAZHQHEe6JdjXnRoB00qAmgIR0CYnga+N96UdX2UKGgGR0Bxl1jawljWaAdNQAJoCEdAmJ9Uz0pVj3V9lChoBkdAcjLjtoi9qWgHTe0BaAhHQJifaDZlFtt1fZQoaAZHQF01w9q1w5xoB03oA2gIR0CYoAx0MgEEdX2UKGgGR0ByV0Ht4RmLaAdNTQFoCEdAmKCmTC+De3V9lChoBkdAcTKQLNOdoWgHTRwBaAhHQJig+slsxfx1fZQoaAZHQHEU6lHjIaNoB005AWgIR0CYo5nOSntOdX2UKGgGR0BxfhpSJj2BaAdNPQFoCEdAmKQmBWgezXV9lChoBkdAbIqkUsWfsmgHTRsBaAhHQJikQZzgdfd1fZQoaAZHQG82BMrVe8hoB00+AWgIR0CYpJ8yvcJudX2UKGgGR0BxGO10DEFXaAdNYgFoCEdAmKTrl7tzCHV9lChoBkdAcTRFPi1iOWgHTXsBaAhHQJilx/CqIad1fZQoaAZHQG+WslLOAy5oB02MAWgIR0CYqCABT4tZdX2UKGgGR0BrjO5SWJJoaAdNNQFoCEdAmKhzcIqsl3V9lChoBkdAcmyb2Dg62mgHTScBaAhHQJi71kTYdyV1fZQoaAZHQHAv1UQ04zdoB008AWgIR0CYvAPWxyGSdX2UKGgGR0Bv/NNi6QNkaAdNKAFoCEdAmLxTYh+vyXV9lChoBkdAcFbqZ+hGpmgHTV0BaAhHQJi8113dKul1fZQoaAZHQHF4M189fTloB02bAmgIR0CYvWQuVX3hdX2UKGgGR0Bvvymbb1yvaAdNcgFoCEdAmL2TtsvZiHV9lChoBkdAcZCiExqO92gHTZUBaAhHQJi9q1jRUm51fZQoaAZHQGx4QT/Q0GhoB000AWgIR0CYwLe8f3evdX2UKGgGR0Bw8r4SHuZ1aAdNLwFoCEdAmMD3lGPPs3V9lChoBkdAa+Ho3aSLZWgHTS8BaAhHQJjBWtITXat1fZQoaAZHQHCSY065oXdoB01qAWgIR0CYwo3trsSkdX2UKGgGR0BuV4bn5i3HaAdNkgJoCEdAmMMdGmUGFHV9lChoBkdAbzX05EMLGGgHTUEBaAhHQJjGS0w8GLV1fZQoaAZHQHFqGEPDpC9oB00gAWgIR0CYya/6fra/dX2UKGgGR0BvFLLB9Cu2aAdNzQFoCEdAmMrEfPomonV9lChoBkdAcSVDYh+vyWgHTR4BaAhHQJjK8MOPNml1fZQoaAZHQHHgn6/IsAhoB002AWgIR0CYyz8pCrtFdX2UKGgGR0BtuUyP+4smaAdNFgFoCEdAmMuE70WdmXV9lChoBkdAbuKsCDEm6WgHTUIBaAhHQJjODuBtk4F1fZQoaAZHQHHiD5XU6PtoB004AWgIR0CY0XYcNpdsdX2UKGgGR0Btt/LkjopyaAdNqQFoCEdAmNHyLyc0+HV9lChoBkdAcC0Lr5ZbIWgHTZYBaAhHQJjSUrSVnmJ1fZQoaAZHQHJON12aDwpoB01KAWgIR0CY0tFJxvNvdX2UKGgGR0Bw3/y6MBIXaAdNKgFoCEdAmNMFrqMWGnV9lChoBkdAcNkxKg7HQ2gHTXMBaAhHQJjVIlE7W/d1fZQoaAZHQG+op66asp5oB006AWgIR0CY1fJwsGxEdX2UKGgGR0Bwu1yaNMoMaAdNtwFoCEdAmNYp+UhV2nV9lChoBkdAce1wN9YwI2gHTSsBaAhHQJjXatnwob51fZQoaAZHQHHebBfrrxBoB00bAWgIR0CY13UrkKeDdX2UKGgGR0Bss+3+dbxFaAdNKAFoCEdAmN1KF7D2rXV9lChoBkdAce5Yzi0fHWgHTTABaAhHQJjdXRsuWbB1fZQoaAZHQG4WtXHR1HRoB020AWgIR0CY3dsnAqNIdX2UKGgGR0ByRJ/oaDPGaAdNzAFoCEdAmN6ljy4FzXV9lChoBkdAcga+so2GZmgHTZoBaAhHQJje+6Ae7tl1fZQoaAZHQGyVfCyhSLtoB01hAWgIR0CY3yBY3eendX2UKGgGR0Bx1e9Ba9saaAdNSAFoCEdAmN8vVRUFS3V9lChoBkdAcGWCQcPvrmgHTU8BaAhHQJjfmg/Tspp1fZQoaAZHQGZ3RQJokAxoB03oA2gIR0CY38BnSOR1dX2UKGgGR0Bx1vC1qnFYaAdNMgFoCEdAmOB5hfBvaXV9lChoBkdAcfHxSYPXkGgHTf0BaAhHQJjgjyPMjeN1fZQoaAZHQHBg71VYISloB002AWgIR0CY4pM72cridX2UKGgGR0BkV4hUzbeuaAdN6ANoCEdAmOMf5k9U0nV9lChoBkdAcEIzAvcrRWgHTXsBaAhHQJjjdUS7GvR1fZQoaAZHQHC1pEYwZfloB02FAWgIR0CY45GjsUqQdWUu"
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
  },
54
- "_n_updates": 248,
55
  "observation_space": {
56
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
  ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
@@ -77,14 +77,14 @@
77
  "_np_random": null
78
  },
79
  "n_envs": 16,
80
- "n_steps": 1024,
81
  "gamma": 0.999,
82
  "gae_lambda": 0.98,
83
  "ent_coef": 0.01,
84
  "vf_coef": 0.5,
85
  "max_grad_norm": 0.5,
86
  "batch_size": 64,
87
- "n_epochs": 4,
88
  "clip_range": {
89
  ":type:": "<class 'function'>",
90
  ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7e2a0f6172e0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e2a0f617370>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e2a0f617400>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e2a0f617490>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7e2a0f617520>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7e2a0f6175b0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7e2a0f617640>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e2a0f6176d0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7e2a0f617760>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e2a0f6177f0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e2a0f617880>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7e2a0f617910>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7e2a0f5c7700>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
+ "num_timesteps": 1507328,
25
+ "_total_timesteps": 1500000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1695522685106348523,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALOj0b2GplY/kRA4vjH/KL8Frha+da8IvQAAAAAAAAAAmh/evAqRLru6aQY8lreQPLAcTLzFank9AACAPwAAgD9APC2+TuaFP5kCBr/kdTK/IVmFviYlk74AAAAAAAAAADO4Gb4iaoY+LpmBPowNiL7lyNS8brL6PQAAAAAAAAAAppB5vuq8Wj+jRgS+h9A/v63ehr7i3pU9AAAAAAAAAACAtBG9pK8cuzBS/TmhU408p5f7u7NTdD0AAIA/AACAPxqXBr32sDG6aMSUthp+gbE/UQu7mFq0NQAAgD8AAIA/Zu3TvBRQurpaUB05VUoONDKLYzm+TDO4AACAPwAAgD/wHme+2Qn3PoaAzT3pHBC/97svvlKrHz4AAAAAAAAAAIAWaL0KynC71YlkPHtGjDwYp7g8taZwvQAAgD8AAIA/JpDevdULFj73arA+gLJovozU4j3O9aw8AAAAAAAAAAAzKW68byPEPsPEoL1KpPu+T6ZqPJI3E74AAAAAAAAAADN6jb3a4KU/8A6nvqc4Ar/2dN+9kYy8vQAAAAAAAAAAzZ6cvK5HjbjrtYY5STOrNHhd0TtKdaS4AACAPwAAgD+zGhO9eTSZPlEpoT05EdK+TSM6PfNj0joAAAAAAAAAADNbODwuo689Jlf+veTem77EQ528/kKmvQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
41
  "_episode_num": 0,
42
  "use_sde": false,
43
  "sde_sample_freq": -1,
44
+ "_current_progress_remaining": -0.004885333333333408,
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWV5wsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHIVpXuE25yMAWyUS7qMAXSUR0ClplLFXJYDdX2UKGgGR0BzUdv863iJaAdL8WgIR0ClppwLNOdodX2UKGgGR0BxQsxQBPsSaAdL7WgIR0ClpqIBq9GrdX2UKGgGR0ByerLDAJswaAdLzWgIR0ClprFlbu+idX2UKGgGR0BuA1mrbQC0aAdL0mgIR0Clpr/xDst1dX2UKGgGR0BxjdpnHvMKaAdLz2gIR0Clp1U7KaG6dX2UKGgGR0Bw6Og7HQyAaAdL42gIR0Clp1qm8/UwdX2UKGgGR0BymnPiT+vRaAdL1WgIR0Clp23vx6OYdX2UKGgGR0BxlJyhi9ZiaAdL2mgIR0Clp/sx46fbdX2UKGgGR0BNO/bCaZx8aAdLnWgIR0ClqDEc0cfedX2UKGgGR0BzG4w+MZP3aAdL1WgIR0ClqK3PzFuOdX2UKGgGR0BtZ8Nc4YJmaAdLymgIR0ClqT7kGRmsdX2UKGgGR0BxCgeKbaysaAdL0mgIR0ClqabbUPQOdX2UKGgGR0Bx0ELkS26TaAdLuWgIR0ClqbeBYmsvdX2UKGgGR0BvxLRhMJyAaAdLzGgIR0ClqfMvIwM6dX2UKGgGR0BzH3giu+yraAdL5GgIR0ClqmSUC7sfdX2UKGgGR0BwlbkT6BRRaAdL2WgIR0Clqt8FhXr/dX2UKGgGR0B0KDHbRF7VaAdL/mgIR0ClqznUtqYadX2UKGgGR0ByvJFvybx3aAdL+GgIR0Clq2wuVX3hdX2UKGgGR0BwBZ40Mw10aAdL0mgIR0Clq4W6bvw3dX2UKGgGR0BynfbDdgv2aAdL+mgIR0Clq547zTWodX2UKGgGR0BQtFLBbfP5aAdLuWgIR0Clq6pYDDCQdX2UKGgGR0BxkvwKBun/aAdL5mgIR0Clq9748EFGdX2UKGgGR0B0bJdPci4baAdL8mgIR0Clq/bALy+YdX2UKGgGR0ByuhMAWBSUaAdL02gIR0ClrBbMPjGUdX2UKGgGR0BzvJ04iosJaAdNKgFoCEdApawdHvttynV9lChoBkdAcGX5dWyTp2gHS71oCEdApax1yimEXnV9lChoBkdAcfm8n/kvK2gHS+JoCEdApayMwi7kGXV9lChoBkdAcKL+pOvdM2gHS+NoCEdApa041LrX2HV9lChoBkdAcfXr6tT1kGgHS/BoCEdApa2Lp5eJHnV9lChoBkdAcwZwyIpH7WgHTQEBaAhHQKWtkJLM9r51fZQoaAZHQHOljWsijcpoB0vKaAhHQKWtonv2GqR1fZQoaAZHQHKT2ZZ0SytoB0vraAhHQKWtwTyrgfl1fZQoaAZHQG35T/hl18toB0u7aAhHQKWt66FuejF1fZQoaAZHQHObO63AmAtoB0vTaAhHQKWuIM+/xlR1fZQoaAZHQHFCBdpqREFoB0vpaAhHQKWuN+AmReV1fZQoaAZHQHDdk5yU9p1oB0vkaAhHQKWuSdCE6DJ1fZQoaAZHQHMt4OUdJatoB0vBaAhHQKWueKCQLeB1fZQoaAZHQHGf6pgkTpRoB0vtaAhHQKWuf2YfGMp1fZQoaAZHQHM0hd+ocaRoB0vdaAhHQKWuovBacI91fZQoaAZHQHAzTYI0IkZoB0vRaAhHQKWuoOmR/3F1fZQoaAZHQHPDilenhsJoB0vqaAhHQKWur8D0UXZ1fZQoaAZHQHKOwnc+JP9oB0vPaAhHQKWvCYw7DEZ1fZQoaAZHQHEifLX+VC5oB0vGaAhHQKWvl86V+ql1fZQoaAZHQHK9+VHFxXJoB00XAWgIR0Clr9RI8QqadX2UKGgGR0BwF9nh86V/aAdLv2gIR0Clr+e1a4c4dX2UKGgGR0BwJ4/OdGy5aAdLzGgIR0Clr/3k5p8GdX2UKGgGR0ByPHsHB1s+aAdLr2gIR0ClsAAjps42dX2UKGgGR0Bx8BIVdonKaAdL5WgIR0ClsEJqASWadX2UKGgGR0BxpbY/Vy3kaAdLqmgIR0ClsEVrylN2dX2UKGgGR0ByXkP+XJHRaAdL2WgIR0ClsFThYNiIdX2UKGgGR0BuUuKZUkv9aAdL2GgIR0ClsKkR8MNMdX2UKGgGR0By3tHc1wYMaAdLxmgIR0ClsNCih37ldX2UKGgGR0Bx5AwSJ0nxaAdL42gIR0ClsOKv3ai9dX2UKGgGR0Bx8wQ/X5FgaAdLy2gIR0ClsQVEuxr0dX2UKGgGR0Bwg8spXp4baAdL5WgIR0ClsSlqrR0EdX2UKGgGR0BzCLoxHoX9aAdL22gIR0ClsTbr9l3AdX2UKGgGR0BxkTSpiqhlaAdL22gIR0ClsaWNedCmdX2UKGgGR0ByjLRrrPdEaAdNAwFoCEdApbHBaC+UQnV9lChoBkdAcfbl+Vkc0mgHS+FoCEdApbJEBXCCSXV9lChoBkdAcZJaLn9vTGgHS8xoCEdApbJrNdJJ5HV9lChoBkdAcLcMjNY8uGgHS8toCEdApbJqpcX3xnV9lChoBkdAcomdDIBBA2gHS9hoCEdApbJ6fzz3AXV9lChoBkdAckGJvo/zKGgHS8VoCEdApbKfGp++d3V9lChoBkdAcej4/u9eyGgHS6xoCEdApbMhU1hsqXV9lChoBkdAc6qbMHKOk2gHS/RoCEdApbM/NHH3lHV9lChoBkdAcsuQ3xWkrWgHS8FoCEdApbNEgOjIrHV9lChoBkdAcsjsqrilzmgHS9loCEdApbNWi5/b03V9lChoBkdAcwlVxjriVGgHTQABaAhHQKWzdYGMXJp1fZQoaAZHQHD1YoE0SAZoB0vWaAhHQKWz16sySFJ1fZQoaAZHQHFiLHuJDVpoB01KAWgIR0Cls+DhUBGQdX2UKGgGR0Bya6j/MnqnaAdLsmgIR0Cls+mqHXVcdX2UKGgGR0BxD1xeb/fgaAdL2mgIR0Cls/Q4sEq2dX2UKGgGR0BxSCQEIPbxaAdLp2gIR0CltJB/qgRLdX2UKGgGR0BzgUqVhTfjaAdL52gIR0CltLQnhKlIdX2UKGgGR0ByYbpfQa73aAdLwmgIR0CltTMVclgMdX2UKGgGR0BzX0LSeAd5aAdLzmgIR0CltTR6fJ3gdX2UKGgGR0BwAW7OE/SqaAdL7WgIR0CltWrRrrPddX2UKGgGR0BxriM3qAz6aAdNbgFoCEdApbWGF10T13V9lChoBkdAdEuIBzV+Z2gHS+5oCEdApbWU/Y8MeHV9lChoBkdAcxyEZR8+imgHS7xoCEdApbWnw7T2FnV9lChoBkdAb29TRYzSC2gHS7toCEdApbW+kUKzA3V9lChoBkdAcvaziCJ40WgHS8JoCEdApbXW5jH4oXV9lChoBkdAcgYn889wFWgHS81oCEdApbYfZTQ3P3V9lChoBkfANJ98E3bVSWgHS1poCEdApbZMaVD8cnV9lChoBkdAcSSCrLhaT2gHS8NoCEdApbZ3KQq7RXV9lChoBkdAc9XeeWfK6mgHS85oCEdApbaFdRiw0XV9lChoBkdAcdig2Ifr8mgHS/hoCEdApbaIHAymAXV9lChoBkdAcPh8r7O3UmgHS9poCEdApbataUzKtHV9lChoBkdAco9zXBguy2gHS+poCEdApbbMd7v5QHV9lChoBkdAcOC37UG3WmgHS8toCEdApbcxNXYDknV9lChoBkdAcOpR6nivPmgHS99oCEdApbdRwZOzp3V9lChoBkdAcc5UlAu7H2gHS81oCEdApbehIWgvlHV9lChoBkdAcG59ph4MW2gHS7loCEdApbe2Zb6gunV9lChoBkdAbjZebd8ArGgHS8BoCEdApbe+YMOPNnV9lChoBkdAcIyWpqASWmgHS7poCEdApbfkfs/puHV9lChoBkdAc+AKAJ9iMGgHS7loCEdApbf6MJhOQHV9lChoBkdAc5J13t8eCGgHS/hoCEdApbhO2LHdXXV9lChoBkdAbSMTsY2sJmgHS8loCEdApbh4geRxLnV9lChoBkdAcnURcNYr8WgHS/hoCEdApbiKfg75mHVlLg=="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
  },
54
+ "_n_updates": 690,
55
  "observation_space": {
56
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
  ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
 
77
  "_np_random": null
78
  },
79
  "n_envs": 16,
80
+ "n_steps": 2048,
81
  "gamma": 0.999,
82
  "gae_lambda": 0.98,
83
  "ent_coef": 0.01,
84
  "vf_coef": 0.5,
85
  "max_grad_norm": 0.5,
86
  "batch_size": 64,
87
+ "n_epochs": 15,
88
  "clip_range": {
89
  ":type:": "<class 'function'>",
90
  ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62ada79905e2f0f39a8eefd46b1087fb739a359a31f73081b0c8e1c37162e903
3
  size 87929
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edb271825e397c34cd388228d3093c9f49748190ffd41d2afdcf5f2f566160bd
3
  size 87929
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ae9ad6263880d6a6022e676ed0172f1ccfc6f083098022b4c30b6d3e75f88a3
3
  size 43329
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6c63add49864a90407bba472d2e21b9c0f0b4ed4dfff72275b3380e40cf1d8b
3
  size 43329
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 268.0932125, "std_reward": 20.940760244451525, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-09-23T22:56:22.106896"}
 
1
+ {"mean_reward": 277.8567491, "std_reward": 11.58854152151543, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-09-24T03:38:23.345135"}