felixdae commited on
Commit
cb53509
·
1 Parent(s): ac8ad72

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 277.81 +/- 16.22
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 283.35 +/- 20.40
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f6382212cb0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f6382212d40>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f6382212dd0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f6382212e60>", "_build": "<function ActorCriticPolicy._build at 0x7f6382212ef0>", "forward": "<function ActorCriticPolicy.forward at 0x7f6382212f80>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f6382213010>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f63822130a0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f6382213130>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f63822131c0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f6382213250>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f63822132e0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f6382215a00>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1685758402973880763, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAACbTT7NgC0+B827vb3ufr4N3AQ+I0rBvAAAAAAAAAAAprJvPnYl+D7EHT08xD67vl2yKj4DUTI8AAAAAAAAAAA9orE+kfQTP6HpJL7+YNG+KoKTPkUB5b0AAAAAAAAAAG3gPb7kIJk/UL0Dv26f5r7Hk5G+9uCRvgAAAAAAAAAA7TUevgwDSz5qIrY+PwW0vtLObj3T0OY9AAAAAAAAAACmM9A9MbiuPzwkAz8T4LG+DbqCPUXAEz4AAAAAAAAAAM3CRbymXLU/3iHMvs+dfj2uYj48EC0+PQAAAAAAAAAAAGEJPX4Trj72q9I8TiqrvlcNlzpeE1E8AAAAAAAAAABVC5u+n2iiPz1XBb+M2Pu+CGPuvkXDt70AAAAAAAAAAM2sCbvfeLQ/LudZvpCuMr04+R875m5FPQAAAAAAAAAAABC0Oygz0j1xF8K81EldvuGQJz2n7DG8AAAAAAAAAADNdcY8KVypP4Kfpz6VUBa/oZs5PND27j0AAAAAAAAAACbKyD3EAZM+527MveYnkb5XMQc80H3iuwAAAAAAAAAAmkaSPcYhdD+q+wE+jCMJv6BhhzryPAO9AAAAAAAAAACNAUu+ZU6KPiuNgT53ye2+jGGjPHCe6D0AAAAAAAAAAGZOjL1SGOa5jnxgNSKEii4m6oC7kleVtAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAEAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVAAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHK7dsenyd6MAWyUTS4BjAF0lEdAmvJg79ycTnV9lChoBkdAcAhi++M6zWgHS/hoCEdAmvMWn889wHV9lChoBkdAcN7EOiFj/mgHS/RoCEdAmvOXhOxja3V9lChoBkdAcXi+OwPiDWgHTSABaAhHQJr0CnGbTc91fZQoaAZHQHCEtUsFt9BoB0v5aAhHQJr0pqesgdR1fZQoaAZHQHANUxyn1nNoB0vHaAhHQJr0jJSzgMt1fZQoaAZHQHBLNv0h/y5oB0viaAhHQJr1fLFGXol1fZQoaAZHQHH7nwob4rVoB0vmaAhHQJr1oDLbHp91fZQoaAZHQHIYCW3Sa3JoB0v7aAhHQJr1iS4e9zx1fZQoaAZHQHCpUFnqVyFoB0vtaAhHQJr1t4Uvf0p1fZQoaAZHQHI/Iqbz9TBoB0vfaAhHQJr2vLr5ZbJ1fZQoaAZHQHMAxuCPIXFoB00LAWgIR0Ca9vPWQOnVdX2UKGgGR0Bxed+DvmYCaAdNCQFoCEdAmvcxB/qgRXV9lChoBkdAcRJyVfNRnGgHS+5oCEdAmvfc9jgAInV9lChoBkdAcOwrrPdEcGgHTQcBaAhHQJr4QUXYUWV1fZQoaAZHQHCyFz2exwBoB0vyaAhHQJr5KA6Mir11fZQoaAZHQHFtsNQTEitoB00UAWgIR0Ca+Turp7kXdX2UKGgGR0BwutPqLS/kaAdNFgFoCEdAmvkz101ZT3V9lChoBkdAcNF9XLeQ+2gHS95oCEdAmvmOfNA1N3V9lChoBkdAcmcYNAkcCGgHS/JoCEdAmvmlhkRSP3V9lChoBkdAcS40Sh8IA2gHS+toCEdAmvpOXNTtLXV9lChoBkdAcWTy4FzMimgHS9NoCEdAmvrfdyksSXV9lChoBkdAcAUp2ll9SmgHTRYBaAhHQJr7d+AmReV1fZQoaAZHQHOr8DwH7gtoB0v7aAhHQJr7oO+ZgG91fZQoaAZHQHNteyu6mO5oB00AAWgIR0Ca++lWwNb1dX2UKGgGR0BxKsMc6vJSaAdL0WgIR0Ca++/2TPjXdX2UKGgGR0Bu8IbCJoCdaAdNKQFoCEdAmvzW34Kx93V9lChoBkdAcIcaA4GUwGgHS/1oCEdAmv08hs67unV9lChoBkdAcYiVyWAwwmgHS/NoCEdAmv088YAKfHV9lChoBkdAbsWmZVn27GgHS+loCEdAmv4AOe8PF3V9lChoBkdAcIZivgWJrWgHS/5oCEdAmxBHEQ5FPXV9lChoBkdAUSG+N96Tn2gHS7RoCEdAmxE3YxtYS3V9lChoBkdAced5gPVd5mgHS/VoCEdAmxHj37DVIHV9lChoBkdAcVueWv8qF2gHS/doCEdAmxH9wNsnA3V9lChoBkdAbygYsunMuGgHTQQBaAhHQJsSXp+tr9F1fZQoaAZHQG4Jr7oB7u5oB0v3aAhHQJsSk3m3fAN1fZQoaAZHQHEcy2QXAM5oB00EAWgIR0CbEySuQp4KdX2UKGgGR0Bzk7kaMrEtaAdL+WgIR0CbFYeQuEmIdX2UKGgGR0BvG3sRg7YDaAdL62gIR0CbFcVnmJWOdX2UKGgGR0BzhAomXw9aaAdNKwFoCEdAmxan+6y0KXV9lChoBkdAcgQpI+W4VmgHTRUBaAhHQJsW+UJOWSl1fZQoaAZHQG995oPCl8BoB00dAWgIR0CbF6jwhGH6dX2UKGgGR0Bw7VvkzXSSaAdL6mgIR0CbF8v2GqPwdX2UKGgGR0BxbujL0SRKaAdL+WgIR0CbGF4SYgJUdX2UKGgGR0BzKeG5+YtyaAdNCAFoCEdAmxhelsP8RHV9lChoBkdAcmJ6LOzIFWgHS/VoCEdAmxlvH5rP+nV9lChoBkdAchd8pkPMCGgHS/RoCEdAmxpMNlRP43V9lChoBkdAcSQ/o7muDGgHS+VoCEdAmxp1aGHpKXV9lChoBkdAbeHTlT3qRmgHS9xoCEdAmxp+GoJiRXV9lChoBkdAcBXqzJIUamgHS9VoCEdAmxpqekHlfnV9lChoBkdAcTqZxaPjn2gHS+1oCEdAmxqRnjABUHV9lChoBkdAcYdSjxkNF2gHS+loCEdAmxs8oQWepXV9lChoBkdAc2etI065oWgHTTsBaAhHQJsbXYUWVNZ1fZQoaAZHQG8NMijcmBxoB0vYaAhHQJscaws5GSZ1fZQoaAZHQG9Avn8sMApoB00BAWgIR0CbHVyOaOPvdX2UKGgGR0BzFKDOC5EuaAdLzGgIR0CbHWlkpZwGdX2UKGgGR0BxSiWdEsreaAdL/WgIR0CbHeTb349HdX2UKGgGR0By7pdu5z5oaAdNCwFoCEdAmx59IkJKJ3V9lChoBkdAc3kLlFMIvGgHS+9oCEdAmx6qGxlg+nV9lChoBkdAc1B2FFlTWGgHS9xoCEdAmx7kQPI4l3V9lChoBkdAcMfM2FWXC2gHTRABaAhHQJsfFIBikO91fZQoaAZHQG8+1+Zw4sFoB0vOaAhHQJsfdIkJKJ51fZQoaAZHQFRJAOavzOJoB0upaAhHQJsfebqhUR51fZQoaAZHQHJbxzzVc2RoB00YAWgIR0CbH6jsUqQSdX2UKGgGR0BwTFK8L8aXaAdL3mgIR0CbH741xbSrdX2UKGgGR0BxbmRxLkCFaAdL7GgIR0CbH/GWUr08dX2UKGgGR0Bx3DyFwkxAaAdNAgFoCEdAmyCPGVAzHnV9lChoBkdAcEu2rXDm82gHS+ZoCEdAmyCyEYfnwHV9lChoBkdAcNZ7VrhzeWgHTQ4BaAhHQJsg7posZpB1fZQoaAZHQHIEyP2f029oB00OAWgIR0CbItoFFDv3dX2UKGgGR0BwoJDTjNpuaAdL+mgIR0CbI1EYwZfldX2UKGgGR0BvTI+Sr5qNaAdL4GgIR0CbIziQDFIedX2UKGgGR0Bxcn8CPp6haAdL1GgIR0CbI4I68xsVdX2UKGgGR0BuIyWeHzpYaAdNDwFoCEdAmyPx15jYqXV9lChoBkdAcgwIbfgrH2gHS9ZoCEdAmyQs5n13+3V9lChoBkdAcEvZiuuA7WgHS/VoCEdAmySNQfp2U3V9lChoBkdAckcPKMefZmgHS9BoCEdAmySrxmTTv3V9lChoBkdAcrCtZ3cHnmgHS+5oCEdAmyU0dq+JxnV9lChoBkdAc0aeQdS2pmgHTR8BaAhHQJsl5PrOZ9d1fZQoaAZHQHGjgMUh3aBoB0vhaAhHQJsmNyHVPN51fZQoaAZHQHLfQGKQ7tBoB00FAWgIR0CbJiv/BFd+dX2UKGgGR0BzHWsp5NXYaAdNBgFoCEdAmyZw3YL9dnV9lChoBkdAb7+B/ZuhsmgHS+JoCEdAmyamQfZElXV9lChoBkdAcqwE/B3zMGgHS+5oCEdAmyax02cawXV9lChoBkdAcM1BQemvXGgHTTcBaAhHQJsnCt0V8Cx1fZQoaAZHQHCKH3ta6jFoB0v3aAhHQJspDJ8v25B1fZQoaAZHQG3RHG8274BoB0vsaAhHQJspHBSDRMN1fZQoaAZHQHDu0e+23KBoB0vqaAhHQJspVXhfjS51fZQoaAZHQHGW4S13MZBoB0v7aAhHQJsplXr+o991fZQoaAZHQG87R8twrDtoB0vWaAhHQJspzEm6XjV1fZQoaAZHQG/7dZq20AtoB0vyaAhHQJsp6wTufEp1fZQoaAZHQHHwD/ACW/toB00BAWgIR0CbKn9X9zfadX2UKGgGR0Bx/9Jbt7a7aAdL3mgIR0CbKqE+gUUPdX2UKGgGR0ByYT37DVH4aAdL4WgIR0CbK1StNi6QdX2UKGgGR0BwMWOvMbFTaAdNEwFoCEdAmytstPHktHV9lChoBkdAcN47A+IM0GgHS+5oCEdAmyv2f9P1tnV9lChoBkdAcE9j+rELpmgHS+NoCEdAmywj9sJpnHV9lChoBkdAcftC7K7qZGgHS/ZoCEdAmyxlbJOnEXV9lChoBkdAcEbtMfzSTmgHS/BoCEdAmyyDnNgSe3V9lChoBkdAcxzT1kDp1WgHTQcBaAhHQJssiya/h2p1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 388, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.107+-x86_64-with-glibc2.31 # 1 SMP Sat Apr 29 09:15:28 UTC 2023", "Python": "3.10.11", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f23f21ea680>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f23f21ea710>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f23f21ea7a0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f23f21ea830>", "_build": "<function ActorCriticPolicy._build at 0x7f23f21ea8c0>", "forward": "<function ActorCriticPolicy.forward at 0x7f23f21ea950>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f23f21ea9e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f23f21eaa70>", "_predict": "<function ActorCriticPolicy._predict at 0x7f23f21eab00>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f23f21eab90>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f23f21eac20>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f23f21eacb0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f23f21dbc80>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 2015232, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1685968980168974344, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM1fgL5VHko/6My+Pb8V/75aYwO/+jZkPgAAAAAAAAAAGop9PR0mkD/pyig+LU75vqq/zz1Ao3k9AAAAAAAAAADm2Ae9wxlMumjEy7P6aRkvafaDunqxszMAAIA/AACAPxoKNL08J4s/LoqWvfEw076U6iW+qEjAvQAAAAAAAAAAGkMCPh7RLT/W6WK8lIT6vpMAKz7e1Uy9AAAAAAAAAACaV5U8yyzHPQF1vr2rQZa+4uK3PNhltL0AAAAAAAAAAM3UHDwpAGi64hActjyqCbFBtg+6ouBDNQAAgD8AAIA/ZoVkvhhRgj9GV5u+eybHvtUJAL8zoB6+AAAAAAAAAADNt4u8rwatPtBx8j2Altm+LaLUPbKQjT0AAAAAAAAAAACoGb1/87I/qo88v2SpK76Nqss8pN3APAAAAAAAAAAAM6SXPDbZbrxXeMu8oFt7PR5knDozntw6AACAPwAAgD+asRw9SBWBuv3OLTcio/Exo9MWu15tS7YAAIA/AACAP3qNnT7MyQ4/KrAxvqaABL8jnoo+GtiCvgAAAAAAAAAAs8ZePY/eebr+oEqyDJ6EMPmMczjHTMwyAACAPwAAgD8AChU+pO2oP6fbIj/Sx+u+1jQ/PqFhvD4AAAAAAAAAAGYxpDz2OFi6brwzM3udILDeKIO79JjKswAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.007616000000000067, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV5QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHGDzJyQxN+MAWyUS+2MAXSUR0CbfZrTYukDdX2UKGgGR0BxXlvP1L8KaAdL3mgIR0CbfarVOKwZdX2UKGgGR8ACkTDfm9xqaAdLgWgIR0CbfarhzeXSdX2UKGgGR0Bx321pj+aSaAdL12gIR0Cbfan/1g6VdX2UKGgGR0ByC6XfIjnnaAdL7mgIR0CbfbbYsd1ddX2UKGgGR0BxNqB3A2ycaAdLyWgIR0CbfdXiR4hVdX2UKGgGR0BxoKimEXchaAdL9GgIR0CbffI0qH45dX2UKGgGR0BxfwZVGTcJaAdL3GgIR0CbfflSjxkNdX2UKGgGR0BwHmDJ2dNGaAdL0mgIR0CbfpMHryDqdX2UKGgGR0BtWxAnlXA/aAdL3mgIR0Cbfp90ihWYdX2UKGgGR0ByvpF2FFlTaAdL4GgIR0Cbftnm7rcCdX2UKGgGR0BxkO6bvw3HaAdL1GgIR0CbfxicoYvWdX2UKGgGR0Byvt2ECeVcaAdL5GgIR0Cbf619fCyhdX2UKGgGR0BMJr7O3UhFaAdLlGgIR0CbgHp22XsxdX2UKGgGR0BwbPtBv73xaAdL6mgIR0CbgIxWDHwPdX2UKGgGR0BxI45IYm9haAdL6WgIR0CbgTQFLWZrdX2UKGgGR0Bw0HsmfGuLaAdL82gIR0CbgVetjkMkdX2UKGgGR0ByMInQY1pCaAdL0mgIR0CbgeHQhOgydX2UKGgGR0BzYONYKYzBaAdL3WgIR0CbghO/L1VYdX2UKGgGR0Bwn8J9iMHbaAdL42gIR0Cbgjj2zv7WdX2UKGgGR0BwfHMY/FBIaAdL52gIR0CbgkA3T/hmdX2UKGgGR0ByxjiOvMbFaAdL6mgIR0Cbgoxsl9jPdX2UKGgGR0Bw5ATSLIgeaAdLzGgIR0Cbgs6XBxgidX2UKGgGR0BxLYm9g4OuaAdL8WgIR0CbgtcLBsQ/dX2UKGgGR0BvPhlDneSCaAdL8mgIR0CbguQ9zOopdX2UKGgGR0Byoha4c3l0aAdL2WgIR0Cbg21Gb1AadX2UKGgGR0BxT5U4rBj4aAdL9WgIR0Cbg76CDmKZdX2UKGgGR0Bx0Chwl0HRaAdL92gIR0CbhF2WpqASdX2UKGgGR0BSqm69TP0JaAdLtmgIR0CbhHZOzposdX2UKGgGR0BxG3Uaya/iaAdL7GgIR0CblK+jua4MdX2UKGgGR0BxMPvc8DB/aAdL2mgIR0CblSTPjXFtdX2UKGgGR0BwMZXKbKA8aAdL3GgIR0Cbld4xUNrkdX2UKGgGR0BwA5A+pwS8aAdL4WgIR0Cblh5P/JeWdX2UKGgGR0BxlShvitJWaAdLy2gIR0Cblp1/lQuVdX2UKGgGR0ByLX3pOerdaAdLyWgIR0Cblp2Pkq+bdX2UKGgGR0BuSyH446wMaAdL4GgIR0Cblto+wC8wdX2UKGgGR0BzKMzO5avBaAdLwmgIR0CblzzDGcWkdX2UKGgGR0ByDZr0rbxmaAdLzWgIR0Cblz01ZTybdX2UKGgGR0BwVjopx3mnaAdL3GgIR0CbmBKeTV2BdX2UKGgGR0BwiIKCxu89aAdNBgFoCEdAm5hQ3gk1M3V9lChoBkdAcbt8LKFIu2gHS/hoCEdAm5j/h2nsLXV9lChoBkdAcZqk9lmOEWgHS/FoCEdAm5mOK0lZ5nV9lChoBkdAcC0OPNmlImgHS/NoCEdAm5oM/MW43HV9lChoBkdAcnWGqxTsIGgHS9xoCEdAm5pdCiRGMHV9lChoBkdAcUfQFcIJJGgHS+VoCEdAm5qAI+nqFHV9lChoBkdAcNcnuiN83WgHS/FoCEdAm5t3YlIEsHV9lChoBkdAc0ldS2phnmgHS+poCEdAm5vpSR8tw3V9lChoBkdAcCTyn1nM+2gHS9toCEdAm5zN6gM+eXV9lChoBkdAcQUXhfjS5WgHS/doCEdAm51SP2f03HV9lChoBkdAcwrMoc7yQWgHS99oCEdAm513Ov+wT3V9lChoBkdAclg1anrIHWgHS9toCEdAm52KHfuTinV9lChoBkdAcRw+/gzguWgHS9ZoCEdAm526zE74jHV9lChoBkdAccZLxZuAJGgHS+9oCEdAm53yjk+5fHV9lChoBkdAcTXgbZOBUmgHS9JoCEdAm55koa1kUnV9lChoBkdAcIzQl8gIQmgHS/VoCEdAm56iUornT3V9lChoBkdAcfFC4z7/GWgHS79oCEdAm566FuejEnV9lChoBkdAcVFjbBXS0GgHS+FoCEdAm58Q0TDfnHV9lChoBkdAbfXXd0q6OGgHS9doCEdAm5/8XBP9DXV9lChoBkdAcStFb3XZoWgHS9ZoCEdAm6B80cfeUXV9lChoBkdAbtE+Yc/+sGgHS9doCEdAm6D8ABDG+HV9lChoBkdAcvp2P1ct5GgHTQMBaAhHQJuiTTH80k51fZQoaAZHQHQSgeV9nbtoB0vRaAhHQJuiaVpsXSB1fZQoaAZHQHHLSq6vq1RoB0v0aAhHQJujJBKL8791fZQoaAZHQHCWjCxeLNxoB0vbaAhHQJukaEsasIV1fZQoaAZHQG+CQN9YwItoB0v8aAhHQJulFOvdM0x1fZQoaAZHQHAyarvLHMloB0voaAhHQJulNVBD5TJ1fZQoaAZHQHFPxBVuJk5oB0vKaAhHQJulNe6Zpi91fZQoaAZHQHOsp1vES/VoB0vbaAhHQJulQGNaQmx1fZQoaAZHQHAFUQ9RrJtoB0viaAhHQJulPxRVIZt1fZQoaAZHQHOzu1WsA/9oB0vGaAhHQJulV9srNGF1fZQoaAZHQHFl6F/QSjBoB0vwaAhHQJulZwcYIjZ1fZQoaAZHQHDEAOe8PFxoB0vdaAhHQJumbz7MxGl1fZQoaAZHQG+d1TR6WxBoB0vxaAhHQJumr2TPjXF1fZQoaAZHQHMgTfR/mT1oB0u9aAhHQJunWt5le4V1fZQoaAZHQHFOCZ0CA+ZoB0vzaAhHQJuoDnjhky11fZQoaAZHQG9Sk87p3X9oB0vqaAhHQJuoRS9/SYx1fZQoaAZHQHGFOhbnoxJoB0vaaAhHQJup3M+u/1x1fZQoaAZHQHIhaYu01IloB0vyaAhHQJup5fnfVI91fZQoaAZHQHO3HsolUqBoB00CAWgIR0CbqlTb349HdX2UKGgGR0BxQK3BpHqeaAdL1WgIR0CbqpGUfPondX2UKGgGR0BzrbmknCwbaAdL2mgIR0CbqyeTmnwYdX2UKGgGR0BuGBb8m8dxaAdL5mgIR0Cbq1X/YJ3QdX2UKGgGR0Bv4T4DcM3IaAdL7GgIR0Cbq5Bltj0+dX2UKGgGR0Bw0y2CuloEaAdL72gIR0Cbq8ISlFc6dX2UKGgGR0BzBdqUNayKaAdL0mgIR0Cbq+1AJLM+dX2UKGgGR0BzcHmwJPZaaAdLzmgIR0CbrAir1dxAdX2UKGgGR0BySf7el9BsaAdL/GgIR0CbrAafSQYDdX2UKGgGR0BxuCLUCq6waAdNAQFoCEdAm6wQFLWZqnV9lChoBkdAcaTKvmoze2gHTREBaAhHQJusX30wrUd1fZQoaAZHQHB+oKIBRyhoB0vdaAhHQJusvgpBomJ1fZQoaAZHQHGcMJY1YQtoB0vHaAhHQJus5R2r4nF1fZQoaAZHQHA0exKQJX1oB0vsaAhHQJuthFDv3Jx1fZQoaAZHQHGRTMvAXVNoB0vdaAhHQJuusUrTYul1fZQoaAZHQG+Iz4cm0E5oB0vlaAhHQJuu2h11W811fZQoaAZHQHM3y0OVgQZoB0vVaAhHQJuvMOtnwod1fZQoaAZHQHLbWjfvWpZoB0v2aAhHQJuvry9VWCF1fZQoaAZHQHNi903fhuRoB0vbaAhHQJuv498qnWJ1fZQoaAZHQHE53Ytg8bJoB0vNaAhHQJuv9tKqXF91fZQoaAZHQHNjtSEUTL5oB0veaAhHQJuwHcHnln11fZQoaAZHQHMX5IDoyKxoB0vVaAhHQJuweW6bvw51ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 492, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.107+-x86_64-with-glibc2.31 # 1 SMP Sat Apr 29 09:15:28 UTC 2023", "Python": "3.10.11", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f76cc5eb1e3eebd680f3cb02d458b53cab83fec4dee4aa991a6d4f6530293fda
3
- size 146667
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:424876a40e563d82606b66d9113a7562c5f844fd4a8c39887dd607988c94ee89
3
+ size 146631
ppo-LunarLander-v2/data CHANGED
@@ -4,54 +4,54 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f6382212cb0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f6382212d40>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f6382212dd0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f6382212e60>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f6382212ef0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f6382212f80>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f6382213010>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f63822130a0>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7f6382213130>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f63822131c0>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f6382213250>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f63822132e0>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7f6382215a00>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
- "num_timesteps": 1507328,
25
- "_total_timesteps": 1500000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1685758402973880763,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAACbTT7NgC0+B827vb3ufr4N3AQ+I0rBvAAAAAAAAAAAprJvPnYl+D7EHT08xD67vl2yKj4DUTI8AAAAAAAAAAA9orE+kfQTP6HpJL7+YNG+KoKTPkUB5b0AAAAAAAAAAG3gPb7kIJk/UL0Dv26f5r7Hk5G+9uCRvgAAAAAAAAAA7TUevgwDSz5qIrY+PwW0vtLObj3T0OY9AAAAAAAAAACmM9A9MbiuPzwkAz8T4LG+DbqCPUXAEz4AAAAAAAAAAM3CRbymXLU/3iHMvs+dfj2uYj48EC0+PQAAAAAAAAAAAGEJPX4Trj72q9I8TiqrvlcNlzpeE1E8AAAAAAAAAABVC5u+n2iiPz1XBb+M2Pu+CGPuvkXDt70AAAAAAAAAAM2sCbvfeLQ/LudZvpCuMr04+R875m5FPQAAAAAAAAAAABC0Oygz0j1xF8K81EldvuGQJz2n7DG8AAAAAAAAAADNdcY8KVypP4Kfpz6VUBa/oZs5PND27j0AAAAAAAAAACbKyD3EAZM+527MveYnkb5XMQc80H3iuwAAAAAAAAAAmkaSPcYhdD+q+wE+jCMJv6BhhzryPAO9AAAAAAAAAACNAUu+ZU6KPiuNgT53ye2+jGGjPHCe6D0AAAAAAAAAAGZOjL1SGOa5jnxgNSKEii4m6oC7kleVtAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
38
- ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAEAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
39
  },
40
  "_last_original_obs": null,
41
  "_episode_num": 0,
42
  "use_sde": false,
43
  "sde_sample_freq": -1,
44
- "_current_progress_remaining": -0.004885333333333408,
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWVAAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHK7dsenyd6MAWyUTS4BjAF0lEdAmvJg79ycTnV9lChoBkdAcAhi++M6zWgHS/hoCEdAmvMWn889wHV9lChoBkdAcN7EOiFj/mgHS/RoCEdAmvOXhOxja3V9lChoBkdAcXi+OwPiDWgHTSABaAhHQJr0CnGbTc91fZQoaAZHQHCEtUsFt9BoB0v5aAhHQJr0pqesgdR1fZQoaAZHQHANUxyn1nNoB0vHaAhHQJr0jJSzgMt1fZQoaAZHQHBLNv0h/y5oB0viaAhHQJr1fLFGXol1fZQoaAZHQHH7nwob4rVoB0vmaAhHQJr1oDLbHp91fZQoaAZHQHIYCW3Sa3JoB0v7aAhHQJr1iS4e9zx1fZQoaAZHQHCpUFnqVyFoB0vtaAhHQJr1t4Uvf0p1fZQoaAZHQHI/Iqbz9TBoB0vfaAhHQJr2vLr5ZbJ1fZQoaAZHQHMAxuCPIXFoB00LAWgIR0Ca9vPWQOnVdX2UKGgGR0Bxed+DvmYCaAdNCQFoCEdAmvcxB/qgRXV9lChoBkdAcRJyVfNRnGgHS+5oCEdAmvfc9jgAInV9lChoBkdAcOwrrPdEcGgHTQcBaAhHQJr4QUXYUWV1fZQoaAZHQHCyFz2exwBoB0vyaAhHQJr5KA6Mir11fZQoaAZHQHFtsNQTEitoB00UAWgIR0Ca+Turp7kXdX2UKGgGR0BwutPqLS/kaAdNFgFoCEdAmvkz101ZT3V9lChoBkdAcNF9XLeQ+2gHS95oCEdAmvmOfNA1N3V9lChoBkdAcmcYNAkcCGgHS/JoCEdAmvmlhkRSP3V9lChoBkdAcS40Sh8IA2gHS+toCEdAmvpOXNTtLXV9lChoBkdAcWTy4FzMimgHS9NoCEdAmvrfdyksSXV9lChoBkdAcAUp2ll9SmgHTRYBaAhHQJr7d+AmReV1fZQoaAZHQHOr8DwH7gtoB0v7aAhHQJr7oO+ZgG91fZQoaAZHQHNteyu6mO5oB00AAWgIR0Ca++lWwNb1dX2UKGgGR0BxKsMc6vJSaAdL0WgIR0Ca++/2TPjXdX2UKGgGR0Bu8IbCJoCdaAdNKQFoCEdAmvzW34Kx93V9lChoBkdAcIcaA4GUwGgHS/1oCEdAmv08hs67unV9lChoBkdAcYiVyWAwwmgHS/NoCEdAmv088YAKfHV9lChoBkdAbsWmZVn27GgHS+loCEdAmv4AOe8PF3V9lChoBkdAcIZivgWJrWgHS/5oCEdAmxBHEQ5FPXV9lChoBkdAUSG+N96Tn2gHS7RoCEdAmxE3YxtYS3V9lChoBkdAced5gPVd5mgHS/VoCEdAmxHj37DVIHV9lChoBkdAcVueWv8qF2gHS/doCEdAmxH9wNsnA3V9lChoBkdAbygYsunMuGgHTQQBaAhHQJsSXp+tr9F1fZQoaAZHQG4Jr7oB7u5oB0v3aAhHQJsSk3m3fAN1fZQoaAZHQHEcy2QXAM5oB00EAWgIR0CbEySuQp4KdX2UKGgGR0Bzk7kaMrEtaAdL+WgIR0CbFYeQuEmIdX2UKGgGR0BvG3sRg7YDaAdL62gIR0CbFcVnmJWOdX2UKGgGR0BzhAomXw9aaAdNKwFoCEdAmxan+6y0KXV9lChoBkdAcgQpI+W4VmgHTRUBaAhHQJsW+UJOWSl1fZQoaAZHQG995oPCl8BoB00dAWgIR0CbF6jwhGH6dX2UKGgGR0Bw7VvkzXSSaAdL6mgIR0CbF8v2GqPwdX2UKGgGR0BxbujL0SRKaAdL+WgIR0CbGF4SYgJUdX2UKGgGR0BzKeG5+YtyaAdNCAFoCEdAmxhelsP8RHV9lChoBkdAcmJ6LOzIFWgHS/VoCEdAmxlvH5rP+nV9lChoBkdAchd8pkPMCGgHS/RoCEdAmxpMNlRP43V9lChoBkdAcSQ/o7muDGgHS+VoCEdAmxp1aGHpKXV9lChoBkdAbeHTlT3qRmgHS9xoCEdAmxp+GoJiRXV9lChoBkdAcBXqzJIUamgHS9VoCEdAmxpqekHlfnV9lChoBkdAcTqZxaPjn2gHS+1oCEdAmxqRnjABUHV9lChoBkdAcYdSjxkNF2gHS+loCEdAmxs8oQWepXV9lChoBkdAc2etI065oWgHTTsBaAhHQJsbXYUWVNZ1fZQoaAZHQG8NMijcmBxoB0vYaAhHQJscaws5GSZ1fZQoaAZHQG9Avn8sMApoB00BAWgIR0CbHVyOaOPvdX2UKGgGR0BzFKDOC5EuaAdLzGgIR0CbHWlkpZwGdX2UKGgGR0BxSiWdEsreaAdL/WgIR0CbHeTb349HdX2UKGgGR0By7pdu5z5oaAdNCwFoCEdAmx59IkJKJ3V9lChoBkdAc3kLlFMIvGgHS+9oCEdAmx6qGxlg+nV9lChoBkdAc1B2FFlTWGgHS9xoCEdAmx7kQPI4l3V9lChoBkdAcMfM2FWXC2gHTRABaAhHQJsfFIBikO91fZQoaAZHQG8+1+Zw4sFoB0vOaAhHQJsfdIkJKJ51fZQoaAZHQFRJAOavzOJoB0upaAhHQJsfebqhUR51fZQoaAZHQHJbxzzVc2RoB00YAWgIR0CbH6jsUqQSdX2UKGgGR0BwTFK8L8aXaAdL3mgIR0CbH741xbSrdX2UKGgGR0BxbmRxLkCFaAdL7GgIR0CbH/GWUr08dX2UKGgGR0Bx3DyFwkxAaAdNAgFoCEdAmyCPGVAzHnV9lChoBkdAcEu2rXDm82gHS+ZoCEdAmyCyEYfnwHV9lChoBkdAcNZ7VrhzeWgHTQ4BaAhHQJsg7posZpB1fZQoaAZHQHIEyP2f029oB00OAWgIR0CbItoFFDv3dX2UKGgGR0BwoJDTjNpuaAdL+mgIR0CbI1EYwZfldX2UKGgGR0BvTI+Sr5qNaAdL4GgIR0CbIziQDFIedX2UKGgGR0Bxcn8CPp6haAdL1GgIR0CbI4I68xsVdX2UKGgGR0BuIyWeHzpYaAdNDwFoCEdAmyPx15jYqXV9lChoBkdAcgwIbfgrH2gHS9ZoCEdAmyQs5n13+3V9lChoBkdAcEvZiuuA7WgHS/VoCEdAmySNQfp2U3V9lChoBkdAckcPKMefZmgHS9BoCEdAmySrxmTTv3V9lChoBkdAcrCtZ3cHnmgHS+5oCEdAmyU0dq+JxnV9lChoBkdAc0aeQdS2pmgHTR8BaAhHQJsl5PrOZ9d1fZQoaAZHQHGjgMUh3aBoB0vhaAhHQJsmNyHVPN51fZQoaAZHQHLfQGKQ7tBoB00FAWgIR0CbJiv/BFd+dX2UKGgGR0BzHWsp5NXYaAdNBgFoCEdAmyZw3YL9dnV9lChoBkdAb7+B/ZuhsmgHS+JoCEdAmyamQfZElXV9lChoBkdAcqwE/B3zMGgHS+5oCEdAmyax02cawXV9lChoBkdAcM1BQemvXGgHTTcBaAhHQJsnCt0V8Cx1fZQoaAZHQHCKH3ta6jFoB0v3aAhHQJspDJ8v25B1fZQoaAZHQG3RHG8274BoB0vsaAhHQJspHBSDRMN1fZQoaAZHQHDu0e+23KBoB0vqaAhHQJspVXhfjS51fZQoaAZHQHGW4S13MZBoB0v7aAhHQJsplXr+o991fZQoaAZHQG87R8twrDtoB0vWaAhHQJspzEm6XjV1fZQoaAZHQG/7dZq20AtoB0vyaAhHQJsp6wTufEp1fZQoaAZHQHHwD/ACW/toB00BAWgIR0CbKn9X9zfadX2UKGgGR0Bx/9Jbt7a7aAdL3mgIR0CbKqE+gUUPdX2UKGgGR0ByYT37DVH4aAdL4WgIR0CbK1StNi6QdX2UKGgGR0BwMWOvMbFTaAdNEwFoCEdAmytstPHktHV9lChoBkdAcN47A+IM0GgHS+5oCEdAmyv2f9P1tnV9lChoBkdAcE9j+rELpmgHS+NoCEdAmywj9sJpnHV9lChoBkdAcftC7K7qZGgHS/ZoCEdAmyxlbJOnEXV9lChoBkdAcEbtMfzSTmgHS/BoCEdAmyyDnNgSe3V9lChoBkdAcxzT1kDp1WgHTQcBaAhHQJssiya/h2p1ZS4="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
  },
54
- "_n_updates": 388,
55
  "observation_space": {
56
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
  ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f23f21ea680>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f23f21ea710>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f23f21ea7a0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f23f21ea830>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f23f21ea8c0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f23f21ea950>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f23f21ea9e0>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f23f21eaa70>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f23f21eab00>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f23f21eab90>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f23f21eac20>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f23f21eacb0>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7f23f21dbc80>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
+ "num_timesteps": 2015232,
25
+ "_total_timesteps": 2000000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1685968980168974344,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM1fgL5VHko/6My+Pb8V/75aYwO/+jZkPgAAAAAAAAAAGop9PR0mkD/pyig+LU75vqq/zz1Ao3k9AAAAAAAAAADm2Ae9wxlMumjEy7P6aRkvafaDunqxszMAAIA/AACAPxoKNL08J4s/LoqWvfEw076U6iW+qEjAvQAAAAAAAAAAGkMCPh7RLT/W6WK8lIT6vpMAKz7e1Uy9AAAAAAAAAACaV5U8yyzHPQF1vr2rQZa+4uK3PNhltL0AAAAAAAAAAM3UHDwpAGi64hActjyqCbFBtg+6ouBDNQAAgD8AAIA/ZoVkvhhRgj9GV5u+eybHvtUJAL8zoB6+AAAAAAAAAADNt4u8rwatPtBx8j2Altm+LaLUPbKQjT0AAAAAAAAAAACoGb1/87I/qo88v2SpK76Nqss8pN3APAAAAAAAAAAAM6SXPDbZbrxXeMu8oFt7PR5knDozntw6AACAPwAAgD+asRw9SBWBuv3OLTcio/Exo9MWu15tS7YAAIA/AACAP3qNnT7MyQ4/KrAxvqaABL8jnoo+GtiCvgAAAAAAAAAAs8ZePY/eebr+oEqyDJ6EMPmMczjHTMwyAACAPwAAgD8AChU+pO2oP6fbIj/Sx+u+1jQ/PqFhvD4AAAAAAAAAAGYxpDz2OFi6brwzM3udILDeKIO79JjKswAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
38
+ ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
39
  },
40
  "_last_original_obs": null,
41
  "_episode_num": 0,
42
  "use_sde": false,
43
  "sde_sample_freq": -1,
44
+ "_current_progress_remaining": -0.007616000000000067,
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWV5QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHGDzJyQxN+MAWyUS+2MAXSUR0CbfZrTYukDdX2UKGgGR0BxXlvP1L8KaAdL3mgIR0CbfarVOKwZdX2UKGgGR8ACkTDfm9xqaAdLgWgIR0CbfarhzeXSdX2UKGgGR0Bx321pj+aSaAdL12gIR0Cbfan/1g6VdX2UKGgGR0ByC6XfIjnnaAdL7mgIR0CbfbbYsd1ddX2UKGgGR0BxNqB3A2ycaAdLyWgIR0CbfdXiR4hVdX2UKGgGR0BxoKimEXchaAdL9GgIR0CbffI0qH45dX2UKGgGR0BxfwZVGTcJaAdL3GgIR0CbfflSjxkNdX2UKGgGR0BwHmDJ2dNGaAdL0mgIR0CbfpMHryDqdX2UKGgGR0BtWxAnlXA/aAdL3mgIR0Cbfp90ihWYdX2UKGgGR0ByvpF2FFlTaAdL4GgIR0Cbftnm7rcCdX2UKGgGR0BxkO6bvw3HaAdL1GgIR0CbfxicoYvWdX2UKGgGR0Byvt2ECeVcaAdL5GgIR0Cbf619fCyhdX2UKGgGR0BMJr7O3UhFaAdLlGgIR0CbgHp22XsxdX2UKGgGR0BwbPtBv73xaAdL6mgIR0CbgIxWDHwPdX2UKGgGR0BxI45IYm9haAdL6WgIR0CbgTQFLWZrdX2UKGgGR0Bw0HsmfGuLaAdL82gIR0CbgVetjkMkdX2UKGgGR0ByMInQY1pCaAdL0mgIR0CbgeHQhOgydX2UKGgGR0BzYONYKYzBaAdL3WgIR0CbghO/L1VYdX2UKGgGR0Bwn8J9iMHbaAdL42gIR0Cbgjj2zv7WdX2UKGgGR0BwfHMY/FBIaAdL52gIR0CbgkA3T/hmdX2UKGgGR0ByxjiOvMbFaAdL6mgIR0Cbgoxsl9jPdX2UKGgGR0Bw5ATSLIgeaAdLzGgIR0Cbgs6XBxgidX2UKGgGR0BxLYm9g4OuaAdL8WgIR0CbgtcLBsQ/dX2UKGgGR0BvPhlDneSCaAdL8mgIR0CbguQ9zOopdX2UKGgGR0Byoha4c3l0aAdL2WgIR0Cbg21Gb1AadX2UKGgGR0BxT5U4rBj4aAdL9WgIR0Cbg76CDmKZdX2UKGgGR0Bx0Chwl0HRaAdL92gIR0CbhF2WpqASdX2UKGgGR0BSqm69TP0JaAdLtmgIR0CbhHZOzposdX2UKGgGR0BxG3Uaya/iaAdL7GgIR0CblK+jua4MdX2UKGgGR0BxMPvc8DB/aAdL2mgIR0CblSTPjXFtdX2UKGgGR0BwMZXKbKA8aAdL3GgIR0Cbld4xUNrkdX2UKGgGR0BwA5A+pwS8aAdL4WgIR0Cblh5P/JeWdX2UKGgGR0BxlShvitJWaAdLy2gIR0Cblp1/lQuVdX2UKGgGR0ByLX3pOerdaAdLyWgIR0Cblp2Pkq+bdX2UKGgGR0BuSyH446wMaAdL4GgIR0Cblto+wC8wdX2UKGgGR0BzKMzO5avBaAdLwmgIR0CblzzDGcWkdX2UKGgGR0ByDZr0rbxmaAdLzWgIR0Cblz01ZTybdX2UKGgGR0BwVjopx3mnaAdL3GgIR0CbmBKeTV2BdX2UKGgGR0BwiIKCxu89aAdNBgFoCEdAm5hQ3gk1M3V9lChoBkdAcbt8LKFIu2gHS/hoCEdAm5j/h2nsLXV9lChoBkdAcZqk9lmOEWgHS/FoCEdAm5mOK0lZ5nV9lChoBkdAcC0OPNmlImgHS/NoCEdAm5oM/MW43HV9lChoBkdAcnWGqxTsIGgHS9xoCEdAm5pdCiRGMHV9lChoBkdAcUfQFcIJJGgHS+VoCEdAm5qAI+nqFHV9lChoBkdAcNcnuiN83WgHS/FoCEdAm5t3YlIEsHV9lChoBkdAc0ldS2phnmgHS+poCEdAm5vpSR8tw3V9lChoBkdAcCTyn1nM+2gHS9toCEdAm5zN6gM+eXV9lChoBkdAcQUXhfjS5WgHS/doCEdAm51SP2f03HV9lChoBkdAcwrMoc7yQWgHS99oCEdAm513Ov+wT3V9lChoBkdAclg1anrIHWgHS9toCEdAm52KHfuTinV9lChoBkdAcRw+/gzguWgHS9ZoCEdAm526zE74jHV9lChoBkdAccZLxZuAJGgHS+9oCEdAm53yjk+5fHV9lChoBkdAcTXgbZOBUmgHS9JoCEdAm55koa1kUnV9lChoBkdAcIzQl8gIQmgHS/VoCEdAm56iUornT3V9lChoBkdAcfFC4z7/GWgHS79oCEdAm566FuejEnV9lChoBkdAcVFjbBXS0GgHS+FoCEdAm58Q0TDfnHV9lChoBkdAbfXXd0q6OGgHS9doCEdAm5/8XBP9DXV9lChoBkdAcStFb3XZoWgHS9ZoCEdAm6B80cfeUXV9lChoBkdAbtE+Yc/+sGgHS9doCEdAm6D8ABDG+HV9lChoBkdAcvp2P1ct5GgHTQMBaAhHQJuiTTH80k51fZQoaAZHQHQSgeV9nbtoB0vRaAhHQJuiaVpsXSB1fZQoaAZHQHHLSq6vq1RoB0v0aAhHQJujJBKL8791fZQoaAZHQHCWjCxeLNxoB0vbaAhHQJukaEsasIV1fZQoaAZHQG+CQN9YwItoB0v8aAhHQJulFOvdM0x1fZQoaAZHQHAyarvLHMloB0voaAhHQJulNVBD5TJ1fZQoaAZHQHFPxBVuJk5oB0vKaAhHQJulNe6Zpi91fZQoaAZHQHOsp1vES/VoB0vbaAhHQJulQGNaQmx1fZQoaAZHQHAFUQ9RrJtoB0viaAhHQJulPxRVIZt1fZQoaAZHQHOzu1WsA/9oB0vGaAhHQJulV9srNGF1fZQoaAZHQHFl6F/QSjBoB0vwaAhHQJulZwcYIjZ1fZQoaAZHQHDEAOe8PFxoB0vdaAhHQJumbz7MxGl1fZQoaAZHQG+d1TR6WxBoB0vxaAhHQJumr2TPjXF1fZQoaAZHQHMgTfR/mT1oB0u9aAhHQJunWt5le4V1fZQoaAZHQHFOCZ0CA+ZoB0vzaAhHQJuoDnjhky11fZQoaAZHQG9Sk87p3X9oB0vqaAhHQJuoRS9/SYx1fZQoaAZHQHGFOhbnoxJoB0vaaAhHQJup3M+u/1x1fZQoaAZHQHIhaYu01IloB0vyaAhHQJup5fnfVI91fZQoaAZHQHO3HsolUqBoB00CAWgIR0CbqlTb349HdX2UKGgGR0BxQK3BpHqeaAdL1WgIR0CbqpGUfPondX2UKGgGR0BzrbmknCwbaAdL2mgIR0CbqyeTmnwYdX2UKGgGR0BuGBb8m8dxaAdL5mgIR0Cbq1X/YJ3QdX2UKGgGR0Bv4T4DcM3IaAdL7GgIR0Cbq5Bltj0+dX2UKGgGR0Bw0y2CuloEaAdL72gIR0Cbq8ISlFc6dX2UKGgGR0BzBdqUNayKaAdL0mgIR0Cbq+1AJLM+dX2UKGgGR0BzcHmwJPZaaAdLzmgIR0CbrAir1dxAdX2UKGgGR0BySf7el9BsaAdL/GgIR0CbrAafSQYDdX2UKGgGR0BxuCLUCq6waAdNAQFoCEdAm6wQFLWZqnV9lChoBkdAcaTKvmoze2gHTREBaAhHQJusX30wrUd1fZQoaAZHQHB+oKIBRyhoB0vdaAhHQJusvgpBomJ1fZQoaAZHQHGcMJY1YQtoB0vHaAhHQJus5R2r4nF1fZQoaAZHQHA0exKQJX1oB0vsaAhHQJuthFDv3Jx1fZQoaAZHQHGRTMvAXVNoB0vdaAhHQJuusUrTYul1fZQoaAZHQG+Iz4cm0E5oB0vlaAhHQJuu2h11W811fZQoaAZHQHM3y0OVgQZoB0vVaAhHQJuvMOtnwod1fZQoaAZHQHLbWjfvWpZoB0v2aAhHQJuvry9VWCF1fZQoaAZHQHNi903fhuRoB0vbaAhHQJuv498qnWJ1fZQoaAZHQHE53Ytg8bJoB0vNaAhHQJuv9tKqXF91fZQoaAZHQHNjtSEUTL5oB0veaAhHQJuwHcHnln11fZQoaAZHQHMX5IDoyKxoB0vVaAhHQJuweW6bvw51ZS4="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
  },
54
+ "_n_updates": 492,
55
  "observation_space": {
56
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
  ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d28767766512ca90900fd048bf56e7ca910b830efcda620aea07d4e1311db2a4
3
  size 87929
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0336023c1a7c573c46c504544dde67009db506392cfd3571c04770965dcbfac2
3
  size 87929
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0487a8c4ade92684dfa3d8cc81a3b16aa00562c98e0e083b1e5c9518e6b25627
3
  size 43329
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57a30c01c1928a1627c353ff868bd63139afb15aa3200cfc8599fb1a83b94e51
3
  size 43329
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 277.80892382852636, "std_reward": 16.215863338688838, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-06-03T02:40:40.772755"}
 
1
+ {"mean_reward": 283.35054041649585, "std_reward": 20.401455067585868, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-06-05T13:13:40.169995"}