Commit ·
bbb6fc1
1
Parent(s): 4f27e4a
PPO LunarLander-v2 after hpo
Browse files- README.md +1 -1
- config.json +1 -1
- ppo_lunarlander-v2_hpo.zip +3 -0
- ppo_lunarlander-v2_hpo/_stable_baselines3_version +1 -0
- ppo_lunarlander-v2_hpo/data +98 -0
- ppo_lunarlander-v2_hpo/policy.optimizer.pth +3 -0
- ppo_lunarlander-v2_hpo/policy.pth +3 -0
- ppo_lunarlander-v2_hpo/pytorch_variables.pth +3 -0
- ppo_lunarlander-v2_hpo/system_info.txt +7 -0
- replay.mp4 +0 -0
- results.json +1 -1
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value:
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: 119.96 +/- 120.32
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fa995a5a280>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fa995a5a310>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fa995a5a3a0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fa995a5a430>", "_build": "<function ActorCriticPolicy._build at 0x7fa995a5a4c0>", "forward": "<function ActorCriticPolicy.forward at 0x7fa995a5a550>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fa995a5a5e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fa995a5a670>", "_predict": "<function ActorCriticPolicy._predict at 0x7fa995a5a700>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fa995a5a790>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fa995a5a820>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fa995a5a8b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7fa995ad1bd0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1001472, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1679385416731872502, "learning_rate": 0.0005022723199591951, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVJQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeS9ob21lL3hhdmkvRG9jdW1lbnRzL3Byb2plY3RzL0RlZXBSTC1odWdnaW5nZmFjZS9kZWVwcmwtZW52L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjHkvaG9tZS94YXZpL0RvY3VtZW50cy9wcm9qZWN0cy9EZWVwUkwtaHVnZ2luZ2ZhY2UvZGVlcHJsLWVudi9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9AdV2YDXX3hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAOYYFT55zGg/coeePrIPUb/G2Y8+usPZvAAAAAAAAAAAAAOtvBLkuDxnDLq8aoYDvgd8MjyaltO7AAAAAAAAAADNaNK7SAbEOy4uAzuCNKC9Y/ErPA+jQDwAAAAAAAAAAM3EYj2+4bM/Aj4pP0P0/b2xf1W8R73JPQAAAAAAAAAAGs8Jvs/7Yj7tFR8++8divvtJFD3TPlU9AAAAAAAAAAAa3wo9j34Wum9ISbt6k5s3aCA/u8wCFDoAAIA/AACAPwgwgr5SXYE8steHOn+JwLgFIAq+KnSjuQAAgD8AAIA/jZAaPsxxEj+65V88U7Rhv5oy7z3qgXe8AAAAAAAAAACGVSa+8R7JPVi9u7uCNoK9+g4aveUD/rwAAAAAAAAAAJpGjTwcox09Q6qvveLOTb3VYv68qqg1vAAAAAAAAAAATUMmPoPpVD1iYv88WuqZv2bRp7334YO+AAAAAAAAAACAoBY9e1SIumavyDpvxei0uzMgu/3T5LkAAIA/AACAP82rBL0ImA0/Elw3vH5lMb81zjg7vv+TPQAAAAAAAAAAU0Clvi3tHj/PTBa9XP4rv2ajEr6INsk9AAAAAAAAAAD6LSi+5o4pP/GdM74Jugy/PSMPvvqhfDwAAAAAAAAAAM12NLwkK7U//ZqKvkeSIjxCwGE8TbUSPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0014719999999999178, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVLhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIdCmuKvtmOUCUhpRSlIwBbJRLdYwBdJRHQKM59lBhQWN1fZQoaAZoCWgPQwgdxw+VBuBwQJSGlFKUaBVL22gWR0CjOi0ahpQDdX2UKGgGaAloD0MIwtoYO+EVcUCUhpRSlGgVS8ZoFkdAoz7XykKu0XV9lChoBmgJaA9DCHuIRneQInFAlIaUUpRoFUvpaBZHQKM/FF8XvYx1fZQoaAZoCWgPQwiwrDQpBS1AwJSGlFKUaBVLZGgWR0CjPxjP4VRDdX2UKGgGaAloD0MIQfM5d7skR0CUhpRSlGgVS3doFkdAoz816NVBEHV9lChoBmgJaA9DCCuiJvp8F1jAlIaUUpRoFUtaaBZHQKM/POmixml1fZQoaAZoCWgPQwg1JVmHo0NtQJSGlFKUaBVLymgWR0CjP2LPD50sdX2UKGgGaAloD0MIeTwtP/CwbkCUhpRSlGgVS9toFkdAoz+sc6vJR3V9lChoBmgJaA9DCNNmnIZoDXJAlIaUUpRoFUvMaBZHQKM/zisGPgh1fZQoaAZoCWgPQwgJNUOqqFtwQJSGlFKUaBVLrGgWR0CjP80fYBeYdX2UKGgGaAloD0MIi+JV1nY+c0CUhpRSlGgVS9BoFkdAoz/ebd8ArHV9lChoBmgJaA9DCANgPIPGhHNAlIaUUpRoFUu6aBZHQKM/7P9DQZ51fZQoaAZoCWgPQwgriIGufRdOwJSGlFKUaBVLVmgWR0CjP/ZrP+n7dX2UKGgGaAloD0MI58b0hCU+ckCUhpRSlGgVS+5oFkdAo0A0jNY8uHV9lChoBmgJaA9DCM/AyMuaJDJAlIaUUpRoFUthaBZHQKNE24MnZ011fZQoaAZoCWgPQwih2uBEtFBwQJSGlFKUaBVL2GgWR0CjRNuxrzoVdX2UKGgGaAloD0MIey3ovTHqTkCUhpRSlGgVS31oFkdAo0Tqjafzz3V9lChoBmgJaA9DCIDTu3g/EHJAlIaUUpRoFUvbaBZHQKNFJ2IO6NF1fZQoaAZoCWgPQwjOcAM+P4z5v5SGlFKUaBVLXGgWR0CjRWLE9+w1dX2UKGgGaAloD0MIkUPEzSlDb0CUhpRSlGgVS91oFkdAo0Vo9aEBbXV9lChoBmgJaA9DCGuCqPvAnnBAlIaUUpRoFUuxaBZHQKNGVQ+lj3F1fZQoaAZoCWgPQwiIEFfO3ulLQJSGlFKUaBVLdGgWR0CjSqvcJtzkdX2UKGgGaAloD0MIFmniHeAOcUCUhpRSlGgVS+xoFkdAo0rBH09QoHV9lChoBmgJaA9DCL9FJ0utfHBAlIaUUpRoFUvJaBZHQKNK8ImgJ1J1fZQoaAZoCWgPQwheZtgoaztwQJSGlFKUaBVL1mgWR0CjS0vMSsbOdX2UKGgGaAloD0MI3Lqbp/rRcECUhpRSlGgVTQwBaBZHQKNLUPAfuCx1fZQoaAZoCWgPQwiI9NvXAXBxQJSGlFKUaBVLu2gWR0CjS8bx/d6+dX2UKGgGaAloD0MIBb8NMV4/cUCUhpRSlGgVS9NoFkdAo0xfJJXhfnV9lChoBmgJaA9DCEax3NLqIXJAlIaUUpRoFU0WAWgWR0CjTG4XGff5dX2UKGgGaAloD0MIKH/3jhogcUCUhpRSlGgVS9ZoFkdAo1NQ9ic5KnV9lChoBmgJaA9DCPUsCOV9XPa/lIaUUpRoFUt0aBZHQKNT4SlFc6h1fZQoaAZoCWgPQwioUx7dCCtyQJSGlFKUaBVNAAFoFkdAo1P3uXu3MXV9lChoBmgJaA9DCBsN4C0Qr3BAlIaUUpRoFUvwaBZHQKNT/1YhdMV1fZQoaAZoCWgPQwjbiCe7mVZvQJSGlFKUaBVLxWgWR0CjVI2XC0ngdX2UKGgGaAloD0MIFAfQ73szcUCUhpRSlGgVS8JoFkdAo1ViBiCrcXV9lChoBmgJaA9DCJRQ+kJIam1AlIaUUpRoFUvRaBZHQKNVfeZ5Rj11fZQoaAZoCWgPQwhywRn8fX5xQJSGlFKUaBVL2WgWR0CjVZQd8zAOdX2UKGgGaAloD0MI0/iFVxIJcECUhpRSlGgVS9doFkdAo1qNC3PRiXV9lChoBmgJaA9DCJBKsaOxOXBAlIaUUpRoFUvKaBZHQKNa1ENOM2p1fZQoaAZoCWgPQwhUrYVZaGcLQJSGlFKUaBVLimgWR0CjWuT/6wdKdX2UKGgGaAloD0MIu2QcI9knTECUhpRSlGgVS3doFkdAo1r/aDf3vnV9lChoBmgJaA9DCErP9BJjNTDAlIaUUpRoFUtZaBZHQKNcJYlpoK51fZQoaAZoCWgPQwhiLT4FQHBvQJSGlFKUaBVLuGgWR0CjXCWzF+/hdX2UKGgGaAloD0MIAp1Jm6pHcUCUhpRSlGgVS9JoFkdAo1yY2Q4jr3V9lChoBmgJaA9DCMxiYvPxuXBAlIaUUpRoFUvKaBZHQKNg/s8gZCR1fZQoaAZoCWgPQwhOmDCalfVMQJSGlFKUaBVLgWgWR0CjYYWovSMMdX2UKGgGaAloD0MI6uqOxbaDb0CUhpRSlGgVS8poFkdAo2G2iYb833V9lChoBmgJaA9DCOF/K9mxEfc/lIaUUpRoFUt2aBZHQKNipX8wYch1fZQoaAZoCWgPQwg/G7luSq5hQJSGlFKUaBVN6ANoFkdAo2O5vkzXSXV9lChoBmgJaA9DCA9iZwqdh0VAlIaUUpRoFUtmaBZHQKNoG6r/82t1fZQoaAZoCWgPQwixw5j092BGQJSGlFKUaBVLmmgWR0CjaIOB+WnkdX2UKGgGaAloD0MIVKhuLv75cECUhpRSlGgVTcwBaBZHQKNo15O8Cgd1fZQoaAZoCWgPQwitad5xSq1yQJSGlFKUaBVNVgFoFkdAo2kDyWiUPnV9lChoBmgJaA9DCKBU+3Q8mG5AlIaUUpRoFUu1aBZHQKNpod92HL11fZQoaAZoCWgPQwjXicvxCg5vQJSGlFKUaBVNCAFoFkdAo2oOgL7XQXV9lChoBmgJaA9DCM/0EmMZj2xAlIaUUpRoFU1cA2gWR0CjamE12q1gdX2UKGgGaAloD0MIr7FLVG/SUcCUhpRSlGgVSz1oFkdAo3Ect29tdnV9lChoBmgJaA9DCGiWBKjpMnBAlIaUUpRoFUvwaBZHQKNy6bwSamZ1fZQoaAZoCWgPQwg5Y5gT9IlwQJSGlFKUaBVLxGgWR0CjcvxwQ176dX2UKGgGaAloD0MIRdREn4++QsCUhpRSlGgVS2VoFkdAo3Mo1pCa7XV9lChoBmgJaA9DCGUdjq7SP0xAlIaUUpRoFUuvaBZHQKNz1KGtZFJ1fZQoaAZoCWgPQwhens4V5a9wQJSGlFKUaBVNlgNoFkdAo3RIhQm/nHV9lChoBmgJaA9DCHJsPUO4iW9AlIaUUpRoFUvfaBZHQKN0Za8Hv+h1fZQoaAZoCWgPQwhkeOxnsRQNQJSGlFKUaBVLXmgWR0CjdHasZHd5dX2UKGgGaAloD0MIbTmX4qpGNUCUhpRSlGgVS4doFkdAo3TURg7YCnV9lChoBmgJaA9DCIem7PSDbV/AlIaUUpRoFUtHaBZHQKN53jriVB51fZQoaAZoCWgPQwjItDaN7YVQwJSGlFKUaBVLWmgWR0Cjed6SDAaedX2UKGgGaAloD0MI8UbmkT8QY8CUhpRSlGgVS2hoFkdAo3oD9ZRsM3V9lChoBmgJaA9DCCo6ksv/VXRAlIaUUpRoFUv8aBZHQKN6Kt6HCXR1fZQoaAZoCWgPQwiC4seYuxZYwJSGlFKUaBVLW2gWR0CjeocvmHQAdX2UKGgGaAloD0MIJ6CJsOEmaECUhpRSlGgVTegDaBZHQKN64xW1c+t1fZQoaAZoCWgPQwgtmWN5VzZgwJSGlFKUaBVLQGgWR0Cje01X/5tWdX2UKGgGaAloD0MI1a90PjwCWMCUhpRSlGgVS3VoFkdAo3tmerdWQ3V9lChoBmgJaA9DCG2RtBt9oD/AlIaUUpRoFUuGaBZHQKN7goaUA1h1fZQoaAZoCWgPQwhMw/ARMYU0QJSGlFKUaBVLP2gWR0CjgFdTHbRGdX2UKGgGaAloD0MI3ncMj/1QMkCUhpRSlGgVS1poFkdAo4CPqoqCpXV9lChoBmgJaA9DCCMUW0FTPXBAlIaUUpRoFUvmaBZHQKOA1TqB3A51fZQoaAZoCWgPQwhi9rLttFNXwJSGlFKUaBVLPWgWR0CjgPTBRAKOdX2UKGgGaAloD0MI+WabG5MJckCUhpRSlGgVTZYBaBZHQKOBCfQKKHh1fZQoaAZoCWgPQwiQv7SoT+BvQJSGlFKUaBVL8mgWR0CjgfJPIn0DdX2UKGgGaAloD0MINrHAV3T7PUCUhpRSlGgVS3xoFkdAo4I8brC3w3V9lChoBmgJaA9DCGwFTUssyWLAlIaUUpRoFUs8aBZHQKOCYFfzBhx1fZQoaAZoCWgPQwj6f9WRIxZwQJSGlFKUaBVL1WgWR0Cjgo2Tot+TdX2UKGgGaAloD0MI/iyWIvnWTcCUhpRSlGgVS19oFkdAo4Kk2LpA2XV9lChoBmgJaA9DCNf5t8t+RS5AlIaUUpRoFUt+aBZHQKOHrBQemvZ1fZQoaAZoCWgPQwjNzMzMjO5wQJSGlFKUaBVL+GgWR0Cjh7MYuTRqdX2UKGgGaAloD0MIUtfa+xQncECUhpRSlGgVTRABaBZHQKOH6ez2OAB1fZQoaAZoCWgPQwgvUFJggaRjQJSGlFKUaBVN6ANoFkdAo4hyrilzl3V9lChoBmgJaA9DCOdwrfawPFTAlIaUUpRoFUtVaBZHQKOIffR/mT11fZQoaAZoCWgPQwh8X1yq0rJTwJSGlFKUaBVLZGgWR0CjiKHSnccmdX2UKGgGaAloD0MI/fUKC+6vL0CUhpRSlGgVS2loFkdAo5BVbHIZInV9lChoBmgJaA9DCCbhQh4BR3BAlIaUUpRoFUvyaBZHQKOQ8Y8+zMR1fZQoaAZoCWgPQwhtxf6yey9uQJSGlFKUaBVLs2gWR0CjkW05+6RRdX2UKGgGaAloD0MI53Ct9rBZUMCUhpRSlGgVS2loFkdAo5GvRqoIfXV9lChoBmgJaA9DCDEKgsc3FmNAlIaUUpRoFU3oA2gWR0Cjkg5f2K2sdX2UKGgGaAloD0MIT3l0IyydcECUhpRSlGgVTTkBaBZHQKOSdcLSeAd1fZQoaAZoCWgPQwjGT+Pe/NBsQJSGlFKUaBVL8mgWR0CjkwAR02cbdX2UKGgGaAloD0MIorYNo6CaY0CUhpRSlGgVTegDaBZHQKOUBaL4vex1fZQoaAZoCWgPQwgaa39ne5JjQJSGlFKUaBVN6ANoFkdAo5QazJIUanVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 11736, "n_steps": 128, "gamma": 0.988045661427605, "gae_lambda": 0.9768700030979546, "ent_coef": 0.004851331424615018, "vf_coef": 0.9683727099048757, "max_grad_norm": 0.5143831585332781, "batch_size": 128, "n_epochs": 24, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/2z1AOneYeIWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/2ievqsLa04WUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.15.0-67-generic-x86_64-with-glibc2.29 # 74~20.04.1-Ubuntu SMP Wed Feb 22 14:52:34 UTC 2023", "Python": "3.8.10", "Stable-Baselines3": "1.7.0", "PyTorch": "2.0.0+cu117", "GPU Enabled": "True", "Numpy": "1.24.2", "Gym": "0.21.0"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fc080fa54c0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fc080fa5550>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fc080fa55e0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fc080fa5670>", "_build": "<function ActorCriticPolicy._build at 0x7fc080fa5700>", "forward": "<function ActorCriticPolicy.forward at 0x7fc080fa5790>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fc080fa5820>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fc080fa58b0>", "_predict": "<function ActorCriticPolicy._predict at 0x7fc080fa5940>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fc080fa59d0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fc080fa5a60>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fc080fa5af0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7fc080fa2240>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 500080, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1679389289642222321, "learning_rate": 0.0005022723199591951, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVJQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeS9ob21lL3hhdmkvRG9jdW1lbnRzL3Byb2plY3RzL0RlZXBSTC1odWdnaW5nZmFjZS9kZWVwcmwtZW52L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjHkvaG9tZS94YXZpL0RvY3VtZW50cy9wcm9qZWN0cy9EZWVwUkwtaHVnZ2luZ2ZhY2UvZGVlcHJsLWVudi9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9AdV2YDXX3hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM0ioz7/r4A+Cpy/vU7c1L4oINm81xOLPQAAAAAAAAAA0DWVPiWToD6nC407+0i7vvS2tzqruR+9AAAAAAAAAAAND0w+roGVustb7TxZBTU9QgSVPepAuzoAAIA/AACAP4MoyT5EWe8+1y2hvYYAIL+Zd4i9S1dXvAAAAAAAAAAAjdvjPQpnYbntOPs6koyjtdLlE7lWBJm0AAAAAAAAgD9Ny1Q+XI+yPl3IAr2eski+KUsdvZLI0DsAAAAAAAAAAA2z5T0N7UE+x6fLu7IuV76h1Cs8paICuwAAAAAAAAAAsz2CPghzq7xtjdq5hTgfOIeeGb6CLAg5AACAPwAAgD9gfT8+pORhOjBA0jyqhmU5ajQPPANNRjoAAIA/AACAP3Pcuj0Ayog/4uVHPodz0r6/vO48mje4PAAAAAAAAAAAgOCDvtAPVz/mGUc+V86yvuNgxL71miY+AAAAAAAAAAAGPRI+z0dGvFAAvTxbn+w8SjKXvUQvQ7sAAIA/AACAP/qZS75yrEM/dvq4Pn5fC78nEKW9ihYEPwAAAAAAAAAA5mNyPQUA0jyr4kY9VhcwvgoWyDyH0Km7AAAAAAAAAAAAAHq9Ccx4PR7Tij6zCGq/GWz1PYIeEb0AAAAAAAAAABqDrT5oLuO9+xTFPidSlL0slBW/MSoRPgAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.00015999999999993797, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIZOWXwRjFOsCUhpRSlIwBbJRL4YwBdJRHQK441Hww0wd1fZQoaAZoCWgPQwgHexNDcjLiv5SGlFKUaBVLp2gWR0CuOp1Da4+bdX2UKGgGaAloD0MIDhDM0eMjRsCUhpRSlGgVS5BoFkdArj4mZqmCRXV9lChoBmgJaA9DCBaFXRQ98OC/lIaUUpRoFUuJaBZHQK4+KF7laKV1fZQoaAZoCWgPQwhsdqT6TlxtQJSGlFKUaBVL5GgWR0CuP+4HoouxdX2UKGgGaAloD0MIyD8ziI8iaECUhpRSlGgVTZsBaBZHQK5Bu8Tzund1fZQoaAZoCWgPQwjf/fFetRIoQJSGlFKUaBVLqmgWR0CuRUpW3jMndX2UKGgGaAloD0MIiesYV1zVbUCUhpRSlGgVTQABaBZHQK5Rwyon8bd1fZQoaAZoCWgPQwhw0clS68lIwJSGlFKUaBVLw2gWR0CuWP1loUSJdX2UKGgGaAloD0MI36XUJaOncECUhpRSlGgVS9ZoFkdArlyas6q82HV9lChoBmgJaA9DCINqgxPR7ydAlIaUUpRoFUuYaBZHQK5h8FEAo5R1fZQoaAZoCWgPQwj6m1CIgOc0QJSGlFKUaBVLlWgWR0CuY7qFZgXudX2UKGgGaAloD0MICRueXinjIsCUhpRSlGgVS5ZoFkdArmO69M9KVnV9lChoBmgJaA9DCKMfDafM525AlIaUUpRoFU0EAWgWR0CuZYnCfpUxdX2UKGgGaAloD0MIEmqGVFE4R0CUhpRSlGgVS6JoFkdArmrZrtVrAXV9lChoBmgJaA9DCBQF+kSePXFAlIaUUpRoFU0CAWgWR0CudcPddmg8dX2UKGgGaAloD0MIe0ykNBvlbUCUhpRSlGgVS9hoFkdArneOhPCVKXV9lChoBmgJaA9DCI49ey7Tcm9AlIaUUpRoFU3lAWgWR0CugJHX2/SIdX2UKGgGaAloD0MISnuDL0wm8T+UhpRSlGgVS4BoFkdAroXmplz2e3V9lChoBmgJaA9DCFbzHJHvzExAlIaUUpRoFUuWaBZHQK6LUp1ie/Z1fZQoaAZoCWgPQwibV3VWi09wQJSGlFKUaBVNNAFoFkdArpRnz8P4EnV9lChoBmgJaA9DCAQb179ru2hAlIaUUpRoFU0oAWgWR0Cunz5GKAJ+dX2UKGgGaAloD0MI1ZXP8jwmRkCUhpRSlGgVS/ZoFkdArqTKJdjXnXV9lChoBmgJaA9DCHAlOzaC7nJAlIaUUpRoFU1AAWgWR0Cur6UGVzIWdX2UKGgGaAloD0MIjpCBPDsTcECUhpRSlGgVTXQBaBZHQK64vrWRRuV1fZQoaAZoCWgPQwgvTRHg9PZtQJSGlFKUaBVL3GgWR0Cuvi4jbBXTdX2UKGgGaAloD0MIOiF00CWsL0CUhpRSlGgVS41oFkdArsOhw2l2vHV9lChoBmgJaA9DCENTdvqBNnFAlIaUUpRoFU1iAWgWR0CuxXqv3ai9dX2UKGgGaAloD0MIdeRIZ2DcPkCUhpRSlGgVS6ZoFkdArtA1iONo8XV9lChoBmgJaA9DCKbSTzi7k21AlIaUUpRoFUvyaBZHQK7T37tzCDV1fZQoaAZoCWgPQwi/DMaIBCpxQJSGlFKUaBVNdwFoFkdArteS0jTrmnV9lChoBmgJaA9DCH9QFykUq21AlIaUUpRoFU0VA2gWR0Cu2VgOz6acdX2UKGgGaAloD0MITMEaZ5OZcECUhpRSlGgVTS8BaBZHQK7ZXYISlFd1fZQoaAZoCWgPQwhegH10qu5wQJSGlFKUaBVNhgFoFkdArtsrsyBTXXV9lChoBmgJaA9DCK+V0F2SyW5AlIaUUpRoFU3iAWgWR0Cu3seTNdJKdX2UKGgGaAloD0MIGqchqvDvLkCUhpRSlGgVS8NoFkdAruJk6mwaBXV9lChoBmgJaA9DCLEVNC2xvkVAlIaUUpRoFUuuaBZHQK7l5K6nR9h1fZQoaAZoCWgPQwht5pDUQjEgQJSGlFKUaBVLomgWR0Cu56foq0+ldX2UKGgGaAloD0MIEmdF1MTGa0CUhpRSlGgVTZYBaBZHQK7pfgJkXk51fZQoaAZoCWgPQwj9E1ysKCZxQJSGlFKUaBVNuwJoFkdArutBGtp22XV9lChoBmgJaA9DCIKPwYrT0m9AlIaUUpRoFU26AmgWR0Cu7QFyq+8HdX2UKGgGaAloD0MIZARUOIIsKUCUhpRSlGgVS31oFkdArvJbEHdGiHV9lChoBmgJaA9DCLmnqzsWBz1AlIaUUpRoFUuaaBZHQK73tGn4wh51fZQoaAZoCWgPQwh7uyU5YB80QJSGlFKUaBVLx2gWR0Cu+XgWSEDhdX2UKGgGaAloD0MInBn9aDipRkCUhpRSlGgVS4VoFkdArvtDiS7oS3V9lChoBmgJaA9DCIQpyqXx/UBAlIaUUpRoFUuMaBZHQK79DCAtnPF1fZQoaAZoCWgPQwirl99pMhtOQJSGlFKUaBVLlGgWR0CvAKHp8neBdX2UKGgGaAloD0MIa378pUXJOkCUhpRSlGgVS6doFkdArwJmc8TzunV9lChoBmgJaA9DCKX5Y1qblk1AlIaUUpRoFUuTaBZHQK8EILUkOZt1fZQoaAZoCWgPQwisVFBR9TNFQJSGlFKUaBVLqWgWR0CvDPqZML4OdX2UKGgGaAloD0MId4U+WMa6N0CUhpRSlGgVS4hoFkdArw66hYeT3nV9lChoBmgJaA9DCFd5AmHnTHJAlIaUUpRoFU0qAWgWR0CvDsL56+nJdX2UKGgGaAloD0MIGCZTBaNCKUCUhpRSlGgVS49oFkdArxCOmzjWCnV9lChoBmgJaA9DCL9gN2xb1DRAlIaUUpRoFUulaBZHQK8UI+0PYnR1fZQoaAZoCWgPQwg/qIsUymo/QJSGlFKUaBVLuGgWR0CvFCWC2+fzdX2UKGgGaAloD0MIYAX4bvN2HcCUhpRSlGgVS7doFkdArxXpY1YQrnV9lChoBmgJaA9DCHLe/8cJY2BAlIaUUpRoFU3oA2gWR0CvHtPUaybAdX2UKGgGaAloD0MInrEv2XgQB0CUhpRSlGgVS55oFkdAryCc6T4cm3V9lChoBmgJaA9DCIgRwqONP0BAlIaUUpRoFUuUaBZHQK8goqslsxh1fZQoaAZoCWgPQwjC3Vm77cLqv5SGlFKUaBVLzmgWR0CvJ7Mr/bTMdX2UKGgGaAloD0MIH4ZWJ2foQ0CUhpRSlGgVS5xoFkdArytEIPbwjXV9lChoBmgJaA9DCE9AE2HDMx5AlIaUUpRoFUuPaBZHQK8wpBQemvZ1fZQoaAZoCWgPQwjKiXYVUuBuQJSGlFKUaBVL0mgWR0CvMmOAy2x6dX2UKGgGaAloD0MIBJKwbyftPkCUhpRSlGgVS5BoFkdArzJn/JeVs3V9lChoBmgJaA9DCBpOmZtvGlBAlIaUUpRoFUuVaBZHQK83xOVxCIF1fZQoaAZoCWgPQwjtZdtpayJHQJSGlFKUaBVLomgWR0CvN8yquKXOdX2UKGgGaAloD0MIqG3DKAi8RUCUhpRSlGgVS49oFkdArzmGX5WRzXV9lChoBmgJaA9DCC+ob5nTS0BAlIaUUpRoFUuOaBZHQK87TnA6+391fZQoaAZoCWgPQwhUqG4uvkdwQJSGlFKUaBVL52gWR0CvPRTcynDSdX2UKGgGaAloD0MIKGVSQxsAA8CUhpRSlGgVS4poFkdAr0JvD1oQF3V9lChoBmgJaA9DCFDgnXx6bD1AlIaUUpRoFUuCaBZHQK9SZ2VVxS51fZQoaAZoCWgPQwjjcOZXc3A9QJSGlFKUaBVLwWgWR0CvXPuXmeUZdX2UKGgGaAloD0MI+1ksRfJXRUCUhpRSlGgVS5RoFkdAr17EGA08/3V9lChoBmgJaA9DCOAsJctJiCBAlIaUUpRoFUuXaBZHQK9ezEroW591fZQoaAZoCWgPQwhrnE1HAPs7QJSGlFKUaBVLoWgWR0CvYJdE1EVndX2UKGgGaAloD0MIrd9MTBeYRUCUhpRSlGgVS7loFkdAr2CZSLqD9XV9lChoBmgJaA9DCNxLGqM1SnBAlIaUUpRoFUvkaBZHQK9goKSgXdl1fZQoaAZoCWgPQwhRTrSr0LBwQJSGlFKUaBVNUwFoFkdAr2mNJSR8t3V9lChoBmgJaA9DCEKVmj1Q0nFAlIaUUpRoFU1XAWgWR0Cvd+Ak9lmOdX2UKGgGaAloD0MIrvNvl/3ccECUhpRSlGgVTfgBaBZHQK95pDa4+bF1fZQoaAZoCWgPQwihgO1gBJpxQJSGlFKUaBVNcAFoFkdAr301AX2ugnV9lChoBmgJaA9DCBiWP98WpW9AlIaUUpRoFU2GAWgWR0CvnZPomoitdX2UKGgGaAloD0MIprbUQV6TUUCUhpRSlGgVS5poFkdAr6Eiw0O3D3V9lChoBmgJaA9DCDuJCP+ih3FAlIaUUpRoFU0OAWgWR0CvoSroW56MdX2UKGgGaAloD0MILqwb704hc0CUhpRSlGgVTRUBaBZHQK+xagB91EF1fZQoaAZoCWgPQwgr3V1ngzhwQJSGlFKUaBVNWgFoFkdAr7islzEJjXV9lChoBmgJaA9DCF1vm6kQiHNAlIaUUpRoFU3VAmgWR0CvumxF7UobdX2UKGgGaAloD0MI5US7Cimab0CUhpRSlGgVTWYBaBZHQK+6bOX3QD51fZQoaAZoCWgPQwhzu5f7JNRyQJSGlFKUaBVNHAJoFkdAr7xHuRcNY3V9lChoBmgJaA9DCK2/JQB/SW9AlIaUUpRoFU3yAWgWR0CvvEhsQ/X5dX2UKGgGaAloD0MIqb7zi9JKcUCUhpRSlGgVTWgBaBZHQK++DxZuAI91fZQoaAZoCWgPQwiWzRySmt5wQJSGlFKUaBVNEAFoFkdAr74RNfw7T3V9lChoBmgJaA9DCBd/2xMkIEFAlIaUUpRoFUuJaBZHQK/Bot16mfp1fZQoaAZoCWgPQwg+daxSekI2QJSGlFKUaBVLfGgWR0CvwaUXYUWVdX2UKGgGaAloD0MIIEHxY0yOcECUhpRSlGgVTYsBaBZHQK/FQx9oexR1fZQoaAZoCWgPQwiELXb7rNdyQJSGlFKUaBVNEwJoFkdAr8qdqagElnV9lChoBmgJaA9DCCWuY1xxRmlAlIaUUpRoFU3AAWgWR0Cv0bq46Oo6dX2UKGgGaAloD0MIG5sdqb7zJsCUhpRSlGgVS2doFkdAr9N8NYr8SHV9lChoBmgJaA9DCIcYr3lVpx5AlIaUUpRoFUtraBZHQK/Y3+OOsDJ1fZQoaAZoCWgPQwh4gCctXFJFQJSGlFKUaBVLjWgWR0Cv4ApON5t4dWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 107160, "n_steps": 7, "gamma": 0.988045661427605, "gae_lambda": 0.9768700030979546, "ent_coef": 0.004851331424615018, "vf_coef": 0.9683727099048757, "max_grad_norm": 0.5143831585332781, "batch_size": 7, "n_epochs": 24, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVJQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeS9ob21lL3hhdmkvRG9jdW1lbnRzL3Byb2plY3RzL0RlZXBSTC1odWdnaW5nZmFjZS9kZWVwcmwtZW52L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjHkvaG9tZS94YXZpL0RvY3VtZW50cy9wcm9qZWN0cy9EZWVwUkwtaHVnZ2luZ2ZhY2UvZGVlcHJsLWVudi9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/bPUA6d5h4hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": {":type:": "<class 'function'>", ":serialized:": "gAWVJQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeS9ob21lL3hhdmkvRG9jdW1lbnRzL3Byb2plY3RzL0RlZXBSTC1odWdnaW5nZmFjZS9kZWVwcmwtZW52L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjHkvaG9tZS94YXZpL0RvY3VtZW50cy9wcm9qZWN0cy9EZWVwUkwtaHVnZ2luZ2ZhY2UvZGVlcHJsLWVudi9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/aJ6+qwtrThZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.15.0-67-generic-x86_64-with-glibc2.29 # 74~20.04.1-Ubuntu SMP Wed Feb 22 14:52:34 UTC 2023", "Python": "3.8.10", "Stable-Baselines3": "1.7.0", "PyTorch": "2.0.0+cu117", "GPU Enabled": "True", "Numpy": "1.24.2", "Gym": "0.21.0"}}
|
ppo_lunarlander-v2_hpo.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:efd77a6600cb63ba60c03e7fa2a187703ad6b53c41eacc247cf41d2c12651d50
|
| 3 |
+
size 148864
|
ppo_lunarlander-v2_hpo/_stable_baselines3_version
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
1.7.0
|
ppo_lunarlander-v2_hpo/data
ADDED
|
@@ -0,0 +1,98 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"policy_class": {
|
| 3 |
+
":type:": "<class 'abc.ABCMeta'>",
|
| 4 |
+
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
+
"__module__": "stable_baselines3.common.policies",
|
| 6 |
+
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7fc080fa54c0>",
|
| 8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fc080fa5550>",
|
| 9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fc080fa55e0>",
|
| 10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fc080fa5670>",
|
| 11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7fc080fa5700>",
|
| 12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7fc080fa5790>",
|
| 13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x7fc080fa5820>",
|
| 14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fc080fa58b0>",
|
| 15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7fc080fa5940>",
|
| 16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fc080fa59d0>",
|
| 17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fc080fa5a60>",
|
| 18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7fc080fa5af0>",
|
| 19 |
+
"__abstractmethods__": "frozenset()",
|
| 20 |
+
"_abc_impl": "<_abc_data object at 0x7fc080fa2240>"
|
| 21 |
+
},
|
| 22 |
+
"verbose": 1,
|
| 23 |
+
"policy_kwargs": {},
|
| 24 |
+
"observation_space": {
|
| 25 |
+
":type:": "<class 'gym.spaces.box.Box'>",
|
| 26 |
+
":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu",
|
| 27 |
+
"dtype": "float32",
|
| 28 |
+
"_shape": [
|
| 29 |
+
8
|
| 30 |
+
],
|
| 31 |
+
"low": "[-inf -inf -inf -inf -inf -inf -inf -inf]",
|
| 32 |
+
"high": "[inf inf inf inf inf inf inf inf]",
|
| 33 |
+
"bounded_below": "[False False False False False False False False]",
|
| 34 |
+
"bounded_above": "[False False False False False False False False]",
|
| 35 |
+
"_np_random": null
|
| 36 |
+
},
|
| 37 |
+
"action_space": {
|
| 38 |
+
":type:": "<class 'gym.spaces.discrete.Discrete'>",
|
| 39 |
+
":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu",
|
| 40 |
+
"n": 4,
|
| 41 |
+
"_shape": [],
|
| 42 |
+
"dtype": "int64",
|
| 43 |
+
"_np_random": null
|
| 44 |
+
},
|
| 45 |
+
"n_envs": 16,
|
| 46 |
+
"num_timesteps": 500080,
|
| 47 |
+
"_total_timesteps": 500000,
|
| 48 |
+
"_num_timesteps_at_start": 0,
|
| 49 |
+
"seed": null,
|
| 50 |
+
"action_noise": null,
|
| 51 |
+
"start_time": 1679389289642222321,
|
| 52 |
+
"learning_rate": 0.0005022723199591951,
|
| 53 |
+
"tensorboard_log": null,
|
| 54 |
+
"lr_schedule": {
|
| 55 |
+
":type:": "<class 'function'>",
|
| 56 |
+
":serialized:": "gAWVJQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeS9ob21lL3hhdmkvRG9jdW1lbnRzL3Byb2plY3RzL0RlZXBSTC1odWdnaW5nZmFjZS9kZWVwcmwtZW52L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjHkvaG9tZS94YXZpL0RvY3VtZW50cy9wcm9qZWN0cy9EZWVwUkwtaHVnZ2luZ2ZhY2UvZGVlcHJsLWVudi9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9AdV2YDXX3hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
| 57 |
+
},
|
| 58 |
+
"_last_obs": {
|
| 59 |
+
":type:": "<class 'numpy.ndarray'>",
|
| 60 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM0ioz7/r4A+Cpy/vU7c1L4oINm81xOLPQAAAAAAAAAA0DWVPiWToD6nC407+0i7vvS2tzqruR+9AAAAAAAAAAAND0w+roGVustb7TxZBTU9QgSVPepAuzoAAIA/AACAP4MoyT5EWe8+1y2hvYYAIL+Zd4i9S1dXvAAAAAAAAAAAjdvjPQpnYbntOPs6koyjtdLlE7lWBJm0AAAAAAAAgD9Ny1Q+XI+yPl3IAr2eski+KUsdvZLI0DsAAAAAAAAAAA2z5T0N7UE+x6fLu7IuV76h1Cs8paICuwAAAAAAAAAAsz2CPghzq7xtjdq5hTgfOIeeGb6CLAg5AACAPwAAgD9gfT8+pORhOjBA0jyqhmU5ajQPPANNRjoAAIA/AACAP3Pcuj0Ayog/4uVHPodz0r6/vO48mje4PAAAAAAAAAAAgOCDvtAPVz/mGUc+V86yvuNgxL71miY+AAAAAAAAAAAGPRI+z0dGvFAAvTxbn+w8SjKXvUQvQ7sAAIA/AACAP/qZS75yrEM/dvq4Pn5fC78nEKW9ihYEPwAAAAAAAAAA5mNyPQUA0jyr4kY9VhcwvgoWyDyH0Km7AAAAAAAAAAAAAHq9Ccx4PR7Tij6zCGq/GWz1PYIeEb0AAAAAAAAAABqDrT5oLuO9+xTFPidSlL0slBW/MSoRPgAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
| 61 |
+
},
|
| 62 |
+
"_last_episode_starts": {
|
| 63 |
+
":type:": "<class 'numpy.ndarray'>",
|
| 64 |
+
":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
|
| 65 |
+
},
|
| 66 |
+
"_last_original_obs": null,
|
| 67 |
+
"_episode_num": 0,
|
| 68 |
+
"use_sde": false,
|
| 69 |
+
"sde_sample_freq": -1,
|
| 70 |
+
"_current_progress_remaining": -0.00015999999999993797,
|
| 71 |
+
"ep_info_buffer": {
|
| 72 |
+
":type:": "<class 'collections.deque'>",
|
| 73 |
+
":serialized:": "gAWVQhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIZOWXwRjFOsCUhpRSlIwBbJRL4YwBdJRHQK441Hww0wd1fZQoaAZoCWgPQwgHexNDcjLiv5SGlFKUaBVLp2gWR0CuOp1Da4+bdX2UKGgGaAloD0MIDhDM0eMjRsCUhpRSlGgVS5BoFkdArj4mZqmCRXV9lChoBmgJaA9DCBaFXRQ98OC/lIaUUpRoFUuJaBZHQK4+KF7laKV1fZQoaAZoCWgPQwhsdqT6TlxtQJSGlFKUaBVL5GgWR0CuP+4HoouxdX2UKGgGaAloD0MIyD8ziI8iaECUhpRSlGgVTZsBaBZHQK5Bu8Tzund1fZQoaAZoCWgPQwjf/fFetRIoQJSGlFKUaBVLqmgWR0CuRUpW3jMndX2UKGgGaAloD0MIiesYV1zVbUCUhpRSlGgVTQABaBZHQK5Rwyon8bd1fZQoaAZoCWgPQwhw0clS68lIwJSGlFKUaBVLw2gWR0CuWP1loUSJdX2UKGgGaAloD0MI36XUJaOncECUhpRSlGgVS9ZoFkdArlyas6q82HV9lChoBmgJaA9DCINqgxPR7ydAlIaUUpRoFUuYaBZHQK5h8FEAo5R1fZQoaAZoCWgPQwj6m1CIgOc0QJSGlFKUaBVLlWgWR0CuY7qFZgXudX2UKGgGaAloD0MICRueXinjIsCUhpRSlGgVS5ZoFkdArmO69M9KVnV9lChoBmgJaA9DCKMfDafM525AlIaUUpRoFU0EAWgWR0CuZYnCfpUxdX2UKGgGaAloD0MIEmqGVFE4R0CUhpRSlGgVS6JoFkdArmrZrtVrAXV9lChoBmgJaA9DCBQF+kSePXFAlIaUUpRoFU0CAWgWR0CudcPddmg8dX2UKGgGaAloD0MIe0ykNBvlbUCUhpRSlGgVS9hoFkdArneOhPCVKXV9lChoBmgJaA9DCI49ey7Tcm9AlIaUUpRoFU3lAWgWR0CugJHX2/SIdX2UKGgGaAloD0MISnuDL0wm8T+UhpRSlGgVS4BoFkdAroXmplz2e3V9lChoBmgJaA9DCFbzHJHvzExAlIaUUpRoFUuWaBZHQK6LUp1ie/Z1fZQoaAZoCWgPQwibV3VWi09wQJSGlFKUaBVNNAFoFkdArpRnz8P4EnV9lChoBmgJaA9DCAQb179ru2hAlIaUUpRoFU0oAWgWR0Cunz5GKAJ+dX2UKGgGaAloD0MI1ZXP8jwmRkCUhpRSlGgVS/ZoFkdArqTKJdjXnXV9lChoBmgJaA9DCHAlOzaC7nJAlIaUUpRoFU1AAWgWR0Cur6UGVzIWdX2UKGgGaAloD0MIjpCBPDsTcECUhpRSlGgVTXQBaBZHQK64vrWRRuV1fZQoaAZoCWgPQwgvTRHg9PZtQJSGlFKUaBVL3GgWR0Cuvi4jbBXTdX2UKGgGaAloD0MIOiF00CWsL0CUhpRSlGgVS41oFkdArsOhw2l2vHV9lChoBmgJaA9DCENTdvqBNnFAlIaUUpRoFU1iAWgWR0CuxXqv3ai9dX2UKGgGaAloD0MIdeRIZ2DcPkCUhpRSlGgVS6ZoFkdArtA1iONo8XV9lChoBmgJaA9DCKbSTzi7k21AlIaUUpRoFUvyaBZHQK7T37tzCDV1fZQoaAZoCWgPQwi/DMaIBCpxQJSGlFKUaBVNdwFoFkdArteS0jTrmnV9lChoBmgJaA9DCH9QFykUq21AlIaUUpRoFU0VA2gWR0Cu2VgOz6acdX2UKGgGaAloD0MITMEaZ5OZcECUhpRSlGgVTS8BaBZHQK7ZXYISlFd1fZQoaAZoCWgPQwhegH10qu5wQJSGlFKUaBVNhgFoFkdArtsrsyBTXXV9lChoBmgJaA9DCK+V0F2SyW5AlIaUUpRoFU3iAWgWR0Cu3seTNdJKdX2UKGgGaAloD0MIGqchqvDvLkCUhpRSlGgVS8NoFkdAruJk6mwaBXV9lChoBmgJaA9DCLEVNC2xvkVAlIaUUpRoFUuuaBZHQK7l5K6nR9h1fZQoaAZoCWgPQwht5pDUQjEgQJSGlFKUaBVLomgWR0Cu56foq0+ldX2UKGgGaAloD0MIEmdF1MTGa0CUhpRSlGgVTZYBaBZHQK7pfgJkXk51fZQoaAZoCWgPQwj9E1ysKCZxQJSGlFKUaBVNuwJoFkdArutBGtp22XV9lChoBmgJaA9DCIKPwYrT0m9AlIaUUpRoFU26AmgWR0Cu7QFyq+8HdX2UKGgGaAloD0MIZARUOIIsKUCUhpRSlGgVS31oFkdArvJbEHdGiHV9lChoBmgJaA9DCLmnqzsWBz1AlIaUUpRoFUuaaBZHQK73tGn4wh51fZQoaAZoCWgPQwh7uyU5YB80QJSGlFKUaBVLx2gWR0Cu+XgWSEDhdX2UKGgGaAloD0MInBn9aDipRkCUhpRSlGgVS4VoFkdArvtDiS7oS3V9lChoBmgJaA9DCIQpyqXx/UBAlIaUUpRoFUuMaBZHQK79DCAtnPF1fZQoaAZoCWgPQwirl99pMhtOQJSGlFKUaBVLlGgWR0CvAKHp8neBdX2UKGgGaAloD0MIa378pUXJOkCUhpRSlGgVS6doFkdArwJmc8TzunV9lChoBmgJaA9DCKX5Y1qblk1AlIaUUpRoFUuTaBZHQK8EILUkOZt1fZQoaAZoCWgPQwisVFBR9TNFQJSGlFKUaBVLqWgWR0CvDPqZML4OdX2UKGgGaAloD0MId4U+WMa6N0CUhpRSlGgVS4hoFkdArw66hYeT3nV9lChoBmgJaA9DCFd5AmHnTHJAlIaUUpRoFU0qAWgWR0CvDsL56+nJdX2UKGgGaAloD0MIGCZTBaNCKUCUhpRSlGgVS49oFkdArxCOmzjWCnV9lChoBmgJaA9DCL9gN2xb1DRAlIaUUpRoFUulaBZHQK8UI+0PYnR1fZQoaAZoCWgPQwg/qIsUymo/QJSGlFKUaBVLuGgWR0CvFCWC2+fzdX2UKGgGaAloD0MIYAX4bvN2HcCUhpRSlGgVS7doFkdArxXpY1YQrnV9lChoBmgJaA9DCHLe/8cJY2BAlIaUUpRoFU3oA2gWR0CvHtPUaybAdX2UKGgGaAloD0MInrEv2XgQB0CUhpRSlGgVS55oFkdAryCc6T4cm3V9lChoBmgJaA9DCIgRwqONP0BAlIaUUpRoFUuUaBZHQK8goqslsxh1fZQoaAZoCWgPQwjC3Vm77cLqv5SGlFKUaBVLzmgWR0CvJ7Mr/bTMdX2UKGgGaAloD0MIH4ZWJ2foQ0CUhpRSlGgVS5xoFkdArytEIPbwjXV9lChoBmgJaA9DCE9AE2HDMx5AlIaUUpRoFUuPaBZHQK8wpBQemvZ1fZQoaAZoCWgPQwjKiXYVUuBuQJSGlFKUaBVL0mgWR0CvMmOAy2x6dX2UKGgGaAloD0MIBJKwbyftPkCUhpRSlGgVS5BoFkdArzJn/JeVs3V9lChoBmgJaA9DCBpOmZtvGlBAlIaUUpRoFUuVaBZHQK83xOVxCIF1fZQoaAZoCWgPQwjtZdtpayJHQJSGlFKUaBVLomgWR0CvN8yquKXOdX2UKGgGaAloD0MIqG3DKAi8RUCUhpRSlGgVS49oFkdArzmGX5WRzXV9lChoBmgJaA9DCC+ob5nTS0BAlIaUUpRoFUuOaBZHQK87TnA6+391fZQoaAZoCWgPQwhUqG4uvkdwQJSGlFKUaBVL52gWR0CvPRTcynDSdX2UKGgGaAloD0MIKGVSQxsAA8CUhpRSlGgVS4poFkdAr0JvD1oQF3V9lChoBmgJaA9DCFDgnXx6bD1AlIaUUpRoFUuCaBZHQK9SZ2VVxS51fZQoaAZoCWgPQwjjcOZXc3A9QJSGlFKUaBVLwWgWR0CvXPuXmeUZdX2UKGgGaAloD0MI+1ksRfJXRUCUhpRSlGgVS5RoFkdAr17EGA08/3V9lChoBmgJaA9DCOAsJctJiCBAlIaUUpRoFUuXaBZHQK9ezEroW591fZQoaAZoCWgPQwhrnE1HAPs7QJSGlFKUaBVLoWgWR0CvYJdE1EVndX2UKGgGaAloD0MIrd9MTBeYRUCUhpRSlGgVS7loFkdAr2CZSLqD9XV9lChoBmgJaA9DCNxLGqM1SnBAlIaUUpRoFUvkaBZHQK9goKSgXdl1fZQoaAZoCWgPQwhRTrSr0LBwQJSGlFKUaBVNUwFoFkdAr2mNJSR8t3V9lChoBmgJaA9DCEKVmj1Q0nFAlIaUUpRoFU1XAWgWR0Cvd+Ak9lmOdX2UKGgGaAloD0MIrvNvl/3ccECUhpRSlGgVTfgBaBZHQK95pDa4+bF1fZQoaAZoCWgPQwihgO1gBJpxQJSGlFKUaBVNcAFoFkdAr301AX2ugnV9lChoBmgJaA9DCBiWP98WpW9AlIaUUpRoFU2GAWgWR0CvnZPomoitdX2UKGgGaAloD0MIprbUQV6TUUCUhpRSlGgVS5poFkdAr6Eiw0O3D3V9lChoBmgJaA9DCDuJCP+ih3FAlIaUUpRoFU0OAWgWR0CvoSroW56MdX2UKGgGaAloD0MILqwb704hc0CUhpRSlGgVTRUBaBZHQK+xagB91EF1fZQoaAZoCWgPQwgr3V1ngzhwQJSGlFKUaBVNWgFoFkdAr7islzEJjXV9lChoBmgJaA9DCF1vm6kQiHNAlIaUUpRoFU3VAmgWR0CvumxF7UobdX2UKGgGaAloD0MI5US7Cimab0CUhpRSlGgVTWYBaBZHQK+6bOX3QD51fZQoaAZoCWgPQwhzu5f7JNRyQJSGlFKUaBVNHAJoFkdAr7xHuRcNY3V9lChoBmgJaA9DCK2/JQB/SW9AlIaUUpRoFU3yAWgWR0CvvEhsQ/X5dX2UKGgGaAloD0MIqb7zi9JKcUCUhpRSlGgVTWgBaBZHQK++DxZuAI91fZQoaAZoCWgPQwiWzRySmt5wQJSGlFKUaBVNEAFoFkdAr74RNfw7T3V9lChoBmgJaA9DCBd/2xMkIEFAlIaUUpRoFUuJaBZHQK/Bot16mfp1fZQoaAZoCWgPQwg+daxSekI2QJSGlFKUaBVLfGgWR0CvwaUXYUWVdX2UKGgGaAloD0MIIEHxY0yOcECUhpRSlGgVTYsBaBZHQK/FQx9oexR1fZQoaAZoCWgPQwiELXb7rNdyQJSGlFKUaBVNEwJoFkdAr8qdqagElnV9lChoBmgJaA9DCCWuY1xxRmlAlIaUUpRoFU3AAWgWR0Cv0bq46Oo6dX2UKGgGaAloD0MIG5sdqb7zJsCUhpRSlGgVS2doFkdAr9N8NYr8SHV9lChoBmgJaA9DCIcYr3lVpx5AlIaUUpRoFUtraBZHQK/Y3+OOsDJ1fZQoaAZoCWgPQwh4gCctXFJFQJSGlFKUaBVLjWgWR0Cv4ApON5t4dWUu"
|
| 74 |
+
},
|
| 75 |
+
"ep_success_buffer": {
|
| 76 |
+
":type:": "<class 'collections.deque'>",
|
| 77 |
+
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 78 |
+
},
|
| 79 |
+
"_n_updates": 107160,
|
| 80 |
+
"n_steps": 7,
|
| 81 |
+
"gamma": 0.988045661427605,
|
| 82 |
+
"gae_lambda": 0.9768700030979546,
|
| 83 |
+
"ent_coef": 0.004851331424615018,
|
| 84 |
+
"vf_coef": 0.9683727099048757,
|
| 85 |
+
"max_grad_norm": 0.5143831585332781,
|
| 86 |
+
"batch_size": 7,
|
| 87 |
+
"n_epochs": 24,
|
| 88 |
+
"clip_range": {
|
| 89 |
+
":type:": "<class 'function'>",
|
| 90 |
+
":serialized:": "gAWVJQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeS9ob21lL3hhdmkvRG9jdW1lbnRzL3Byb2plY3RzL0RlZXBSTC1odWdnaW5nZmFjZS9kZWVwcmwtZW52L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjHkvaG9tZS94YXZpL0RvY3VtZW50cy9wcm9qZWN0cy9EZWVwUkwtaHVnZ2luZ2ZhY2UvZGVlcHJsLWVudi9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/bPUA6d5h4hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
| 91 |
+
},
|
| 92 |
+
"clip_range_vf": {
|
| 93 |
+
":type:": "<class 'function'>",
|
| 94 |
+
":serialized:": "gAWVJQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeS9ob21lL3hhdmkvRG9jdW1lbnRzL3Byb2plY3RzL0RlZXBSTC1odWdnaW5nZmFjZS9kZWVwcmwtZW52L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjHkvaG9tZS94YXZpL0RvY3VtZW50cy9wcm9qZWN0cy9EZWVwUkwtaHVnZ2luZ2ZhY2UvZGVlcHJsLWVudi9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/aJ6+qwtrThZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
| 95 |
+
},
|
| 96 |
+
"normalize_advantage": true,
|
| 97 |
+
"target_kl": null
|
| 98 |
+
}
|
ppo_lunarlander-v2_hpo/policy.optimizer.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e9c033ff4db4b4c5d4635215bf72989d7f283c10b9ec9787e50b8a02058b626
|
| 3 |
+
size 87929
|
ppo_lunarlander-v2_hpo/policy.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5bcf2715d44705fe7d110bffa428469603c527bc88a3b0238f510424ae535f2
|
| 3 |
+
size 43393
|
ppo_lunarlander-v2_hpo/pytorch_variables.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1
|
| 3 |
+
size 431
|
ppo_lunarlander-v2_hpo/system_info.txt
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- OS: Linux-5.15.0-67-generic-x86_64-with-glibc2.29 # 74~20.04.1-Ubuntu SMP Wed Feb 22 14:52:34 UTC 2023
|
| 2 |
+
- Python: 3.8.10
|
| 3 |
+
- Stable-Baselines3: 1.7.0
|
| 4 |
+
- PyTorch: 2.0.0+cu117
|
| 5 |
+
- GPU Enabled: True
|
| 6 |
+
- Numpy: 1.24.2
|
| 7 |
+
- Gym: 0.21.0
|
replay.mp4
CHANGED
|
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward":
|
|
|
|
| 1 |
+
{"mean_reward": 119.96047343111745, "std_reward": 120.32348713766541, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-21T11:57:57.841700"}
|