Commit ·
7f32eae
1
Parent(s): da9c2a6
Upload PPO LunarLander-v2 trained agent
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +1 -1
- ppo-LunarLander-v2/data +24 -24
- ppo-LunarLander-v2/policy.optimizer.pth +1 -1
- ppo-LunarLander-v2/policy.pth +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value:
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: 292.03 +/- 14.79
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7d69072093f0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7d6907209480>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7d6907209510>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7d69072095a0>", "_build": "<function ActorCriticPolicy._build at 0x7d6907209630>", "forward": "<function ActorCriticPolicy.forward at 0x7d69072096c0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7d6907209750>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7d69072097e0>", "_predict": "<function ActorCriticPolicy._predict at 0x7d6907209870>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7d6907209900>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7d6907209990>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7d6907209a20>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7d6907210b80>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 5046272, "_total_timesteps": 5000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1690227444805570883, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALNnJj6gkvM+qHvKvX2zEb8NfIU+rQ5uvQAAAAAAAAAA2nOePYywvD7ru9m9G7krv7fZCD6V3b+9AAAAAAAAAACgDmY+m8zEPqKztr6CXBu/sCtyPtkgmr4AAAAAAAAAABP0SD6uaJk/dBgZP9e1Jr94QcE+lg6hPgAAAAAAAAAAmqW+vb9QBD+dBlM9PT5Iv/J3U779Pv09AAAAAAAAAAAA4Ow7HPdOvLpaEb5p6ui7fwMfPdojpT0AAIA/AACAP5r0Dj3ZtFw/S0WYPcyNk7+tqS49aIxQPQAAAAAAAAAAZmaOOgXKl7t+ilO7pGMXPKOXyjwyxgq9AACAPwAAgD+z3Dg+cwigP5vT7D4Pxxy/CwinPjJGgz4AAAAAAAAAAADgGLzS+oC7tV9+vK0eazwXDMG8DXhLPQAAgD8AAIA/AFOaPF9jsz+j5us+PUgUvrs5LLxmPt+5AAAAAAAAAACmOqU9LlfdO7Xol77WLRS+m39XvTk9FD8AAIA/AAAAAM2YNjzDYV66oZaavDoPVDJwhFc6ZmX+swAAgD8AAIA/AKAUO+6BoT8o2qo8smA8vyI2KLsY5Ji7AAAAAAAAAABmhI88FMCzuqfkIbiJZRqzrFIGuo4HOTcAAIA/AACAP2aCyzvcuWu88rmgvgXziz1GpsM8uQnDuwAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.009254400000000107, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHHKdW2gFouMAWyUS4yMAXSUR0C12pjEJjUedX2UKGgGR0Bxqh1fVqetaAdLkGgIR0C12rMs6JZXdX2UKGgGR0ByYanVG0/oaAdLkWgIR0C12sWF36hydX2UKGgGR0By9/08NhE0aAdLyWgIR0C12tALVnVYdX2UKGgGR0BzA3KSxJNCaAdLrWgIR0C12tHf/FR6dX2UKGgGR0By1Uis4ku6aAdLk2gIR0C12uWrfcesdX2UKGgGR0BvTvU6PsAvaAdLmmgIR0C12vVPva11dX2UKGgGR0Bwi4Qrc0tRaAdLk2gIR0C12wFKkEcLdX2UKGgGR0Bz1wvugHu7aAdLqmgIR0C12wlaOgg6dX2UKGgGR0BybhUyYXwcaAdLvWgIR0C12w9z8xbjdX2UKGgGR0ByMFd5Y5ktaAdLnmgIR0C12zTA31jBdX2UKGgGR0Bw+vMKTjebaAdLoWgIR0C12z8P4EfUdX2UKGgGR0Bx2NW912aEaAdLqWgIR0C12z0EovzwdX2UKGgGR0BybGIsRQJpaAdLuGgIR0C120OR9w3pdX2UKGgGR0BxntHe7+UAaAdLm2gIR0C122PMwDeTdX2UKGgGR0BxaaO938oAaAdLt2gIR0C122jURWcSdX2UKGgGR0BwZAHLRrrPaAdLlmgIR0C123SVbA1vdX2UKGgGR0BzbtCKJl8PaAdLrGgIR0C123IhY/3WdX2UKGgGR0Bye3Tqjaf0aAdLemgIR0C124ABLf1pdX2UKGgGR0BxOH2USqVAaAdLp2gIR0C125giiZfEdX2UKGgGR0ByHEJTl1bJaAdLj2gIR0C126oePq9odX2UKGgGR0ByGwE/0NBoaAdLuGgIR0C127oLofSydX2UKGgGR0BzD3ZrYXfqaAdLwmgIR0C128feLvTgdX2UKGgGR0BwgAmReTmoaAdLmmgIR0C129AXZXdTdX2UKGgGR0BxdgSnLq2SaAdLn2gIR0C129yUX531dX2UKGgGR0BxjKpyZKFqaAdLqGgIR0C129pDE3sHdX2UKGgGR0BzEvZK3/gjaAdLo2gIR0C13AZ80DU3dX2UKGgGR0BxsSDnNgSfaAdLrWgIR0C13Bur2g3+dX2UKGgGR0BzLhX2dupCaAdLs2gIR0C13Cpf6XSjdX2UKGgGR0B0G6cc2itaaAdLuWgIR0C13C33g1m8dX2UKGgGR0BzQDS2H+IeaAdLomgIR0C13DpJkGzKdX2UKGgGR0BykWgam4y5aAdLqGgIR0C13D1K5CnhdX2UKGgGR0Byx4QRPGhmaAdLm2gIR0C13EgzUI9ldX2UKGgGR0BwIxefI0ZWaAdLqGgIR0C13E1cD8tPdX2UKGgGR0Bxd5z0Yj0MaAdLtWgIR0C13IUgW8AadX2UKGgGR0BzFtcNYr8SaAdL1mgIR0C13Iko8ZDRdX2UKGgGR0Bw63HFPznSaAdLi2gIR0C13JHGsFMadX2UKGgGR0ByK8W1twaSaAdLuGgIR0C13J9NJvpAdX2UKGgGR0BzYw14xDb8aAdLv2gIR0C13LmDDjzadX2UKGgGR0BzMji6xxDLaAdLt2gIR0C13MQkgOjJdX2UKGgGR0BydO6MBIWhaAdLx2gIR0C13NKB/ZuidX2UKGgGR0Byjd7IDHOsaAdLumgIR0C13NbGR3eOdX2UKGgGR0ByY3hl18suaAdLlmgIR0C13OiosI3SdX2UKGgGR0Bzhl4VymygaAdLm2gIR0C13PzAaef7dX2UKGgGR0By4BBC2MKkaAdLimgIR0C13QnL3bmEdX2UKGgGR0B0c0aNuLrHaAdLx2gIR0C13RMXBP9DdX2UKGgGR0BxeAL/jsD5aAdLmmgIR0C13Rojnmq6dX2UKGgGR0BzYlLcsUZfaAdLuGgIR0C13SWsvIwNdX2UKGgGR0BxYdSydFvyaAdLrmgIR0C13SV6Rhc8dX2UKGgGR0BymVYdQwbmaAdLtWgIR0C13TCDh99ddX2UKGgGR0BxUYVJtix3aAdLmWgIR0C13VkEcKgJdX2UKGgGR0BydM2XLNfPaAdLoGgIR0C13VvjKgZkdX2UKGgGR0ByVKnDR+jNaAdLtWgIR0C13XQN5MURdX2UKGgGR0Bxeqf029+PaAdLlWgIR0C13ZYzabnYdX2UKGgGR0By0kdcSoOyaAdLumgIR0C13ZSWAwwkdX2UKGgGR0Bw1mESM98raAdLrGgIR0C13ZsP4EfUdX2UKGgGR0BwOX1schkiaAdLjGgIR0C13Z3HmzSkdX2UKGgGR0Bw0lsk6cRUaAdLnWgIR0C13Z251/2CdX2UKGgGR0BzP2DpTuOTaAdLrmgIR0C13adilSCOdX2UKGgGR0Bw2mAiFCb+aAdLlmgIR0C13c8NhE0BdX2UKGgGR0B0MMzl90A+aAdLrGgIR0C13eC5y2hJdX2UKGgGR0Bx5SFev6j4aAdLqGgIR0C13fGapgkUdX2UKGgGR0Bykfi5uqFRaAdLlGgIR0C13fY5PuXvdX2UKGgGR0BzmCxY7q6faAdLs2gIR0C13gXWrfcfdX2UKGgGR0ByzguxrzoVaAdLt2gIR0C13hZT6zmfdX2UKGgGR0ByjIsTWXkYaAdLwWgIR0C13iNdE9dNdX2UKGgGR0BzJh6Z6UqyaAdLr2gIR0C13kfTTfBOdX2UKGgGR0BzQQIyCWeIaAdLvmgIR0C13ljGHYYjdX2UKGgGR0ByPEzl90A+aAdLq2gIR0C13lrj1f3OdX2UKGgGR0BzYUi0OVgQaAdLn2gIR0C13nQDvE0jdX2UKGgGR0BwN9/BnBciaAdLoGgIR0C13oPpD/lydX2UKGgGR0BxeO0D2alUaAdLrGgIR0C13ousHSncdX2UKGgGR0BzuYeIVM24aAdLv2gIR0C13rRSxZ+ydX2UKGgGR0BzpEGSpzcRaAdLyGgIR0C13rkvkBCEdX2UKGgGR0B0itUgjhUBaAdLyWgIR0C13r3b212JdX2UKGgGR0BxCGaAnUlSaAdLhmgIR0C13r9yxRl6dX2UKGgGR0Bx22K508vFaAdLtWgIR0C13udlAeJYdX2UKGgGR0BxhYGJN0vHaAdLo2gIR0C13xFD8cdYdX2UKGgGR0BxtsV1wHZ9aAdLtGgIR0C13xmm1pj+dX2UKGgGR0BzYuh24d6taAdLyGgIR0C13yDuKGcndX2UKGgGR0By82I42jwhaAdLomgIR0C13ylijL0SdX2UKGgGR0BycIQf6oETaAdLtmgIR0C132Cbc45tdX2UKGgGR0BwocmjTKDDaAdLn2gIR0C132kwBYFJdX2UKGgGR0ByM2sIVuaXaAdLmmgIR0C133gWBSUDdX2UKGgGR0BwQ+CAc1fmaAdLkmgIR0C134re67NCdX2UKGgGR0BwHxDv3JxOaAdLkGgIR0C138MYMvytdX2UKGgGR0BwIHNY8uBdaAdLlmgIR0C139PW6K+BdX2UKGgGR0BzrV83Mpw0aAdLr2gIR0C139fJeVs2dX2UKGgGR0B0zqJP69CeaAdLzmgIR0C1390RSP2gdX2UKGgGR0BwnfeZXuE3aAdLm2gIR0C13+IzN2TxdX2UKGgGR0ByuuPYFqzraAdLwGgIR0C13/HXmNipdX2UKGgGR0BzEbE0iyIIaAdLvmgIR0C14B9/FzdUdX2UKGgGR0BwvNmSQo1DaAdLnGgIR0C14DH8TBZZdX2UKGgGR0BxvxzCDVYqaAdLtGgIR0C14DOrp7kXdX2UKGgGR0BxdcQHzH0caAdLsGgIR0C14FwRGtp3dX2UKGgGR0ByOxC8e0XxaAdLumgIR0C14H7SeAd5dX2UKGgGR0Bv0l0V8CxNaAdLo2gIR0C14I0CeVcEdX2UKGgGR0BzwfvlU6xPaAdLxWgIR0C14I3K8tf5dX2UKGgGR0BzpJemelKsaAdLsGgIR0C14LALmZE2dX2UKGgGR0BvPKIi1RceaAdLpWgIR0C14L5M+NcXdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 616, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 4096, "gamma": 0.9965591734846347, "gae_lambda": 0.9788057367973633, "ent_coef": 0.006067412634309154, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 8, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.109+-x86_64-with-glibc2.35 # 1 SMP Fri Jun 9 10:57:30 UTC 2023", "Python": "3.10.6", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7be8202a70>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7be8202b00>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7be8202b90>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7be8202c20>", "_build": "<function ActorCriticPolicy._build at 0x7f7be8202cb0>", "forward": "<function ActorCriticPolicy.forward at 0x7f7be8202d40>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f7be8202dd0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7be8202e60>", "_predict": "<function ActorCriticPolicy._predict at 0x7f7be8202ef0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7be8202f80>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7be8203010>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7be82030a0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f7be820c780>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 6029312, "_total_timesteps": 6000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1690313243737686727, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAE2js735iqo/iqGcvif+774tLqG9bPkxvgAAAAAAAAAAgOQtvfagcbqtDS24Xiyqskq9+rrx80g3AACAPwAAgD/mwQi+/PFOP073B74622i/pV5gvk054zoAAAAAAAAAAAD/Yz3wUZs/WOmuPsyPRb/zYLQ9thlYPgAAAAAAAAAAszYsPWx8Lz6WPcC8LfQYvxMloz2FrC28AAAAAAAAAAAztka+25OWPlyKmD60k/S+MIhTvstifj4AAAAAAAAAAFp7LT567yI/hSFXvdbMNr9PcpA+iP85vgAAAAAAAAAAmtxoPbRWiz+w0/U9qSJiv0rUyT2dEuc9AAAAAAAAAACaZ/A88bgzPMhbVr7pm6y9O1bmvR06cT8AAIA/AAAAAIDi5r3x8qM9k5DnPl57wL7A36A90GpUPgAAAAAAAAAAzQyaOwrYNbsiNH29/IwEPGZVZrzdH/M8AACAPwAAgD9aErW9id9dPc79VT5H7La+6ppBvfKJIT0AAAAAAAAAAGZX270Nqq0/pamHvkLkCL/qGYS9+YYivgAAAAAAAAAAQNLAvSkIM7pt8ss8pQ7IOwB+ULtKda48AACAPwAAgD+ztim9XMMGuoy/JjR0jdkv+GbgO7UNtLMAAIA/AACAP3PY+71MrJ8/cPInv4dOJL+5yvu9TMLEvgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHKlF/QSi/SMAWyUS92MAXSUR0C5UEIRVZLadX2UKGgGR0ByhnpX6qKhaAdLn2gIR0C5UFq3VkMDdX2UKGgGR0Bzuw2zfJmvaAdLyWgIR0C5UGzYEnstdX2UKGgGR0BwOsd92HLzaAdLkGgIR0C5UHGdRR/FdX2UKGgGR0ByTRtXPqs2aAdLrWgIR0C5UIQLiMo+dX2UKGgGR0BzR/rcCYCyaAdLzWgIR0C5UKYA0bcXdX2UKGgGR0Byixlbu+h5aAdLiGgIR0C5ULGykbgkdX2UKGgGR0A98HJtBOYZaAdLX2gIR0C5ULw+Y+jedX2UKGgGR0BzgHd1uBMBaAdLrGgIR0C5UL9vbXYldX2UKGgGR0ByLnV9Wp6yaAdLs2gIR0C5UMORYA80dX2UKGgGR0By22iRGMGYaAdLr2gIR0C5UNm5Yoy9dX2UKGgGR0BybN1jiGWVaAdLm2gIR0C5UNk7nxJ/dX2UKGgGR0Bx3YgJTl1baAdLsmgIR0C5UNuFpPAPdX2UKGgGR0Bw6lXGOuJUaAdLlGgIR0C5UQSEQGwBdX2UKGgGR0ByXC704BFNaAdLu2gIR0C5URUUKzAvdX2UKGgGR0BynzuF6AvtaAdLnGgIR0C5URRKtga4dX2UKGgGR0ByeXf0mMOxaAdLq2gIR0C5URptvXK9dX2UKGgGR0BxASPKdQO4aAdLl2gIR0C5USx0lqrSdX2UKGgGR0BzBZIg/1QJaAdLomgIR0C5USq+evpydX2UKGgGR0BxKE96kZaWaAdLpGgIR0C5UTb9MsYmdX2UKGgGR0BxJmarmyPdaAdLqGgIR0C5UUpcgQpXdX2UKGgGR0Bz2PyiEg4faAdLlWgIR0C5UU3ssxwidX2UKGgGR0ByHsMy8BdVaAdLpmgIR0C5UWvYvnKXdX2UKGgGR0BwuD6hxo7FaAdLnWgIR0C5UW+NkvsadX2UKGgGR0ByLjaews5GaAdLoWgIR0C5UXgcDKYBdX2UKGgGR0BzvnktEofCaAdLp2gIR0C5UXf3JxNqdX2UKGgGR0BxhxwuM+/yaAdLoGgIR0C5UYxNmDlHdX2UKGgGR0ByKkAYHgP3aAdLsGgIR0C5UaPLDAJtdX2UKGgGR0BzoZfICEHuaAdLvWgIR0C5UbZWV/tqdX2UKGgGR0BzSLm0VrRCaAdLnWgIR0C5UdHB+F10dX2UKGgGR0Bz93KdQO4HaAdLs2gIR0C5UdyIcinpdX2UKGgGR0Bzeq48U21laAdLpWgIR0C5UfRnvlU7dX2UKGgGR0By2BwKjSG8aAdLv2gIR0C5UfzLOiWWdX2UKGgGR0By7ayB06o3aAdLpGgIR0C5UgBMvh60dX2UKGgGR0BzeyoVEd/8aAdLlmgIR0C5UgduLrHEdX2UKGgGR0BzhaOn2qT9aAdLxWgIR0C5UgldxAB1dX2UKGgGR0B0WmGpMpPRaAdLxWgIR0C5UhrMHKOldX2UKGgGR0ByOvGEPDpDaAdLs2gIR0C5UiUpqh11dX2UKGgGR0Bw/95HEuQIaAdLi2gIR0C5UiQZ88cNdX2UKGgGR0B0AiB4D9wWaAdLnGgIR0C5Uje+Eh7mdX2UKGgGR0BxTVjFyaNNaAdLpmgIR0C5UjgC0WuYdX2UKGgGR0Bx/LEBKcuraAdLpmgIR0C5UlgZsKsudX2UKGgGR0By0BQxesxPaAdLwWgIR0C5Ulk9ZA6ddX2UKGgGR0ByZZqmCROlaAdLp2gIR0C5Ums1baAXdX2UKGgGR0BxdO9ytFKDaAdLiWgIR0C5UnwlF+d9dX2UKGgGR0BzszoePq9oaAdLsGgIR0C5UohMSK3vdX2UKGgGR0BK8ZxiobXIaAdLYWgIR0C5Uot4RmK7dX2UKGgGR0Byt8oYvWYnaAdLoWgIR0C5Uq6rJbMYdX2UKGgGR0BzNp/mT1TSaAdLmWgIR0C5UrFMZgogdX2UKGgGR0Bx6fIfbKzSaAdLnmgIR0C5UrPzBhx6dX2UKGgGR0BzfoQvpQk5aAdLwWgIR0C5UrRIFvAHdX2UKGgGR0BxDkAhje9BaAdLiWgIR0C5UsGygPEsdX2UKGgGR0By3jfcer+6aAdLrGgIR0C5UszPrv9cdX2UKGgGR0Bzi8UFjd56aAdLuGgIR0C5UttTkyULdX2UKGgGR0BxwbxhDw6RaAdLo2gIR0C5Ut9vGZNPdX2UKGgGR0BwpnOE/SpjaAdLmmgIR0C5UuZ8WsRydX2UKGgGR0BwR1W6shgWaAdLiWgIR0C5UvMjiXIEdX2UKGgGR0BwXrzasZHeaAdLpmgIR0C5UvPrGBFvdX2UKGgGR0BxBnrSmZVoaAdLmGgIR0C5UwRHkLhKdX2UKGgGR0Bv96r5qM3qaAdLmmgIR0C5Uxd5Y5ktdX2UKGgGR0BwWggq3EydaAdLnWgIR0C5UzTAzpHJdX2UKGgGR0BygQjIJZ4faAdLqGgIR0C5UzW/rSmZdX2UKGgGR0BwwNHSWqtHaAdLnmgIR0C5UzjvE0iydX2UKGgGR0BxrsEHMUypaAdLgGgIR0C5Uz31OCXhdX2UKGgGR0Bx9nrLQokSaAdLpWgIR0C5U2ExM36zdX2UKGgGR0BxoGaAnUlSaAdLpmgIR0C5U2QsCkoGdX2UKGgGR0ByKwtmL9/CaAdLr2gIR0C5U3B9XtBwdX2UKGgGR0ByBpVea8YiaAdLi2gIR0C5U3Un1FpgdX2UKGgGR0BxTQf3evZAaAdLnGgIR0C5U3UVJtiydX2UKGgGR0BytH/FR51OaAdLhWgIR0C5U3cqvvBrdX2UKGgGR0BzNXnGKhtcaAdLp2gIR0C5U3fBN21VdX2UKGgGR0BvbxDArQPaaAdLlGgIR0C5U5IigTRIdX2UKGgGR0ByRdiMHbAUaAdLtWgIR0C5U51Bt1p1dX2UKGgGR0Bwc9zcRDkVaAdLmGgIR0C5U6czEaVEdX2UKGgGR0ByacOTaCcxaAdLs2gIR0C5U7PugHu7dX2UKGgGR0B0M97JGOMmaAdLtWgIR0C5U97NbC79dX2UKGgGR0BxX0mlZX+3aAdLm2gIR0C5U+OgctGvdX2UKGgGR0BxWxI5HVgAaAdLsWgIR0C5U/n8O09hdX2UKGgGR0ByAuEIw/PgaAdLsGgIR0C5VAFvIfbLdX2UKGgGR0Bz/zpu/DceaAdLvWgIR0C5VAbiIciodX2UKGgGR0BxM8/7iyY5aAdLhGgIR0C5VApu63AmdX2UKGgGR0Byo+VJL/S6aAdLnWgIR0C5VBB7mdRSdX2UKGgGR0Bzk0UO/cnFaAdLlWgIR0C5VBy8jAzpdX2UKGgGR0BybbBi1AqvaAdLmmgIR0C5VB3BciW3dX2UKGgGR0BzelzbN8mbaAdLnWgIR0C5VCUjcEeRdX2UKGgGR0ByF962OQyRaAdLqmgIR0C5VCJ4nndPdX2UKGgGR0BwXaGFi8WcaAdLsWgIR0C5VDm6bvw3dX2UKGgGR0BxUjbItDlYaAdLmGgIR0C5VEdrKvFFdX2UKGgGR0ByU22SdOIqaAdLuWgIR0C5VGJ8WsRydX2UKGgGR0Bw+id5IH1OaAdLqmgIR0C5VGhGpda/dX2UKGgGR0BxhCW4Vh1DaAdLn2gIR0C5VGk+C9RKdX2UKGgGR0BwN+Y/mknDaAdLlmgIR0C5VIhLoOhCdX2UKGgGR0BxbppztCzDaAdLiWgIR0C5VJRPO6d2dX2UKGgGR0Bx4IymALApaAdLgWgIR0C5VJvVAiV0dX2UKGgGR0BylnPJJXhgaAdLf2gIR0C5VKztsvZidX2UKGgGR0ByGwbp/wy7aAdLhmgIR0C5VLcLv1DjdX2UKGgGR0BzmClhw2l3aAdLo2gIR0C5VLvDxb0OdX2UKGgGR0B0KA+s5n14aAdLyWgIR0C5VMljy4FzdX2UKGgGR0BwrrX05EMLaAdLmGgIR0C5VNAXMyJsdX2UKGgGR0ByjKfpUxVRaAdLtWgIR0C5VNSEtdzGdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 920, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 4096, "gamma": 0.9917626079449092, "gae_lambda": 0.9646639489615664, "ent_coef": 0.00606441490506668, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.109+-x86_64-with-glibc2.35 # 1 SMP Fri Jun 9 10:57:30 UTC 2023", "Python": "3.10.6", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
ppo-LunarLander-v2.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 146664
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca391b1c835be79689e79040f7e0e24f26174265ff8fcfc29725559a30460cde
|
| 3 |
size 146664
|
ppo-LunarLander-v2/data
CHANGED
|
@@ -4,34 +4,34 @@
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
| 8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
| 9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
| 10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
| 11 |
-
"_build": "<function ActorCriticPolicy._build at
|
| 12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
| 13 |
-
"extract_features": "<function ActorCriticPolicy.extract_features at
|
| 14 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
| 15 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
| 16 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
| 17 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
| 18 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
-
"_abc_impl": "<_abc._abc_data object at
|
| 21 |
},
|
| 22 |
"verbose": 1,
|
| 23 |
"policy_kwargs": {},
|
| 24 |
-
"num_timesteps":
|
| 25 |
-
"_total_timesteps":
|
| 26 |
"_num_timesteps_at_start": 0,
|
| 27 |
"seed": null,
|
| 28 |
"action_noise": null,
|
| 29 |
-
"start_time":
|
| 30 |
"learning_rate": 0.0003,
|
| 31 |
"tensorboard_log": null,
|
| 32 |
"_last_obs": {
|
| 33 |
":type:": "<class 'numpy.ndarray'>",
|
| 34 |
-
":serialized:": "
|
| 35 |
},
|
| 36 |
"_last_episode_starts": {
|
| 37 |
":type:": "<class 'numpy.ndarray'>",
|
|
@@ -41,17 +41,17 @@
|
|
| 41 |
"_episode_num": 0,
|
| 42 |
"use_sde": false,
|
| 43 |
"sde_sample_freq": -1,
|
| 44 |
-
"_current_progress_remaining": -0.
|
| 45 |
"_stats_window_size": 100,
|
| 46 |
"ep_info_buffer": {
|
| 47 |
":type:": "<class 'collections.deque'>",
|
| 48 |
-
":serialized:": "
|
| 49 |
},
|
| 50 |
"ep_success_buffer": {
|
| 51 |
":type:": "<class 'collections.deque'>",
|
| 52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 53 |
},
|
| 54 |
-
"_n_updates":
|
| 55 |
"observation_space": {
|
| 56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
| 57 |
":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
|
|
@@ -78,13 +78,13 @@
|
|
| 78 |
},
|
| 79 |
"n_envs": 16,
|
| 80 |
"n_steps": 4096,
|
| 81 |
-
"gamma": 0.
|
| 82 |
-
"gae_lambda": 0.
|
| 83 |
-
"ent_coef": 0.
|
| 84 |
"vf_coef": 0.5,
|
| 85 |
"max_grad_norm": 0.5,
|
| 86 |
"batch_size": 64,
|
| 87 |
-
"n_epochs":
|
| 88 |
"clip_range": {
|
| 89 |
":type:": "<class 'function'>",
|
| 90 |
":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
|
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7f7be8202a70>",
|
| 8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7be8202b00>",
|
| 9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7be8202b90>",
|
| 10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7be8202c20>",
|
| 11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7f7be8202cb0>",
|
| 12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7f7be8202d40>",
|
| 13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x7f7be8202dd0>",
|
| 14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7be8202e60>",
|
| 15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7f7be8202ef0>",
|
| 16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7be8202f80>",
|
| 17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7be8203010>",
|
| 18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7be82030a0>",
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f7be820c780>"
|
| 21 |
},
|
| 22 |
"verbose": 1,
|
| 23 |
"policy_kwargs": {},
|
| 24 |
+
"num_timesteps": 6029312,
|
| 25 |
+
"_total_timesteps": 6000000,
|
| 26 |
"_num_timesteps_at_start": 0,
|
| 27 |
"seed": null,
|
| 28 |
"action_noise": null,
|
| 29 |
+
"start_time": 1690313243737686727,
|
| 30 |
"learning_rate": 0.0003,
|
| 31 |
"tensorboard_log": null,
|
| 32 |
"_last_obs": {
|
| 33 |
":type:": "<class 'numpy.ndarray'>",
|
| 34 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAE2js735iqo/iqGcvif+774tLqG9bPkxvgAAAAAAAAAAgOQtvfagcbqtDS24Xiyqskq9+rrx80g3AACAPwAAgD/mwQi+/PFOP073B74622i/pV5gvk054zoAAAAAAAAAAAD/Yz3wUZs/WOmuPsyPRb/zYLQ9thlYPgAAAAAAAAAAszYsPWx8Lz6WPcC8LfQYvxMloz2FrC28AAAAAAAAAAAztka+25OWPlyKmD60k/S+MIhTvstifj4AAAAAAAAAAFp7LT567yI/hSFXvdbMNr9PcpA+iP85vgAAAAAAAAAAmtxoPbRWiz+w0/U9qSJiv0rUyT2dEuc9AAAAAAAAAACaZ/A88bgzPMhbVr7pm6y9O1bmvR06cT8AAIA/AAAAAIDi5r3x8qM9k5DnPl57wL7A36A90GpUPgAAAAAAAAAAzQyaOwrYNbsiNH29/IwEPGZVZrzdH/M8AACAPwAAgD9aErW9id9dPc79VT5H7La+6ppBvfKJIT0AAAAAAAAAAGZX270Nqq0/pamHvkLkCL/qGYS9+YYivgAAAAAAAAAAQNLAvSkIM7pt8ss8pQ7IOwB+ULtKda48AACAPwAAgD+ztim9XMMGuoy/JjR0jdkv+GbgO7UNtLMAAIA/AACAP3PY+71MrJ8/cPInv4dOJL+5yvu9TMLEvgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
| 35 |
},
|
| 36 |
"_last_episode_starts": {
|
| 37 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
|
| 41 |
"_episode_num": 0,
|
| 42 |
"use_sde": false,
|
| 43 |
"sde_sample_freq": -1,
|
| 44 |
+
"_current_progress_remaining": -0.004885333333333408,
|
| 45 |
"_stats_window_size": 100,
|
| 46 |
"ep_info_buffer": {
|
| 47 |
":type:": "<class 'collections.deque'>",
|
| 48 |
+
":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHKlF/QSi/SMAWyUS92MAXSUR0C5UEIRVZLadX2UKGgGR0ByhnpX6qKhaAdLn2gIR0C5UFq3VkMDdX2UKGgGR0Bzuw2zfJmvaAdLyWgIR0C5UGzYEnstdX2UKGgGR0BwOsd92HLzaAdLkGgIR0C5UHGdRR/FdX2UKGgGR0ByTRtXPqs2aAdLrWgIR0C5UIQLiMo+dX2UKGgGR0BzR/rcCYCyaAdLzWgIR0C5UKYA0bcXdX2UKGgGR0Byixlbu+h5aAdLiGgIR0C5ULGykbgkdX2UKGgGR0A98HJtBOYZaAdLX2gIR0C5ULw+Y+jedX2UKGgGR0BzgHd1uBMBaAdLrGgIR0C5UL9vbXYldX2UKGgGR0ByLnV9Wp6yaAdLs2gIR0C5UMORYA80dX2UKGgGR0By22iRGMGYaAdLr2gIR0C5UNm5Yoy9dX2UKGgGR0BybN1jiGWVaAdLm2gIR0C5UNk7nxJ/dX2UKGgGR0Bx3YgJTl1baAdLsmgIR0C5UNuFpPAPdX2UKGgGR0Bw6lXGOuJUaAdLlGgIR0C5UQSEQGwBdX2UKGgGR0ByXC704BFNaAdLu2gIR0C5URUUKzAvdX2UKGgGR0BynzuF6AvtaAdLnGgIR0C5URRKtga4dX2UKGgGR0ByeXf0mMOxaAdLq2gIR0C5URptvXK9dX2UKGgGR0BxASPKdQO4aAdLl2gIR0C5USx0lqrSdX2UKGgGR0BzBZIg/1QJaAdLomgIR0C5USq+evpydX2UKGgGR0BxKE96kZaWaAdLpGgIR0C5UTb9MsYmdX2UKGgGR0BxJmarmyPdaAdLqGgIR0C5UUpcgQpXdX2UKGgGR0Bz2PyiEg4faAdLlWgIR0C5UU3ssxwidX2UKGgGR0ByHsMy8BdVaAdLpmgIR0C5UWvYvnKXdX2UKGgGR0BwuD6hxo7FaAdLnWgIR0C5UW+NkvsadX2UKGgGR0ByLjaews5GaAdLoWgIR0C5UXgcDKYBdX2UKGgGR0BzvnktEofCaAdLp2gIR0C5UXf3JxNqdX2UKGgGR0BxhxwuM+/yaAdLoGgIR0C5UYxNmDlHdX2UKGgGR0ByKkAYHgP3aAdLsGgIR0C5UaPLDAJtdX2UKGgGR0BzoZfICEHuaAdLvWgIR0C5UbZWV/tqdX2UKGgGR0BzSLm0VrRCaAdLnWgIR0C5UdHB+F10dX2UKGgGR0Bz93KdQO4HaAdLs2gIR0C5UdyIcinpdX2UKGgGR0Bzeq48U21laAdLpWgIR0C5UfRnvlU7dX2UKGgGR0By2BwKjSG8aAdLv2gIR0C5UfzLOiWWdX2UKGgGR0By7ayB06o3aAdLpGgIR0C5UgBMvh60dX2UKGgGR0BzeyoVEd/8aAdLlmgIR0C5UgduLrHEdX2UKGgGR0BzhaOn2qT9aAdLxWgIR0C5UgldxAB1dX2UKGgGR0B0WmGpMpPRaAdLxWgIR0C5UhrMHKOldX2UKGgGR0ByOvGEPDpDaAdLs2gIR0C5UiUpqh11dX2UKGgGR0Bw/95HEuQIaAdLi2gIR0C5UiQZ88cNdX2UKGgGR0B0AiB4D9wWaAdLnGgIR0C5Uje+Eh7mdX2UKGgGR0BxTVjFyaNNaAdLpmgIR0C5UjgC0WuYdX2UKGgGR0Bx/LEBKcuraAdLpmgIR0C5UlgZsKsudX2UKGgGR0By0BQxesxPaAdLwWgIR0C5Ulk9ZA6ddX2UKGgGR0ByZZqmCROlaAdLp2gIR0C5Ums1baAXdX2UKGgGR0BxdO9ytFKDaAdLiWgIR0C5UnwlF+d9dX2UKGgGR0BzszoePq9oaAdLsGgIR0C5UohMSK3vdX2UKGgGR0BK8ZxiobXIaAdLYWgIR0C5Uot4RmK7dX2UKGgGR0Byt8oYvWYnaAdLoWgIR0C5Uq6rJbMYdX2UKGgGR0BzNp/mT1TSaAdLmWgIR0C5UrFMZgogdX2UKGgGR0Bx6fIfbKzSaAdLnmgIR0C5UrPzBhx6dX2UKGgGR0BzfoQvpQk5aAdLwWgIR0C5UrRIFvAHdX2UKGgGR0BxDkAhje9BaAdLiWgIR0C5UsGygPEsdX2UKGgGR0By3jfcer+6aAdLrGgIR0C5UszPrv9cdX2UKGgGR0Bzi8UFjd56aAdLuGgIR0C5UttTkyULdX2UKGgGR0BxwbxhDw6RaAdLo2gIR0C5Ut9vGZNPdX2UKGgGR0BwpnOE/SpjaAdLmmgIR0C5UuZ8WsRydX2UKGgGR0BwR1W6shgWaAdLiWgIR0C5UvMjiXIEdX2UKGgGR0BwXrzasZHeaAdLpmgIR0C5UvPrGBFvdX2UKGgGR0BxBnrSmZVoaAdLmGgIR0C5UwRHkLhKdX2UKGgGR0Bv96r5qM3qaAdLmmgIR0C5Uxd5Y5ktdX2UKGgGR0BwWggq3EydaAdLnWgIR0C5UzTAzpHJdX2UKGgGR0BygQjIJZ4faAdLqGgIR0C5UzW/rSmZdX2UKGgGR0BwwNHSWqtHaAdLnmgIR0C5UzjvE0iydX2UKGgGR0BxrsEHMUypaAdLgGgIR0C5Uz31OCXhdX2UKGgGR0Bx9nrLQokSaAdLpWgIR0C5U2ExM36zdX2UKGgGR0BxoGaAnUlSaAdLpmgIR0C5U2QsCkoGdX2UKGgGR0ByKwtmL9/CaAdLr2gIR0C5U3B9XtBwdX2UKGgGR0ByBpVea8YiaAdLi2gIR0C5U3Un1FpgdX2UKGgGR0BxTQf3evZAaAdLnGgIR0C5U3UVJtiydX2UKGgGR0BytH/FR51OaAdLhWgIR0C5U3cqvvBrdX2UKGgGR0BzNXnGKhtcaAdLp2gIR0C5U3fBN21VdX2UKGgGR0BvbxDArQPaaAdLlGgIR0C5U5IigTRIdX2UKGgGR0ByRdiMHbAUaAdLtWgIR0C5U51Bt1p1dX2UKGgGR0Bwc9zcRDkVaAdLmGgIR0C5U6czEaVEdX2UKGgGR0ByacOTaCcxaAdLs2gIR0C5U7PugHu7dX2UKGgGR0B0M97JGOMmaAdLtWgIR0C5U97NbC79dX2UKGgGR0BxX0mlZX+3aAdLm2gIR0C5U+OgctGvdX2UKGgGR0BxWxI5HVgAaAdLsWgIR0C5U/n8O09hdX2UKGgGR0ByAuEIw/PgaAdLsGgIR0C5VAFvIfbLdX2UKGgGR0Bz/zpu/DceaAdLvWgIR0C5VAbiIciodX2UKGgGR0BxM8/7iyY5aAdLhGgIR0C5VApu63AmdX2UKGgGR0Byo+VJL/S6aAdLnWgIR0C5VBB7mdRSdX2UKGgGR0Bzk0UO/cnFaAdLlWgIR0C5VBy8jAzpdX2UKGgGR0BybbBi1AqvaAdLmmgIR0C5VB3BciW3dX2UKGgGR0BzelzbN8mbaAdLnWgIR0C5VCUjcEeRdX2UKGgGR0ByF962OQyRaAdLqmgIR0C5VCJ4nndPdX2UKGgGR0BwXaGFi8WcaAdLsWgIR0C5VDm6bvw3dX2UKGgGR0BxUjbItDlYaAdLmGgIR0C5VEdrKvFFdX2UKGgGR0ByU22SdOIqaAdLuWgIR0C5VGJ8WsRydX2UKGgGR0Bw+id5IH1OaAdLqmgIR0C5VGhGpda/dX2UKGgGR0BxhCW4Vh1DaAdLn2gIR0C5VGk+C9RKdX2UKGgGR0BwN+Y/mknDaAdLlmgIR0C5VIhLoOhCdX2UKGgGR0BxbppztCzDaAdLiWgIR0C5VJRPO6d2dX2UKGgGR0Bx4IymALApaAdLgWgIR0C5VJvVAiV0dX2UKGgGR0BylnPJJXhgaAdLf2gIR0C5VKztsvZidX2UKGgGR0ByGwbp/wy7aAdLhmgIR0C5VLcLv1DjdX2UKGgGR0BzmClhw2l3aAdLo2gIR0C5VLvDxb0OdX2UKGgGR0B0KA+s5n14aAdLyWgIR0C5VMljy4FzdX2UKGgGR0BwrrX05EMLaAdLmGgIR0C5VNAXMyJsdX2UKGgGR0ByjKfpUxVRaAdLtWgIR0C5VNSEtdzGdWUu"
|
| 49 |
},
|
| 50 |
"ep_success_buffer": {
|
| 51 |
":type:": "<class 'collections.deque'>",
|
| 52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 53 |
},
|
| 54 |
+
"_n_updates": 920,
|
| 55 |
"observation_space": {
|
| 56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
| 57 |
":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
|
|
|
|
| 78 |
},
|
| 79 |
"n_envs": 16,
|
| 80 |
"n_steps": 4096,
|
| 81 |
+
"gamma": 0.9917626079449092,
|
| 82 |
+
"gae_lambda": 0.9646639489615664,
|
| 83 |
+
"ent_coef": 0.00606441490506668,
|
| 84 |
"vf_coef": 0.5,
|
| 85 |
"max_grad_norm": 0.5,
|
| 86 |
"batch_size": 64,
|
| 87 |
+
"n_epochs": 10,
|
| 88 |
"clip_range": {
|
| 89 |
":type:": "<class 'function'>",
|
| 90 |
":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
ppo-LunarLander-v2/policy.optimizer.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87929
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca6d9130895f6904dfda444f91dfbf8421da8d56c932f67c9016f0bf5606d1ee
|
| 3 |
size 87929
|
ppo-LunarLander-v2/policy.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 43329
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2466cb7314128898643eafb6611397f04614d1a7c3a93bb7153d35c63d4a3dce
|
| 3 |
size 43329
|
replay.mp4
CHANGED
|
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward":
|
|
|
|
| 1 |
+
{"mean_reward": 292.0318324753425, "std_reward": 14.787519524814575, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-07-25T21:15:05.129483"}
|