aidenlee commited on
Commit
fd9fc9a
·
1 Parent(s): 82cfc7f
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: -311.75 +/- 143.84
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: -47.08 +/- 134.68
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f36fbd8c3a0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f36fbd8c430>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f36fbd8c4c0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f36fbd8c550>", "_build": "<function ActorCriticPolicy._build at 0x7f36fbd8c5e0>", "forward": "<function ActorCriticPolicy.forward at 0x7f36fbd8c670>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f36fbd8c700>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f36fbd8c790>", "_predict": "<function ActorCriticPolicy._predict at 0x7f36fbd8c820>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f36fbd8c8b0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f36fbd8c940>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f36fbd8c9d0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f36fbd90a80>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 1, "num_timesteps": 0, "_total_timesteps": 0, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": null, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": null, "_last_episode_starts": null, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 1, "ep_info_buffer": null, "ep_success_buffer": null, "_n_updates": 0, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu116", "GPU Enabled": "False", "Numpy": "1.22.4", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f36fbd8c3a0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f36fbd8c430>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f36fbd8c4c0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f36fbd8c550>", "_build": "<function ActorCriticPolicy._build at 0x7f36fbd8c5e0>", "forward": "<function ActorCriticPolicy.forward at 0x7f36fbd8c670>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f36fbd8c700>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f36fbd8c790>", "_predict": "<function ActorCriticPolicy._predict at 0x7f36fbd8c820>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f36fbd8c8b0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f36fbd8c940>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f36fbd8c9d0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f36fbd90a80>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 1, "num_timesteps": 100352, "_total_timesteps": 100000.0, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1679408570305682247, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVlQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAIC8G7+cTfc+6goavgbY372tG1S8jeDRPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksBSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdAAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYBAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwGFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0035199999999999676, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIHzF6bqGJRsCUhpRSlIwBbJRL0YwBdJRHQFy9IRywOe91fZQoaAZoCWgPQwh9CRUcXuAswJSGlFKUaBVL42gWR0BczZWFN+LFdX2UKGgGaAloD0MIMC3qk9wJQ8CUhpRSlGgVS9hoFkdAXNy8pTdcjnV9lChoBmgJaA9DCLyyCwbXS1ZAlIaUUpRoFU3oA2gWR0Bdj5X6qKgqdX2UKGgGaAloD0MILxfxnZjGX8CUhpRSlGgVS8BoFkdAXZ1rYXfqHHV9lChoBmgJaA9DCEZFnE6ya11AlIaUUpRoFU3oA2gWR0BeYOZb6guidX2UKGgGaAloD0MIzxJkBFR0NUCUhpRSlGgVS45oFkdAXmxiXpnpS3V9lChoBmgJaA9DCChIbHcPqEvAlIaUUpRoFUu2aBZHQF59Qd0aIep1fZQoaAZoCWgPQwi8k0+Pbf5SwJSGlFKUaBVLjWgWR0Bex8/hVENOdX2UKGgGaAloD0MIoiqm0k+QL0CUhpRSlGgVS41oFkdAXtNQP7N0NnV9lChoBmgJaA9DCGhAvRk1gzlAlIaUUpRoFUuGaBZHQF7dieumrKh1fZQoaAZoCWgPQwixijcyj6wgQJSGlFKUaBVLjmgWR0Be5t92HLzPdX2UKGgGaAloD0MIMA3DR8S0FkCUhpRSlGgVS3FoFkdAXu56F/QSjHV9lChoBmgJaA9DCP6Bctu++zdAlIaUUpRoFUunaBZHQF77pEQXhwV1fZQoaAZoCWgPQwh8KxIT1G5KQJSGlFKUaBVLnWgWR0BfCyJ9AooedX2UKGgGaAloD0MI8wGBzqQFJMCUhpRSlGgVS3NoFkdAX0MAYHgP3HV9lChoBmgJaA9DCBb59UNsMD/AlIaUUpRoFUtxaBZHQF9KIsiB5HF1fZQoaAZoCWgPQwh9BtSbUUJiQJSGlFKUaBVN6ANoFkdAYANKhcqvvHV9lChoBmgJaA9DCEga3NYWxEnAlIaUUpRoFUuTaBZHQGAJTkyULUl1fZQoaAZoCWgPQwgVNgNckLFRQJSGlFKUaBVN6ANoFkdAYGHrOZ9d/3V9lChoBmgJaA9DCJ0Rpb3BGzpAlIaUUpRoFUtnaBZHQGBl9rO7g891fZQoaAZoCWgPQwg9gbBTrOY3wJSGlFKUaBVLYmgWR0BgacG5c1O1dX2UKGgGaAloD0MI5EhnYORFMUCUhpRSlGgVS5ZoFkdAYG/lQMx46nV9lChoBmgJaA9DCHaKVYMwLyBAlIaUUpRoFUtlaBZHQGBzg2606YF1fZQoaAZoCWgPQwj3PlWFBnI0wJSGlFKUaBVLXGgWR0BgdqQV9F4LdX2UKGgGaAloD0MIpTFaR1VhW0CUhpRSlGgVTegDaBZHQGDZELH+6y11fZQoaAZoCWgPQwitp1ZfXaU9QJSGlFKUaBVLbWgWR0Bg3co4MnZ1dX2UKGgGaAloD0MIyorh6gBYN0CUhpRSlGgVS5VoFkdAYQaTfzjFQ3V9lChoBmgJaA9DCEdaKm9HBDtAlIaUUpRoFUudaBZHQGENJRoAXEZ1fZQoaAZoCWgPQwg0Tdh+MlhPQJSGlFKUaBVLl2gWR0BhE/GS6lLwdX2UKGgGaAloD0MI4Zf6eVOBGECUhpRSlGgVS4loFkdAYRu0IkZ75XV9lChoBmgJaA9DCE+WWu83mj3AlIaUUpRoFUubaBZHQGEjhmwqy4Z1fZQoaAZoCWgPQwhhN2xblLEgQJSGlFKUaBVLc2gWR0BhKMQVbiZOdX2UKGgGaAloD0MIChLb3QPoMECUhpRSlGgVS4BoFkdAYS5vZRKpUHV9lChoBmgJaA9DCKtCA7FsZvQ/lIaUUpRoFUuBaBZHQGEzjzyz5XV1fZQoaAZoCWgPQwgNcEG2LA1OQJSGlFKUaBVLpmgWR0BhV7oEB8x9dX2UKGgGaAloD0MIwOrIkc7QEcCUhpRSlGgVS3JoFkdAYVupw0fozXV9lChoBmgJaA9DCJcBZylZwjDAlIaUUpRoFUuNaBZHQGFglfZ26kJ1fZQoaAZoCWgPQwhCP1OvW8QwQJSGlFKUaBVLiGgWR0BhZdu+AVfvdX2UKGgGaAloD0MIUFPL1vp0RECUhpRSlGgVS2doFkdAYWnTsIE8rHV9lChoBmgJaA9DCJsb0xOWqBlAlIaUUpRoFUt4aBZHQGFuAmiQDFJ1fZQoaAZoCWgPQwiCjla1pIlDwJSGlFKUaBVLiGgWR0BhcstRNyo5dX2UKGgGaAloD0MIQX+hR4yeDkCUhpRSlGgVS2toFkdAYXZ6QeV9nnV9lChoBmgJaA9DCGfttgvNnTBAlIaUUpRoFUuUaBZHQGGTjsD4gzR1fZQoaAZoCWgPQwi0AdiACJk9QJSGlFKUaBVLpWgWR0BhmUxoIv8JdX2UKGgGaAloD0MIje4gdqYAJcCUhpRSlGgVS5loFkdAYZ5VrAP/aXV9lChoBmgJaA9DCFOwxtl0cFhAlIaUUpRoFU3oA2gWR0Bh/jM/yGzsdX2UKGgGaAloD0MIUd7H0Ry5JsCUhpRSlGgVS5poFkdAYgNuzhP0qnV9lChoBmgJaA9DCMNF7unqPhJAlIaUUpRoFUuIaBZHQGIINZmqYJF1fZQoaAZoCWgPQwjDnnb4a/ZcQJSGlFKUaBVN6ANoFkdAYmdFF2FFlXV9lChoBmgJaA9DCCklBKvq9T5AlIaUUpRoFUu8aBZHQGJt3PZ7HAB1fZQoaAZoCWgPQwjQ04BB0ss6QJSGlFKUaBVLf2gWR0BicgwoLG70dX2UKGgGaAloD0MIIM8u3/oEZECUhpRSlGgVTegDaBZHQGLPSXD3ueB1fZQoaAZoCWgPQwgFTraBO2NRQJSGlFKUaBVN6ANoFkdAYypwy6+WW3V9lChoBmgJaA9DCFOvWwTGKirAlIaUUpRoFUuJaBZHQGNHvGQ0XP91fZQoaAZoCWgPQwhU5BBxc0FUwJSGlFKUaBVLiGgWR0BjTUOqebuudX2UKGgGaAloD0MIQ41CklkVSkCUhpRSlGgVS6VoFkdAY1MpQUHpr3V9lChoBmgJaA9DCJZ5q65DVRJAlIaUUpRoFUt1aBZHQGNXiwr1/Uh1fZQoaAZoCWgPQwgFhqxu9dQ7wJSGlFKUaBVLXWgWR0BjWqFVT72tdX2UKGgGaAloD0MIUTOkiuJNQkCUhpRSlGgVS51oFkdAY1/SeiBXjnV9lChoBmgJaA9DCEHw+PauOTDAlIaUUpRoFUukaBZHQGNlSpBHCoF1fZQoaAZoCWgPQwgPfAxWnAVjQJSGlFKUaBVN6ANoFkdAY7Fy/9Hc13V9lChoBmgJaA9DCGCsb2ByEU1AlIaUUpRoFUtsaBZHQGO01tfoicJ1fZQoaAZoCWgPQwj0/j9OmDDVv5SGlFKUaBVLZGgWR0Bj0DV6NVBEdX2UKGgGaAloD0MIImx4eqXRYkCUhpRSlGgVTegDaBZHQGQjBxYJVsF1fZQoaAZoCWgPQwhGJ0ut99MrQJSGlFKUaBVLcGgWR0BkJsyBTXJ6dX2UKGgGaAloD0MI6j2V0x7rZkCUhpRSlGgVTegDaBZHQGR28jzI3it1fZQoaAZoCWgPQwjb3QN0X0IwQJSGlFKUaBVLpmgWR0Bkfxs9B8hLdX2UKGgGaAloD0MImYBfI0lqSkCUhpRSlGgVS7RoFkdAZIca9bor4HV9lChoBmgJaA9DCG78icqGjT3AlIaUUpRoFUvLaBZHQGSQIDgZTAF1fZQoaAZoCWgPQwjoL/SIUUVgQJSGlFKUaBVN6ANoFkdAZPrE6T4cm3V9lChoBmgJaA9DCFjk1w+x+F9AlIaUUpRoFU3oA2gWR0BlVtKPGQ0XdX2UKGgGaAloD0MItDo5Q/FGY0CUhpRSlGgVTegDaBZHQGWnlQdjoZB1fZQoaAZoCWgPQwiULv1LUmhTQJSGlFKUaBVLwGgWR0Blr3qZ+hGpdX2UKGgGaAloD0MIEXAIVWq2W0CUhpRSlGgVTegDaBZHQGYRVuBMBZJ1fZQoaAZoCWgPQwjd7A+U2wxPQJSGlFKUaBVLsmgWR0BmGN6ol2NedX2UKGgGaAloD0MI+Db92Q9VZ0CUhpRSlGgVTegDaBZHQGZmw5eZ5Rl1fZQoaAZoCWgPQwjU1ohgnPhiQJSGlFKUaBVN6ANoFkdAZtN/vv0AcXV9lChoBmgJaA9DCB1Z+WUw/F1AlIaUUpRoFU3oA2gWR0BnKv4yoGY8dX2UKGgGaAloD0MI6lil9MyiZECUhpRSlGgVTegDaBZHQGeE6hpQDV91fZQoaAZoCWgPQwhNLVvri4QpwJSGlFKUaBVL52gWR0BnqCNsFdLQdX2UKGgGaAloD0MIb59VZkr3YECUhpRSlGgVTegDaBZHQGfzzOHFglZ1fZQoaAZoCWgPQwgVGR2QhMJdQJSGlFKUaBVN6ANoFkdAaFpwFTvRZ3V9lChoBmgJaA9DCHfbhea6AmJAlIaUUpRoFU3oA2gWR0BopgTRIBikdX2UKGgGaAloD0MIvTjx1Y46QkCUhpRSlGgVS9BoFkdAaMnS5RTCL3V9lChoBmgJaA9DCCswZHWr/UfAlIaUUpRoFUvyaBZHQGjTg93bEgp1fZQoaAZoCWgPQwiN74tLVUReQJSGlFKUaBVN6ANoFkdAaTg12JSBLHV9lChoBmgJaA9DCA4viEhN2l9AlIaUUpRoFU3oA2gWR0BpoFS2phnbdX2UKGgGaAloD0MIat/cXz1FXECUhpRSlGgVTegDaBZHQGnmymALApN1fZQoaAZoCWgPQwgyWdx/ZM9hQJSGlFKUaBVN6ANoFkdAajPmDDjzZ3V9lChoBmgJaA9DCP0RhgFLe1xAlIaUUpRoFU3oA2gWR0BqhA4p+c6OdX2UKGgGaAloD0MIGO5cGOlBXkCUhpRSlGgVTegDaBZHQGrjCI+GGmF1fZQoaAZoCWgPQwhU46WbxBhDwJSGlFKUaBVN2AFoFkdAavuuloDgZXV9lChoBmgJaA9DCAlrY+yEk1xAlIaUUpRoFU3oA2gWR0BrT68vmHQAdX2UKGgGaAloD0MIhNkEGJanW8CUhpRSlGgVTWgDaBZHQGuYXos7MgV1fZQoaAZoCWgPQwgrTrUWZtxewJSGlFKUaBVNAgFoFkdAa6I9h7Vrh3V9lChoBmgJaA9DCPgb7bjhN0rAlIaUUpRoFUv7aBZHQGvCxxtHhCN1fZQoaAZoCWgPQwhvZB75g5pkQJSGlFKUaBVN6ANoFkdAbChriVB2OnV9lChoBmgJaA9DCCJxj6WP92RAlIaUUpRoFU3gAWgWR0BsRGK64Ds/dX2UKGgGaAloD0MI81meBzftcUCUhpRSlGgVTUQBaBZHQGxVWFvhqCZ1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 980, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu116", "GPU Enabled": "False", "Numpy": "1.22.4", "Gym": "0.21.0"}}
ppo-LunarLander-v2_1.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1327bbb128128b6f11b09e512011906587e667bd8fcd6a4e753ffe9a44024337
3
+ size 146175
ppo-LunarLander-v2_1/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 1.7.0
ppo-LunarLander-v2_1/data ADDED
@@ -0,0 +1,95 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
+ "__module__": "stable_baselines3.common.policies",
6
+ "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f36fbd8c3a0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f36fbd8c430>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f36fbd8c4c0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f36fbd8c550>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f36fbd8c5e0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f36fbd8c670>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f36fbd8c700>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f36fbd8c790>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f36fbd8c820>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f36fbd8c8b0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f36fbd8c940>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f36fbd8c9d0>",
19
+ "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7f36fbd90a80>"
21
+ },
22
+ "verbose": 1,
23
+ "policy_kwargs": {},
24
+ "observation_space": {
25
+ ":type:": "<class 'gym.spaces.box.Box'>",
26
+ ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu",
27
+ "dtype": "float32",
28
+ "_shape": [
29
+ 8
30
+ ],
31
+ "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]",
32
+ "high": "[inf inf inf inf inf inf inf inf]",
33
+ "bounded_below": "[False False False False False False False False]",
34
+ "bounded_above": "[False False False False False False False False]",
35
+ "_np_random": null
36
+ },
37
+ "action_space": {
38
+ ":type:": "<class 'gym.spaces.discrete.Discrete'>",
39
+ ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu",
40
+ "n": 4,
41
+ "_shape": [],
42
+ "dtype": "int64",
43
+ "_np_random": null
44
+ },
45
+ "n_envs": 1,
46
+ "num_timesteps": 100352,
47
+ "_total_timesteps": 100000.0,
48
+ "_num_timesteps_at_start": 0,
49
+ "seed": null,
50
+ "action_noise": null,
51
+ "start_time": 1679408570305682247,
52
+ "learning_rate": 0.0003,
53
+ "tensorboard_log": null,
54
+ "lr_schedule": {
55
+ ":type:": "<class 'function'>",
56
+ ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
57
+ },
58
+ "_last_obs": {
59
+ ":type:": "<class 'numpy.ndarray'>",
60
+ ":serialized:": "gAWVlQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAIC8G7+cTfc+6goavgbY372tG1S8jeDRPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksBSwiGlIwBQ5R0lFKULg=="
61
+ },
62
+ "_last_episode_starts": {
63
+ ":type:": "<class 'numpy.ndarray'>",
64
+ ":serialized:": "gAWVdAAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYBAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwGFlIwBQ5R0lFKULg=="
65
+ },
66
+ "_last_original_obs": null,
67
+ "_episode_num": 0,
68
+ "use_sde": false,
69
+ "sde_sample_freq": -1,
70
+ "_current_progress_remaining": -0.0035199999999999676,
71
+ "ep_info_buffer": {
72
+ ":type:": "<class 'collections.deque'>",
73
+ ":serialized:": "gAWVQRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIHzF6bqGJRsCUhpRSlIwBbJRL0YwBdJRHQFy9IRywOe91fZQoaAZoCWgPQwh9CRUcXuAswJSGlFKUaBVL42gWR0BczZWFN+LFdX2UKGgGaAloD0MIMC3qk9wJQ8CUhpRSlGgVS9hoFkdAXNy8pTdcjnV9lChoBmgJaA9DCLyyCwbXS1ZAlIaUUpRoFU3oA2gWR0Bdj5X6qKgqdX2UKGgGaAloD0MILxfxnZjGX8CUhpRSlGgVS8BoFkdAXZ1rYXfqHHV9lChoBmgJaA9DCEZFnE6ya11AlIaUUpRoFU3oA2gWR0BeYOZb6guidX2UKGgGaAloD0MIzxJkBFR0NUCUhpRSlGgVS45oFkdAXmxiXpnpS3V9lChoBmgJaA9DCChIbHcPqEvAlIaUUpRoFUu2aBZHQF59Qd0aIep1fZQoaAZoCWgPQwi8k0+Pbf5SwJSGlFKUaBVLjWgWR0Bex8/hVENOdX2UKGgGaAloD0MIoiqm0k+QL0CUhpRSlGgVS41oFkdAXtNQP7N0NnV9lChoBmgJaA9DCGhAvRk1gzlAlIaUUpRoFUuGaBZHQF7dieumrKh1fZQoaAZoCWgPQwixijcyj6wgQJSGlFKUaBVLjmgWR0Be5t92HLzPdX2UKGgGaAloD0MIMA3DR8S0FkCUhpRSlGgVS3FoFkdAXu56F/QSjHV9lChoBmgJaA9DCP6Bctu++zdAlIaUUpRoFUunaBZHQF77pEQXhwV1fZQoaAZoCWgPQwh8KxIT1G5KQJSGlFKUaBVLnWgWR0BfCyJ9AooedX2UKGgGaAloD0MI8wGBzqQFJMCUhpRSlGgVS3NoFkdAX0MAYHgP3HV9lChoBmgJaA9DCBb59UNsMD/AlIaUUpRoFUtxaBZHQF9KIsiB5HF1fZQoaAZoCWgPQwh9BtSbUUJiQJSGlFKUaBVN6ANoFkdAYANKhcqvvHV9lChoBmgJaA9DCEga3NYWxEnAlIaUUpRoFUuTaBZHQGAJTkyULUl1fZQoaAZoCWgPQwgVNgNckLFRQJSGlFKUaBVN6ANoFkdAYGHrOZ9d/3V9lChoBmgJaA9DCJ0Rpb3BGzpAlIaUUpRoFUtnaBZHQGBl9rO7g891fZQoaAZoCWgPQwg9gbBTrOY3wJSGlFKUaBVLYmgWR0BgacG5c1O1dX2UKGgGaAloD0MI5EhnYORFMUCUhpRSlGgVS5ZoFkdAYG/lQMx46nV9lChoBmgJaA9DCHaKVYMwLyBAlIaUUpRoFUtlaBZHQGBzg2606YF1fZQoaAZoCWgPQwj3PlWFBnI0wJSGlFKUaBVLXGgWR0BgdqQV9F4LdX2UKGgGaAloD0MIpTFaR1VhW0CUhpRSlGgVTegDaBZHQGDZELH+6y11fZQoaAZoCWgPQwitp1ZfXaU9QJSGlFKUaBVLbWgWR0Bg3co4MnZ1dX2UKGgGaAloD0MIyorh6gBYN0CUhpRSlGgVS5VoFkdAYQaTfzjFQ3V9lChoBmgJaA9DCEdaKm9HBDtAlIaUUpRoFUudaBZHQGENJRoAXEZ1fZQoaAZoCWgPQwg0Tdh+MlhPQJSGlFKUaBVLl2gWR0BhE/GS6lLwdX2UKGgGaAloD0MI4Zf6eVOBGECUhpRSlGgVS4loFkdAYRu0IkZ75XV9lChoBmgJaA9DCE+WWu83mj3AlIaUUpRoFUubaBZHQGEjhmwqy4Z1fZQoaAZoCWgPQwhhN2xblLEgQJSGlFKUaBVLc2gWR0BhKMQVbiZOdX2UKGgGaAloD0MIChLb3QPoMECUhpRSlGgVS4BoFkdAYS5vZRKpUHV9lChoBmgJaA9DCKtCA7FsZvQ/lIaUUpRoFUuBaBZHQGEzjzyz5XV1fZQoaAZoCWgPQwgNcEG2LA1OQJSGlFKUaBVLpmgWR0BhV7oEB8x9dX2UKGgGaAloD0MIwOrIkc7QEcCUhpRSlGgVS3JoFkdAYVupw0fozXV9lChoBmgJaA9DCJcBZylZwjDAlIaUUpRoFUuNaBZHQGFglfZ26kJ1fZQoaAZoCWgPQwhCP1OvW8QwQJSGlFKUaBVLiGgWR0BhZdu+AVfvdX2UKGgGaAloD0MIUFPL1vp0RECUhpRSlGgVS2doFkdAYWnTsIE8rHV9lChoBmgJaA9DCJsb0xOWqBlAlIaUUpRoFUt4aBZHQGFuAmiQDFJ1fZQoaAZoCWgPQwiCjla1pIlDwJSGlFKUaBVLiGgWR0BhcstRNyo5dX2UKGgGaAloD0MIQX+hR4yeDkCUhpRSlGgVS2toFkdAYXZ6QeV9nnV9lChoBmgJaA9DCGfttgvNnTBAlIaUUpRoFUuUaBZHQGGTjsD4gzR1fZQoaAZoCWgPQwi0AdiACJk9QJSGlFKUaBVLpWgWR0BhmUxoIv8JdX2UKGgGaAloD0MIje4gdqYAJcCUhpRSlGgVS5loFkdAYZ5VrAP/aXV9lChoBmgJaA9DCFOwxtl0cFhAlIaUUpRoFU3oA2gWR0Bh/jM/yGzsdX2UKGgGaAloD0MIUd7H0Ry5JsCUhpRSlGgVS5poFkdAYgNuzhP0qnV9lChoBmgJaA9DCMNF7unqPhJAlIaUUpRoFUuIaBZHQGIINZmqYJF1fZQoaAZoCWgPQwjDnnb4a/ZcQJSGlFKUaBVN6ANoFkdAYmdFF2FFlXV9lChoBmgJaA9DCCklBKvq9T5AlIaUUpRoFUu8aBZHQGJt3PZ7HAB1fZQoaAZoCWgPQwjQ04BB0ss6QJSGlFKUaBVLf2gWR0BicgwoLG70dX2UKGgGaAloD0MIIM8u3/oEZECUhpRSlGgVTegDaBZHQGLPSXD3ueB1fZQoaAZoCWgPQwgFTraBO2NRQJSGlFKUaBVN6ANoFkdAYypwy6+WW3V9lChoBmgJaA9DCFOvWwTGKirAlIaUUpRoFUuJaBZHQGNHvGQ0XP91fZQoaAZoCWgPQwhU5BBxc0FUwJSGlFKUaBVLiGgWR0BjTUOqebuudX2UKGgGaAloD0MIQ41CklkVSkCUhpRSlGgVS6VoFkdAY1MpQUHpr3V9lChoBmgJaA9DCJZ5q65DVRJAlIaUUpRoFUt1aBZHQGNXiwr1/Uh1fZQoaAZoCWgPQwgFhqxu9dQ7wJSGlFKUaBVLXWgWR0BjWqFVT72tdX2UKGgGaAloD0MIUTOkiuJNQkCUhpRSlGgVS51oFkdAY1/SeiBXjnV9lChoBmgJaA9DCEHw+PauOTDAlIaUUpRoFUukaBZHQGNlSpBHCoF1fZQoaAZoCWgPQwgPfAxWnAVjQJSGlFKUaBVN6ANoFkdAY7Fy/9Hc13V9lChoBmgJaA9DCGCsb2ByEU1AlIaUUpRoFUtsaBZHQGO01tfoicJ1fZQoaAZoCWgPQwj0/j9OmDDVv5SGlFKUaBVLZGgWR0Bj0DV6NVBEdX2UKGgGaAloD0MIImx4eqXRYkCUhpRSlGgVTegDaBZHQGQjBxYJVsF1fZQoaAZoCWgPQwhGJ0ut99MrQJSGlFKUaBVLcGgWR0BkJsyBTXJ6dX2UKGgGaAloD0MI6j2V0x7rZkCUhpRSlGgVTegDaBZHQGR28jzI3it1fZQoaAZoCWgPQwjb3QN0X0IwQJSGlFKUaBVLpmgWR0Bkfxs9B8hLdX2UKGgGaAloD0MImYBfI0lqSkCUhpRSlGgVS7RoFkdAZIca9bor4HV9lChoBmgJaA9DCG78icqGjT3AlIaUUpRoFUvLaBZHQGSQIDgZTAF1fZQoaAZoCWgPQwjoL/SIUUVgQJSGlFKUaBVN6ANoFkdAZPrE6T4cm3V9lChoBmgJaA9DCFjk1w+x+F9AlIaUUpRoFU3oA2gWR0BlVtKPGQ0XdX2UKGgGaAloD0MItDo5Q/FGY0CUhpRSlGgVTegDaBZHQGWnlQdjoZB1fZQoaAZoCWgPQwiULv1LUmhTQJSGlFKUaBVLwGgWR0Blr3qZ+hGpdX2UKGgGaAloD0MIEXAIVWq2W0CUhpRSlGgVTegDaBZHQGYRVuBMBZJ1fZQoaAZoCWgPQwjd7A+U2wxPQJSGlFKUaBVLsmgWR0BmGN6ol2NedX2UKGgGaAloD0MI+Db92Q9VZ0CUhpRSlGgVTegDaBZHQGZmw5eZ5Rl1fZQoaAZoCWgPQwjU1ohgnPhiQJSGlFKUaBVN6ANoFkdAZtN/vv0AcXV9lChoBmgJaA9DCB1Z+WUw/F1AlIaUUpRoFU3oA2gWR0BnKv4yoGY8dX2UKGgGaAloD0MI6lil9MyiZECUhpRSlGgVTegDaBZHQGeE6hpQDV91fZQoaAZoCWgPQwhNLVvri4QpwJSGlFKUaBVL52gWR0BnqCNsFdLQdX2UKGgGaAloD0MIb59VZkr3YECUhpRSlGgVTegDaBZHQGfzzOHFglZ1fZQoaAZoCWgPQwgVGR2QhMJdQJSGlFKUaBVN6ANoFkdAaFpwFTvRZ3V9lChoBmgJaA9DCHfbhea6AmJAlIaUUpRoFU3oA2gWR0BopgTRIBikdX2UKGgGaAloD0MIvTjx1Y46QkCUhpRSlGgVS9BoFkdAaMnS5RTCL3V9lChoBmgJaA9DCCswZHWr/UfAlIaUUpRoFUvyaBZHQGjTg93bEgp1fZQoaAZoCWgPQwiN74tLVUReQJSGlFKUaBVN6ANoFkdAaTg12JSBLHV9lChoBmgJaA9DCA4viEhN2l9AlIaUUpRoFU3oA2gWR0BpoFS2phnbdX2UKGgGaAloD0MIat/cXz1FXECUhpRSlGgVTegDaBZHQGnmymALApN1fZQoaAZoCWgPQwgyWdx/ZM9hQJSGlFKUaBVN6ANoFkdAajPmDDjzZ3V9lChoBmgJaA9DCP0RhgFLe1xAlIaUUpRoFU3oA2gWR0BqhA4p+c6OdX2UKGgGaAloD0MIGO5cGOlBXkCUhpRSlGgVTegDaBZHQGrjCI+GGmF1fZQoaAZoCWgPQwhU46WbxBhDwJSGlFKUaBVN2AFoFkdAavuuloDgZXV9lChoBmgJaA9DCAlrY+yEk1xAlIaUUpRoFU3oA2gWR0BrT68vmHQAdX2UKGgGaAloD0MIhNkEGJanW8CUhpRSlGgVTWgDaBZHQGuYXos7MgV1fZQoaAZoCWgPQwgrTrUWZtxewJSGlFKUaBVNAgFoFkdAa6I9h7Vrh3V9lChoBmgJaA9DCPgb7bjhN0rAlIaUUpRoFUv7aBZHQGvCxxtHhCN1fZQoaAZoCWgPQwhvZB75g5pkQJSGlFKUaBVN6ANoFkdAbChriVB2OnV9lChoBmgJaA9DCCJxj6WP92RAlIaUUpRoFU3gAWgWR0BsRGK64Ds/dX2UKGgGaAloD0MI81meBzftcUCUhpRSlGgVTUQBaBZHQGxVWFvhqCZ1ZS4="
74
+ },
75
+ "ep_success_buffer": {
76
+ ":type:": "<class 'collections.deque'>",
77
+ ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
78
+ },
79
+ "_n_updates": 980,
80
+ "n_steps": 1024,
81
+ "gamma": 0.999,
82
+ "gae_lambda": 0.98,
83
+ "ent_coef": 0.01,
84
+ "vf_coef": 0.5,
85
+ "max_grad_norm": 0.5,
86
+ "batch_size": 64,
87
+ "n_epochs": 10,
88
+ "clip_range": {
89
+ ":type:": "<class 'function'>",
90
+ ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
91
+ },
92
+ "clip_range_vf": null,
93
+ "normalize_advantage": true,
94
+ "target_kl": null
95
+ }
ppo-LunarLander-v2_1/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80cafaf39c7cfede6b990f781df90a7ffcab5596540e2e002fd0e08d3275d3b5
3
+ size 87545
ppo-LunarLander-v2_1/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc720cfb7141cc07c6c228faef75c3041891a17eb4927161df7021dff42fce3d
3
+ size 43265
ppo-LunarLander-v2_1/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1
3
+ size 431
ppo-LunarLander-v2_1/system_info.txt ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ - OS: Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022
2
+ - Python: 3.9.16
3
+ - Stable-Baselines3: 1.7.0
4
+ - PyTorch: 1.13.1+cu116
5
+ - GPU Enabled: False
6
+ - Numpy: 1.22.4
7
+ - Gym: 0.21.0
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -311.7473829105496, "std_reward": 143.83528969072057, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-21T14:18:04.141235"}
 
1
+ {"mean_reward": -47.08261518846532, "std_reward": 134.67678425843607, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-21T14:27:57.098334"}