deanvanaswegen commited on
Commit
0a4b465
·
1 Parent(s): 115f90d

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 227.59 +/- 33.91
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 270.37 +/- 17.72
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f9eacc9aee0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f9eacc9af70>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f9eacc9e040>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f9eacc9e0d0>", "_build": "<function ActorCriticPolicy._build at 0x7f9eacc9e160>", "forward": "<function ActorCriticPolicy.forward at 0x7f9eacc9e1f0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f9eacc9e280>", "_predict": "<function ActorCriticPolicy._predict at 0x7f9eacc9e310>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f9eacc9e3a0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f9eacc9e430>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f9eacc9e4c0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f9eacc94f00>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 32, "num_timesteps": 1048576, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1671807920230630791, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQQAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABAAAAAAAAPqjLL7sL6W7v6m8OTQQETec0vs8CgrfuAAAgD8AAIA/mpF0PVzLFrpGEN+4zatbNRBOW7gzNAA4AACAPwAAgD/gg6Y+SUwHPU4N6rl93we4+5wXPhJ5IzkAAIA/AACAP2bgZ73tGww+5VlnPnocOL7Zfao9QWYmPQAAAAAAAAAApvQcvlKFr7sXpzc7MXPROJgWHT3ypme6AACAPwAAgD9ANU8+PtyTP2su+D4B2Yi+E4EqPgrh9TwAAAAAAAAAAGYvzbwO3W0/Kb0evXfkub7Qhxu9DToqvQAAAAAAAAAAzeyZvER9vj+2K0y+ea6MPsLbCjyEWrq8AAAAAAAAAAAzyWI+lId6PkE5x70xnkG9KXolvWCpW70AAAAAAAAAAA1Pz70UvNi69UaQvBEPL72Zlau7/tUYvgAAAAAAAIA/JqScPeGam7jzpmu7zp8pOPSiijvNiBE5AACAPwAAgD8A9m48QAy3P02Y9D5E5IM+TgIgvP8DjrwAAAAAAAAAAGbewjvDKTm6Spuiu5L/CDeVx6C6Njl3tgAAgD8AAIA/s6R9PY+GfbqFujU6I3WENSVLQDvlWlK5AACAPwAAgD9Thzc+GyGpvFBPGDrSlmC4J4MVvk3cTrkAAIA/AACAP+Y4MT0UDrs5fVCEOYlhxjOSvNa7K4OguAAAgD8AAIA/WoELPsO6Ijsi7f26UTQouJzq4zzJeRs6AACAPwAAgD/N/JO8Kfg2usMMzjrNDyQ2NanMuqa58LkAAIA/AACAP/PMsb3DuSe64tQMuUZ2l7W2vqE69dUjOAAAgD8AAIA/Jv03PkghzTn7FyU5rmnMNS5xUzyeUTy4AACAPwAAgD8Nbok9SCeBuiKAvDrJSX01Xs7uOe1E2bkAAIA/AACAP6aV9r2um8a6bWTtPaxmTL17W2476+rdvAAAgD8AAIA/s4FqPuSCFzypXoU7pINdOUnboT2EApq6AACAPwAAgD+a7de8FKKMul39YTpqTpo2fs01OygdgLkAAIA/AACAP+bXHb2Fa4u58s+mPDmZ5TxWsiQ7Pd9sPAAAgD8AAIA/848ovo8KYLzVHCk6ZRgSOJ31xz2GkVS5AACAPwAAgD+A9Lc+mH21Pgk4xrxBt06+MAkrvH5EPb0AAAAAAAAAAA1+Qb49QE27jKugOYEZuDZ3vbs8hj2/uAAAgD8AAIA/GhN1vVLIirnGOJI5WubHNKnLIjvO6Km4AACAPwAAgD/mEj+99qwpurJ8uLskADI4YTkcOkAEbzcAAIA/AACAP3DHXr7hEv05PkUaOkHnkLbWiTu8UnEzuQAAgD8AAIA/k45NPiphhj+qWew9f+SvvlJwrj3d2gM7AAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSyBLCIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVkwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksghZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.04857599999999995, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVfxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIQ8cOKvHaYECUhpRSlIwBbJRN6AOMAXSUR0CYQ8YKpkwwdX2UKGgGaAloD0MI08H6P4fIXUCUhpRSlGgVTegDaBZHQJhFigPEsJ91fZQoaAZoCWgPQwhh/gqZq3FiQJSGlFKUaBVN6ANoFkdAmEf2Ifr8i3V9lChoBmgJaA9DCPtcbcV+QmVAlIaUUpRoFU3eAmgWR0CYSLXLeQ+2dX2UKGgGaAloD0MIAB5RoTrGYUCUhpRSlGgVTegDaBZHQJhJbf/FR511fZQoaAZoCWgPQwgBFvn1Q25kQJSGlFKUaBVN6ANoFkdAmEv3erMkhXV9lChoBmgJaA9DCI7NjlTfvGNAlIaUUpRoFU3oA2gWR0CYTWHlfZ27dX2UKGgGaAloD0MIOuenOA7SXECUhpRSlGgVTegDaBZHQJhQGfVZs9B1fZQoaAZoCWgPQwhLrfcb7VAqQJSGlFKUaBVNCgFoFkdAmFShvvSc9XV9lChoBmgJaA9DCOKxn8VSHVxAlIaUUpRoFU3oA2gWR0CYVYCL/CIldX2UKGgGaAloD0MI7rH0oQu+ZECUhpRSlGgVTegDaBZHQJhWR77bcoJ1fZQoaAZoCWgPQwiZSj/h7OYeQJSGlFKUaBVL8GgWR0CYW1lhw2l3dX2UKGgGaAloD0MIoIhFDDvGYECUhpRSlGgVTegDaBZHQJhbW8VYZEV1fZQoaAZoCWgPQwjo2hfQC91ZQJSGlFKUaBVN6ANoFkdAmF1Wv4dp7HV9lChoBmgJaA9DCMAjKlQ3AWZAlIaUUpRoFU3oA2gWR0CYX/klNUOvdX2UKGgGaAloD0MI+Ppal5r8YUCUhpRSlGgVTegDaBZHQJhi+a6STyJ1fZQoaAZoCWgPQwgAVHHjlrllQJSGlFKUaBVN6ANoFkdAmHDbxqfvnnV9lChoBmgJaA9DCBvXv+uzR2NAlIaUUpRoFU3oA2gWR0CYfRPk7wKCdX2UKGgGaAloD0MIMBAEyNCSZUCUhpRSlGgVTegDaBZHQJiBB05lvqF1fZQoaAZoCWgPQwiKIM7DCawYwJSGlFKUaBVNEQFoFkdAmIQVCHARCnV9lChoBmgJaA9DCHWPbK4avWNAlIaUUpRoFU3oA2gWR0CYhFcEeQuFdX2UKGgGaAloD0MIpFLsaBy0YECUhpRSlGgVTegDaBZHQJiE8/iYLLJ1fZQoaAZoCWgPQwhfYFYo0g1jQJSGlFKUaBVN6ANoFkdAmIZtb5dnkHV9lChoBmgJaA9DCCXJc30flmBAlIaUUpRoFU3oA2gWR0CYjXLq2SdOdX2UKGgGaAloD0MInmFqS51aYkCUhpRSlGgVTegDaBZHQJiVmvbGm1p1fZQoaAZoCWgPQwgucHmsGfBiQJSGlFKUaBVN6ANoFkdAmJf9vfj0c3V9lChoBmgJaA9DCJoF2h3S2mNAlIaUUpRoFU3oA2gWR0CZg4rFOwgUdX2UKGgGaAloD0MIDjLJyNlkbkCUhpRSlGgVTSQCaBZHQJmHJp8F6iV1fZQoaAZoCWgPQwhPz7uxoCpOQJSGlFKUaBVN6ANoFkdAmYmY+wC8vnV9lChoBmgJaA9DCBX/d0SFvV1AlIaUUpRoFU3oA2gWR0CZkX9hJAdGdX2UKGgGaAloD0MIjQ3d7A+7XECUhpRSlGgVTegDaBZHQJmSXIzWPLh1fZQoaAZoCWgPQwhVNNb+TnxhQJSGlFKUaBVN6ANoFkdAmZPN2gWadHV9lChoBmgJaA9DCL/Rjht+q1tAlIaUUpRoFU3oA2gWR0CZmNIre67NdX2UKGgGaAloD0MIvYv343ara0CUhpRSlGgVTakDaBZHQJmaptpEhJR1fZQoaAZoCWgPQwi6oSk7/ZRiQJSGlFKUaBVN6ANoFkdAmZyGL9/BnHV9lChoBmgJaA9DCPjgtUubVGFAlIaUUpRoFU3oA2gWR0CZncwt8NQTdX2UKGgGaAloD0MIZXCUvDqDYUCUhpRSlGgVTegDaBZHQJmfxDw6QvJ1fZQoaAZoCWgPQwhuT5DY7mtlQJSGlFKUaBVN6ANoFkdAmaNPEGZ/kXV9lChoBmgJaA9DCFJlGHeD3lpAlIaUUpRoFU3oA2gWR0CZpCGHpKSQdX2UKGgGaAloD0MIntLB+j/5YkCUhpRSlGgVTegDaBZHQJmnEllbu+h1fZQoaAZoCWgPQwi9yAT8Gv5eQJSGlFKUaBVN6ANoFkdAmaiaFIuoP3V9lChoBmgJaA9DCNyCpbqAFV5AlIaUUpRoFU3oA2gWR0CZq5LvkRzzdX2UKGgGaAloD0MIz9iXbDyaYECUhpRSlGgVTegDaBZHQJmwc9C/oJR1fZQoaAZoCWgPQwglOzYC8TRdQJSGlFKUaBVN6ANoFkdAmbFjrqt5lnV9lChoBmgJaA9DCKwfm+RHdGVAlIaUUpRoFU3oA2gWR0CZsgx9XtBwdX2UKGgGaAloD0MIdEF9yxxWbUCUhpRSlGgVTdECaBZHQJm1/XSSeRR1fZQoaAZoCWgPQwjByMuaWBlfQJSGlFKUaBVN6ANoFkdAmbcmPo3aSXV9lChoBmgJaA9DCF7b2y3JHF5AlIaUUpRoFU3oA2gWR0CZtyicoYvWdX2UKGgGaAloD0MImRJJ9LJbakCUhpRSlGgVTd4DaBZHQJm4AWTHKfZ1fZQoaAZoCWgPQwgYlGk0OcFgQJSGlFKUaBVN6ANoFkdAmc09RFZxJnV9lChoBmgJaA9DCOtwdJVuJW9AlIaUUpRoFU1eAWgWR0CZ0pKEFnqWdX2UKGgGaAloD0MIlgfpKXIALkCUhpRSlGgVTRQBaBZHQJnZYw482aV1fZQoaAZoCWgPQwhM/5JUJtlhQJSGlFKUaBVN6ANoFkdAmdvgfZElV3V9lChoBmgJaA9DCBRa1v1ji15AlIaUUpRoFU3oA2gWR0CZ3n/x2B8QdX2UKGgGaAloD0MIycuaWGBBZkCUhpRSlGgVTegDaBZHQJneuhtcfNl1fZQoaAZoCWgPQwhJ1uHoqotiQJSGlFKUaBVN6ANoFkdAmd9DpHI6sHV9lChoBmgJaA9DCI3xYfYyxWNAlIaUUpRoFU3oA2gWR0CZ4IDZUT+OdX2UKGgGaAloD0MIeQWiJ2VCY0CUhpRSlGgVTegDaBZHQJnmY6+36RB1fZQoaAZoCWgPQwgaTS7GwIlsQJSGlFKUaBVNZQJoFkdAmemxWPtD2XV9lChoBmgJaA9DCEdVE0RdzWpAlIaUUpRoFU3PA2gWR0CZ6oisny/cdX2UKGgGaAloD0MItOidCrg8XUCUhpRSlGgVTegDaBZHQJnvM3ZPEbZ1fZQoaAZoCWgPQwhZpl8i3sVfQJSGlFKUaBVN6ANoFkdAmf8BdpqREHV9lChoBmgJaA9DCBwj2SPUMF5AlIaUUpRoFU3oA2gWR0CaAiHDrJKbdX2UKGgGaAloD0MIqOFbWLfsakCUhpRSlGgVTVMDaBZHQJoC8cp9ZzR1fZQoaAZoCWgPQwjVJHhDGsNiQJSGlFKUaBVN6ANoFkdAmgQuHnEET3V9lChoBmgJaA9DCCMShZZ1NFxAlIaUUpRoFU3oA2gWR0CaCum8M/hVdX2UKGgGaAloD0MIGqN1VDWrVUCUhpRSlGgVTegDaBZHQJoLr9cbBGh1fZQoaAZoCWgPQwiCAYQPJYplQJSGlFKUaBVN6ANoFkdAmgz2X9itrHV9lChoBmgJaA9DCMpUwagkzW9AlIaUUpRoFU2zAWgWR0CaD5r8R+SbdX2UKGgGaAloD0MITDWzloKYZECUhpRSlGgVTegDaBZHQJoRJM+NcW11fZQoaAZoCWgPQwh07KAS1/hiQJSGlFKUaBVN6ANoFkdAmhK44hllLHV9lChoBmgJaA9DCPkwe9n2XWtAlIaUUpRoFU19AWgWR0CaE3OBUaQ4dX2UKGgGaAloD0MIUWnEzD4UY0CUhpRSlGgVTegDaBZHQJoVXNcGC7N1fZQoaAZoCWgPQwgJxOv6RWZwQJSGlFKUaBVNLgNoFkdAmhiqLXL/0nV9lChoBmgJaA9DCOqURzfCJVhAlIaUUpRoFU3oA2gWR0CaGiokRjBmdX2UKGgGaAloD0MINxd/2xNdXUCUhpRSlGgVTegDaBZHQJoa2plz2ex1fZQoaAZoCWgPQwi+Ly5V6UdlQJSGlFKUaBVN6ANoFkdAmh00s8PnS3V9lChoBmgJaA9DCIGYhAt5OmBAlIaUUpRoFU3oA2gWR0CaIRU8FINFdX2UKGgGaAloD0MIgEV+/RBdZECUhpRSlGgVTegDaBZHQJoli0x/NJR1fZQoaAZoCWgPQwj76T9r/q5jQJSGlFKUaBVN6ANoFkdAmiZEqUeMh3V9lChoBmgJaA9DCMwHBDoTWGRAlIaUUpRoFU3oA2gWR0CaJthCdBjXdX2UKGgGaAloD0MInkXvVMAGYUCUhpRSlGgVTegDaBZHQJoqcPoV2zR1fZQoaAZoCWgPQwgSE9TwLVVeQJSGlFKUaBVN6ANoFkdAmixYChew93V9lChoBmgJaA9DCEbtfhXg9W9AlIaUUpRoFU1NAWgWR0CaMjNI9TxYdX2UKGgGaAloD0MI2Lj+XZ+zYECUhpRSlGgVTegDaBZHQJpAyjCYTkB1fZQoaAZoCWgPQwiKc9TR8UljQJSGlFKUaBVN6ANoFkdAmkXg1BMSK3V9lChoBmgJaA9DCBCU2/Y9y1ZAlIaUUpRoFU3oA2gWR0CaTKDdxhlUdX2UKGgGaAloD0MId/hrskYXb0CUhpRSlGgVTc4DaBZHQJpQf5ylvZR1fZQoaAZoCWgPQwhaZaa0/mxaQJSGlFKUaBVN6ANoFkdAmlGh/3Fkx3V9lChoBmgJaA9DCM8UOq+xj2VAlIaUUpRoFU3oA2gWR0CaUdoTfzjFdX2UKGgGaAloD0MImYBfI0nCZ0CUhpRSlGgVTegDaBZHQJpSV13dKul1fZQoaAZoCWgPQwg/jXvzm5tuQJSGlFKUaBVNEwJoFkdAmlc9Wp6yB3V9lChoBmgJaA9DCMUB9Pv+I2NAlIaUUpRoFU3oA2gWR0CaXJPBi1ArdX2UKGgGaAloD0MIsiyY+KOQYUCUhpRSlGgVTegDaBZHQJpdW6MBIWh1fZQoaAZoCWgPQwj2tS41wulkQJSGlFKUaBVN6ANoFkdAmmIatPpIMHV9lChoBmgJaA9DCGIQWDm0fDpAlIaUUpRoFUvsaBZHQJps0PTXrdF1fZQoaAZoCWgPQwi86gHzkJkoQJSGlFKUaBVNHAFoFkdAmm2/8uSOinV9lChoBmgJaA9DCKmj42rkNWVAlIaUUpRoFU3oA2gWR0Cacds41gpjdX2UKGgGaAloD0MIhUTaxp++YkCUhpRSlGgVTegDaBZHQJp07YbsF+x1fZQoaAZoCWgPQwjjFvNzQ31jQJSGlFKUaBVN6ANoFkdAmnWfgNwzcnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 160, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022", "Python": "3.8.16", "Stable-Baselines3": "1.6.2", "PyTorch": "1.13.0+cu116", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f021a647ca0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f021a647d30>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f021a647dc0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f021a647e50>", "_build": "<function ActorCriticPolicy._build at 0x7f021a647ee0>", "forward": "<function ActorCriticPolicy.forward at 0x7f021a647f70>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f021a64b040>", "_predict": "<function ActorCriticPolicy._predict at 0x7f021a64b0d0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f021a64b160>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f021a64b1f0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f021a64b280>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f021a644570>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 10, "num_timesteps": 102400, "_total_timesteps": 100000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1671871118506073747, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVtQEAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZAAQAAAAAAAGZ27DtekbU/qx07PxByrD4K5Ai8zIkpvgAAAAAAAAAAzYKrPF7otD+a6zE/onchPDimlLzMtau9AAAAAAAAAAAAAD+9uN+iu9ZJ/j1Q4BA9ChjfvJvC8D0AAIA/AACAP/OcLL7TCgU/axR5PW6TDb+9j1a+k6TuPQAAAAAAAAAAGpX2PVPsHz9aUZk8sfIiv4A0GD5u3c+5AAAAAAAAAADa2549NPOIPQ/rgb4zTIi+RtJSvVitnL0AAAAAAAAAAOONmj6jBRE/pTpqvvBKC7/qMnw+68d0vgAAAAAAAAAA0xwdvo8uP7wW1+86BT4zOf1trz3Prkm6AACAPwAAgD8FcI++P0cHPxbu5ruLFgi/t5DavpIOpT0AAAAAAAAAAJpdfzw4AZ672vgoviD9xbwdljI9+mWuvgAAAAAAAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksKSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVfQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYKAAAAAAAAAAEAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwqFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.02400000000000002, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIaFn3j8UwckCUhpRSlIwBbJRL54wBdJRHQJ5ywiRnvlV1fZQoaAZoCWgPQwiwWS4bXR9wQJSGlFKUaBVLzWgWR0Cecsm1YyO8dX2UKGgGaAloD0MI76gxIWbYcECUhpRSlGgVS6FoFkdAnnLq/Efkm3V9lChoBmgJaA9DCPZBlgUTjXNAlIaUUpRoFUu/aBZHQJ5y7ArQPZt1fZQoaAZoCWgPQwgqc/ONqJRyQJSGlFKUaBVLvWgWR0Cec5VeruIAdX2UKGgGaAloD0MIwAXZsvxJcUCUhpRSlGgVS8BoFkdAnnOYdZJTVHV9lChoBmgJaA9DCFfqWRBKknFAlIaUUpRoFUu9aBZHQJ50Xa8Hv+h1fZQoaAZoCWgPQwj7PbFO1VNyQJSGlFKUaBVLxmgWR0CedfkSVW0adX2UKGgGaAloD0MIXWxaKQSEbUCUhpRSlGgVS6loFkdAnnYggcLjP3V9lChoBmgJaA9DCBKJQsv6UHJAlIaUUpRoFUuyaBZHQJ52Ypz90ih1fZQoaAZoCWgPQwiYM9sVOs1zQJSGlFKUaBVL2GgWR0Cedol4TsY3dX2UKGgGaAloD0MIZqIIqdsbckCUhpRSlGgVS8RoFkdAnnbdcjZ+QXV9lChoBmgJaA9DCJUoe0v5vXNAlIaUUpRoFUvaaBZHQJ53Vn3+MqB1fZQoaAZoCWgPQwiNQSeETudxQJSGlFKUaBVLnGgWR0Ced7rRBu4xdX2UKGgGaAloD0MIK6Im+nyycUCUhpRSlGgVS8NoFkdAnnfCNKh+OXV9lChoBmgJaA9DCEIkQ47tU3NAlIaUUpRoFUv9aBZHQJ55EdKdxyZ1fZQoaAZoCWgPQwiwyRr1EMNxQJSGlFKUaBVLm2gWR0CeedJ3gUDddX2UKGgGaAloD0MITBsOSwPGcUCUhpRSlGgVS8ZoFkdAnnppfdAPd3V9lChoBmgJaA9DCLmOccWFanJAlIaUUpRoFUvNaBZHQJ56x8b70nR1fZQoaAZoCWgPQwj1FDlEXAJ0QJSGlFKUaBVLt2gWR0CeewFXaJyidX2UKGgGaAloD0MIu5unOuQfbUCUhpRSlGgVS8loFkdAnnsdSydFv3V9lChoBmgJaA9DCCR872/QCHJAlIaUUpRoFUvcaBZHQJ58W1stTUB1fZQoaAZoCWgPQwhHrptSXvRxQJSGlFKUaBVLzGgWR0CefGyAhB7edX2UKGgGaAloD0MIf/YjReQbcUCUhpRSlGgVS85oFkdAnnx9srNGE3V9lChoBmgJaA9DCIF4Xb+g7HFAlIaUUpRoFUuuaBZHQJ59CgqVhTh1fZQoaAZoCWgPQwilpIeh1WRxQJSGlFKUaBVLuWgWR0CeffxOclPadX2UKGgGaAloD0MIam0a26sXcUCUhpRSlGgVS79oFkdAnn7AP/aQFXV9lChoBmgJaA9DCCjU00fgUnFAlIaUUpRoFUu6aBZHQJ5/NbkfcN91fZQoaAZoCWgPQwgfgqrRqwVxQJSGlFKUaBVLu2gWR0Cef00Cih38dX2UKGgGaAloD0MIarx0k5gPdECUhpRSlGgVS+poFkdAnoATqbBoEnV9lChoBmgJaA9DCKM/NPNkB3JAlIaUUpRoFUumaBZHQJ6AR8QZn+R1fZQoaAZoCWgPQwiC4seYOzRyQJSGlFKUaBVLq2gWR0CegPUIcBEKdX2UKGgGaAloD0MI81XysTudcUCUhpRSlGgVS9JoFkdAnoExb8m8d3V9lChoBmgJaA9DCL1yvW0maXFAlIaUUpRoFUvYaBZHQJ6BRf+jua51fZQoaAZoCWgPQwjEtG/ur/9yQJSGlFKUaBVLy2gWR0Cegp0EovzwdX2UKGgGaAloD0MInlxTIDNscUCUhpRSlGgVS6doFkdAnoL7Tx5LRXV9lChoBmgJaA9DCN7jTBM2AXRAlIaUUpRoFUu9aBZHQJ6DBZuAI6d1fZQoaAZoCWgPQwjRQCybuR5uQJSGlFKUaBVLuWgWR0Ceg3rTH80ldX2UKGgGaAloD0MIAcPy59svc0CUhpRSlGgVS79oFkdAnoRcDbJwKnV9lChoBmgJaA9DCAK37uap+HBAlIaUUpRoFUvIaBZHQJ6ExlTWGyp1fZQoaAZoCWgPQwhWgVoM3kBwQJSGlFKUaBVLrmgWR0CehORc/t6YdX2UKGgGaAloD0MIz6EMVbGUckCUhpRSlGgVS7VoFkdAnoVafSQYDXV9lChoBmgJaA9DCJz7q8c9SnFAlIaUUpRoFUvPaBZHQJ6F5NGmUGF1fZQoaAZoCWgPQwhEhermYilkQJSGlFKUaBVN6ANoFkdAnoZqiblRxnV9lChoBmgJaA9DCKyL22iA7G1AlIaUUpRoFUu0aBZHQJ6Gstsenyd1fZQoaAZoCWgPQwhbmfBL/TBxQJSGlFKUaBVLtWgWR0CehwQcghbGdX2UKGgGaAloD0MIXB0AcRc1cUCUhpRSlGgVS9ZoFkdAnoeVBppN9HV9lChoBmgJaA9DCJLNVfOccnJAlIaUUpRoFUvRaBZHQJ6H4jfNzKd1fZQoaAZoCWgPQwhN2H4yhjByQJSGlFKUaBVLs2gWR0CeiBgBcRlIdX2UKGgGaAloD0MIizidZKvAbkCUhpRSlGgVS7BoFkdAnohXPqs2enV9lChoBmgJaA9DCG1VEtmHIXFAlIaUUpRoFUudaBZHQJ6IgGUwBYF1fZQoaAZoCWgPQwhzhXe5iNlxQJSGlFKUaBVL02gWR0CeiSND+irUdX2UKGgGaAloD0MIrcJmgAtlc0CUhpRSlGgVS71oFkdAnopQ5aNdaHV9lChoBmgJaA9DCIBEEyji4nJAlIaUUpRoFUvXaBZHQJ6KgyeqaPV1fZQoaAZoCWgPQwj5o6gzdzZxQJSGlFKUaBVNAgFoFkdAnorspsoDxXV9lChoBmgJaA9DCENWt3pOz3JAlIaUUpRoFUu2aBZHQJ6LndsSCe51fZQoaAZoCWgPQwh0et6NxT1zQJSGlFKUaBVL6GgWR0Cei6fSx7iRdX2UKGgGaAloD0MIfJkoQqqMckCUhpRSlGgVS99oFkdAnowgWrOqvXV9lChoBmgJaA9DCJxrmKHxfHJAlIaUUpRoFUu0aBZHQJ6ML/rB0p51fZQoaAZoCWgPQwjW/WMh+vhzQJSGlFKUaBVLymgWR0CejDVEuxr0dX2UKGgGaAloD0MIBfwaSUJ6ckCUhpRSlGgVS8hoFkdAnoxsuWa+e3V9lChoBmgJaA9DCIwv2uOFK3NAlIaUUpRoFUvUaBZHQJ6NXhR64Uh1fZQoaAZoCWgPQwg/i6VI/p1xQJSGlFKUaBVLoGgWR0CejaT5ftx/dX2UKGgGaAloD0MInS0gtN5ZdECUhpRSlGgVS7ZoFkdAno3da6jFh3V9lChoBmgJaA9DCJeo3hoY13JAlIaUUpRoFUu7aBZHQJ6OeumrKeV1fZQoaAZoCWgPQwj8UGnEDNRxQJSGlFKUaBVLs2gWR0CejuNZvDP4dX2UKGgGaAloD0MIu7a3W9L4cUCUhpRSlGgVS7xoFkdAno8aMWGh3HV9lChoBmgJaA9DCCKphZJJ2W9AlIaUUpRoFUuzaBZHQJ6PT3bmEGt1fZQoaAZoCWgPQwgIrYcvEzdyQJSGlFKUaBVLuGgWR0Cej4dVvMr3dX2UKGgGaAloD0MIGOsbmFx5c0CUhpRSlGgVS9RoFkdAnpBRyS3b23V9lChoBmgJaA9DCPUR+MMP03BAlIaUUpRoFUunaBZHQJ6Qyu3c5811fZQoaAZoCWgPQwglWvJ42sVvQJSGlFKUaBVLumgWR0CekNDwH7gsdX2UKGgGaAloD0MI/n4xW7IYcECUhpRSlGgVS7loFkdAnpFdipeeF3V9lChoBmgJaA9DCL9k48FW83BAlIaUUpRoFUu/aBZHQJ6TIbkwN9Z1fZQoaAZoCWgPQwgSEmkb/wZyQJSGlFKUaBVL2mgWR0CekzTot+TedX2UKGgGaAloD0MIU+knnJ2GcUCUhpRSlGgVS/BoFkdAnpM2AXl8xHV9lChoBmgJaA9DCOi/B6+dB3NAlIaUUpRoFUvdaBZHQJ6Tghje9Bd1fZQoaAZoCWgPQwi4rpgR3h1vQJSGlFKUaBVLo2gWR0Cek5UG3WnTdX2UKGgGaAloD0MICp3X2OWScUCUhpRSlGgVS9NoFkdAnpPB8QZn+XV9lChoBmgJaA9DCPqZet3iTHJAlIaUUpRoFUukaBZHQJ6UC8f3evZ1fZQoaAZoCWgPQwhv05/9yLFyQJSGlFKUaBVL1GgWR0CelOzGxUvPdX2UKGgGaAloD0MIn48y4kJ0cECUhpRSlGgVS7toFkdAnpUQBPsRhHV9lChoBmgJaA9DCIQPJVoyWXFAlIaUUpRoFUuqaBZHQJ6WY+7lJYl1fZQoaAZoCWgPQwha2T7kLbxwQJSGlFKUaBVLqGgWR0Celmqmj0tidX2UKGgGaAloD0MIhbUxdsJFcUCUhpRSlGgVS5VoFkdAnpaL1mJ3xHV9lChoBmgJaA9DCM8SZASUW3JAlIaUUpRoFUvDaBZHQJ6W+6shgVp1fZQoaAZoCWgPQwiTHRuBuC90QJSGlFKUaBVLtGgWR0CelwtHxz7udX2UKGgGaAloD0MIVDVB1L3WcUCUhpRSlGgVS8BoFkdAnpc16zE74nV9lChoBmgJaA9DCKSrdHedq25AlIaUUpRoFUuwaBZHQJ6XeJemelN1fZQoaAZoCWgPQwiIu3oVGW9vQJSGlFKUaBVLuWgWR0CemJXIEKVqdX2UKGgGaAloD0MIzse1oaLQcUCUhpRSlGgVS8JoFkdAnpjcDGLk0nV9lChoBmgJaA9DCH3O3a6XjXBAlIaUUpRoFUumaBZHQJ6ZuTcIqsl1fZQoaAZoCWgPQwhOet/4mnpxQJSGlFKUaBVLrGgWR0Cemd1Gb1AadX2UKGgGaAloD0MIi6azk0G6bkCUhpRSlGgVS7FoFkdAnpomDDjzZ3V9lChoBmgJaA9DCE7yI36FYXFAlIaUUpRoFUu8aBZHQJ6a0MOPNml1fZQoaAZoCWgPQwiiJvp8VJRxQJSGlFKUaBVLymgWR0Cem1DW9US7dX2UKGgGaAloD0MIeSRens5vcUCUhpRSlGgVS7poFkdAnptTxCpm3HV9lChoBmgJaA9DCN7n+Ghx0nFAlIaUUpRoFUvXaBZHQJ6beMm4RVZ1fZQoaAZoCWgPQwi7Cik/qZdtQJSGlFKUaBVLr2gWR0CenIkyk9EDdX2UKGgGaAloD0MIsz9QbhsJcUCUhpRSlGgVS75oFkdAnpyUAxSHd3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 540, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022", "Python": "3.8.16", "Stable-Baselines3": "1.6.2", "PyTorch": "1.13.0+cu116", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:baf5575f655e351468348ba9d2d23a9e8203b17eb2d3fc1b43e5ece2f6b15c20
3
- size 147916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afbb46aa5a0939b02751dcc9e45750fca2eb50904626cc69dbcfded0a723cdc0
3
+ size 146822
ppo-LunarLander-v2/data CHANGED
@@ -4,19 +4,19 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f9eacc9aee0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f9eacc9af70>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f9eacc9e040>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f9eacc9e0d0>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f9eacc9e160>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f9eacc9e1f0>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f9eacc9e280>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f9eacc9e310>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f9eacc9e3a0>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f9eacc9e430>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f9eacc9e4c0>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7f9eacc94f00>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
@@ -41,13 +41,13 @@
41
  "dtype": "int64",
42
  "_np_random": null
43
  },
44
- "n_envs": 32,
45
- "num_timesteps": 1048576,
46
- "_total_timesteps": 1000000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1671807920230630791,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
@@ -56,26 +56,26 @@
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQQAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABAAAAAAAAPqjLL7sL6W7v6m8OTQQETec0vs8CgrfuAAAgD8AAIA/mpF0PVzLFrpGEN+4zatbNRBOW7gzNAA4AACAPwAAgD/gg6Y+SUwHPU4N6rl93we4+5wXPhJ5IzkAAIA/AACAP2bgZ73tGww+5VlnPnocOL7Zfao9QWYmPQAAAAAAAAAApvQcvlKFr7sXpzc7MXPROJgWHT3ypme6AACAPwAAgD9ANU8+PtyTP2su+D4B2Yi+E4EqPgrh9TwAAAAAAAAAAGYvzbwO3W0/Kb0evXfkub7Qhxu9DToqvQAAAAAAAAAAzeyZvER9vj+2K0y+ea6MPsLbCjyEWrq8AAAAAAAAAAAzyWI+lId6PkE5x70xnkG9KXolvWCpW70AAAAAAAAAAA1Pz70UvNi69UaQvBEPL72Zlau7/tUYvgAAAAAAAIA/JqScPeGam7jzpmu7zp8pOPSiijvNiBE5AACAPwAAgD8A9m48QAy3P02Y9D5E5IM+TgIgvP8DjrwAAAAAAAAAAGbewjvDKTm6Spuiu5L/CDeVx6C6Njl3tgAAgD8AAIA/s6R9PY+GfbqFujU6I3WENSVLQDvlWlK5AACAPwAAgD9Thzc+GyGpvFBPGDrSlmC4J4MVvk3cTrkAAIA/AACAP+Y4MT0UDrs5fVCEOYlhxjOSvNa7K4OguAAAgD8AAIA/WoELPsO6Ijsi7f26UTQouJzq4zzJeRs6AACAPwAAgD/N/JO8Kfg2usMMzjrNDyQ2NanMuqa58LkAAIA/AACAP/PMsb3DuSe64tQMuUZ2l7W2vqE69dUjOAAAgD8AAIA/Jv03PkghzTn7FyU5rmnMNS5xUzyeUTy4AACAPwAAgD8Nbok9SCeBuiKAvDrJSX01Xs7uOe1E2bkAAIA/AACAP6aV9r2um8a6bWTtPaxmTL17W2476+rdvAAAgD8AAIA/s4FqPuSCFzypXoU7pINdOUnboT2EApq6AACAPwAAgD+a7de8FKKMul39YTpqTpo2fs01OygdgLkAAIA/AACAP+bXHb2Fa4u58s+mPDmZ5TxWsiQ7Pd9sPAAAgD8AAIA/848ovo8KYLzVHCk6ZRgSOJ31xz2GkVS5AACAPwAAgD+A9Lc+mH21Pgk4xrxBt06+MAkrvH5EPb0AAAAAAAAAAA1+Qb49QE27jKugOYEZuDZ3vbs8hj2/uAAAgD8AAIA/GhN1vVLIirnGOJI5WubHNKnLIjvO6Km4AACAPwAAgD/mEj+99qwpurJ8uLskADI4YTkcOkAEbzcAAIA/AACAP3DHXr7hEv05PkUaOkHnkLbWiTu8UnEzuQAAgD8AAIA/k45NPiphhj+qWew9f+SvvlJwrj3d2gM7AAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSyBLCIaUjAFDlHSUUpQu"
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
63
- ":serialized:": "gAWVkwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksghZSMAUOUdJRSlC4="
64
  },
65
  "_last_original_obs": null,
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
- "_current_progress_remaining": -0.04857599999999995,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWVfxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIQ8cOKvHaYECUhpRSlIwBbJRN6AOMAXSUR0CYQ8YKpkwwdX2UKGgGaAloD0MI08H6P4fIXUCUhpRSlGgVTegDaBZHQJhFigPEsJ91fZQoaAZoCWgPQwhh/gqZq3FiQJSGlFKUaBVN6ANoFkdAmEf2Ifr8i3V9lChoBmgJaA9DCPtcbcV+QmVAlIaUUpRoFU3eAmgWR0CYSLXLeQ+2dX2UKGgGaAloD0MIAB5RoTrGYUCUhpRSlGgVTegDaBZHQJhJbf/FR511fZQoaAZoCWgPQwgBFvn1Q25kQJSGlFKUaBVN6ANoFkdAmEv3erMkhXV9lChoBmgJaA9DCI7NjlTfvGNAlIaUUpRoFU3oA2gWR0CYTWHlfZ27dX2UKGgGaAloD0MIOuenOA7SXECUhpRSlGgVTegDaBZHQJhQGfVZs9B1fZQoaAZoCWgPQwhLrfcb7VAqQJSGlFKUaBVNCgFoFkdAmFShvvSc9XV9lChoBmgJaA9DCOKxn8VSHVxAlIaUUpRoFU3oA2gWR0CYVYCL/CIldX2UKGgGaAloD0MI7rH0oQu+ZECUhpRSlGgVTegDaBZHQJhWR77bcoJ1fZQoaAZoCWgPQwiZSj/h7OYeQJSGlFKUaBVL8GgWR0CYW1lhw2l3dX2UKGgGaAloD0MIoIhFDDvGYECUhpRSlGgVTegDaBZHQJhbW8VYZEV1fZQoaAZoCWgPQwjo2hfQC91ZQJSGlFKUaBVN6ANoFkdAmF1Wv4dp7HV9lChoBmgJaA9DCMAjKlQ3AWZAlIaUUpRoFU3oA2gWR0CYX/klNUOvdX2UKGgGaAloD0MI+Ppal5r8YUCUhpRSlGgVTegDaBZHQJhi+a6STyJ1fZQoaAZoCWgPQwgAVHHjlrllQJSGlFKUaBVN6ANoFkdAmHDbxqfvnnV9lChoBmgJaA9DCBvXv+uzR2NAlIaUUpRoFU3oA2gWR0CYfRPk7wKCdX2UKGgGaAloD0MIMBAEyNCSZUCUhpRSlGgVTegDaBZHQJiBB05lvqF1fZQoaAZoCWgPQwiKIM7DCawYwJSGlFKUaBVNEQFoFkdAmIQVCHARCnV9lChoBmgJaA9DCHWPbK4avWNAlIaUUpRoFU3oA2gWR0CYhFcEeQuFdX2UKGgGaAloD0MIpFLsaBy0YECUhpRSlGgVTegDaBZHQJiE8/iYLLJ1fZQoaAZoCWgPQwhfYFYo0g1jQJSGlFKUaBVN6ANoFkdAmIZtb5dnkHV9lChoBmgJaA9DCCXJc30flmBAlIaUUpRoFU3oA2gWR0CYjXLq2SdOdX2UKGgGaAloD0MInmFqS51aYkCUhpRSlGgVTegDaBZHQJiVmvbGm1p1fZQoaAZoCWgPQwgucHmsGfBiQJSGlFKUaBVN6ANoFkdAmJf9vfj0c3V9lChoBmgJaA9DCJoF2h3S2mNAlIaUUpRoFU3oA2gWR0CZg4rFOwgUdX2UKGgGaAloD0MIDjLJyNlkbkCUhpRSlGgVTSQCaBZHQJmHJp8F6iV1fZQoaAZoCWgPQwhPz7uxoCpOQJSGlFKUaBVN6ANoFkdAmYmY+wC8vnV9lChoBmgJaA9DCBX/d0SFvV1AlIaUUpRoFU3oA2gWR0CZkX9hJAdGdX2UKGgGaAloD0MIjQ3d7A+7XECUhpRSlGgVTegDaBZHQJmSXIzWPLh1fZQoaAZoCWgPQwhVNNb+TnxhQJSGlFKUaBVN6ANoFkdAmZPN2gWadHV9lChoBmgJaA9DCL/Rjht+q1tAlIaUUpRoFU3oA2gWR0CZmNIre67NdX2UKGgGaAloD0MIvYv343ara0CUhpRSlGgVTakDaBZHQJmaptpEhJR1fZQoaAZoCWgPQwi6oSk7/ZRiQJSGlFKUaBVN6ANoFkdAmZyGL9/BnHV9lChoBmgJaA9DCPjgtUubVGFAlIaUUpRoFU3oA2gWR0CZncwt8NQTdX2UKGgGaAloD0MIZXCUvDqDYUCUhpRSlGgVTegDaBZHQJmfxDw6QvJ1fZQoaAZoCWgPQwhuT5DY7mtlQJSGlFKUaBVN6ANoFkdAmaNPEGZ/kXV9lChoBmgJaA9DCFJlGHeD3lpAlIaUUpRoFU3oA2gWR0CZpCGHpKSQdX2UKGgGaAloD0MIntLB+j/5YkCUhpRSlGgVTegDaBZHQJmnEllbu+h1fZQoaAZoCWgPQwi9yAT8Gv5eQJSGlFKUaBVN6ANoFkdAmaiaFIuoP3V9lChoBmgJaA9DCNyCpbqAFV5AlIaUUpRoFU3oA2gWR0CZq5LvkRzzdX2UKGgGaAloD0MIz9iXbDyaYECUhpRSlGgVTegDaBZHQJmwc9C/oJR1fZQoaAZoCWgPQwglOzYC8TRdQJSGlFKUaBVN6ANoFkdAmbFjrqt5lnV9lChoBmgJaA9DCKwfm+RHdGVAlIaUUpRoFU3oA2gWR0CZsgx9XtBwdX2UKGgGaAloD0MIdEF9yxxWbUCUhpRSlGgVTdECaBZHQJm1/XSSeRR1fZQoaAZoCWgPQwjByMuaWBlfQJSGlFKUaBVN6ANoFkdAmbcmPo3aSXV9lChoBmgJaA9DCF7b2y3JHF5AlIaUUpRoFU3oA2gWR0CZtyicoYvWdX2UKGgGaAloD0MImRJJ9LJbakCUhpRSlGgVTd4DaBZHQJm4AWTHKfZ1fZQoaAZoCWgPQwgYlGk0OcFgQJSGlFKUaBVN6ANoFkdAmc09RFZxJnV9lChoBmgJaA9DCOtwdJVuJW9AlIaUUpRoFU1eAWgWR0CZ0pKEFnqWdX2UKGgGaAloD0MIlgfpKXIALkCUhpRSlGgVTRQBaBZHQJnZYw482aV1fZQoaAZoCWgPQwhM/5JUJtlhQJSGlFKUaBVN6ANoFkdAmdvgfZElV3V9lChoBmgJaA9DCBRa1v1ji15AlIaUUpRoFU3oA2gWR0CZ3n/x2B8QdX2UKGgGaAloD0MIycuaWGBBZkCUhpRSlGgVTegDaBZHQJneuhtcfNl1fZQoaAZoCWgPQwhJ1uHoqotiQJSGlFKUaBVN6ANoFkdAmd9DpHI6sHV9lChoBmgJaA9DCI3xYfYyxWNAlIaUUpRoFU3oA2gWR0CZ4IDZUT+OdX2UKGgGaAloD0MIeQWiJ2VCY0CUhpRSlGgVTegDaBZHQJnmY6+36RB1fZQoaAZoCWgPQwgaTS7GwIlsQJSGlFKUaBVNZQJoFkdAmemxWPtD2XV9lChoBmgJaA9DCEdVE0RdzWpAlIaUUpRoFU3PA2gWR0CZ6oisny/cdX2UKGgGaAloD0MItOidCrg8XUCUhpRSlGgVTegDaBZHQJnvM3ZPEbZ1fZQoaAZoCWgPQwhZpl8i3sVfQJSGlFKUaBVN6ANoFkdAmf8BdpqREHV9lChoBmgJaA9DCBwj2SPUMF5AlIaUUpRoFU3oA2gWR0CaAiHDrJKbdX2UKGgGaAloD0MIqOFbWLfsakCUhpRSlGgVTVMDaBZHQJoC8cp9ZzR1fZQoaAZoCWgPQwjVJHhDGsNiQJSGlFKUaBVN6ANoFkdAmgQuHnEET3V9lChoBmgJaA9DCCMShZZ1NFxAlIaUUpRoFU3oA2gWR0CaCum8M/hVdX2UKGgGaAloD0MIGqN1VDWrVUCUhpRSlGgVTegDaBZHQJoLr9cbBGh1fZQoaAZoCWgPQwiCAYQPJYplQJSGlFKUaBVN6ANoFkdAmgz2X9itrHV9lChoBmgJaA9DCMpUwagkzW9AlIaUUpRoFU2zAWgWR0CaD5r8R+SbdX2UKGgGaAloD0MITDWzloKYZECUhpRSlGgVTegDaBZHQJoRJM+NcW11fZQoaAZoCWgPQwh07KAS1/hiQJSGlFKUaBVN6ANoFkdAmhK44hllLHV9lChoBmgJaA9DCPkwe9n2XWtAlIaUUpRoFU19AWgWR0CaE3OBUaQ4dX2UKGgGaAloD0MIUWnEzD4UY0CUhpRSlGgVTegDaBZHQJoVXNcGC7N1fZQoaAZoCWgPQwgJxOv6RWZwQJSGlFKUaBVNLgNoFkdAmhiqLXL/0nV9lChoBmgJaA9DCOqURzfCJVhAlIaUUpRoFU3oA2gWR0CaGiokRjBmdX2UKGgGaAloD0MINxd/2xNdXUCUhpRSlGgVTegDaBZHQJoa2plz2ex1fZQoaAZoCWgPQwi+Ly5V6UdlQJSGlFKUaBVN6ANoFkdAmh00s8PnS3V9lChoBmgJaA9DCIGYhAt5OmBAlIaUUpRoFU3oA2gWR0CaIRU8FINFdX2UKGgGaAloD0MIgEV+/RBdZECUhpRSlGgVTegDaBZHQJoli0x/NJR1fZQoaAZoCWgPQwj76T9r/q5jQJSGlFKUaBVN6ANoFkdAmiZEqUeMh3V9lChoBmgJaA9DCMwHBDoTWGRAlIaUUpRoFU3oA2gWR0CaJthCdBjXdX2UKGgGaAloD0MInkXvVMAGYUCUhpRSlGgVTegDaBZHQJoqcPoV2zR1fZQoaAZoCWgPQwgSE9TwLVVeQJSGlFKUaBVN6ANoFkdAmixYChew93V9lChoBmgJaA9DCEbtfhXg9W9AlIaUUpRoFU1NAWgWR0CaMjNI9TxYdX2UKGgGaAloD0MI2Lj+XZ+zYECUhpRSlGgVTegDaBZHQJpAyjCYTkB1fZQoaAZoCWgPQwiKc9TR8UljQJSGlFKUaBVN6ANoFkdAmkXg1BMSK3V9lChoBmgJaA9DCBCU2/Y9y1ZAlIaUUpRoFU3oA2gWR0CaTKDdxhlUdX2UKGgGaAloD0MId/hrskYXb0CUhpRSlGgVTc4DaBZHQJpQf5ylvZR1fZQoaAZoCWgPQwhaZaa0/mxaQJSGlFKUaBVN6ANoFkdAmlGh/3Fkx3V9lChoBmgJaA9DCM8UOq+xj2VAlIaUUpRoFU3oA2gWR0CaUdoTfzjFdX2UKGgGaAloD0MImYBfI0nCZ0CUhpRSlGgVTegDaBZHQJpSV13dKul1fZQoaAZoCWgPQwg/jXvzm5tuQJSGlFKUaBVNEwJoFkdAmlc9Wp6yB3V9lChoBmgJaA9DCMUB9Pv+I2NAlIaUUpRoFU3oA2gWR0CaXJPBi1ArdX2UKGgGaAloD0MIsiyY+KOQYUCUhpRSlGgVTegDaBZHQJpdW6MBIWh1fZQoaAZoCWgPQwj2tS41wulkQJSGlFKUaBVN6ANoFkdAmmIatPpIMHV9lChoBmgJaA9DCGIQWDm0fDpAlIaUUpRoFUvsaBZHQJps0PTXrdF1fZQoaAZoCWgPQwi86gHzkJkoQJSGlFKUaBVNHAFoFkdAmm2/8uSOinV9lChoBmgJaA9DCKmj42rkNWVAlIaUUpRoFU3oA2gWR0Cacds41gpjdX2UKGgGaAloD0MIhUTaxp++YkCUhpRSlGgVTegDaBZHQJp07YbsF+x1fZQoaAZoCWgPQwjjFvNzQ31jQJSGlFKUaBVN6ANoFkdAmnWfgNwzcnVlLg=="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 160,
79
  "n_steps": 2048,
80
  "gamma": 0.99,
81
  "gae_lambda": 0.95,
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f021a647ca0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f021a647d30>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f021a647dc0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f021a647e50>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f021a647ee0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f021a647f70>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f021a64b040>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f021a64b0d0>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f021a64b160>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f021a64b1f0>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f021a64b280>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7f021a644570>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
 
41
  "dtype": "int64",
42
  "_np_random": null
43
  },
44
+ "n_envs": 10,
45
+ "num_timesteps": 102400,
46
+ "_total_timesteps": 100000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1671871118506073747,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
 
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVtQEAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZAAQAAAAAAAGZ27DtekbU/qx07PxByrD4K5Ai8zIkpvgAAAAAAAAAAzYKrPF7otD+a6zE/onchPDimlLzMtau9AAAAAAAAAAAAAD+9uN+iu9ZJ/j1Q4BA9ChjfvJvC8D0AAIA/AACAP/OcLL7TCgU/axR5PW6TDb+9j1a+k6TuPQAAAAAAAAAAGpX2PVPsHz9aUZk8sfIiv4A0GD5u3c+5AAAAAAAAAADa2549NPOIPQ/rgb4zTIi+RtJSvVitnL0AAAAAAAAAAOONmj6jBRE/pTpqvvBKC7/qMnw+68d0vgAAAAAAAAAA0xwdvo8uP7wW1+86BT4zOf1trz3Prkm6AACAPwAAgD8FcI++P0cHPxbu5ruLFgi/t5DavpIOpT0AAAAAAAAAAJpdfzw4AZ672vgoviD9xbwdljI9+mWuvgAAAAAAAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksKSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
63
+ ":serialized:": "gAWVfQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYKAAAAAAAAAAEAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwqFlIwBQ5R0lFKULg=="
64
  },
65
  "_last_original_obs": null,
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
+ "_current_progress_remaining": -0.02400000000000002,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVHxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIaFn3j8UwckCUhpRSlIwBbJRL54wBdJRHQJ5ywiRnvlV1fZQoaAZoCWgPQwiwWS4bXR9wQJSGlFKUaBVLzWgWR0Cecsm1YyO8dX2UKGgGaAloD0MI76gxIWbYcECUhpRSlGgVS6FoFkdAnnLq/Efkm3V9lChoBmgJaA9DCPZBlgUTjXNAlIaUUpRoFUu/aBZHQJ5y7ArQPZt1fZQoaAZoCWgPQwgqc/ONqJRyQJSGlFKUaBVLvWgWR0Cec5VeruIAdX2UKGgGaAloD0MIwAXZsvxJcUCUhpRSlGgVS8BoFkdAnnOYdZJTVHV9lChoBmgJaA9DCFfqWRBKknFAlIaUUpRoFUu9aBZHQJ50Xa8Hv+h1fZQoaAZoCWgPQwj7PbFO1VNyQJSGlFKUaBVLxmgWR0CedfkSVW0adX2UKGgGaAloD0MIXWxaKQSEbUCUhpRSlGgVS6loFkdAnnYggcLjP3V9lChoBmgJaA9DCBKJQsv6UHJAlIaUUpRoFUuyaBZHQJ52Ypz90ih1fZQoaAZoCWgPQwiYM9sVOs1zQJSGlFKUaBVL2GgWR0Cedol4TsY3dX2UKGgGaAloD0MIZqIIqdsbckCUhpRSlGgVS8RoFkdAnnbdcjZ+QXV9lChoBmgJaA9DCJUoe0v5vXNAlIaUUpRoFUvaaBZHQJ53Vn3+MqB1fZQoaAZoCWgPQwiNQSeETudxQJSGlFKUaBVLnGgWR0Ced7rRBu4xdX2UKGgGaAloD0MIK6Im+nyycUCUhpRSlGgVS8NoFkdAnnfCNKh+OXV9lChoBmgJaA9DCEIkQ47tU3NAlIaUUpRoFUv9aBZHQJ55EdKdxyZ1fZQoaAZoCWgPQwiwyRr1EMNxQJSGlFKUaBVLm2gWR0CeedJ3gUDddX2UKGgGaAloD0MITBsOSwPGcUCUhpRSlGgVS8ZoFkdAnnppfdAPd3V9lChoBmgJaA9DCLmOccWFanJAlIaUUpRoFUvNaBZHQJ56x8b70nR1fZQoaAZoCWgPQwj1FDlEXAJ0QJSGlFKUaBVLt2gWR0CeewFXaJyidX2UKGgGaAloD0MIu5unOuQfbUCUhpRSlGgVS8loFkdAnnsdSydFv3V9lChoBmgJaA9DCCR872/QCHJAlIaUUpRoFUvcaBZHQJ58W1stTUB1fZQoaAZoCWgPQwhHrptSXvRxQJSGlFKUaBVLzGgWR0CefGyAhB7edX2UKGgGaAloD0MIf/YjReQbcUCUhpRSlGgVS85oFkdAnnx9srNGE3V9lChoBmgJaA9DCIF4Xb+g7HFAlIaUUpRoFUuuaBZHQJ59CgqVhTh1fZQoaAZoCWgPQwilpIeh1WRxQJSGlFKUaBVLuWgWR0CeffxOclPadX2UKGgGaAloD0MIam0a26sXcUCUhpRSlGgVS79oFkdAnn7AP/aQFXV9lChoBmgJaA9DCCjU00fgUnFAlIaUUpRoFUu6aBZHQJ5/NbkfcN91fZQoaAZoCWgPQwgfgqrRqwVxQJSGlFKUaBVLu2gWR0Cef00Cih38dX2UKGgGaAloD0MIarx0k5gPdECUhpRSlGgVS+poFkdAnoATqbBoEnV9lChoBmgJaA9DCKM/NPNkB3JAlIaUUpRoFUumaBZHQJ6AR8QZn+R1fZQoaAZoCWgPQwiC4seYOzRyQJSGlFKUaBVLq2gWR0CegPUIcBEKdX2UKGgGaAloD0MI81XysTudcUCUhpRSlGgVS9JoFkdAnoExb8m8d3V9lChoBmgJaA9DCL1yvW0maXFAlIaUUpRoFUvYaBZHQJ6BRf+jua51fZQoaAZoCWgPQwjEtG/ur/9yQJSGlFKUaBVLy2gWR0Cegp0EovzwdX2UKGgGaAloD0MInlxTIDNscUCUhpRSlGgVS6doFkdAnoL7Tx5LRXV9lChoBmgJaA9DCN7jTBM2AXRAlIaUUpRoFUu9aBZHQJ6DBZuAI6d1fZQoaAZoCWgPQwjRQCybuR5uQJSGlFKUaBVLuWgWR0Ceg3rTH80ldX2UKGgGaAloD0MIAcPy59svc0CUhpRSlGgVS79oFkdAnoRcDbJwKnV9lChoBmgJaA9DCAK37uap+HBAlIaUUpRoFUvIaBZHQJ6ExlTWGyp1fZQoaAZoCWgPQwhWgVoM3kBwQJSGlFKUaBVLrmgWR0CehORc/t6YdX2UKGgGaAloD0MIz6EMVbGUckCUhpRSlGgVS7VoFkdAnoVafSQYDXV9lChoBmgJaA9DCJz7q8c9SnFAlIaUUpRoFUvPaBZHQJ6F5NGmUGF1fZQoaAZoCWgPQwhEhermYilkQJSGlFKUaBVN6ANoFkdAnoZqiblRxnV9lChoBmgJaA9DCKyL22iA7G1AlIaUUpRoFUu0aBZHQJ6Gstsenyd1fZQoaAZoCWgPQwhbmfBL/TBxQJSGlFKUaBVLtWgWR0CehwQcghbGdX2UKGgGaAloD0MIXB0AcRc1cUCUhpRSlGgVS9ZoFkdAnoeVBppN9HV9lChoBmgJaA9DCJLNVfOccnJAlIaUUpRoFUvRaBZHQJ6H4jfNzKd1fZQoaAZoCWgPQwhN2H4yhjByQJSGlFKUaBVLs2gWR0CeiBgBcRlIdX2UKGgGaAloD0MIizidZKvAbkCUhpRSlGgVS7BoFkdAnohXPqs2enV9lChoBmgJaA9DCG1VEtmHIXFAlIaUUpRoFUudaBZHQJ6IgGUwBYF1fZQoaAZoCWgPQwhzhXe5iNlxQJSGlFKUaBVL02gWR0CeiSND+irUdX2UKGgGaAloD0MIrcJmgAtlc0CUhpRSlGgVS71oFkdAnopQ5aNdaHV9lChoBmgJaA9DCIBEEyji4nJAlIaUUpRoFUvXaBZHQJ6KgyeqaPV1fZQoaAZoCWgPQwj5o6gzdzZxQJSGlFKUaBVNAgFoFkdAnorspsoDxXV9lChoBmgJaA9DCENWt3pOz3JAlIaUUpRoFUu2aBZHQJ6LndsSCe51fZQoaAZoCWgPQwh0et6NxT1zQJSGlFKUaBVL6GgWR0Cei6fSx7iRdX2UKGgGaAloD0MIfJkoQqqMckCUhpRSlGgVS99oFkdAnowgWrOqvXV9lChoBmgJaA9DCJxrmKHxfHJAlIaUUpRoFUu0aBZHQJ6ML/rB0p51fZQoaAZoCWgPQwjW/WMh+vhzQJSGlFKUaBVLymgWR0CejDVEuxr0dX2UKGgGaAloD0MIBfwaSUJ6ckCUhpRSlGgVS8hoFkdAnoxsuWa+e3V9lChoBmgJaA9DCIwv2uOFK3NAlIaUUpRoFUvUaBZHQJ6NXhR64Uh1fZQoaAZoCWgPQwg/i6VI/p1xQJSGlFKUaBVLoGgWR0CejaT5ftx/dX2UKGgGaAloD0MInS0gtN5ZdECUhpRSlGgVS7ZoFkdAno3da6jFh3V9lChoBmgJaA9DCJeo3hoY13JAlIaUUpRoFUu7aBZHQJ6OeumrKeV1fZQoaAZoCWgPQwj8UGnEDNRxQJSGlFKUaBVLs2gWR0CejuNZvDP4dX2UKGgGaAloD0MIu7a3W9L4cUCUhpRSlGgVS7xoFkdAno8aMWGh3HV9lChoBmgJaA9DCCKphZJJ2W9AlIaUUpRoFUuzaBZHQJ6PT3bmEGt1fZQoaAZoCWgPQwgIrYcvEzdyQJSGlFKUaBVLuGgWR0Cej4dVvMr3dX2UKGgGaAloD0MIGOsbmFx5c0CUhpRSlGgVS9RoFkdAnpBRyS3b23V9lChoBmgJaA9DCPUR+MMP03BAlIaUUpRoFUunaBZHQJ6Qyu3c5811fZQoaAZoCWgPQwglWvJ42sVvQJSGlFKUaBVLumgWR0CekNDwH7gsdX2UKGgGaAloD0MI/n4xW7IYcECUhpRSlGgVS7loFkdAnpFdipeeF3V9lChoBmgJaA9DCL9k48FW83BAlIaUUpRoFUu/aBZHQJ6TIbkwN9Z1fZQoaAZoCWgPQwgSEmkb/wZyQJSGlFKUaBVL2mgWR0CekzTot+TedX2UKGgGaAloD0MIU+knnJ2GcUCUhpRSlGgVS/BoFkdAnpM2AXl8xHV9lChoBmgJaA9DCOi/B6+dB3NAlIaUUpRoFUvdaBZHQJ6Tghje9Bd1fZQoaAZoCWgPQwi4rpgR3h1vQJSGlFKUaBVLo2gWR0Cek5UG3WnTdX2UKGgGaAloD0MICp3X2OWScUCUhpRSlGgVS9NoFkdAnpPB8QZn+XV9lChoBmgJaA9DCPqZet3iTHJAlIaUUpRoFUukaBZHQJ6UC8f3evZ1fZQoaAZoCWgPQwhv05/9yLFyQJSGlFKUaBVL1GgWR0CelOzGxUvPdX2UKGgGaAloD0MIn48y4kJ0cECUhpRSlGgVS7toFkdAnpUQBPsRhHV9lChoBmgJaA9DCIQPJVoyWXFAlIaUUpRoFUuqaBZHQJ6WY+7lJYl1fZQoaAZoCWgPQwha2T7kLbxwQJSGlFKUaBVLqGgWR0Celmqmj0tidX2UKGgGaAloD0MIhbUxdsJFcUCUhpRSlGgVS5VoFkdAnpaL1mJ3xHV9lChoBmgJaA9DCM8SZASUW3JAlIaUUpRoFUvDaBZHQJ6W+6shgVp1fZQoaAZoCWgPQwiTHRuBuC90QJSGlFKUaBVLtGgWR0CelwtHxz7udX2UKGgGaAloD0MIVDVB1L3WcUCUhpRSlGgVS8BoFkdAnpc16zE74nV9lChoBmgJaA9DCKSrdHedq25AlIaUUpRoFUuwaBZHQJ6XeJemelN1fZQoaAZoCWgPQwiIu3oVGW9vQJSGlFKUaBVLuWgWR0CemJXIEKVqdX2UKGgGaAloD0MIzse1oaLQcUCUhpRSlGgVS8JoFkdAnpjcDGLk0nV9lChoBmgJaA9DCH3O3a6XjXBAlIaUUpRoFUumaBZHQJ6ZuTcIqsl1fZQoaAZoCWgPQwhOet/4mnpxQJSGlFKUaBVLrGgWR0Cemd1Gb1AadX2UKGgGaAloD0MIi6azk0G6bkCUhpRSlGgVS7FoFkdAnpomDDjzZ3V9lChoBmgJaA9DCE7yI36FYXFAlIaUUpRoFUu8aBZHQJ6a0MOPNml1fZQoaAZoCWgPQwiiJvp8VJRxQJSGlFKUaBVLymgWR0Cem1DW9US7dX2UKGgGaAloD0MIeSRens5vcUCUhpRSlGgVS7poFkdAnptTxCpm3HV9lChoBmgJaA9DCN7n+Ghx0nFAlIaUUpRoFUvXaBZHQJ6beMm4RVZ1fZQoaAZoCWgPQwi7Cik/qZdtQJSGlFKUaBVLr2gWR0CenIkyk9EDdX2UKGgGaAloD0MIsz9QbhsJcUCUhpRSlGgVS75oFkdAnpyUAxSHd3VlLg=="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
+ "_n_updates": 540,
79
  "n_steps": 2048,
80
  "gamma": 0.99,
81
  "gae_lambda": 0.95,
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58ce81ffb1df1d0744c8efb0d6e1abc4f2e0d3d257994f15ea5555bd7cf7fbaa
3
  size 87929
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b6085d055d68d006f8477528243fe5fc985682426bef123cad2698701cfcbfc
3
  size 87929
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aea9d585846c61662ab7e6b6f96532e5b114b02eadb910dfb28151c7f3750ffe
3
  size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66039977789bf2843aabb27a2d437dae37b190178b6cc335cb2467459a364bb1
3
  size 43201
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 227.594549432059, "std_reward": 33.913351031198125, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-12-23T15:36:06.565486"}
 
1
+ {"mean_reward": 270.3729659526125, "std_reward": 17.716298513489033, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-12-24T08:44:57.099753"}