Upload PPO LunarLander-v2 trained agent with 1e6 total timesteps
Browse files- README.md +1 -1
- config.json +1 -1
- ppo_LunarLander-v2_vec_env.zip +2 -2
- ppo_LunarLander-v2_vec_env/data +4 -4
- ppo_LunarLander-v2_vec_env/policy.optimizer.pth +1 -1
- ppo_LunarLander-v2_vec_env/policy.pth +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value:
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: 230.65 +/- 65.94
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7a1cd0b5feb0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7a1cd0b5ff40>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7a1cd0b64040>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7a1cd0b640d0>", "_build": "<function ActorCriticPolicy._build at 0x7a1cd0b64160>", "forward": "<function ActorCriticPolicy.forward at 0x7a1cd0b641f0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7a1cd0b64280>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7a1cd0b64310>", "_predict": "<function ActorCriticPolicy._predict at 0x7a1cd0b643a0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7a1cd0b64430>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7a1cd0b644c0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7a1cd0b64550>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7a1cd0aedbc0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1734951495033123187, "learning_rate": 0.0002, "tensorboard_log": null, "_last_obs": null, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG/VsXrMTvmMAWyUTXUBjAF0lEdAoUnczbeuWHV9lChoBkdAbsCRISUTtmgHS/loCEdAoUrAP7N0NnV9lChoBkdAcAU52hZha2gHTQABaAhHQKFLiHoHLRt1fZQoaAZHQG5X84o7V8VoB01LA2gIR0ChTDci4axYdX2UKGgGR0Bw+fWnTAnEaAdNGAFoCEdAoUzfaYeDF3V9lChoBkdAYcJLhaTwD2gHTegDaAhHQKFNuGY8dPt1fZQoaAZHQG6xTEJjUd9oB00VAWgIR0ChTkfhuO0cdX2UKGgGR0Bw8gRnOB1+aAdNEAFoCEdAoU565AhStXV9lChoBkdAakh2EkB0ZGgHTQkBaAhHQKFO02BreqJ1fZQoaAZHQHDcT9OymhxoB02qAmgIR0ChT716Vt4zdX2UKGgGR0Bs+g6uGKyfaAdNGgFoCEdAoVCG4PPLPnV9lChoBkdAbVgoDPnjhmgHS+doCEdAoVGe8qWkanV9lChoBkdAbsWFsYVIqmgHS+NoCEdAoVStOwgTy3V9lChoBkdAbXoc94eLemgHTTMBaAhHQKFXV6WPcSJ1fZQoaAZHQG4u38GcFyJoB0vqaAhHQKFYmrmyPdV1fZQoaAZHQHJZc6vJRwZoB00YAWgIR0ChWKZxiobXdX2UKGgGR0BhHI6ZH/cWaAdN6ANoCEdAoVinpfQa73V9lChoBkdAcbdaPS2H+WgHTQwBaAhHQKFYyICU5dZ1fZQoaAZHQHEjQ8W9DhNoB025AWgIR0ChWUSOJcgRdX2UKGgGR0BiBHc580DVaAdN6ANoCEdAoVomdXko4XV9lChoBkdAb6Mll9SdfGgHTQYBaAhHQKGZKdq+Jxh1fZQoaAZHQG741ie/YapoB0vwaAhHQKGZoE+Pikx1fZQoaAZHQHBjPIwM6R1oB028AWgIR0Chmg4/u9eydX2UKGgGR0BiJODUVi4KaAdN6ANoCEdAoZrhywOe8XV9lChoBkdAcVOQpF1B+mgHS/hoCEdAoZw+3Ytg8nV9lChoBkdAbdiwBYFJQWgHS/RoCEdAoZ2/TmW+oXV9lChoBkdAQcm4b0e2eGgHS+loCEdAoZ43pW3jMnV9lChoBkdAcZWZfUnXumgHTTkCaAhHQKGf2MG5c1R1fZQoaAZHQFyX+AVfu1FoB03oA2gIR0ChoAb0WdmQdX2UKGgGR0By9D9itq59aAdNJgFoCEdAoaA2Qr+YMXV9lChoBkdAbulfw7T2FmgHS/poCEdAoaCXsXzlLnV9lChoBkdAcDnm2b5M12gHTTMBaAhHQKGg+NhE0BR1fZQoaAZHQHDS8r/bTMJoB00PAWgIR0ChocA3cYZVdX2UKGgGR0Bt36ohpxm1aAdNYQFoCEdAoaIUxdpqRHV9lChoBkdAcCpPJq7AcmgHS/hoCEdAoaJ3vlU6xXV9lChoBkdAbvYkQf6oEWgHTZcBaAhHQKGksLiMo+h1fZQoaAZHQHBe/fsNUfhoB0vVaAhHQKGk0wgTyrh1fZQoaAZHQG8GSq2jO9poB0v2aAhHQKGlbDG96C11fZQoaAZHQG12nbRF7UpoB0vraAhHQKGnSw8GLUF1fZQoaAZHQGBTjx0+1ShoB03oA2gIR0Chp2fjS5RTdX2UKGgGR0BpyX+S8rZraAdNcQFoCEdAoafirJbMYHV9lChoBkdAcTzCQcPvrmgHS+NoCEdAoahEep4r0HV9lChoBkdAcTghib2DhGgHTQoBaAhHQKGouTt9hJB1fZQoaAZHQHAZbvCuU2VoB0vqaAhHQKGp/fZVXFN1fZQoaAZHQGBluwxFiKBoB03oA2gIR0Chq1z+WGATdX2UKGgGR0Bw+XY+Sr5qaAdL52gIR0ChrZIDgZTAdX2UKGgGR0BwSuJBPbfxaAdNHQFoCEdAobCQwCbMHXV9lChoBkdAbtlIcR15jmgHS/ZoCEdAobFA7YChe3V9lChoBkdAbfG96C17Y2gHTQIBaAhHQKGyh/nW8RN1fZQoaAZHQGyNC+De0oloB00KAmgIR0Chs2SV4X41dX2UKGgGR0BuyDjYI0IkaAdL8WgIR0Chs3O+RHPNdX2UKGgGR0Bs+pK3/givaAdN3AFoCEdAobPt85S3s3V9lChoBkdAcK/wD/2kBWgHS/doCEdAobTF54W1t3V9lChoBkdAcRs+sHSncmgHTXsBaAhHQKG2YkCV8kV1fZQoaAZHQG+GeqR2bG5oB00aAWgIR0Cht6kPczqKdX2UKGgGR0BiZbb8FY+0aAdN6ANoCEdAobkxSeiBXnV9lChoBkdAcBpDuBtk4GgHS+BoCEdAobu0rsjVx3V9lChoBkdAb/+zZ6D5CWgHTQIBaAhHQKG8U2OQyRB1fZQoaAZHQFwAe3hGYrtoB03oA2gIR0ChvGzWGyoodX2UKGgGR0BsOUpy6tknaAdNGgFoCEdAob1Hu5SWJXV9lChoBkdAcHTH5aePJmgHTakCaAhHQKG90L2pQ1t1fZQoaAZHQGvmAuAZsKtoB0v9aAhHQKG/VWBjFyd1fZQoaAZHQG297LEDQqtoB0veaAhHQKG/kk5ZKWd1fZQoaAZHQEHTIMjNY8xoB0vTaAhHQKHAvDej2zx1fZQoaAZHQGOcNwzch1VoB03oA2gIR0Chw3iyQgcMdX2UKGgGR0BhmZNfw7T2aAdN6ANoCEdAocaNMIu5BnV9lChoBkdAb7Y/9Hc1wmgHTQMBaAhHQKHGw3c580F1fZQoaAZHQHASubiIcipoB00mAWgIR0Chx5s8HObBdX2UKGgGR0BwPsrlNlAeaAdL/WgIR0Chx7TBRAKOdX2UKGgGR0BstjASFoL5aAdL9mgIR0ChyA5AQg9vdX2UKGgGR0BtAMW69TP0aAdL5WgIR0ChyUNz8xbjdX2UKGgGR0BtgV/Ue+23aAdL6GgIR0ChybS5I6KcdX2UKGgGR0BwQZSUC7sfaAdL6mgIR0ChzavpY9xIdX2UKGgGR0BiSZkoWpIdaAdN6ANoCEdAoc34KlYU4HV9lChoBkdAYPBJeVs1sWgHTegDaAhHQKHPFB8hLXd1fZQoaAZHQGwWAogFHJ9oB00DA2gIR0Chz7og/1QJdX2UKGgGR0BubjVFx4puaAdL62gIR0Chz+oaLn9vdX2UKGgGR0BwkAhGH58CaAdL4WgIR0Ch0CW/i5uqdX2UKGgGR0BwAVGQSzw+aAdL82gIR0Ch0OXSSeRQdX2UKGgGR0BxY5mmLtNSaAdL/mgIR0Ch0OxMFlkIdX2UKGgGR0BxeaotL+PzaAdL52gIR0Ch0VqzZ6D5dX2UKGgGR0BtLN4NZvDQaAdNhANoCEdAodHfF98Z1nV9lChoBkdAb3tQswtap2gHTXQDaAhHQKHR+CvovBd1fZQoaAZHQG5GBHLA57xoB00+AWgIR0Ch0i6dDpkgdX2UKGgGR0BtkpLK3d9EaAdNHQFoCEdAodLqqOtGNXV9lChoBkdAMzBLbpNbkmgHS9poCEdAodQrcqOLi3V9lChoBkdAcPV3VkMCtGgHS/RoCEdAodSbhisnzHV9lChoBkdAb7ukVvddmmgHS+RoCEdAodYT4L1EmnV9lChoBkdAb+gC4Bmwq2gHTQQBaAhHQKHWVuejEeh1fZQoaAZHQHC3ukHlfZ5oB0v/aAhHQKHXF/vv0Ad1fZQoaAZHQHBvNaEBbOhoB00WAWgIR0Ch12wfhddFdX2UKGgGR0BhWZ9gF5fMaAdN6ANoCEdAodfhP/JeV3V9lChoBkdAcU90MPSUkmgHS+FoCEdAodgMqMFUynV9lChoBkdAcK/jGkvboWgHS+doCEdAodglg6U7jnV9lChoBkdAcTfz+FUQ1GgHTQMBaAhHQKHYXHS4OMF1fZQoaAZHQG/BQlKK509oB00AAWgIR0Ch2ggYpDu0dX2UKGgGR0BvWCUNayKOaAdNSQFoCEdAodsllmOENHV9lChoBkdAcFLHyEtdzGgHTSgBaAhHQKHdMGRFI/Z1fZQoaAZHQGEYiO3lS0loB03oA2gIR0Ch3jPBi1ArdX2UKGgGR0Bv0qb6P8yfaAdNWAFoCEdAod5BntfG/HVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV/QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgLjAJpOJSJiIeUUpQoSwNoD05OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 1, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVrQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVrQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8qNuLrHEMthZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.5.1+cu121", "GPU Enabled": "False", "Numpy": "1.26.4", "Cloudpickle": "3.1.0", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7a1cd0b5feb0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7a1cd0b5ff40>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7a1cd0b64040>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7a1cd0b640d0>", "_build": "<function ActorCriticPolicy._build at 0x7a1cd0b64160>", "forward": "<function ActorCriticPolicy.forward at 0x7a1cd0b641f0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7a1cd0b64280>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7a1cd0b64310>", "_predict": "<function ActorCriticPolicy._predict at 0x7a1cd0b643a0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7a1cd0b64430>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7a1cd0b644c0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7a1cd0b64550>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7a1cd0aedbc0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1734958162878472251, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": null, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG5yYgzP8huMAWyUTQsBjAF0lEdAoxRy9M9KVnV9lChoBkdAcbVbobGWEGgHTScBaAhHQKMU1KcNH6N1fZQoaAZHQGxjuW0JF9doB00UAWgIR0CjFlasp5NXdX2UKGgGR0BhPnQBxPweaAdN6ANoCEdAoxZ27J4jbHV9lChoBkdAb2GiYb83uWgHTRwBaAhHQKMW1qsU7CB1fZQoaAZHQHGTH/Pw/gRoB00mAWgIR0CjF0JkGzKLdX2UKGgGR0BhmmXqqwQlaAdN6ANoCEdAoxjXqeK8+XV9lChoBkdAbVsrYoRZlmgHTRMBaAhHQKMZK7LdN351fZQoaAZHQGHN73fyf+VoB03oA2gIR0CjGZmM4tHydX2UKGgGR0Bu/OFev6j4aAdN5gJoCEdAoxuEXSBsh3V9lChoBkdAcCIx/ustCmgHTTUCaAhHQKMbr5O8Cgd1fZQoaAZHQHHFDMibDuVoB00vAWgIR0CjG9nxBmf5dX2UKGgGR0BwLn+n62v0aAdNCgFoCEdAox2RqsU7CHV9lChoBkdAb4EhM8HObGgHTdgBaAhHQKMd2I55qud1fZQoaAZHQHG71sHjZL9oB00vAWgIR0CjHw12Rq46dX2UKGgGR0BwvQPOIInjaAdNCgFoCEdAox87IRywOnV9lChoBkdAbwUH31zySWgHTR0BaAhHQKMfvGn4wh51fZQoaAZHQHFzCIk7fYVoB00TAWgIR0CjaPpNTLntdX2UKGgGR0BwLj1nM+vAaAdNJAFoCEdAo2kXGwRoRXV9lChoBkdAbBEXMQmNR2gHTRgBaAhHQKNqy0GeMAF1fZQoaAZHQHFjmc8TzupoB00oAWgIR0CjavQn6VMVdX2UKGgGR0BgF8idJ8OTaAdN6ANoCEdAo20Q0ZWJanV9lChoBkdAcI4p+MIeHWgHTSUBaAhHQKNtcsTWXkZ1fZQoaAZHQHDkL9uP3i9oB01UAWgIR0Cjby1YhdMTdX2UKGgGR0Bf+UelsP8RaAdN6ANoCEdAo2/3nB+F13V9lChoBkdAcMcbLEDQq2gHTS4BaAhHQKNwO4rjHXF1fZQoaAZHQHFEt/FzdUNoB00PAWgIR0CjcKuv+wTudX2UKGgGR0BvaRR/EwWWaAdNRwFoCEdAo3DOGIsRQXV9lChoBkdAcP5q33Hq/2gHTQcBaAhHQKNxZr/sE7p1fZQoaAZHQG++7HIZIhBoB00uAWgIR0CjcX181Gb1dX2UKGgGR0BwWrvw3HaOaAdNUwFoCEdAo3QQt4A0bnV9lChoBkdAcEyAdn0032gHTS8CaAhHQKN0WUY8+zN1fZQoaAZHQG/yjHOryUdoB01EAWgIR0CjdaTzVc2SdX2UKGgGR0BgeUygwoLHaAdN6ANoCEdAo3YmHck+o3V9lChoBkdAcGDBnBciW2gHTQwBaAhHQKN2ZcvduYR1fZQoaAZHQHETkPlMh5hoB03HAWgIR0CjdyJfhMrVdX2UKGgGR0BubURL9MsZaAdNBQFoCEdAo3fkFyJbdXV9lChoBkdAchj2ZAprlGgHTRQBaAhHQKN5GrK/2011fZQoaAZHQCQR2dNFjNJoB00PAWgIR0CjeTFQl8gIdX2UKGgGR0Brw5yQxN7CaAdNJAFoCEdAo3qAY1pCbHV9lChoBkdAbqnfsu3+dmgHTY4BaAhHQKN6jZXdTHd1fZQoaAZHQHDPCqIacZtoB00rAWgIR0Cje/wvg3tKdX2UKGgGR0BxORwKjSG8aAdNaQFoCEdAo32pCBwuNHV9lChoBkdAbFBa6BiCrmgHTRUBaAhHQKN+eXE61b91fZQoaAZHQG9Txj8UEgZoB01JAmgIR0Cjf6h68g6mdX2UKGgGR0BIEdPLxI8RaAdL9GgIR0CjgB52IO6NdX2UKGgGR0ByWde6Zpi7aAdNEgFoCEdAo4CDdk8RtnV9lChoBkdAcJfkuYhMamgHTREBaAhHQKOCyvqTr3V1fZQoaAZHQHDEZM10knloB00eAWgIR0CjhEWCmMwUdX2UKGgGR0BtCvjfek57aAdNGQFoCEdAo4VLj1f3OHV9lChoBkdAcF5z5XU6P2gHTQMBaAhHQKOHGk5ZKWd1fZQoaAZHQHCCP+0gKWtoB008AWgIR0CjiAU4BFNMdX2UKGgGR0Bb/Tspobn6aAdN6ANoCEdAo4h7p1RtQHV9lChoBkdAcMkNutOmBWgHTTQBaAhHQKOKT1IRRMx1fZQoaAZHQGuHBl+Vkc1oB00TAWgIR0CjiqmBOHnEdX2UKGgGR0BxiqvW6K+BaAdNDQFoCEdAo4rLlA/s3XV9lChoBkdAbKrlGPPszGgHTQcBaAhHQKOK5YChew91fZQoaAZHQHIhE8eS0ShoB01FAWgIR0Cji2LMs6JZdX2UKGgGR0BvLr79AHE/aAdNOQFoCEdAo44ESVW0Z3V9lChoBkdAcM9XSjQAuWgHTRYBaAhHQKOO9um78Nx1fZQoaAZHQHAF6J/G2kVoB007AWgIR0Cjjy/G2kSFdX2UKGgGR0Bv+yXyAhB7aAdL/2gIR0CjkMAiml67dX2UKGgGR0Bunc7yQPqcaAdNKgFoCEdAo5F3mDDjznV9lChoBkdAbJzFn7Hhj2gHTRMBaAhHQKOSF5qM3qB1fZQoaAZHQHIKSon8baRoB00FAWgIR0Cjk2lpoK2KdX2UKGgGR0Buk2qkuYhMaAdNCgFoCEdAo5RWKfnOjnV9lChoBkdAbKcdCE6DG2gHTR8BaAhHQKOU8UJOWSl1fZQoaAZHQHHlKHoHLRtoB00bAWgIR0CjlY/Q0GeMdX2UKGgGR0Bef3G8274BaAdN6ANoCEdAo5bgkZ75VXV9lChoBkdAbIJeBxxT9GgHTSIBaAhHQKOYzu63AmB1fZQoaAZHQHEpAR9PUKBoB00OAWgIR0CjmYp2ECeVdX2UKGgGR0BxGGVzIV/MaAdNGwFoCEdAo5npuyeI23V9lChoBkdAXfLb212JSGgHTegDaAhHQKOaypfhMrV1fZQoaAZHQFvhLidat9xoB03oA2gIR0CjnUzXz19OdX2UKGgGR0BvuZHf/FR6aAdNJwFoCEdAo53mf/WDpXV9lChoBkdAbvNyq+8Gs2gHTTUBaAhHQKOfPorWiDd1fZQoaAZHQHG1rX6InBtoB00iAWgIR0CjoB9QoCuEdX2UKGgGR0BiHHlZHNHIaAdN6ANoCEdAo6Gao/A0sXV9lChoBkdAbL6FQl8gIWgHTR4BaAhHQKOhts/pt791fZQoaAZHQHCBacVgx8FoB00+AWgIR0Cjoid2ovSMdX2UKGgGR0BuERON5t3waAdNJAFoCEdAo6JgNRWLgnV9lChoBkdAYtlWKdhAnmgHTegDaAhHQKOirteD3/R1fZQoaAZHQHFjeIEbHZNoB0v7aAhHQKOkGn2qT8p1fZQoaAZHQHELUl3Qla9oB00fAWgIR0CjpLQ9A5aNdX2UKGgGR0BtMTnzQNTcaAdNIAFoCEdAo6VOkP+XJHV9lChoBkdAbcN3aBZpz2gHTSsBaAhHQKOmRWluWKN1fZQoaAZHQHCQ+k56t1ZoB00yAWgIR0CjqB8AzYVZdX2UKGgGR0Bx95Grjo6kaAdNHwFoCEdAo6jJCY1HfHV9lChoBkdAcKHvUBnzx2gHTUEBaAhHQKOo7NN8E3d1fZQoaAZHQHAWVzhgmZ5oB00lAWgIR0CjqYi0v4/NdX2UKGgGR0Bw8mKWLP2PaAdNDwFoCEdAo6oJkmQbM3V9lChoBkdAcRb2ECeVcGgHS/loCEdAo6pm0Re1KHV9lChoBkdAbxz4EfT1CmgHTTEBaAhHQKOq8/Rmbsp1fZQoaAZHQHA+kAYHgP5oB00nAWgIR0Cjqyc7QswtdX2UKGgGR0ByvPq5byH3aAdNDQFoCEdAo620bFS88XV9lChoBkdAcVb1zySV4WgHTTwBaAhHQKOt2sdT5wh1fZQoaAZHQHCQcinpB5ZoB00CAWgIR0CjrlBk7OmjdX2UKGgGR0BgTHcSGrS3aAdN6ANoCEdAo66tTLns9nV9lChoBkdAb0ipn6Eal2gHTREBaAhHQKOxT6xgRbt1fZQoaAZHQG05Aqd6LO1oB00fAWgIR0CjshXgUDdQdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV/QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgLjAJpOJSJiIeUUpQoSwNoD05OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 1, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVrQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVrQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.5.1+cu121", "GPU Enabled": "False", "Numpy": "1.26.4", "Cloudpickle": "3.1.0", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
ppo_LunarLander-v2_vec_env.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30ea2bcd8ab7298c3877f7833464ed09a94e665f3628a48458155c4b2734cfb4
|
| 3 |
+
size 146616
|
ppo_LunarLander-v2_vec_env/data
CHANGED
|
@@ -26,8 +26,8 @@
|
|
| 26 |
"_num_timesteps_at_start": 0,
|
| 27 |
"seed": null,
|
| 28 |
"action_noise": null,
|
| 29 |
-
"start_time":
|
| 30 |
-
"learning_rate": 0.
|
| 31 |
"tensorboard_log": null,
|
| 32 |
"_last_obs": null,
|
| 33 |
"_last_episode_starts": {
|
|
@@ -42,7 +42,7 @@
|
|
| 42 |
"_stats_window_size": 100,
|
| 43 |
"ep_info_buffer": {
|
| 44 |
":type:": "<class 'collections.deque'>",
|
| 45 |
-
":serialized:": "
|
| 46 |
},
|
| 47 |
"ep_success_buffer": {
|
| 48 |
":type:": "<class 'collections.deque'>",
|
|
@@ -91,6 +91,6 @@
|
|
| 91 |
"target_kl": null,
|
| 92 |
"lr_schedule": {
|
| 93 |
":type:": "<class 'function'>",
|
| 94 |
-
":serialized:": "gAWVrQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+
|
| 95 |
}
|
| 96 |
}
|
|
|
|
| 26 |
"_num_timesteps_at_start": 0,
|
| 27 |
"seed": null,
|
| 28 |
"action_noise": null,
|
| 29 |
+
"start_time": 1734958162878472251,
|
| 30 |
+
"learning_rate": 0.0003,
|
| 31 |
"tensorboard_log": null,
|
| 32 |
"_last_obs": null,
|
| 33 |
"_last_episode_starts": {
|
|
|
|
| 42 |
"_stats_window_size": 100,
|
| 43 |
"ep_info_buffer": {
|
| 44 |
":type:": "<class 'collections.deque'>",
|
| 45 |
+
":serialized:": "gAWVQAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG5yYgzP8huMAWyUTQsBjAF0lEdAoxRy9M9KVnV9lChoBkdAcbVbobGWEGgHTScBaAhHQKMU1KcNH6N1fZQoaAZHQGxjuW0JF9doB00UAWgIR0CjFlasp5NXdX2UKGgGR0BhPnQBxPweaAdN6ANoCEdAoxZ27J4jbHV9lChoBkdAb2GiYb83uWgHTRwBaAhHQKMW1qsU7CB1fZQoaAZHQHGTH/Pw/gRoB00mAWgIR0CjF0JkGzKLdX2UKGgGR0BhmmXqqwQlaAdN6ANoCEdAoxjXqeK8+XV9lChoBkdAbVsrYoRZlmgHTRMBaAhHQKMZK7LdN351fZQoaAZHQGHN73fyf+VoB03oA2gIR0CjGZmM4tHydX2UKGgGR0Bu/OFev6j4aAdN5gJoCEdAoxuEXSBsh3V9lChoBkdAcCIx/ustCmgHTTUCaAhHQKMbr5O8Cgd1fZQoaAZHQHHFDMibDuVoB00vAWgIR0CjG9nxBmf5dX2UKGgGR0BwLn+n62v0aAdNCgFoCEdAox2RqsU7CHV9lChoBkdAb4EhM8HObGgHTdgBaAhHQKMd2I55qud1fZQoaAZHQHG71sHjZL9oB00vAWgIR0CjHw12Rq46dX2UKGgGR0BwvQPOIInjaAdNCgFoCEdAox87IRywOnV9lChoBkdAbwUH31zySWgHTR0BaAhHQKMfvGn4wh51fZQoaAZHQHFzCIk7fYVoB00TAWgIR0CjaPpNTLntdX2UKGgGR0BwLj1nM+vAaAdNJAFoCEdAo2kXGwRoRXV9lChoBkdAbBEXMQmNR2gHTRgBaAhHQKNqy0GeMAF1fZQoaAZHQHFjmc8TzupoB00oAWgIR0CjavQn6VMVdX2UKGgGR0BgF8idJ8OTaAdN6ANoCEdAo20Q0ZWJanV9lChoBkdAcI4p+MIeHWgHTSUBaAhHQKNtcsTWXkZ1fZQoaAZHQHDkL9uP3i9oB01UAWgIR0Cjby1YhdMTdX2UKGgGR0Bf+UelsP8RaAdN6ANoCEdAo2/3nB+F13V9lChoBkdAcMcbLEDQq2gHTS4BaAhHQKNwO4rjHXF1fZQoaAZHQHFEt/FzdUNoB00PAWgIR0CjcKuv+wTudX2UKGgGR0BvaRR/EwWWaAdNRwFoCEdAo3DOGIsRQXV9lChoBkdAcP5q33Hq/2gHTQcBaAhHQKNxZr/sE7p1fZQoaAZHQG++7HIZIhBoB00uAWgIR0CjcX181Gb1dX2UKGgGR0BwWrvw3HaOaAdNUwFoCEdAo3QQt4A0bnV9lChoBkdAcEyAdn0032gHTS8CaAhHQKN0WUY8+zN1fZQoaAZHQG/yjHOryUdoB01EAWgIR0CjdaTzVc2SdX2UKGgGR0BgeUygwoLHaAdN6ANoCEdAo3YmHck+o3V9lChoBkdAcGDBnBciW2gHTQwBaAhHQKN2ZcvduYR1fZQoaAZHQHETkPlMh5hoB03HAWgIR0CjdyJfhMrVdX2UKGgGR0BubURL9MsZaAdNBQFoCEdAo3fkFyJbdXV9lChoBkdAchj2ZAprlGgHTRQBaAhHQKN5GrK/2011fZQoaAZHQCQR2dNFjNJoB00PAWgIR0CjeTFQl8gIdX2UKGgGR0Brw5yQxN7CaAdNJAFoCEdAo3qAY1pCbHV9lChoBkdAbqnfsu3+dmgHTY4BaAhHQKN6jZXdTHd1fZQoaAZHQHDPCqIacZtoB00rAWgIR0Cje/wvg3tKdX2UKGgGR0BxORwKjSG8aAdNaQFoCEdAo32pCBwuNHV9lChoBkdAbFBa6BiCrmgHTRUBaAhHQKN+eXE61b91fZQoaAZHQG9Txj8UEgZoB01JAmgIR0Cjf6h68g6mdX2UKGgGR0BIEdPLxI8RaAdL9GgIR0CjgB52IO6NdX2UKGgGR0ByWde6Zpi7aAdNEgFoCEdAo4CDdk8RtnV9lChoBkdAcJfkuYhMamgHTREBaAhHQKOCyvqTr3V1fZQoaAZHQHDEZM10knloB00eAWgIR0CjhEWCmMwUdX2UKGgGR0BtCvjfek57aAdNGQFoCEdAo4VLj1f3OHV9lChoBkdAcF5z5XU6P2gHTQMBaAhHQKOHGk5ZKWd1fZQoaAZHQHCCP+0gKWtoB008AWgIR0CjiAU4BFNMdX2UKGgGR0Bb/Tspobn6aAdN6ANoCEdAo4h7p1RtQHV9lChoBkdAcMkNutOmBWgHTTQBaAhHQKOKT1IRRMx1fZQoaAZHQGuHBl+Vkc1oB00TAWgIR0CjiqmBOHnEdX2UKGgGR0BxiqvW6K+BaAdNDQFoCEdAo4rLlA/s3XV9lChoBkdAbKrlGPPszGgHTQcBaAhHQKOK5YChew91fZQoaAZHQHIhE8eS0ShoB01FAWgIR0Cji2LMs6JZdX2UKGgGR0BvLr79AHE/aAdNOQFoCEdAo44ESVW0Z3V9lChoBkdAcM9XSjQAuWgHTRYBaAhHQKOO9um78Nx1fZQoaAZHQHAF6J/G2kVoB007AWgIR0Cjjy/G2kSFdX2UKGgGR0Bv+yXyAhB7aAdL/2gIR0CjkMAiml67dX2UKGgGR0Bunc7yQPqcaAdNKgFoCEdAo5F3mDDjznV9lChoBkdAbJzFn7Hhj2gHTRMBaAhHQKOSF5qM3qB1fZQoaAZHQHIKSon8baRoB00FAWgIR0Cjk2lpoK2KdX2UKGgGR0Buk2qkuYhMaAdNCgFoCEdAo5RWKfnOjnV9lChoBkdAbKcdCE6DG2gHTR8BaAhHQKOU8UJOWSl1fZQoaAZHQHHlKHoHLRtoB00bAWgIR0CjlY/Q0GeMdX2UKGgGR0Bef3G8274BaAdN6ANoCEdAo5bgkZ75VXV9lChoBkdAbIJeBxxT9GgHTSIBaAhHQKOYzu63AmB1fZQoaAZHQHEpAR9PUKBoB00OAWgIR0CjmYp2ECeVdX2UKGgGR0BxGGVzIV/MaAdNGwFoCEdAo5npuyeI23V9lChoBkdAXfLb212JSGgHTegDaAhHQKOaypfhMrV1fZQoaAZHQFvhLidat9xoB03oA2gIR0CjnUzXz19OdX2UKGgGR0BvuZHf/FR6aAdNJwFoCEdAo53mf/WDpXV9lChoBkdAbvNyq+8Gs2gHTTUBaAhHQKOfPorWiDd1fZQoaAZHQHG1rX6InBtoB00iAWgIR0CjoB9QoCuEdX2UKGgGR0BiHHlZHNHIaAdN6ANoCEdAo6Gao/A0sXV9lChoBkdAbL6FQl8gIWgHTR4BaAhHQKOhts/pt791fZQoaAZHQHCBacVgx8FoB00+AWgIR0Cjoid2ovSMdX2UKGgGR0BuERON5t3waAdNJAFoCEdAo6JgNRWLgnV9lChoBkdAYtlWKdhAnmgHTegDaAhHQKOirteD3/R1fZQoaAZHQHFjeIEbHZNoB0v7aAhHQKOkGn2qT8p1fZQoaAZHQHELUl3Qla9oB00fAWgIR0CjpLQ9A5aNdX2UKGgGR0BtMTnzQNTcaAdNIAFoCEdAo6VOkP+XJHV9lChoBkdAbcN3aBZpz2gHTSsBaAhHQKOmRWluWKN1fZQoaAZHQHCQ+k56t1ZoB00yAWgIR0CjqB8AzYVZdX2UKGgGR0Bx95Grjo6kaAdNHwFoCEdAo6jJCY1HfHV9lChoBkdAcKHvUBnzx2gHTUEBaAhHQKOo7NN8E3d1fZQoaAZHQHAWVzhgmZ5oB00lAWgIR0CjqYi0v4/NdX2UKGgGR0Bw8mKWLP2PaAdNDwFoCEdAo6oJkmQbM3V9lChoBkdAcRb2ECeVcGgHS/loCEdAo6pm0Re1KHV9lChoBkdAbxz4EfT1CmgHTTEBaAhHQKOq8/Rmbsp1fZQoaAZHQHA+kAYHgP5oB00nAWgIR0Cjqyc7QswtdX2UKGgGR0ByvPq5byH3aAdNDQFoCEdAo620bFS88XV9lChoBkdAcVb1zySV4WgHTTwBaAhHQKOt2sdT5wh1fZQoaAZHQHCQcinpB5ZoB00CAWgIR0CjrlBk7OmjdX2UKGgGR0BgTHcSGrS3aAdN6ANoCEdAo66tTLns9nV9lChoBkdAb0ipn6Eal2gHTREBaAhHQKOxT6xgRbt1fZQoaAZHQG05Aqd6LO1oB00fAWgIR0CjshXgUDdQdWUu"
|
| 46 |
},
|
| 47 |
"ep_success_buffer": {
|
| 48 |
":type:": "<class 'collections.deque'>",
|
|
|
|
| 91 |
"target_kl": null,
|
| 92 |
"lr_schedule": {
|
| 93 |
":type:": "<class 'function'>",
|
| 94 |
+
":serialized:": "gAWVrQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
| 95 |
}
|
| 96 |
}
|
ppo_LunarLander-v2_vec_env/policy.optimizer.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87978
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b642920187319a33162122ff24c29f0c9c96aaf1f0f6112079f360dfe13ced4
|
| 3 |
size 87978
|
ppo_LunarLander-v2_vec_env/policy.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 43634
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee0f80dfd778b41f1f8d8f626eba5c264d05d5c20df05172af5eba6cccbdb0b4
|
| 3 |
size 43634
|
replay.mp4
CHANGED
|
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward":
|
|
|
|
| 1 |
+
{"mean_reward": 230.65221566998284, "std_reward": 65.93931362009614, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-12-23T13:33:54.535690"}
|