hung3r commited on
Commit
21f332c
·
verified ·
1 Parent(s): fe35179

Upload PPO LunarLander-v2 trained agent

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ replay.mp4 filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: stable-baselines3
3
+ tags:
4
+ - LunarLander-v2
5
+ - deep-reinforcement-learning
6
+ - reinforcement-learning
7
+ - stable-baselines3
8
+ model-index:
9
+ - name: PPO
10
+ results:
11
+ - task:
12
+ type: reinforcement-learning
13
+ name: reinforcement-learning
14
+ dataset:
15
+ name: LunarLander-v2
16
+ type: LunarLander-v2
17
+ metrics:
18
+ - type: mean_reward
19
+ value: 242.98 +/- 34.61
20
+ name: mean_reward
21
+ verified: false
22
+ ---
23
+
24
+ # **PPO** Agent playing **LunarLander-v2**
25
+ This is a trained model of a **PPO** agent playing **LunarLander-v2**
26
+ using the [stable-baselines3 library](https://github.com/DLR-RM/stable-baselines3).
27
+
28
+ ## Usage (with Stable-baselines3)
29
+ TODO: Add your code
30
+
31
+
32
+ ```python
33
+ from stable_baselines3 import ...
34
+ from huggingface_sb3 import load_from_hub
35
+
36
+ ...
37
+ ```
config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__firstlineno__": 390, "__doc__": "\nPolicy class for actor-critic algorithms (has both policy and value prediction).\nUsed by A2C, PPO and the likes.\n\n:param observation_space: Observation space\n:param action_space: Action space\n:param lr_schedule: Learning rate schedule (could be constant)\n:param net_arch: The specification of the policy and value networks.\n:param activation_fn: Activation function\n:param ortho_init: Whether to use or not orthogonal initialization\n:param use_sde: Whether to use State Dependent Exploration or not\n:param log_std_init: Initial value for the log standard deviation\n:param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n:param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n:param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n:param features_extractor_class: Features extractor to use.\n:param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n:param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n:param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n:param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n:param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n", "__init__": "<function ActorCriticPolicy.__init__ at 0x109c449a0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x109c44a40>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x109c44ae0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x109c44b80>", "_build": "<function ActorCriticPolicy._build at 0x109c44c20>", "forward": "<function ActorCriticPolicy.forward at 0x109c44cc0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x109c44d60>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x109c44e00>", "_predict": "<function ActorCriticPolicy._predict at 0x109c44ea0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x109c44f40>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x109c44fe0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x109c45080>", "__static_attributes__": ["action_dist", "action_net", "activation_fn", "dist_kwargs", "features_dim", "features_extractor", "log_std", "log_std_init", "mlp_extractor", "net_arch", "optimizer", "ortho_init", "pi_features_extractor", "share_features_extractor", "use_sde", "value_net", "vf_features_extractor"], "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x109c3e9c0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1000448, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1756209889085469000, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVlgAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAACzMxK9KRBeuv2tSTcX1B8zGfhHu7aHbbYAAIA/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsIhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksBhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.00044800000000000395, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG6lzGo73f2MAWyUTV4BjAF0lEdAagF+S8rZrnV9lChoBkdAbTXiF0xM4GgHTbYBaAhHQGoDnnlnyup1fZQoaAZHQGv5qKgqVhVoB00VAmgIR0BqCDImw7kodX2UKGgGR0BtiO6NEPUbaAdNdwFoCEdAagn4qwyIpHV9lChoBkdAcN+rv9cbBGgHTUgBaAhHQGoLhVMmF8J1fZQoaAZHQHFWCpJf6XVoB01vAWgIR0BqDzZHuqm1dX2UKGgGR0BGXBC2MKkVaAdNiQFoCEdAahEM4LkS3HV9lChoBkdAXY4c81XNkmgHTegDaAhHQGoZOn/DLr51fZQoaAZHQHEFt12aDwpoB03FAWgIR0BqHWJvYODrdX2UKGgGR0Bwl6aCtihGaAdNlAFoCEdAah9ej2zv7XV9lChoBkdAba4DyOJcgWgHTXkBaAhHQGohNFz+3ph1fZQoaAZHQHBNoV2zOX5oB01NAWgIR0BqJMUIsyzpdX2UKGgGR0Bw6ow1zhgmaAdNdAFoCEdAaiaP2f02+HV9lChoBkdAcbjVC5VfeGgHTX8BaAhHQGooZj6N2kl1fZQoaAZHQG+UE0zj3mFoB03YAWgIR0BqLKAxzq8ldX2UKGgGR0BsvOznied1aAdNhgFoCEdAai6bIcR15nV9lChoBkdAbXt5MURFqmgHTcIBaAhHQGoyyk9ECvJ1fZQoaAZHQG/llTvRZ2ZoB02eAWgIR0BqNML8aXKKdX2UKGgGR0Bvv/qC6H0saAdNsgFoCEdAajbQ9A5aNnV9lChoBkdAbTY1/DtPYWgHTWwBaAhHQGo6hiTdLxt1fZQoaAZHQG/hxMN+b3JoB01lAWgIR0BqPD9fkWAPdX2UKGgGR0Br3WR1X/5taAdNfwFoCEdAakAT7l7tzHV9lChoBkdAbrCQ/X5FgGgHTWUBaAhHQGpBzTvy9VZ1fZQoaAZHQHG47kKeCkJoB02rAWgIR0BqQ9mcvugIdX2UKGgGR0Bw1e+AVfu1aAdN1gFoCEdAakgSwnpjc3V9lChoBkdAcHL7/n4fwWgHTYEBaAhHQGpJ7F85S3t1fZQoaAZHQGsH6XSjQAxoB01oAWgIR0BqS6htcfNidX2UKGgGR0BslNzKcNH6aAdNhAFoCEdAak98WKuSwHV9lChoBkdAcAsyNn5BTmgHTZ0BaAhHQGpRfWDpTuR1fZQoaAZHQG2maDwpe/poB02XAWgIR0BqVW+Eh7mddX2UKGgGR0BhjUY0l7dBaAdN6ANoCEdAalxuUliSaHV9lChoBkdAcGYPPszEaWgHTZ4BaAhHQGpebcwg1WN1fZQoaAZHQHBcwEEC/49oB022AWgIR0BqYIogFHJ+dX2UKGgGR0ByBngccU/OaAdNkQFoCEdAamR1AZ88cXV9lChoBkdAaq5ga3qiXmgHTVcBaAhHQGpmGq5sj3V1fZQoaAZHQG8JUwaisXBoB02EAWgIR0Bqaer2g398dX2UKGgGR0BwFimEXcgyaAdNeQFoCEdAamu7HyVfNXV9lChoBkdAa+kuSwGGEmgHTVwBaAhHQGptb7TDwYt1fZQoaAZHQHCXNsvZh8ZoB02ZAWgIR0Bqcv+XJHRUdX2UKGgGR0BtzPMwDeTFaAdNdAFoCEdAanTVkMCtBHV9lChoBkdAcGUq1PWQOmgHTcABaAhHQGp29vjwQUZ1fZQoaAZHQHCFHVkMCtBoB01mAWgIR0BqeqcG1QZXdX2UKGgGR0BttfeWOZLJaAdNlwFoCEdAanyZFXq7iHV9lChoBkdAac7/dZaFEmgHTZoBaAhHQGqAgRkEs8R1fZQoaAZHQHBAC/47A+JoB01DAWgIR0BqghKFqSHNdX2UKGgGR0BtstOsT37DaAdNqgFoCEdAaoQewLVnVXV9lChoBkdAat14ubqhUWgHTZUBaAhHQGqIDFId2gZ1fZQoaAZHQG53RMWXTmZoB016AWgIR0BqiePBBRhudX2UKGgGR0BxNCjafzz3aAdNTgFoCEdAaouCFsYVI3V9lChoBkdARbkEzO5avGgHS/JoCEdAao6evIOpbXV9lChoBkdAcHYPSlWOqGgHTdsCaAhHQGqSrpaA4GV1fZQoaAZHQHAnDtG/etVoB01YAWgIR0BqlmBxxT86dX2UKGgGR0BtUQzUI9kjaAdNaAFoCEdAapgdS2phnnV9lChoBkdAcSiY64lQdmgHTagDaAhHQGqe2saKk2x1fZQoaAZHQHALtlAeJYVoB02DAWgIR0BqoLksBhhIdX2UKGgGR0Bsr7jYI0IkaAdNigFoCEdAaqSXKr7wa3V9lChoBkdAbF2Fh5PdmGgHTWABaAhHQGqmSI55qud1fZQoaAZHQG56YaP0Zm9oB01xAWgIR0BqqBFAmiQDdX2UKGgGR0ByMtCXyAhCaAdNQwFoCEdAaquWi1y/9HV9lChoBkdAb78ynk1dgWgHTWsBaAhHQGqtUCih37l1fZQoaAZHQG2wAvtdAxBoB01fAWgIR0BqrvkxREWqdX2UKGgGR0ByYHJNj9XLaAdNWQFoCEdAarKyE+Pik3V9lChoBkdAcI9udf9gnmgHTZQCaAhHQGq196cAiml1fZQoaAZHQHAYeLvTgEVoB01mAWgIR0BquazzErGzdX2UKGgGR0BsJaMm4RVZaAdNkQFoCEdAarueA/cFhXV9lChoBkdAb8TW1c+qzmgHTVEBaAhHQGq/OT7l7t11fZQoaAZHQG5S2tdRiw1oB02LAWgIR0BqwRul41P4dX2UKGgGR0BsbHMW43FUaAdNggFoCEdAasLtFa0Qb3V9lChoBkdAbZvXLeQ+2WgHTcUBaAhHQGrHEGJN0vJ1fZQoaAZHQG5iHFo+OfdoB02lAWgIR0BqyRnBciW3dX2UKGgGR0Bvs4Q176YWaAdN3gFoCEdAas1egL7XQXV9lChoBkdAcRcIAwPAf2gHTYYBaAhHQGrPQb+98JF1fZQoaAZHQGyEhMJx//hoB01XAWgIR0Bq0OgpSaVldX2UKGgGR0Bwj5tpEhJRaAdNuQFoCEdAatUM1CPZI3V9lChoBkdActyEx7AtWmgHTUEBaAhHQGrWmXPZ7HB1fZQoaAZHQGvohIvrWy1oB02VAWgIR0Bq2IJVsDW9dX2UKGgGR0Bqqkn7YTTOaAdNmgFoCEdAatx04BFNL3V9lChoBkdAbGqS2Yv38GgHTVsBaAhHQGreIP9UCJZ1fZQoaAZHQHH+KXrt3OhoB02JAWgIR0Bq4fp0OmSAdX2UKGgGR0BuABZSvTw2aAdNhgFoCEdAauPSv1UVBXV9lChoBkdAcnxXpnpSrGgHTZQBaAhHQGrlvrOZ9eB1fZQoaAZHQG/7ECvHLidoB02EAWgIR0Bq6Ymois4ldX2UKGgGR0BwrRp/PPcBaAdNdAFoCEdAautcNYr8SHV9lChoBkdAcBIa/RE4N2gHTcQBaAhHQGrvhDw6QvJ1fZQoaAZHQG93s+NcW0toB010AWgIR0Bq8VMPBi1BdX2UKGgGR0Bu+4cWCVbBaAdNcAFoCEdAavMmZVn27HV9lChoBkdAcUdf+CK77WgHTXQBaAhHQGr2+S0Sh8J1fZQoaAZHQGznD1XeWOZoB02KAWgIR0Bq+N50KZ2IdX2UKGgGR0Bvgyp3os7NaAdNiwFoCEdAavrCqIacZ3V9lChoBkdAcaiKxs2vS2gHTaUDaAhHQGsBg93bEgp1fZQoaAZHQG6yTFl05lxoB02VAWgIR0BrBWr+5vtMdX2UKGgGR0BvcE+JP69CaAdNFANoCEdAawlGza9K3HV9lChoBkdAb7T51vES/WgHTcoDaAhHQGsQpPRArx11fZQoaAZHQHDdp4GD+R5oB02bAWgIR0BrFPYe1a4ddX2UKGgGR0Bu3BZQpF1CaAdNjwFoCEdAaxbeuV5a/3V9lChoBkdAcH5OUdJaq2gHTbsBaAhHQGsbAood+5R1fZQoaAZHQHAthBzFMqVoB01bAWgIR0BrHLMgU1yedX2UKGgGR0BvgsqWkaddaAdNcwFoCEdAax58iOearnV9lChoBkdAcKY8Djin52gHTbEBaAhHQGsihyCFsYV1fZQoaAZHQHDo09lmOENoB01tAWgIR0BrJEV8CxNZdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 3908, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 1, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVEgMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwg+AZUAVAEkAJROhZQpjAFflIWUjGcvVXNlcnMvc2FtcGxpbmcvV29ya3NwYWNlL1JML3VuaXQxLy52ZW52L2xpYi9weXRob24zLjEzL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMZy9Vc2Vycy9zYW1wbGluZy9Xb3Jrc3BhY2UvUkwvdW5pdDEvLnZlbnYvbGliL3B5dGhvbjMuMTMvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVEgMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwg+AZUAVAEkAJROhZQpjAFflIWUjGcvVXNlcnMvc2FtcGxpbmcvV29ya3NwYWNlL1JML3VuaXQxLy52ZW52L2xpYi9weXRob24zLjEzL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMZy9Vc2Vycy9zYW1wbGluZy9Xb3Jrc3BhY2UvUkwvdW5pdDEvLnZlbnYvbGliL3B5dGhvbjMuMTMvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "macOS-15.6.1-arm64-arm-64bit-Mach-O Darwin Kernel Version 24.6.0: Mon Jul 14 11:30:34 PDT 2025; root:xnu-11417.140.69~1/RELEASE_ARM64_T8103", "Python": "3.13.4", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.8.0", "GPU Enabled": "False", "Numpy": "2.3.2", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1"}}
ppo-LunarLander-v2.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf0ae0a21b457c65cef9c793c70cca9d9c0385d92c224d571cc74fd357152003
3
+ size 148686
ppo-LunarLander-v2/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 2.0.0a5
ppo-LunarLander-v2/data ADDED
@@ -0,0 +1,119 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
+ "__module__": "stable_baselines3.common.policies",
6
+ "__firstlineno__": 390,
7
+ "__doc__": "\nPolicy class for actor-critic algorithms (has both policy and value prediction).\nUsed by A2C, PPO and the likes.\n\n:param observation_space: Observation space\n:param action_space: Action space\n:param lr_schedule: Learning rate schedule (could be constant)\n:param net_arch: The specification of the policy and value networks.\n:param activation_fn: Activation function\n:param ortho_init: Whether to use or not orthogonal initialization\n:param use_sde: Whether to use State Dependent Exploration or not\n:param log_std_init: Initial value for the log standard deviation\n:param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n:param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n:param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n:param features_extractor_class: Features extractor to use.\n:param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n:param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n:param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n:param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n:param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n",
8
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x109c449a0>",
9
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x109c44a40>",
10
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x109c44ae0>",
11
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x109c44b80>",
12
+ "_build": "<function ActorCriticPolicy._build at 0x109c44c20>",
13
+ "forward": "<function ActorCriticPolicy.forward at 0x109c44cc0>",
14
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x109c44d60>",
15
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x109c44e00>",
16
+ "_predict": "<function ActorCriticPolicy._predict at 0x109c44ea0>",
17
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x109c44f40>",
18
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x109c44fe0>",
19
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x109c45080>",
20
+ "__static_attributes__": [
21
+ "action_dist",
22
+ "action_net",
23
+ "activation_fn",
24
+ "dist_kwargs",
25
+ "features_dim",
26
+ "features_extractor",
27
+ "log_std",
28
+ "log_std_init",
29
+ "mlp_extractor",
30
+ "net_arch",
31
+ "optimizer",
32
+ "ortho_init",
33
+ "pi_features_extractor",
34
+ "share_features_extractor",
35
+ "use_sde",
36
+ "value_net",
37
+ "vf_features_extractor"
38
+ ],
39
+ "__abstractmethods__": "frozenset()",
40
+ "_abc_impl": "<_abc._abc_data object at 0x109c3e9c0>"
41
+ },
42
+ "verbose": 1,
43
+ "policy_kwargs": {},
44
+ "num_timesteps": 1000448,
45
+ "_total_timesteps": 1000000,
46
+ "_num_timesteps_at_start": 0,
47
+ "seed": null,
48
+ "action_noise": null,
49
+ "start_time": 1756209889085469000,
50
+ "learning_rate": 0.0003,
51
+ "tensorboard_log": null,
52
+ "_last_obs": {
53
+ ":type:": "<class 'numpy.ndarray'>",
54
+ ":serialized:": "gAWVlgAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAACzMxK9KRBeuv2tSTcX1B8zGfhHu7aHbbYAAIA/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsIhpSMAUOUdJRSlC4="
55
+ },
56
+ "_last_episode_starts": {
57
+ ":type:": "<class 'numpy.ndarray'>",
58
+ ":serialized:": "gAWVdQAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksBhZSMAUOUdJRSlC4="
59
+ },
60
+ "_last_original_obs": null,
61
+ "_episode_num": 0,
62
+ "use_sde": false,
63
+ "sde_sample_freq": -1,
64
+ "_current_progress_remaining": -0.00044800000000000395,
65
+ "_stats_window_size": 100,
66
+ "ep_info_buffer": {
67
+ ":type:": "<class 'collections.deque'>",
68
+ ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG6lzGo73f2MAWyUTV4BjAF0lEdAagF+S8rZrnV9lChoBkdAbTXiF0xM4GgHTbYBaAhHQGoDnnlnyup1fZQoaAZHQGv5qKgqVhVoB00VAmgIR0BqCDImw7kodX2UKGgGR0BtiO6NEPUbaAdNdwFoCEdAagn4qwyIpHV9lChoBkdAcN+rv9cbBGgHTUgBaAhHQGoLhVMmF8J1fZQoaAZHQHFWCpJf6XVoB01vAWgIR0BqDzZHuqm1dX2UKGgGR0BGXBC2MKkVaAdNiQFoCEdAahEM4LkS3HV9lChoBkdAXY4c81XNkmgHTegDaAhHQGoZOn/DLr51fZQoaAZHQHEFt12aDwpoB03FAWgIR0BqHWJvYODrdX2UKGgGR0Bwl6aCtihGaAdNlAFoCEdAah9ej2zv7XV9lChoBkdAba4DyOJcgWgHTXkBaAhHQGohNFz+3ph1fZQoaAZHQHBNoV2zOX5oB01NAWgIR0BqJMUIsyzpdX2UKGgGR0Bw6ow1zhgmaAdNdAFoCEdAaiaP2f02+HV9lChoBkdAcbjVC5VfeGgHTX8BaAhHQGooZj6N2kl1fZQoaAZHQG+UE0zj3mFoB03YAWgIR0BqLKAxzq8ldX2UKGgGR0BsvOznied1aAdNhgFoCEdAai6bIcR15nV9lChoBkdAbXt5MURFqmgHTcIBaAhHQGoyyk9ECvJ1fZQoaAZHQG/llTvRZ2ZoB02eAWgIR0BqNML8aXKKdX2UKGgGR0Bvv/qC6H0saAdNsgFoCEdAajbQ9A5aNnV9lChoBkdAbTY1/DtPYWgHTWwBaAhHQGo6hiTdLxt1fZQoaAZHQG/hxMN+b3JoB01lAWgIR0BqPD9fkWAPdX2UKGgGR0Br3WR1X/5taAdNfwFoCEdAakAT7l7tzHV9lChoBkdAbrCQ/X5FgGgHTWUBaAhHQGpBzTvy9VZ1fZQoaAZHQHG47kKeCkJoB02rAWgIR0BqQ9mcvugIdX2UKGgGR0Bw1e+AVfu1aAdN1gFoCEdAakgSwnpjc3V9lChoBkdAcHL7/n4fwWgHTYEBaAhHQGpJ7F85S3t1fZQoaAZHQGsH6XSjQAxoB01oAWgIR0BqS6htcfNidX2UKGgGR0BslNzKcNH6aAdNhAFoCEdAak98WKuSwHV9lChoBkdAcAsyNn5BTmgHTZ0BaAhHQGpRfWDpTuR1fZQoaAZHQG2maDwpe/poB02XAWgIR0BqVW+Eh7mddX2UKGgGR0BhjUY0l7dBaAdN6ANoCEdAalxuUliSaHV9lChoBkdAcGYPPszEaWgHTZ4BaAhHQGpebcwg1WN1fZQoaAZHQHBcwEEC/49oB022AWgIR0BqYIogFHJ+dX2UKGgGR0ByBngccU/OaAdNkQFoCEdAamR1AZ88cXV9lChoBkdAaq5ga3qiXmgHTVcBaAhHQGpmGq5sj3V1fZQoaAZHQG8JUwaisXBoB02EAWgIR0Bqaer2g398dX2UKGgGR0BwFimEXcgyaAdNeQFoCEdAamu7HyVfNXV9lChoBkdAa+kuSwGGEmgHTVwBaAhHQGptb7TDwYt1fZQoaAZHQHCXNsvZh8ZoB02ZAWgIR0Bqcv+XJHRUdX2UKGgGR0BtzPMwDeTFaAdNdAFoCEdAanTVkMCtBHV9lChoBkdAcGUq1PWQOmgHTcABaAhHQGp29vjwQUZ1fZQoaAZHQHCFHVkMCtBoB01mAWgIR0BqeqcG1QZXdX2UKGgGR0BttfeWOZLJaAdNlwFoCEdAanyZFXq7iHV9lChoBkdAac7/dZaFEmgHTZoBaAhHQGqAgRkEs8R1fZQoaAZHQHBAC/47A+JoB01DAWgIR0BqghKFqSHNdX2UKGgGR0BtstOsT37DaAdNqgFoCEdAaoQewLVnVXV9lChoBkdAat14ubqhUWgHTZUBaAhHQGqIDFId2gZ1fZQoaAZHQG53RMWXTmZoB016AWgIR0BqiePBBRhudX2UKGgGR0BxNCjafzz3aAdNTgFoCEdAaouCFsYVI3V9lChoBkdARbkEzO5avGgHS/JoCEdAao6evIOpbXV9lChoBkdAcHYPSlWOqGgHTdsCaAhHQGqSrpaA4GV1fZQoaAZHQHAnDtG/etVoB01YAWgIR0BqlmBxxT86dX2UKGgGR0BtUQzUI9kjaAdNaAFoCEdAapgdS2phnnV9lChoBkdAcSiY64lQdmgHTagDaAhHQGqe2saKk2x1fZQoaAZHQHALtlAeJYVoB02DAWgIR0BqoLksBhhIdX2UKGgGR0Bsr7jYI0IkaAdNigFoCEdAaqSXKr7wa3V9lChoBkdAbF2Fh5PdmGgHTWABaAhHQGqmSI55qud1fZQoaAZHQG56YaP0Zm9oB01xAWgIR0BqqBFAmiQDdX2UKGgGR0ByMtCXyAhCaAdNQwFoCEdAaquWi1y/9HV9lChoBkdAb78ynk1dgWgHTWsBaAhHQGqtUCih37l1fZQoaAZHQG2wAvtdAxBoB01fAWgIR0BqrvkxREWqdX2UKGgGR0ByYHJNj9XLaAdNWQFoCEdAarKyE+Pik3V9lChoBkdAcI9udf9gnmgHTZQCaAhHQGq196cAiml1fZQoaAZHQHAYeLvTgEVoB01mAWgIR0BquazzErGzdX2UKGgGR0BsJaMm4RVZaAdNkQFoCEdAarueA/cFhXV9lChoBkdAb8TW1c+qzmgHTVEBaAhHQGq/OT7l7t11fZQoaAZHQG5S2tdRiw1oB02LAWgIR0BqwRul41P4dX2UKGgGR0BsbHMW43FUaAdNggFoCEdAasLtFa0Qb3V9lChoBkdAbZvXLeQ+2WgHTcUBaAhHQGrHEGJN0vJ1fZQoaAZHQG5iHFo+OfdoB02lAWgIR0BqyRnBciW3dX2UKGgGR0Bvs4Q176YWaAdN3gFoCEdAas1egL7XQXV9lChoBkdAcRcIAwPAf2gHTYYBaAhHQGrPQb+98JF1fZQoaAZHQGyEhMJx//hoB01XAWgIR0Bq0OgpSaVldX2UKGgGR0Bwj5tpEhJRaAdNuQFoCEdAatUM1CPZI3V9lChoBkdActyEx7AtWmgHTUEBaAhHQGrWmXPZ7HB1fZQoaAZHQGvohIvrWy1oB02VAWgIR0Bq2IJVsDW9dX2UKGgGR0Bqqkn7YTTOaAdNmgFoCEdAatx04BFNL3V9lChoBkdAbGqS2Yv38GgHTVsBaAhHQGreIP9UCJZ1fZQoaAZHQHH+KXrt3OhoB02JAWgIR0Bq4fp0OmSAdX2UKGgGR0BuABZSvTw2aAdNhgFoCEdAauPSv1UVBXV9lChoBkdAcnxXpnpSrGgHTZQBaAhHQGrlvrOZ9eB1fZQoaAZHQG/7ECvHLidoB02EAWgIR0Bq6Ymois4ldX2UKGgGR0BwrRp/PPcBaAdNdAFoCEdAautcNYr8SHV9lChoBkdAcBIa/RE4N2gHTcQBaAhHQGrvhDw6QvJ1fZQoaAZHQG93s+NcW0toB010AWgIR0Bq8VMPBi1BdX2UKGgGR0Bu+4cWCVbBaAdNcAFoCEdAavMmZVn27HV9lChoBkdAcUdf+CK77WgHTXQBaAhHQGr2+S0Sh8J1fZQoaAZHQGznD1XeWOZoB02KAWgIR0Bq+N50KZ2IdX2UKGgGR0Bvgyp3os7NaAdNiwFoCEdAavrCqIacZ3V9lChoBkdAcaiKxs2vS2gHTaUDaAhHQGsBg93bEgp1fZQoaAZHQG6yTFl05lxoB02VAWgIR0BrBWr+5vtMdX2UKGgGR0BvcE+JP69CaAdNFANoCEdAawlGza9K3HV9lChoBkdAb7T51vES/WgHTcoDaAhHQGsQpPRArx11fZQoaAZHQHDdp4GD+R5oB02bAWgIR0BrFPYe1a4ddX2UKGgGR0Bu3BZQpF1CaAdNjwFoCEdAaxbeuV5a/3V9lChoBkdAcH5OUdJaq2gHTbsBaAhHQGsbAood+5R1fZQoaAZHQHAthBzFMqVoB01bAWgIR0BrHLMgU1yedX2UKGgGR0BvgsqWkaddaAdNcwFoCEdAax58iOearnV9lChoBkdAcKY8Djin52gHTbEBaAhHQGsihyCFsYV1fZQoaAZHQHDo09lmOENoB01tAWgIR0BrJEV8CxNZdWUu"
69
+ },
70
+ "ep_success_buffer": {
71
+ ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
73
+ },
74
+ "_n_updates": 3908,
75
+ "observation_space": {
76
+ ":type:": "<class 'gymnasium.spaces.box.Box'>",
77
+ ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu",
78
+ "dtype": "float32",
79
+ "bounded_below": "[ True True True True True True True True]",
80
+ "bounded_above": "[ True True True True True True True True]",
81
+ "_shape": [
82
+ 8
83
+ ],
84
+ "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
85
+ "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
86
+ "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
87
+ "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
88
+ "_np_random": null
89
+ },
90
+ "action_space": {
91
+ ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
92
+ ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu",
93
+ "n": "4",
94
+ "start": "0",
95
+ "_shape": [],
96
+ "dtype": "int64",
97
+ "_np_random": null
98
+ },
99
+ "n_envs": 1,
100
+ "n_steps": 1024,
101
+ "gamma": 0.999,
102
+ "gae_lambda": 0.98,
103
+ "ent_coef": 0.01,
104
+ "vf_coef": 0.5,
105
+ "max_grad_norm": 0.5,
106
+ "batch_size": 64,
107
+ "n_epochs": 4,
108
+ "clip_range": {
109
+ ":type:": "<class 'function'>",
110
+ ":serialized:": "gAWVEgMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwg+AZUAVAEkAJROhZQpjAFflIWUjGcvVXNlcnMvc2FtcGxpbmcvV29ya3NwYWNlL1JML3VuaXQxLy52ZW52L2xpYi9weXRob24zLjEzL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMZy9Vc2Vycy9zYW1wbGluZy9Xb3Jrc3BhY2UvUkwvdW5pdDEvLnZlbnYvbGliL3B5dGhvbjMuMTMvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
111
+ },
112
+ "clip_range_vf": null,
113
+ "normalize_advantage": true,
114
+ "target_kl": null,
115
+ "lr_schedule": {
116
+ ":type:": "<class 'function'>",
117
+ ":serialized:": "gAWVEgMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwg+AZUAVAEkAJROhZQpjAFflIWUjGcvVXNlcnMvc2FtcGxpbmcvV29ya3NwYWNlL1JML3VuaXQxLy52ZW52L2xpYi9weXRob24zLjEzL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMZy9Vc2Vycy9zYW1wbGluZy9Xb3Jrc3BhY2UvUkwvdW5pdDEvLnZlbnYvbGliL3B5dGhvbjMuMTMvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
118
+ }
119
+ }
ppo-LunarLander-v2/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27560c1d0f29b23bdbf4805137716d65f3ff1b1ac777e1e20529981bb133ebde
3
+ size 88375
ppo-LunarLander-v2/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fea19844ed4e715e6f5a78c5c4b8f52f753b64a2e930686e7f0d9557840c4884
3
+ size 43967
ppo-LunarLander-v2/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b6bbfc035aeac78f3ee425960893ff8bb7927d3cf3425470ac4b6c6ce280c5d
3
+ size 1261
ppo-LunarLander-v2/system_info.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ - OS: macOS-15.6.1-arm64-arm-64bit-Mach-O Darwin Kernel Version 24.6.0: Mon Jul 14 11:30:34 PDT 2025; root:xnu-11417.140.69~1/RELEASE_ARM64_T8103
2
+ - Python: 3.13.4
3
+ - Stable-Baselines3: 2.0.0a5
4
+ - PyTorch: 2.8.0
5
+ - GPU Enabled: False
6
+ - Numpy: 2.3.2
7
+ - Cloudpickle: 3.1.1
8
+ - Gymnasium: 0.28.1
replay.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d60c508ca6138e15e3ad44814b5ca996a7fc436de3d8800b58351ce8c793aa7
3
+ size 180147
results.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"mean_reward": 242.9787788215837, "std_reward": 34.6137894715336, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-08-26T21:08:30.885733"}