Upload PPO LunarLander-v2 trained agent
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +2 -2
- ppo-LunarLander-v2/data +29 -37
- ppo-LunarLander-v2/policy.optimizer.pth +2 -2
- ppo-LunarLander-v2/policy.pth +2 -2
- ppo-LunarLander-v2/pytorch_variables.pth +1 -1
- ppo-LunarLander-v2/system_info.txt +7 -7
- replay.mp4 +2 -2
- results.json +1 -1
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value:
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: 275.78 +/- 17.29
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x37cc609a0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x37cc60a40>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x37cc60ae0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x37cc60b80>", "_build": "<function ActorCriticPolicy._build at 0x37cc60c20>", "forward": "<function ActorCriticPolicy.forward at 0x37cc60cc0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x37cc60d60>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x37cc60e00>", "_predict": "<function ActorCriticPolicy._predict at 0x37cc60ea0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x37cc60f40>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x37cc60fe0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x37cc61080>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x37cafad00>"}, "verbose": 1, "policy_kwargs": {"net_arch": [256, 256]}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1765036791869687000, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWV+QEAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0sDQxKXAGQBZAJ8AHoKAAB6BQAAUwCUTkc/Gjbi6xxDLUsBh5QpjAFflIWUjE4vdmFyL2ZvbGRlcnMva2wveTE3cGtxNG4zeHoycXk3YnZyYmRwaHFjMDAwMGduL1QvaXB5a2VybmVsXzU1NDM4LzM5Mzg1NjQwMjkucHmUjAg8bGFtYmRhPpRoDUsTQw6AAJhEoEGoAaFFmU6AAJRDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaBd9lH2UKGgUaA2MDF9fcXVhbG5hbWVfX5RoDYwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoFYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5ROjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADP+KL5XzGo/eMy6vWmtT75vQQK+cYGUPQAAAAAAAAAAzYyYuVJc9rvYCkK+rvpLu97JRz2ryd89AACAPwAAgD/gjSa+wSdNP7oMnL3DuZi+lmawvedJJL0AAAAAAAAAAIA7r70DTHI9mVWiPu/qK76afBA9ttolvQAAAAAAAAAAps7FvaQKMzybEWE9y5A1vpRBdL2AcT09AAAAAAAAAACalfy7ycUDPguVjT5BzDK+BAV1PdPEbD0AAAAAAAAAAA13mD2S4h0/ZfgTvjIRhb4F/WK86L6JvQAAAAAAAAAAM6tIPa+ApT4gD0s8NhBbvvIte7v4xf86AAAAAAAAAADNeLq9Roo0P+bCEb5itZ++WknMvTZ0GTwAAAAAAAAAAADYpzwc1Vi8bdvBOylotjw217m9efiSPQAAgD8AAIA/c4qqvfbkV7pW6T49sKcDNuaZzToIF/g0AAAAAAAAAADqrV6+4/MMP6D35zzaaW++2I6svTHliz0AAAAAAAAAANDBmj59a5o/XkO2PkeXur7vCng+inIevgAAAAAAAAAATYg/vRLa8jwe6cY8Zz1Zvu2KETyYu2S9AAAAAAAAAAAAfnu8i++vP6oavb5ZkeO+xJTPO0YqB70AAAAAAAAAANKenL4ROkg/JhLOvYYFtb6RCSy+phBfPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG6Ibs4T9KqMAWyUTU4BjAF0lEdAire2H1vl2nV9lChoBkdAcXcEdeY2KmgHTRkBaAhHQIq4Wn4wh4d1fZQoaAZHQGxXFQ2uPmxoB00oAWgIR0CKuKj/uLJkdX2UKGgGR0AoVhWo3rD7aAdL82gIR0CKuecx0uDjdX2UKGgGR0Bw6hQGfPHDaAdNVQFoCEdAirsgTZg5R3V9lChoBkdAbIGNI9TxXmgHTToBaAhHQIq8bo0Q9Rt1fZQoaAZHQG15srNGEwpoB00lAWgIR0CKvRWo3rD7dX2UKGgGR0BvQ0fcN6PbaAdNDgFoCEdAir0ebNKRMnV9lChoBkdAcnQa72+PBGgHTTIBaAhHQIq9XJYDDCR1fZQoaAZHQG4fPrWy1NRoB003AWgIR0CKvdz+WGATdX2UKGgGR0Bx62ePJaJRaAdNQwFoCEdAir6MiB5HE3V9lChoBkdAcUEiiZfD12gHTTABaAhHQIq+rSqlxfh1fZQoaAZHQG8h6uOjqOdoB00iAWgIR0CKvyCROk+HdX2UKGgGR0Bx+m65Gz8haAdNIQFoCEdAir+FRP420nV9lChoBkdAcb0HxjJ+2GgHTT8BaAhHQIrA4Wi1y/91fZQoaAZHQHDLtyYG+sZoB004AWgIR0CKwUydnTRZdX2UKGgGR0Bu6zTWoWHlaAdNNwFoCEdAisJRmbsniXV9lChoBkdAcM9+ERJ2+2gHTU0BaAhHQIrCpEWqLjx1fZQoaAZHQCJUTBZZB9loB0vpaAhHQIrDpnDiwSt1fZQoaAZHQESwe8PFvQ5oB0veaAhHQIrD1ELH+611fZQoaAZHQHBKc+qzZ6FoB01AAWgIR0CKxArhisnzdX2UKGgGR0BwVdRFZxJeaAdNPwFoCEdAisU3+dbxE3V9lChoBkdAbnzRl6JIlWgHTSkBaAhHQIrGV6Vt4zJ1fZQoaAZHQHD/b4Ju2qloB002AWgIR0CKx7pRoAXEdX2UKGgGR0Budz2g3974aAdNJAFoCEdAisfn4fwI+nV9lChoBkdAcS5de6ZpjGgHTV0BaAhHQIrIfcFhXsB1fZQoaAZHQHEKfoA4n4RoB00lAWgIR0CKyIzoEB8ydX2UKGgGR0BryXtx+8XfaAdNJAFoCEdAisjpwsGxEHV9lChoBkdAbs/OKO1fFGgHTVsBaAhHQIrJvYBeXzF1fZQoaAZHQG4XVQ66reZoB00rAWgIR0CKyoElE7W/dX2UKGgGR0BxbG2d/axpaAdNKQFoCEdAisraLfk3j3V9lChoBkdAbct5M10knmgHTRkBaAhHQIrLYFiay8l1fZQoaAZHQHHLZRXOnl5oB01FAWgIR0CKzRDNyHVPdX2UKGgGR0Bx6cM9bHIZaAdNHQFoCEdAis0/s3Q2M3V9lChoBkdAb/6+VTrE+GgHTS8BaAhHQIrNbIT4+KV1fZQoaAZHQHBlqubI91VoB005AWgIR0CKze2FWXC1dX2UKGgGR0BwpNRQ79ycaAdNNAFoCEdAis9IBJZntnV9lChoBkdAbmJa/RE4N2gHTTYBaAhHQIrQhid8Rcx1fZQoaAZHQGzUJ4B3iaRoB00fAWgIR0CK0P9Wp6yCdX2UKGgGR0BvgNEgGKQ8aAdNEAFoCEdAitFAXEZR9HV9lChoBkdAcbVfEn9ehWgHTQsBaAhHQIrRg/xDst11fZQoaAZHQG9m02tMfzVoB00wAWgIR0CK0kgoPTXrdX2UKGgGR0Bw03lmvnr6aAdNTAFoCEdAitKLtmcvunV9lChoBkdAcYQlRxcVxmgHTSoBaAhHQIrTS/Efkmx1fZQoaAZHQGBxoqLCN0hoB03oA2gIR0CK1FVQyhzvdX2UKGgGR0BwRQWKuSwGaAdNLAFoCEdAitUKJEYwZnV9lChoBkdAcHG+WGATZmgHTRQBaAhHQIrWLPIGQjl1fZQoaAZHQHFBOyquKXRoB01vAWgIR0CK1pwFTvRadX2UKGgGR0BxJToePq9oaAdNGQFoCEdAitb7y6MBIXV9lChoBkdAcbnlruYx+WgHTUsBaAhHQIrXr15B1Ld1fZQoaAZHQHIY6VdHDrJoB01VAWgIR0CK2FVFQVKxdX2UKGgGR0BwgnFtKqXGaAdNFAFoCEdAitnQ04zabnV9lChoBkdAckNtShrWRWgHTVgBaAhHQIraTfLs8gZ1fZQoaAZHQG5X181Gb1BoB00bAWgIR0CK2l3225QQdX2UKGgGR0BvlSkEcKgJaAdNMwFoCEdAitqeiSJTEXV9lChoBkdAbrtQqqfe12gHTUQBaAhHQIrau4G2TgV1fZQoaAZHQHBxpzPrv9doB00mAWgIR0CK22UO/cnFdX2UKGgGR0BxjUtvn8sMaAdNNAFoCEdAitwMMAmzB3V9lChoBkdAcW3PLPldT2gHTQEBaAhHQIrcS4SYgJV1fZQoaAZHQG9Jgntv4udoB002AWgIR0CK3MwTufEodX2UKGgGR0BwVqAqd6LPaAdNLAFoCEdAit4jr7fpEHV9lChoBkdAccBpbD/EO2gHTSoBaAhHQIrfKx5cC5p1fZQoaAZHQG5PFQMx46hoB00nAWgIR0CK3/Bt1p0wdX2UKGgGR0BwvZHz6JqJaAdNSgFoCEdAiuC37+DODHV9lChoBkdAcML3ljmSyWgHTTQBaAhHQIrhN6LOzIF1fZQoaAZHQG3Krh73PAxoB00oAWgIR0CK4YXuVopQdX2UKGgGR0ByQoYAKfFraAdNLwFoCEdAiuPr0J4SpXV9lChoBkdAcd6TUiILxGgHS/doCEdAiuQLiuMdcXV9lChoBkdAa2WsIVuaW2gHTTABaAhHQIrkbhNucc51fZQoaAZHQG4UG9xp+MJoB01DAWgIR0CK5J+TeO4odX2UKGgGR0ByBHY287IUaAdNVwFoCEdAiuTT/IbOvHV9lChoBkdAcDagMc6vJWgHTUQBaAhHQIrk+0ojOcF1fZQoaAZHQHFFo9kjHGVoB009AWgIR0CK5Zkd3jdYdX2UKGgGR0BwSmWE9MbnaAdNEwFoCEdAiuXV89fTkXV9lChoBkdAbXv1ZkkKNWgHTUIBaAhHQIrmpjhDPWx1fZQoaAZHQHDYrnTy8SRoB00gAWgIR0CK559zfaYedX2UKGgGR0Br6aufVZs9aAdNNgFoCEdAiulyeRPoFHV9lChoBkdAXaU5OrQw9WgHTegDaAhHQIrqXn8sMAp1fZQoaAZHQHB3S/O+qR5oB00xAWgIR0CK6tdrwe/6dX2UKGgGR0ByW62rn1WbaAdNUwFoCEdAius4FA3T/nV9lChoBkdAa/TBTn7pFGgHTSgBaAhHQIrrS1y/9Hd1fZQoaAZHQHGmugxrSE1oB00yAWgIR0CK61Jo0ygxdX2UKGgGR0Bu9WZ5Rjz7aAdNGgFoCEdAiuzhPCVKPHV9lChoBkdAcDnvAGjbjGgHTSwBaAhHQIruJI1+AmR1fZQoaAZHQHCphjawljVoB00UAWgIR0CK7jIyTINmdX2UKGgGR0Bx8uEg4ffXaAdNPwFoCEdAiu5hg/keZHV9lChoBkdAcdEVh1DBuWgHTToBaAhHQIrutJjDsMR1fZQoaAZHQG/6nUlRgqpoB003AWgIR0CK73P0I1LrdX2UKGgGR0ByA7VRUFSsaAdNZAFoCEdAiu+aVMVUM3V9lChoBkdAbTadTYNAkmgHTSgBaAhHQIrvzl3hXKd1fZQoaAZHQHG3fZElVtJoB00lAWgIR0CK8IgxJul5dX2UKGgGR0Bxm3jhky1vaAdNoAFoCEdAivCiosI3SHV9lChoBkdAcKgDIikftGgHTR4BaAhHQIryxOWSlnB1fZQoaAZHQG8aL/82rGRoB01AAWgIR0CK8wbz9S/CdX2UKGgGR0BuJEwvg3tKaAdNGwFoCEdAivODTBqKxnV9lChoBkdAcC4GMXJo02gHTSgBaAhHQIr0BJ2+wkh1fZQoaAZHQHE8CgPEsJ9oB009AWgIR0CK9DBvaURndX2UKGgGR0BwIolXzUZvaAdNSAFoCEdAivTsnJDE33V9lChoBkdAbFsf0VafSWgHTRIBaAhHQIr09pZfUnZ1fZQoaAZHQG/FJFCswL5oB00YAWgIR0CK9obS7Xg+dWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 460, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.97, "ent_coef": 0.0005, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjE0vb3B0L2FuYWNvbmRhMy9saWIvcHl0aG9uMy4xMi9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlEuEQwj4gADYDxKICpRDAJSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjE0vb3B0L2FuYWNvbmRhMy9saWIvcHl0aG9uMy4xMi9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoIX2UfZQoaBhoDYwMX19xdWFsbmFtZV9flGgOjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgZjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV+QEAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0sDQxKXAGQBZAJ8AHoKAAB6BQAAUwCUTkc/Gjbi6xxDLUsBh5QpjAFflIWUjE4vdmFyL2ZvbGRlcnMva2wveTE3cGtxNG4zeHoycXk3YnZyYmRwaHFjMDAwMGduL1QvaXB5a2VybmVsXzU1NDM4LzM5Mzg1NjQwMjkucHmUjAg8bGFtYmRhPpRoDUsTQw6AAJhEoEGoAaFFmU6AAJRDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaBd9lH2UKGgUaA2MDF9fcXVhbG5hbWVfX5RoDYwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoFYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5ROjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "macOS-15.6.1-arm64-arm-64bit Darwin Kernel Version 24.6.0: Mon Jul 14 11:30:40 PDT 2025; root:xnu-11417.140.69~1/RELEASE_ARM64_T6041", "Python": "3.12.2", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.7.0", "GPU Enabled": "False", "Numpy": "1.26.4", "Cloudpickle": "3.0.0", "Gymnasium": "0.28.1", "OpenAI Gym": "0.26.2"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x79dd3027fce0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x79dd3027fd80>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x79dd3027fe20>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x79dd3027fec0>", "_build": "<function ActorCriticPolicy._build at 0x79dd3027ff60>", "forward": "<function ActorCriticPolicy.forward at 0x79dd30280040>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x79dd302800e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x79dd30280180>", "_predict": "<function ActorCriticPolicy._predict at 0x79dd30280220>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x79dd302802c0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x79dd30280360>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x79dd30280400>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x79dd303e7780>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1765473389146329985, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAACm/7K9gueQPui4oT50P8y+ocIePj+5HT4AAAAAAAAAAM0oUTzL7K8935JHvgV4Ub6Hs7i9MaLGPAAAAAAAAAAAM/nMPLs0qrwGokC8xIhzPe0bmz01ebW8AACAPwAAgD/mbSA9CCOfPZNnYL0/JVa+2c6HPLLKpTwAAAAAAAAAAACfQj1k3vQ+JuEEvYKDlL7q/gE9jk98OAAAAAAAAAAAM0epO08rWj336BG+V9SBvuyZNbzeEZy9AAAAAAAAAABtrkQ+DVn1Pp7Eg72d4qG+JtGGPfZHRj0AAAAAAAAAABqfST0VRTA/znaivUaDt75Zfek8QOUavQAAAAAAAAAAmtuYvMEy8T2pXwK9ooGMvjJgrTygj808AAAAAAAAAADtHAm+2xC1PzpoF7+taoW+ddIWvr2El74AAAAAAAAAAICY4r2h1bY946USPjmhlL7adWw9lpmJPAAAAAAAAAAAM7PevGxr1LuBHjE+K1zpO9YmJ72Wj9E8AACAPwAAgD/I1Ya+UPCJP0eYnr47ReO+Bs7EvsIBLr0AAAAAAAAAAEAQtL16bI8/ghKlvZHI574zth6+/UjavAAAAAAAAAAAsw+NvVs9bz/abrO9ZmHOvnrU/r0uOHq8AAAAAAAAAAAQxqE+VEVePwLtmb0M9ae+S7xqPrfGtr0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVhAAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksQhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVFQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHEFle4TbnKMAWyUS+OMAXSUR0CYamL876pHdX2UKGgGR0Bxcvvx6OYIaAdL6mgIR0CYard5IH1OdX2UKGgGR0BzFQRSP2f1aAdNLwFoCEdAmGrWrfcesHV9lChoBkdAcdasOoYNzGgHTQMBaAhHQJhrIdU83dd1fZQoaAZHQHB8Ey+HrQhoB00rAWgIR0CYa4VEd/8VdX2UKGgGR0BwcwqAjIJaaAdNMwFoCEdAmGuS79Q40nV9lChoBkdAcQQmU4aP0mgHS/ZoCEdAmG3GUfPom3V9lChoBkdAcTpmtyPuHGgHS+VoCEdAmG4Mhs67unV9lChoBkdAcP3k9ECvHWgHTRMBaAhHQJhuWI1tO211fZQoaAZHQHGN3gP3BYVoB0vjaAhHQJhu7lRxcVx1fZQoaAZHQHCzEadc0LtoB0v0aAhHQJhvOnivPkd1fZQoaAZHQHEom8yvcJtoB00LAWgIR0CYb9Qw9JSSdX2UKGgGR0Bv+gsZpBX0aAdNFAFoCEdAmG//Qv6CUXV9lChoBkdAcS/xzaK1omgHS+1oCEdAmHAZSzgMt3V9lChoBkdAbp9ijL0SRWgHS+loCEdAmHCUtNBWxXV9lChoBkdAcCiMPSUkfWgHS/loCEdAmHCmPYFqz3V9lChoBkdAbbgDRtxdZGgHTQABaAhHQJhyM8r7O3V1fZQoaAZHQHAzWf5DZ15oB00SAWgIR0CYcjtPHktFdX2UKGgGR0BxKz9XLeQ/aAdNKAFoCEdAmHJ8/+sHSnV9lChoBkdAcEvxKg7HQ2gHTSUBaAhHQJhzPdoFmnR1fZQoaAZHQHIbrU1AJLNoB00dAmgIR0CYc8byH2ytdX2UKGgGR0BxSukTHsC1aAdNAwFoCEdAmHURTfixV3V9lChoBkdAcYoEg4ffXWgHS+NoCEdAmHV3qzJIUnV9lChoBkdAcptUvf0mMWgHS/9oCEdAmHX8CYCyQnV9lChoBkdAcmU9kBjnWGgHTTMBaAhHQJh2TbblA/t1fZQoaAZHQHI1V2aDwphoB0v0aAhHQJh22s6q8151fZQoaAZHQHGT5e/pMYdoB0v3aAhHQJh3NM7EHdJ1fZQoaAZHQHNU41k1/DtoB01RAWgIR0CYeFyd4FA3dX2UKGgGR0BxHTZmI0qIaAdNFwFoCEdAmHih8pkPMHV9lChoBkdAc2NoS+QEIWgHTR0BaAhHQJh5pgeA/cF1fZQoaAZHQG5X1vVEuxtoB00DAWgIR0CYerdhiLEUdX2UKGgGR0BvDuxY7q6faAdL+WgIR0CYerhBZ6lddX2UKGgGR0ByiIbZOBUaaAdNBwFoCEdAmHrjlxOtXHV9lChoBkdAbHWKF7D2rWgHS+xoCEdAmHwWe18b73V9lChoBkdAcXkkDZDiO2gHTQwBaAhHQJh8iZPVNHp1fZQoaAZHQHJ3AU1yeZpoB0vbaAhHQJh92PS2H+J1fZQoaAZHQHElczyjHn5oB0vnaAhHQJh+zI+4b0h1fZQoaAZHQG73KgyuZCxoB00GAWgIR0CYftxvNu+AdX2UKGgGR0BvxqKYRdyDaAdL6WgIR0CYki5P/JeWdX2UKGgGR0Bw2vXxvvSdaAdNAQFoCEdAmJKPyXlbNnV9lChoBkdAcFaQ79ycTmgHS+poCEdAmJOFWCEpRXV9lChoBkdAcejsLv1DjWgHTRABaAhHQJiTlGSZBs11fZQoaAZHQHAuB6v7m+1oB0v2aAhHQJiUojX4CZF1fZQoaAZHQG4jWhh6SkloB00jAWgIR0CYlPZbILgGdX2UKGgGR0BuY+38XN1RaAdL6WgIR0CYlRnUUfxMdX2UKGgGR0Bw0wDklu3uaAdNAAFoCEdAmJW6QJXyRXV9lChoBkdActhT3qRlpWgHTQsBaAhHQJiWJVWCEpR1fZQoaAZHQEpwSyMUAT9oB0vPaAhHQJiXbWxyGSJ1fZQoaAZHQHLzxzaK1ohoB00nAWgIR0CYl/MHKOktdX2UKGgGR0BxBc/iYLLIaAdNBwFoCEdAmJg/n0TURXV9lChoBkdAcsK3Sro4dmgHS/NoCEdAmJiDguRLb3V9lChoBkdAcMO72tdRi2gHTTgBaAhHQJiYzVPN3W51fZQoaAZHQGQ0VWCEpRZoB03oA2gIR0CYmachkiD/dX2UKGgGR0BwANSHdoFnaAdNAwFoCEdAmJnlqN6w+3V9lChoBkdAcaLWGATZhGgHTQ4BaAhHQJiZ5hx5s0p1fZQoaAZHQEy9G8VYZEVoB0vraAhHQJiaNnM+u/11fZQoaAZHQHLGc3uNPxhoB00BAWgIR0CYmrq0MPSVdX2UKGgGR0ByDFCUornUaAdL5WgIR0CYm0lTFVDKdX2UKGgGR0BxPrcYZVGTaAdNAwFoCEdAmJvdETg2qHV9lChoBkdAbhokTpPhymgHS+loCEdAmJw1TR6WxHV9lChoBkdAbvBRaX8fm2gHS9toCEdAmJxCFPBSDXV9lChoBkdAcWwSAYpDu2gHTSwBaAhHQJidUxVQyh11fZQoaAZHQHKzCyyD7IloB0vcaAhHQJidbLV4HHF1fZQoaAZHQHHTt+CsfaJoB0vtaAhHQJieggkka/B1fZQoaAZHQHBJQpF1B+poB0v9aAhHQJieuIdlum91fZQoaAZHQHDrPIbOu7poB00WAWgIR0CYoGOJ+DvmdX2UKGgGR0ByXUN4JNTMaAdL8WgIR0CYoIedTYNBdX2UKGgGR0BxjCqU/wAmaAdNKAFoCEdAmKCnXd0q6XV9lChoBkdAZkPr2QGOdWgHTegDaAhHQJihvaL4vex1fZQoaAZHQHDbx/qgRK9oB00bAWgIR0CYoc5jYqXodX2UKGgGR0By+GmelKsdaAdNJgFoCEdAmKHb5IpYtHV9lChoBkdAcxw0SRKYiWgHS9ZoCEdAmKHvu1F6RnV9lChoBkdAbjyK8cuJ12gHS/BoCEdAmKIdWdVebHV9lChoBkdAcO8XiBGx2WgHTQwBaAhHQJiiQrmQr+Z1fZQoaAZHQHFGYbn5i3JoB00qAWgIR0CYonqS5iEydX2UKGgGR0BwrsNQTEiuaAdL42gIR0CYo5gAp8WsdX2UKGgGR0Bw/+KdhAnlaAdL42gIR0CYo7JO32EkdX2UKGgGR0A5cRP420iRaAdLemgIR0CYo7fKp1ifdX2UKGgGR0BxTs+RoysTaAdNHQFoCEdAmKP3qmj0tnV9lChoBkdAbe8er+5vtWgHTSQBaAhHQJikFESdvsJ1fZQoaAZHQHLKjFZPl+5oB00CAWgIR0CYpUY/3WWhdX2UKGgGR0BxvZYigTRIaAdL/mgIR0CYpVmzByjpdX2UKGgGR0Bw/VFEy+HraAdL0mgIR0CYpY8a4tpVdX2UKGgGR0BxCGvmozeoaAdL7GgIR0CYpqTHKfWddX2UKGgGR0BzDUOlO45MaAdL2WgIR0CYqIiOearndX2UKGgGR0BwYF1dPci4aAdNBAFoCEdAmKkZNj9XLnV9lChoBkdAbYTFglWwNmgHS/FoCEdAmKkliz9jw3V9lChoBkdAc07p84Pwu2gHTRQBaAhHQJip5YFJQLx1fZQoaAZHQHJZIkVvddpoB00XAWgIR0CYql9bX6IndX2UKGgGR0BxYzkkrwvyaAdNKAFoCEdAmKqOUD+zdHV9lChoBkdAcN/lOoHcDmgHTSwBaAhHQJiq23b212J1fZQoaAZHQHNM4d+5OJtoB0vwaAhHQJirR13dKul1fZQoaAZHQG4TivPkaMtoB0v6aAhHQJirgIv8IiV1fZQoaAZHQHLutM0xdptoB0v1aAhHQJirgUFjd591fZQoaAZHQHN/zSLIgeRoB00CAWgIR0CYrGQxN7BwdX2UKGgGR0Bvwc+u/1xsaAdNHQFoCEdAmK0kfozN2XV9lChoBkdAcelEIgNgB2gHS/xoCEdAmK4zoMa0hXV9lChoBkdAcO55WRzRyGgHS/RoCEdAmK467EpAlnV9lChoBkdAb6RdAxBVuWgHTQMBaAhHQJiuTFUADJV1fZQoaAZHQHMPE/GEPDpoB0vqaAhHQJiuudZq20B1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 368, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.6.105+-x86_64-with-glibc2.35 # 1 SMP Thu Oct 2 10:42:05 UTC 2025", "Python": "3.12.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.9.0+cu126", "GPU Enabled": "True", "Numpy": "2.0.2", "Cloudpickle": "3.1.2", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
ppo-LunarLander-v2.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e57cabf84425751b7860bd200819d976843ad957f124c809111b7ef6de5ff9e
|
| 3 |
+
size 149119
|
ppo-LunarLander-v2/data
CHANGED
|
@@ -4,46 +4,38 @@
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
| 8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
| 9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
| 10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
| 11 |
-
"_build": "<function ActorCriticPolicy._build at
|
| 12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
| 13 |
-
"extract_features": "<function ActorCriticPolicy.extract_features at
|
| 14 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
| 15 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
| 16 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
| 17 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
| 18 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
-
"_abc_impl": "<_abc._abc_data object at
|
| 21 |
},
|
| 22 |
"verbose": 1,
|
| 23 |
-
"policy_kwargs": {
|
| 24 |
-
"net_arch": [
|
| 25 |
-
256,
|
| 26 |
-
256
|
| 27 |
-
]
|
| 28 |
-
},
|
| 29 |
"num_timesteps": 1507328,
|
| 30 |
"_total_timesteps": 1500000,
|
| 31 |
"_num_timesteps_at_start": 0,
|
| 32 |
"seed": null,
|
| 33 |
"action_noise": null,
|
| 34 |
-
"start_time":
|
| 35 |
-
"learning_rate":
|
| 36 |
-
":type:": "<class 'function'>",
|
| 37 |
-
":serialized:": "gAWV+QEAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0sDQxKXAGQBZAJ8AHoKAAB6BQAAUwCUTkc/Gjbi6xxDLUsBh5QpjAFflIWUjE4vdmFyL2ZvbGRlcnMva2wveTE3cGtxNG4zeHoycXk3YnZyYmRwaHFjMDAwMGduL1QvaXB5a2VybmVsXzU1NDM4LzM5Mzg1NjQwMjkucHmUjAg8bGFtYmRhPpRoDUsTQw6AAJhEoEGoAaFFmU6AAJRDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaBd9lH2UKGgUaA2MDF9fcXVhbG5hbWVfX5RoDYwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoFYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5ROjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
| 38 |
-
},
|
| 39 |
"tensorboard_log": null,
|
| 40 |
"_last_obs": {
|
| 41 |
":type:": "<class 'numpy.ndarray'>",
|
| 42 |
-
":serialized:": "
|
| 43 |
},
|
| 44 |
"_last_episode_starts": {
|
| 45 |
":type:": "<class 'numpy.ndarray'>",
|
| 46 |
-
":serialized:": "
|
| 47 |
},
|
| 48 |
"_last_original_obs": null,
|
| 49 |
"_episode_num": 0,
|
|
@@ -53,16 +45,16 @@
|
|
| 53 |
"_stats_window_size": 100,
|
| 54 |
"ep_info_buffer": {
|
| 55 |
":type:": "<class 'collections.deque'>",
|
| 56 |
-
":serialized:": "
|
| 57 |
},
|
| 58 |
"ep_success_buffer": {
|
| 59 |
":type:": "<class 'collections.deque'>",
|
| 60 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 61 |
},
|
| 62 |
-
"_n_updates":
|
| 63 |
"observation_space": {
|
| 64 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
| 65 |
-
":serialized:": "
|
| 66 |
"dtype": "float32",
|
| 67 |
"bounded_below": "[ True True True True True True True True]",
|
| 68 |
"bounded_above": "[ True True True True True True True True]",
|
|
@@ -77,7 +69,7 @@
|
|
| 77 |
},
|
| 78 |
"action_space": {
|
| 79 |
":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
|
| 80 |
-
":serialized:": "
|
| 81 |
"n": "4",
|
| 82 |
"start": "0",
|
| 83 |
"_shape": [],
|
|
@@ -85,23 +77,23 @@
|
|
| 85 |
"_np_random": null
|
| 86 |
},
|
| 87 |
"n_envs": 16,
|
| 88 |
-
"n_steps":
|
| 89 |
-
"gamma": 0.
|
| 90 |
-
"gae_lambda": 0.
|
| 91 |
-
"ent_coef": 0.
|
| 92 |
"vf_coef": 0.5,
|
| 93 |
"max_grad_norm": 0.5,
|
| 94 |
"batch_size": 64,
|
| 95 |
-
"n_epochs":
|
| 96 |
"clip_range": {
|
| 97 |
":type:": "<class 'function'>",
|
| 98 |
-
":serialized:": "
|
| 99 |
},
|
| 100 |
"clip_range_vf": null,
|
| 101 |
"normalize_advantage": true,
|
| 102 |
"target_kl": null,
|
| 103 |
"lr_schedule": {
|
| 104 |
":type:": "<class 'function'>",
|
| 105 |
-
":serialized:": "
|
| 106 |
}
|
| 107 |
}
|
|
|
|
| 4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x79dd3027fce0>",
|
| 8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x79dd3027fd80>",
|
| 9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x79dd3027fe20>",
|
| 10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x79dd3027fec0>",
|
| 11 |
+
"_build": "<function ActorCriticPolicy._build at 0x79dd3027ff60>",
|
| 12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x79dd30280040>",
|
| 13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x79dd302800e0>",
|
| 14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x79dd30280180>",
|
| 15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x79dd30280220>",
|
| 16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x79dd302802c0>",
|
| 17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x79dd30280360>",
|
| 18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x79dd30280400>",
|
| 19 |
"__abstractmethods__": "frozenset()",
|
| 20 |
+
"_abc_impl": "<_abc._abc_data object at 0x79dd303e7780>"
|
| 21 |
},
|
| 22 |
"verbose": 1,
|
| 23 |
+
"policy_kwargs": {},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 24 |
"num_timesteps": 1507328,
|
| 25 |
"_total_timesteps": 1500000,
|
| 26 |
"_num_timesteps_at_start": 0,
|
| 27 |
"seed": null,
|
| 28 |
"action_noise": null,
|
| 29 |
+
"start_time": 1765473389146329985,
|
| 30 |
+
"learning_rate": 0.0003,
|
|
|
|
|
|
|
|
|
|
| 31 |
"tensorboard_log": null,
|
| 32 |
"_last_obs": {
|
| 33 |
":type:": "<class 'numpy.ndarray'>",
|
| 34 |
+
":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAACm/7K9gueQPui4oT50P8y+ocIePj+5HT4AAAAAAAAAAM0oUTzL7K8935JHvgV4Ub6Hs7i9MaLGPAAAAAAAAAAAM/nMPLs0qrwGokC8xIhzPe0bmz01ebW8AACAPwAAgD/mbSA9CCOfPZNnYL0/JVa+2c6HPLLKpTwAAAAAAAAAAACfQj1k3vQ+JuEEvYKDlL7q/gE9jk98OAAAAAAAAAAAM0epO08rWj336BG+V9SBvuyZNbzeEZy9AAAAAAAAAABtrkQ+DVn1Pp7Eg72d4qG+JtGGPfZHRj0AAAAAAAAAABqfST0VRTA/znaivUaDt75Zfek8QOUavQAAAAAAAAAAmtuYvMEy8T2pXwK9ooGMvjJgrTygj808AAAAAAAAAADtHAm+2xC1PzpoF7+taoW+ddIWvr2El74AAAAAAAAAAICY4r2h1bY946USPjmhlL7adWw9lpmJPAAAAAAAAAAAM7PevGxr1LuBHjE+K1zpO9YmJ72Wj9E8AACAPwAAgD/I1Ya+UPCJP0eYnr47ReO+Bs7EvsIBLr0AAAAAAAAAAEAQtL16bI8/ghKlvZHI574zth6+/UjavAAAAAAAAAAAsw+NvVs9bz/abrO9ZmHOvnrU/r0uOHq8AAAAAAAAAAAQxqE+VEVePwLtmb0M9ae+S7xqPrfGtr0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="
|
| 35 |
},
|
| 36 |
"_last_episode_starts": {
|
| 37 |
":type:": "<class 'numpy.ndarray'>",
|
| 38 |
+
":serialized:": "gAWVhAAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksQhZSMAUOUdJRSlC4="
|
| 39 |
},
|
| 40 |
"_last_original_obs": null,
|
| 41 |
"_episode_num": 0,
|
|
|
|
| 45 |
"_stats_window_size": 100,
|
| 46 |
"ep_info_buffer": {
|
| 47 |
":type:": "<class 'collections.deque'>",
|
| 48 |
+
":serialized:": "gAWVFQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHEFle4TbnKMAWyUS+OMAXSUR0CYamL876pHdX2UKGgGR0Bxcvvx6OYIaAdL6mgIR0CYard5IH1OdX2UKGgGR0BzFQRSP2f1aAdNLwFoCEdAmGrWrfcesHV9lChoBkdAcdasOoYNzGgHTQMBaAhHQJhrIdU83dd1fZQoaAZHQHB8Ey+HrQhoB00rAWgIR0CYa4VEd/8VdX2UKGgGR0BwcwqAjIJaaAdNMwFoCEdAmGuS79Q40nV9lChoBkdAcQQmU4aP0mgHS/ZoCEdAmG3GUfPom3V9lChoBkdAcTpmtyPuHGgHS+VoCEdAmG4Mhs67unV9lChoBkdAcP3k9ECvHWgHTRMBaAhHQJhuWI1tO211fZQoaAZHQHGN3gP3BYVoB0vjaAhHQJhu7lRxcVx1fZQoaAZHQHCzEadc0LtoB0v0aAhHQJhvOnivPkd1fZQoaAZHQHEom8yvcJtoB00LAWgIR0CYb9Qw9JSSdX2UKGgGR0Bv+gsZpBX0aAdNFAFoCEdAmG//Qv6CUXV9lChoBkdAcS/xzaK1omgHS+1oCEdAmHAZSzgMt3V9lChoBkdAbp9ijL0SRWgHS+loCEdAmHCUtNBWxXV9lChoBkdAcCiMPSUkfWgHS/loCEdAmHCmPYFqz3V9lChoBkdAbbgDRtxdZGgHTQABaAhHQJhyM8r7O3V1fZQoaAZHQHAzWf5DZ15oB00SAWgIR0CYcjtPHktFdX2UKGgGR0BxKz9XLeQ/aAdNKAFoCEdAmHJ8/+sHSnV9lChoBkdAcEvxKg7HQ2gHTSUBaAhHQJhzPdoFmnR1fZQoaAZHQHIbrU1AJLNoB00dAmgIR0CYc8byH2ytdX2UKGgGR0BxSukTHsC1aAdNAwFoCEdAmHURTfixV3V9lChoBkdAcYoEg4ffXWgHS+NoCEdAmHV3qzJIUnV9lChoBkdAcptUvf0mMWgHS/9oCEdAmHX8CYCyQnV9lChoBkdAcmU9kBjnWGgHTTMBaAhHQJh2TbblA/t1fZQoaAZHQHI1V2aDwphoB0v0aAhHQJh22s6q8151fZQoaAZHQHGT5e/pMYdoB0v3aAhHQJh3NM7EHdJ1fZQoaAZHQHNU41k1/DtoB01RAWgIR0CYeFyd4FA3dX2UKGgGR0BxHTZmI0qIaAdNFwFoCEdAmHih8pkPMHV9lChoBkdAc2NoS+QEIWgHTR0BaAhHQJh5pgeA/cF1fZQoaAZHQG5X1vVEuxtoB00DAWgIR0CYerdhiLEUdX2UKGgGR0BvDuxY7q6faAdL+WgIR0CYerhBZ6lddX2UKGgGR0ByiIbZOBUaaAdNBwFoCEdAmHrjlxOtXHV9lChoBkdAbHWKF7D2rWgHS+xoCEdAmHwWe18b73V9lChoBkdAcXkkDZDiO2gHTQwBaAhHQJh8iZPVNHp1fZQoaAZHQHJ3AU1yeZpoB0vbaAhHQJh92PS2H+J1fZQoaAZHQHElczyjHn5oB0vnaAhHQJh+zI+4b0h1fZQoaAZHQG73KgyuZCxoB00GAWgIR0CYftxvNu+AdX2UKGgGR0BvxqKYRdyDaAdL6WgIR0CYki5P/JeWdX2UKGgGR0Bw2vXxvvSdaAdNAQFoCEdAmJKPyXlbNnV9lChoBkdAcFaQ79ycTmgHS+poCEdAmJOFWCEpRXV9lChoBkdAcejsLv1DjWgHTRABaAhHQJiTlGSZBs11fZQoaAZHQHAuB6v7m+1oB0v2aAhHQJiUojX4CZF1fZQoaAZHQG4jWhh6SkloB00jAWgIR0CYlPZbILgGdX2UKGgGR0BuY+38XN1RaAdL6WgIR0CYlRnUUfxMdX2UKGgGR0Bw0wDklu3uaAdNAAFoCEdAmJW6QJXyRXV9lChoBkdActhT3qRlpWgHTQsBaAhHQJiWJVWCEpR1fZQoaAZHQEpwSyMUAT9oB0vPaAhHQJiXbWxyGSJ1fZQoaAZHQHLzxzaK1ohoB00nAWgIR0CYl/MHKOktdX2UKGgGR0BxBc/iYLLIaAdNBwFoCEdAmJg/n0TURXV9lChoBkdAcsK3Sro4dmgHS/NoCEdAmJiDguRLb3V9lChoBkdAcMO72tdRi2gHTTgBaAhHQJiYzVPN3W51fZQoaAZHQGQ0VWCEpRZoB03oA2gIR0CYmachkiD/dX2UKGgGR0BwANSHdoFnaAdNAwFoCEdAmJnlqN6w+3V9lChoBkdAcaLWGATZhGgHTQ4BaAhHQJiZ5hx5s0p1fZQoaAZHQEy9G8VYZEVoB0vraAhHQJiaNnM+u/11fZQoaAZHQHLGc3uNPxhoB00BAWgIR0CYmrq0MPSVdX2UKGgGR0ByDFCUornUaAdL5WgIR0CYm0lTFVDKdX2UKGgGR0BxPrcYZVGTaAdNAwFoCEdAmJvdETg2qHV9lChoBkdAbhokTpPhymgHS+loCEdAmJw1TR6WxHV9lChoBkdAbvBRaX8fm2gHS9toCEdAmJxCFPBSDXV9lChoBkdAcWwSAYpDu2gHTSwBaAhHQJidUxVQyh11fZQoaAZHQHKzCyyD7IloB0vcaAhHQJidbLV4HHF1fZQoaAZHQHHTt+CsfaJoB0vtaAhHQJieggkka/B1fZQoaAZHQHBJQpF1B+poB0v9aAhHQJieuIdlum91fZQoaAZHQHDrPIbOu7poB00WAWgIR0CYoGOJ+DvmdX2UKGgGR0ByXUN4JNTMaAdL8WgIR0CYoIedTYNBdX2UKGgGR0BxjCqU/wAmaAdNKAFoCEdAmKCnXd0q6XV9lChoBkdAZkPr2QGOdWgHTegDaAhHQJihvaL4vex1fZQoaAZHQHDbx/qgRK9oB00bAWgIR0CYoc5jYqXodX2UKGgGR0By+GmelKsdaAdNJgFoCEdAmKHb5IpYtHV9lChoBkdAcxw0SRKYiWgHS9ZoCEdAmKHvu1F6RnV9lChoBkdAbjyK8cuJ12gHS/BoCEdAmKIdWdVebHV9lChoBkdAcO8XiBGx2WgHTQwBaAhHQJiiQrmQr+Z1fZQoaAZHQHFGYbn5i3JoB00qAWgIR0CYonqS5iEydX2UKGgGR0BwrsNQTEiuaAdL42gIR0CYo5gAp8WsdX2UKGgGR0Bw/+KdhAnlaAdL42gIR0CYo7JO32EkdX2UKGgGR0A5cRP420iRaAdLemgIR0CYo7fKp1ifdX2UKGgGR0BxTs+RoysTaAdNHQFoCEdAmKP3qmj0tnV9lChoBkdAbe8er+5vtWgHTSQBaAhHQJikFESdvsJ1fZQoaAZHQHLKjFZPl+5oB00CAWgIR0CYpUY/3WWhdX2UKGgGR0BxvZYigTRIaAdL/mgIR0CYpVmzByjpdX2UKGgGR0Bw/VFEy+HraAdL0mgIR0CYpY8a4tpVdX2UKGgGR0BxCGvmozeoaAdL7GgIR0CYpqTHKfWddX2UKGgGR0BzDUOlO45MaAdL2WgIR0CYqIiOearndX2UKGgGR0BwYF1dPci4aAdNBAFoCEdAmKkZNj9XLnV9lChoBkdAbYTFglWwNmgHS/FoCEdAmKkliz9jw3V9lChoBkdAc07p84Pwu2gHTRQBaAhHQJip5YFJQLx1fZQoaAZHQHJZIkVvddpoB00XAWgIR0CYql9bX6IndX2UKGgGR0BxYzkkrwvyaAdNKAFoCEdAmKqOUD+zdHV9lChoBkdAcN/lOoHcDmgHTSwBaAhHQJiq23b212J1fZQoaAZHQHNM4d+5OJtoB0vwaAhHQJirR13dKul1fZQoaAZHQG4TivPkaMtoB0v6aAhHQJirgIv8IiV1fZQoaAZHQHLutM0xdptoB0v1aAhHQJirgUFjd591fZQoaAZHQHN/zSLIgeRoB00CAWgIR0CYrGQxN7BwdX2UKGgGR0Bvwc+u/1xsaAdNHQFoCEdAmK0kfozN2XV9lChoBkdAcelEIgNgB2gHS/xoCEdAmK4zoMa0hXV9lChoBkdAcO55WRzRyGgHS/RoCEdAmK467EpAlnV9lChoBkdAb6RdAxBVuWgHTQMBaAhHQJiuTFUADJV1fZQoaAZHQHMPE/GEPDpoB0vqaAhHQJiuudZq20B1ZS4="
|
| 49 |
},
|
| 50 |
"ep_success_buffer": {
|
| 51 |
":type:": "<class 'collections.deque'>",
|
| 52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 53 |
},
|
| 54 |
+
"_n_updates": 368,
|
| 55 |
"observation_space": {
|
| 56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
| 57 |
+
":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu",
|
| 58 |
"dtype": "float32",
|
| 59 |
"bounded_below": "[ True True True True True True True True]",
|
| 60 |
"bounded_above": "[ True True True True True True True True]",
|
|
|
|
| 69 |
},
|
| 70 |
"action_space": {
|
| 71 |
":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
|
| 72 |
+
":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu",
|
| 73 |
"n": "4",
|
| 74 |
"start": "0",
|
| 75 |
"_shape": [],
|
|
|
|
| 77 |
"_np_random": null
|
| 78 |
},
|
| 79 |
"n_envs": 16,
|
| 80 |
+
"n_steps": 1024,
|
| 81 |
+
"gamma": 0.999,
|
| 82 |
+
"gae_lambda": 0.98,
|
| 83 |
+
"ent_coef": 0.01,
|
| 84 |
"vf_coef": 0.5,
|
| 85 |
"max_grad_norm": 0.5,
|
| 86 |
"batch_size": 64,
|
| 87 |
+
"n_epochs": 4,
|
| 88 |
"clip_range": {
|
| 89 |
":type:": "<class 'function'>",
|
| 90 |
+
":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
| 91 |
},
|
| 92 |
"clip_range_vf": null,
|
| 93 |
"normalize_advantage": true,
|
| 94 |
"target_kl": null,
|
| 95 |
"lr_schedule": {
|
| 96 |
":type:": "<class 'function'>",
|
| 97 |
+
":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
| 98 |
}
|
| 99 |
}
|
ppo-LunarLander-v2/policy.optimizer.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5a8b82a91cf3cdfe41aeafecbe0fc52038e1a3592406ead2b06fc4885244e91
|
| 3 |
+
size 88695
|
ppo-LunarLander-v2/policy.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b4220b30a703513238096fd1a75956ba205314d4dfe112638d0e2a007aeb647
|
| 3 |
+
size 44095
|
ppo-LunarLander-v2/pytorch_variables.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1261
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:07c7431cf6005e7d8f367d79e995f63e2f9b981a37e3437b795d058f9af4308b
|
| 3 |
size 1261
|
ppo-LunarLander-v2/system_info.txt
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
-
- OS:
|
| 2 |
-
- Python: 3.12.
|
| 3 |
- Stable-Baselines3: 2.0.0a5
|
| 4 |
-
- PyTorch: 2.
|
| 5 |
-
- GPU Enabled:
|
| 6 |
-
- Numpy:
|
| 7 |
-
- Cloudpickle: 3.
|
| 8 |
- Gymnasium: 0.28.1
|
| 9 |
-
- OpenAI Gym: 0.
|
|
|
|
| 1 |
+
- OS: Linux-6.6.105+-x86_64-with-glibc2.35 # 1 SMP Thu Oct 2 10:42:05 UTC 2025
|
| 2 |
+
- Python: 3.12.12
|
| 3 |
- Stable-Baselines3: 2.0.0a5
|
| 4 |
+
- PyTorch: 2.9.0+cu126
|
| 5 |
+
- GPU Enabled: True
|
| 6 |
+
- Numpy: 2.0.2
|
| 7 |
+
- Cloudpickle: 3.1.2
|
| 8 |
- Gymnasium: 0.28.1
|
| 9 |
+
- OpenAI Gym: 0.25.2
|
replay.mp4
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33c60f47cb8fc1d053f797569ccf8f41ced461123b4fa2a7becac136d21804f7
|
| 3 |
+
size 147427
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward":
|
|
|
|
| 1 |
+
{"mean_reward": 275.7800392308601, "std_reward": 17.288160639183115, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-12-11T17:42:51.775045"}
|