metapat973 commited on
Commit
6e1b18a
·
verified ·
1 Parent(s): c06605c

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 209.82 +/- 73.31
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 275.78 +/- 17.29
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x37cc609a0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x37cc60a40>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x37cc60ae0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x37cc60b80>", "_build": "<function ActorCriticPolicy._build at 0x37cc60c20>", "forward": "<function ActorCriticPolicy.forward at 0x37cc60cc0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x37cc60d60>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x37cc60e00>", "_predict": "<function ActorCriticPolicy._predict at 0x37cc60ea0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x37cc60f40>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x37cc60fe0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x37cc61080>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x37cafad00>"}, "verbose": 1, "policy_kwargs": {"net_arch": [256, 256]}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1765036791869687000, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWV+QEAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0sDQxKXAGQBZAJ8AHoKAAB6BQAAUwCUTkc/Gjbi6xxDLUsBh5QpjAFflIWUjE4vdmFyL2ZvbGRlcnMva2wveTE3cGtxNG4zeHoycXk3YnZyYmRwaHFjMDAwMGduL1QvaXB5a2VybmVsXzU1NDM4LzM5Mzg1NjQwMjkucHmUjAg8bGFtYmRhPpRoDUsTQw6AAJhEoEGoAaFFmU6AAJRDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaBd9lH2UKGgUaA2MDF9fcXVhbG5hbWVfX5RoDYwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoFYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5ROjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADP+KL5XzGo/eMy6vWmtT75vQQK+cYGUPQAAAAAAAAAAzYyYuVJc9rvYCkK+rvpLu97JRz2ryd89AACAPwAAgD/gjSa+wSdNP7oMnL3DuZi+lmawvedJJL0AAAAAAAAAAIA7r70DTHI9mVWiPu/qK76afBA9ttolvQAAAAAAAAAAps7FvaQKMzybEWE9y5A1vpRBdL2AcT09AAAAAAAAAACalfy7ycUDPguVjT5BzDK+BAV1PdPEbD0AAAAAAAAAAA13mD2S4h0/ZfgTvjIRhb4F/WK86L6JvQAAAAAAAAAAM6tIPa+ApT4gD0s8NhBbvvIte7v4xf86AAAAAAAAAADNeLq9Roo0P+bCEb5itZ++WknMvTZ0GTwAAAAAAAAAAADYpzwc1Vi8bdvBOylotjw217m9efiSPQAAgD8AAIA/c4qqvfbkV7pW6T49sKcDNuaZzToIF/g0AAAAAAAAAADqrV6+4/MMP6D35zzaaW++2I6svTHliz0AAAAAAAAAANDBmj59a5o/XkO2PkeXur7vCng+inIevgAAAAAAAAAATYg/vRLa8jwe6cY8Zz1Zvu2KETyYu2S9AAAAAAAAAAAAfnu8i++vP6oavb5ZkeO+xJTPO0YqB70AAAAAAAAAANKenL4ROkg/JhLOvYYFtb6RCSy+phBfPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG6Ibs4T9KqMAWyUTU4BjAF0lEdAire2H1vl2nV9lChoBkdAcXcEdeY2KmgHTRkBaAhHQIq4Wn4wh4d1fZQoaAZHQGxXFQ2uPmxoB00oAWgIR0CKuKj/uLJkdX2UKGgGR0AoVhWo3rD7aAdL82gIR0CKuecx0uDjdX2UKGgGR0Bw6hQGfPHDaAdNVQFoCEdAirsgTZg5R3V9lChoBkdAbIGNI9TxXmgHTToBaAhHQIq8bo0Q9Rt1fZQoaAZHQG15srNGEwpoB00lAWgIR0CKvRWo3rD7dX2UKGgGR0BvQ0fcN6PbaAdNDgFoCEdAir0ebNKRMnV9lChoBkdAcnQa72+PBGgHTTIBaAhHQIq9XJYDDCR1fZQoaAZHQG4fPrWy1NRoB003AWgIR0CKvdz+WGATdX2UKGgGR0Bx62ePJaJRaAdNQwFoCEdAir6MiB5HE3V9lChoBkdAcUEiiZfD12gHTTABaAhHQIq+rSqlxfh1fZQoaAZHQG8h6uOjqOdoB00iAWgIR0CKvyCROk+HdX2UKGgGR0Bx+m65Gz8haAdNIQFoCEdAir+FRP420nV9lChoBkdAcb0HxjJ+2GgHTT8BaAhHQIrA4Wi1y/91fZQoaAZHQHDLtyYG+sZoB004AWgIR0CKwUydnTRZdX2UKGgGR0Bu6zTWoWHlaAdNNwFoCEdAisJRmbsniXV9lChoBkdAcM9+ERJ2+2gHTU0BaAhHQIrCpEWqLjx1fZQoaAZHQCJUTBZZB9loB0vpaAhHQIrDpnDiwSt1fZQoaAZHQESwe8PFvQ5oB0veaAhHQIrD1ELH+611fZQoaAZHQHBKc+qzZ6FoB01AAWgIR0CKxArhisnzdX2UKGgGR0BwVdRFZxJeaAdNPwFoCEdAisU3+dbxE3V9lChoBkdAbnzRl6JIlWgHTSkBaAhHQIrGV6Vt4zJ1fZQoaAZHQHD/b4Ju2qloB002AWgIR0CKx7pRoAXEdX2UKGgGR0Budz2g3974aAdNJAFoCEdAisfn4fwI+nV9lChoBkdAcS5de6ZpjGgHTV0BaAhHQIrIfcFhXsB1fZQoaAZHQHEKfoA4n4RoB00lAWgIR0CKyIzoEB8ydX2UKGgGR0BryXtx+8XfaAdNJAFoCEdAisjpwsGxEHV9lChoBkdAbs/OKO1fFGgHTVsBaAhHQIrJvYBeXzF1fZQoaAZHQG4XVQ66reZoB00rAWgIR0CKyoElE7W/dX2UKGgGR0BxbG2d/axpaAdNKQFoCEdAisraLfk3j3V9lChoBkdAbct5M10knmgHTRkBaAhHQIrLYFiay8l1fZQoaAZHQHHLZRXOnl5oB01FAWgIR0CKzRDNyHVPdX2UKGgGR0Bx6cM9bHIZaAdNHQFoCEdAis0/s3Q2M3V9lChoBkdAb/6+VTrE+GgHTS8BaAhHQIrNbIT4+KV1fZQoaAZHQHBlqubI91VoB005AWgIR0CKze2FWXC1dX2UKGgGR0BwpNRQ79ycaAdNNAFoCEdAis9IBJZntnV9lChoBkdAbmJa/RE4N2gHTTYBaAhHQIrQhid8Rcx1fZQoaAZHQGzUJ4B3iaRoB00fAWgIR0CK0P9Wp6yCdX2UKGgGR0BvgNEgGKQ8aAdNEAFoCEdAitFAXEZR9HV9lChoBkdAcbVfEn9ehWgHTQsBaAhHQIrRg/xDst11fZQoaAZHQG9m02tMfzVoB00wAWgIR0CK0kgoPTXrdX2UKGgGR0Bw03lmvnr6aAdNTAFoCEdAitKLtmcvunV9lChoBkdAcYQlRxcVxmgHTSoBaAhHQIrTS/Efkmx1fZQoaAZHQGBxoqLCN0hoB03oA2gIR0CK1FVQyhzvdX2UKGgGR0BwRQWKuSwGaAdNLAFoCEdAitUKJEYwZnV9lChoBkdAcHG+WGATZmgHTRQBaAhHQIrWLPIGQjl1fZQoaAZHQHFBOyquKXRoB01vAWgIR0CK1pwFTvRadX2UKGgGR0BxJToePq9oaAdNGQFoCEdAitb7y6MBIXV9lChoBkdAcbnlruYx+WgHTUsBaAhHQIrXr15B1Ld1fZQoaAZHQHIY6VdHDrJoB01VAWgIR0CK2FVFQVKxdX2UKGgGR0BwgnFtKqXGaAdNFAFoCEdAitnQ04zabnV9lChoBkdAckNtShrWRWgHTVgBaAhHQIraTfLs8gZ1fZQoaAZHQG5X181Gb1BoB00bAWgIR0CK2l3225QQdX2UKGgGR0BvlSkEcKgJaAdNMwFoCEdAitqeiSJTEXV9lChoBkdAbrtQqqfe12gHTUQBaAhHQIrau4G2TgV1fZQoaAZHQHBxpzPrv9doB00mAWgIR0CK22UO/cnFdX2UKGgGR0BxjUtvn8sMaAdNNAFoCEdAitwMMAmzB3V9lChoBkdAcW3PLPldT2gHTQEBaAhHQIrcS4SYgJV1fZQoaAZHQG9Jgntv4udoB002AWgIR0CK3MwTufEodX2UKGgGR0BwVqAqd6LPaAdNLAFoCEdAit4jr7fpEHV9lChoBkdAccBpbD/EO2gHTSoBaAhHQIrfKx5cC5p1fZQoaAZHQG5PFQMx46hoB00nAWgIR0CK3/Bt1p0wdX2UKGgGR0BwvZHz6JqJaAdNSgFoCEdAiuC37+DODHV9lChoBkdAcML3ljmSyWgHTTQBaAhHQIrhN6LOzIF1fZQoaAZHQG3Krh73PAxoB00oAWgIR0CK4YXuVopQdX2UKGgGR0ByQoYAKfFraAdNLwFoCEdAiuPr0J4SpXV9lChoBkdAcd6TUiILxGgHS/doCEdAiuQLiuMdcXV9lChoBkdAa2WsIVuaW2gHTTABaAhHQIrkbhNucc51fZQoaAZHQG4UG9xp+MJoB01DAWgIR0CK5J+TeO4odX2UKGgGR0ByBHY287IUaAdNVwFoCEdAiuTT/IbOvHV9lChoBkdAcDagMc6vJWgHTUQBaAhHQIrk+0ojOcF1fZQoaAZHQHFFo9kjHGVoB009AWgIR0CK5Zkd3jdYdX2UKGgGR0BwSmWE9MbnaAdNEwFoCEdAiuXV89fTkXV9lChoBkdAbXv1ZkkKNWgHTUIBaAhHQIrmpjhDPWx1fZQoaAZHQHDYrnTy8SRoB00gAWgIR0CK559zfaYedX2UKGgGR0Br6aufVZs9aAdNNgFoCEdAiulyeRPoFHV9lChoBkdAXaU5OrQw9WgHTegDaAhHQIrqXn8sMAp1fZQoaAZHQHB3S/O+qR5oB00xAWgIR0CK6tdrwe/6dX2UKGgGR0ByW62rn1WbaAdNUwFoCEdAius4FA3T/nV9lChoBkdAa/TBTn7pFGgHTSgBaAhHQIrrS1y/9Hd1fZQoaAZHQHGmugxrSE1oB00yAWgIR0CK61Jo0ygxdX2UKGgGR0Bu9WZ5Rjz7aAdNGgFoCEdAiuzhPCVKPHV9lChoBkdAcDnvAGjbjGgHTSwBaAhHQIruJI1+AmR1fZQoaAZHQHCphjawljVoB00UAWgIR0CK7jIyTINmdX2UKGgGR0Bx8uEg4ffXaAdNPwFoCEdAiu5hg/keZHV9lChoBkdAcdEVh1DBuWgHTToBaAhHQIrutJjDsMR1fZQoaAZHQG/6nUlRgqpoB003AWgIR0CK73P0I1LrdX2UKGgGR0ByA7VRUFSsaAdNZAFoCEdAiu+aVMVUM3V9lChoBkdAbTadTYNAkmgHTSgBaAhHQIrvzl3hXKd1fZQoaAZHQHG3fZElVtJoB00lAWgIR0CK8IgxJul5dX2UKGgGR0Bxm3jhky1vaAdNoAFoCEdAivCiosI3SHV9lChoBkdAcKgDIikftGgHTR4BaAhHQIryxOWSlnB1fZQoaAZHQG8aL/82rGRoB01AAWgIR0CK8wbz9S/CdX2UKGgGR0BuJEwvg3tKaAdNGwFoCEdAivODTBqKxnV9lChoBkdAcC4GMXJo02gHTSgBaAhHQIr0BJ2+wkh1fZQoaAZHQHE8CgPEsJ9oB009AWgIR0CK9DBvaURndX2UKGgGR0BwIolXzUZvaAdNSAFoCEdAivTsnJDE33V9lChoBkdAbFsf0VafSWgHTRIBaAhHQIr09pZfUnZ1fZQoaAZHQG/FJFCswL5oB00YAWgIR0CK9obS7Xg+dWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 460, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.97, "ent_coef": 0.0005, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjE0vb3B0L2FuYWNvbmRhMy9saWIvcHl0aG9uMy4xMi9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlEuEQwj4gADYDxKICpRDAJSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjE0vb3B0L2FuYWNvbmRhMy9saWIvcHl0aG9uMy4xMi9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoIX2UfZQoaBhoDYwMX19xdWFsbmFtZV9flGgOjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgZjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV+QEAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0sDQxKXAGQBZAJ8AHoKAAB6BQAAUwCUTkc/Gjbi6xxDLUsBh5QpjAFflIWUjE4vdmFyL2ZvbGRlcnMva2wveTE3cGtxNG4zeHoycXk3YnZyYmRwaHFjMDAwMGduL1QvaXB5a2VybmVsXzU1NDM4LzM5Mzg1NjQwMjkucHmUjAg8bGFtYmRhPpRoDUsTQw6AAJhEoEGoAaFFmU6AAJRDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaBd9lH2UKGgUaA2MDF9fcXVhbG5hbWVfX5RoDYwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoFYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5ROjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "macOS-15.6.1-arm64-arm-64bit Darwin Kernel Version 24.6.0: Mon Jul 14 11:30:40 PDT 2025; root:xnu-11417.140.69~1/RELEASE_ARM64_T6041", "Python": "3.12.2", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.7.0", "GPU Enabled": "False", "Numpy": "1.26.4", "Cloudpickle": "3.0.0", "Gymnasium": "0.28.1", "OpenAI Gym": "0.26.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x79dd3027fce0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x79dd3027fd80>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x79dd3027fe20>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x79dd3027fec0>", "_build": "<function ActorCriticPolicy._build at 0x79dd3027ff60>", "forward": "<function ActorCriticPolicy.forward at 0x79dd30280040>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x79dd302800e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x79dd30280180>", "_predict": "<function ActorCriticPolicy._predict at 0x79dd30280220>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x79dd302802c0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x79dd30280360>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x79dd30280400>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x79dd303e7780>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1765473389146329985, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAACm/7K9gueQPui4oT50P8y+ocIePj+5HT4AAAAAAAAAAM0oUTzL7K8935JHvgV4Ub6Hs7i9MaLGPAAAAAAAAAAAM/nMPLs0qrwGokC8xIhzPe0bmz01ebW8AACAPwAAgD/mbSA9CCOfPZNnYL0/JVa+2c6HPLLKpTwAAAAAAAAAAACfQj1k3vQ+JuEEvYKDlL7q/gE9jk98OAAAAAAAAAAAM0epO08rWj336BG+V9SBvuyZNbzeEZy9AAAAAAAAAABtrkQ+DVn1Pp7Eg72d4qG+JtGGPfZHRj0AAAAAAAAAABqfST0VRTA/znaivUaDt75Zfek8QOUavQAAAAAAAAAAmtuYvMEy8T2pXwK9ooGMvjJgrTygj808AAAAAAAAAADtHAm+2xC1PzpoF7+taoW+ddIWvr2El74AAAAAAAAAAICY4r2h1bY946USPjmhlL7adWw9lpmJPAAAAAAAAAAAM7PevGxr1LuBHjE+K1zpO9YmJ72Wj9E8AACAPwAAgD/I1Ya+UPCJP0eYnr47ReO+Bs7EvsIBLr0AAAAAAAAAAEAQtL16bI8/ghKlvZHI574zth6+/UjavAAAAAAAAAAAsw+NvVs9bz/abrO9ZmHOvnrU/r0uOHq8AAAAAAAAAAAQxqE+VEVePwLtmb0M9ae+S7xqPrfGtr0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVhAAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksQhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVFQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHEFle4TbnKMAWyUS+OMAXSUR0CYamL876pHdX2UKGgGR0Bxcvvx6OYIaAdL6mgIR0CYard5IH1OdX2UKGgGR0BzFQRSP2f1aAdNLwFoCEdAmGrWrfcesHV9lChoBkdAcdasOoYNzGgHTQMBaAhHQJhrIdU83dd1fZQoaAZHQHB8Ey+HrQhoB00rAWgIR0CYa4VEd/8VdX2UKGgGR0BwcwqAjIJaaAdNMwFoCEdAmGuS79Q40nV9lChoBkdAcQQmU4aP0mgHS/ZoCEdAmG3GUfPom3V9lChoBkdAcTpmtyPuHGgHS+VoCEdAmG4Mhs67unV9lChoBkdAcP3k9ECvHWgHTRMBaAhHQJhuWI1tO211fZQoaAZHQHGN3gP3BYVoB0vjaAhHQJhu7lRxcVx1fZQoaAZHQHCzEadc0LtoB0v0aAhHQJhvOnivPkd1fZQoaAZHQHEom8yvcJtoB00LAWgIR0CYb9Qw9JSSdX2UKGgGR0Bv+gsZpBX0aAdNFAFoCEdAmG//Qv6CUXV9lChoBkdAcS/xzaK1omgHS+1oCEdAmHAZSzgMt3V9lChoBkdAbp9ijL0SRWgHS+loCEdAmHCUtNBWxXV9lChoBkdAcCiMPSUkfWgHS/loCEdAmHCmPYFqz3V9lChoBkdAbbgDRtxdZGgHTQABaAhHQJhyM8r7O3V1fZQoaAZHQHAzWf5DZ15oB00SAWgIR0CYcjtPHktFdX2UKGgGR0BxKz9XLeQ/aAdNKAFoCEdAmHJ8/+sHSnV9lChoBkdAcEvxKg7HQ2gHTSUBaAhHQJhzPdoFmnR1fZQoaAZHQHIbrU1AJLNoB00dAmgIR0CYc8byH2ytdX2UKGgGR0BxSukTHsC1aAdNAwFoCEdAmHURTfixV3V9lChoBkdAcYoEg4ffXWgHS+NoCEdAmHV3qzJIUnV9lChoBkdAcptUvf0mMWgHS/9oCEdAmHX8CYCyQnV9lChoBkdAcmU9kBjnWGgHTTMBaAhHQJh2TbblA/t1fZQoaAZHQHI1V2aDwphoB0v0aAhHQJh22s6q8151fZQoaAZHQHGT5e/pMYdoB0v3aAhHQJh3NM7EHdJ1fZQoaAZHQHNU41k1/DtoB01RAWgIR0CYeFyd4FA3dX2UKGgGR0BxHTZmI0qIaAdNFwFoCEdAmHih8pkPMHV9lChoBkdAc2NoS+QEIWgHTR0BaAhHQJh5pgeA/cF1fZQoaAZHQG5X1vVEuxtoB00DAWgIR0CYerdhiLEUdX2UKGgGR0BvDuxY7q6faAdL+WgIR0CYerhBZ6lddX2UKGgGR0ByiIbZOBUaaAdNBwFoCEdAmHrjlxOtXHV9lChoBkdAbHWKF7D2rWgHS+xoCEdAmHwWe18b73V9lChoBkdAcXkkDZDiO2gHTQwBaAhHQJh8iZPVNHp1fZQoaAZHQHJ3AU1yeZpoB0vbaAhHQJh92PS2H+J1fZQoaAZHQHElczyjHn5oB0vnaAhHQJh+zI+4b0h1fZQoaAZHQG73KgyuZCxoB00GAWgIR0CYftxvNu+AdX2UKGgGR0BvxqKYRdyDaAdL6WgIR0CYki5P/JeWdX2UKGgGR0Bw2vXxvvSdaAdNAQFoCEdAmJKPyXlbNnV9lChoBkdAcFaQ79ycTmgHS+poCEdAmJOFWCEpRXV9lChoBkdAcejsLv1DjWgHTRABaAhHQJiTlGSZBs11fZQoaAZHQHAuB6v7m+1oB0v2aAhHQJiUojX4CZF1fZQoaAZHQG4jWhh6SkloB00jAWgIR0CYlPZbILgGdX2UKGgGR0BuY+38XN1RaAdL6WgIR0CYlRnUUfxMdX2UKGgGR0Bw0wDklu3uaAdNAAFoCEdAmJW6QJXyRXV9lChoBkdActhT3qRlpWgHTQsBaAhHQJiWJVWCEpR1fZQoaAZHQEpwSyMUAT9oB0vPaAhHQJiXbWxyGSJ1fZQoaAZHQHLzxzaK1ohoB00nAWgIR0CYl/MHKOktdX2UKGgGR0BxBc/iYLLIaAdNBwFoCEdAmJg/n0TURXV9lChoBkdAcsK3Sro4dmgHS/NoCEdAmJiDguRLb3V9lChoBkdAcMO72tdRi2gHTTgBaAhHQJiYzVPN3W51fZQoaAZHQGQ0VWCEpRZoB03oA2gIR0CYmachkiD/dX2UKGgGR0BwANSHdoFnaAdNAwFoCEdAmJnlqN6w+3V9lChoBkdAcaLWGATZhGgHTQ4BaAhHQJiZ5hx5s0p1fZQoaAZHQEy9G8VYZEVoB0vraAhHQJiaNnM+u/11fZQoaAZHQHLGc3uNPxhoB00BAWgIR0CYmrq0MPSVdX2UKGgGR0ByDFCUornUaAdL5WgIR0CYm0lTFVDKdX2UKGgGR0BxPrcYZVGTaAdNAwFoCEdAmJvdETg2qHV9lChoBkdAbhokTpPhymgHS+loCEdAmJw1TR6WxHV9lChoBkdAbvBRaX8fm2gHS9toCEdAmJxCFPBSDXV9lChoBkdAcWwSAYpDu2gHTSwBaAhHQJidUxVQyh11fZQoaAZHQHKzCyyD7IloB0vcaAhHQJidbLV4HHF1fZQoaAZHQHHTt+CsfaJoB0vtaAhHQJieggkka/B1fZQoaAZHQHBJQpF1B+poB0v9aAhHQJieuIdlum91fZQoaAZHQHDrPIbOu7poB00WAWgIR0CYoGOJ+DvmdX2UKGgGR0ByXUN4JNTMaAdL8WgIR0CYoIedTYNBdX2UKGgGR0BxjCqU/wAmaAdNKAFoCEdAmKCnXd0q6XV9lChoBkdAZkPr2QGOdWgHTegDaAhHQJihvaL4vex1fZQoaAZHQHDbx/qgRK9oB00bAWgIR0CYoc5jYqXodX2UKGgGR0By+GmelKsdaAdNJgFoCEdAmKHb5IpYtHV9lChoBkdAcxw0SRKYiWgHS9ZoCEdAmKHvu1F6RnV9lChoBkdAbjyK8cuJ12gHS/BoCEdAmKIdWdVebHV9lChoBkdAcO8XiBGx2WgHTQwBaAhHQJiiQrmQr+Z1fZQoaAZHQHFGYbn5i3JoB00qAWgIR0CYonqS5iEydX2UKGgGR0BwrsNQTEiuaAdL42gIR0CYo5gAp8WsdX2UKGgGR0Bw/+KdhAnlaAdL42gIR0CYo7JO32EkdX2UKGgGR0A5cRP420iRaAdLemgIR0CYo7fKp1ifdX2UKGgGR0BxTs+RoysTaAdNHQFoCEdAmKP3qmj0tnV9lChoBkdAbe8er+5vtWgHTSQBaAhHQJikFESdvsJ1fZQoaAZHQHLKjFZPl+5oB00CAWgIR0CYpUY/3WWhdX2UKGgGR0BxvZYigTRIaAdL/mgIR0CYpVmzByjpdX2UKGgGR0Bw/VFEy+HraAdL0mgIR0CYpY8a4tpVdX2UKGgGR0BxCGvmozeoaAdL7GgIR0CYpqTHKfWddX2UKGgGR0BzDUOlO45MaAdL2WgIR0CYqIiOearndX2UKGgGR0BwYF1dPci4aAdNBAFoCEdAmKkZNj9XLnV9lChoBkdAbYTFglWwNmgHS/FoCEdAmKkliz9jw3V9lChoBkdAc07p84Pwu2gHTRQBaAhHQJip5YFJQLx1fZQoaAZHQHJZIkVvddpoB00XAWgIR0CYql9bX6IndX2UKGgGR0BxYzkkrwvyaAdNKAFoCEdAmKqOUD+zdHV9lChoBkdAcN/lOoHcDmgHTSwBaAhHQJiq23b212J1fZQoaAZHQHNM4d+5OJtoB0vwaAhHQJirR13dKul1fZQoaAZHQG4TivPkaMtoB0v6aAhHQJirgIv8IiV1fZQoaAZHQHLutM0xdptoB0v1aAhHQJirgUFjd591fZQoaAZHQHN/zSLIgeRoB00CAWgIR0CYrGQxN7BwdX2UKGgGR0Bvwc+u/1xsaAdNHQFoCEdAmK0kfozN2XV9lChoBkdAcelEIgNgB2gHS/xoCEdAmK4zoMa0hXV9lChoBkdAcO55WRzRyGgHS/RoCEdAmK467EpAlnV9lChoBkdAb6RdAxBVuWgHTQMBaAhHQJiuTFUADJV1fZQoaAZHQHMPE/GEPDpoB0vqaAhHQJiuudZq20B1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 368, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.6.105+-x86_64-with-glibc2.35 # 1 SMP Thu Oct 2 10:42:05 UTC 2025", "Python": "3.12.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.9.0+cu126", "GPU Enabled": "True", "Numpy": "2.0.2", "Cloudpickle": "3.1.2", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:401049f780bc1355c4fd9e66dc2005df42b317bc3d3a0cabe997aac772608a98
3
- size 1681530
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e57cabf84425751b7860bd200819d976843ad957f124c809111b7ef6de5ff9e
3
+ size 149119
ppo-LunarLander-v2/data CHANGED
@@ -4,46 +4,38 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x37cc609a0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x37cc60a40>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x37cc60ae0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x37cc60b80>",
11
- "_build": "<function ActorCriticPolicy._build at 0x37cc60c20>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x37cc60cc0>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x37cc60d60>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x37cc60e00>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x37cc60ea0>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x37cc60f40>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x37cc60fe0>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x37cc61080>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x37cafad00>"
21
  },
22
  "verbose": 1,
23
- "policy_kwargs": {
24
- "net_arch": [
25
- 256,
26
- 256
27
- ]
28
- },
29
  "num_timesteps": 1507328,
30
  "_total_timesteps": 1500000,
31
  "_num_timesteps_at_start": 0,
32
  "seed": null,
33
  "action_noise": null,
34
- "start_time": 1765036791869687000,
35
- "learning_rate": {
36
- ":type:": "<class 'function'>",
37
- ":serialized:": "gAWV+QEAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0sDQxKXAGQBZAJ8AHoKAAB6BQAAUwCUTkc/Gjbi6xxDLUsBh5QpjAFflIWUjE4vdmFyL2ZvbGRlcnMva2wveTE3cGtxNG4zeHoycXk3YnZyYmRwaHFjMDAwMGduL1QvaXB5a2VybmVsXzU1NDM4LzM5Mzg1NjQwMjkucHmUjAg8bGFtYmRhPpRoDUsTQw6AAJhEoEGoAaFFmU6AAJRDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaBd9lH2UKGgUaA2MDF9fcXVhbG5hbWVfX5RoDYwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoFYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5ROjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
38
- },
39
  "tensorboard_log": null,
40
  "_last_obs": {
41
  ":type:": "<class 'numpy.ndarray'>",
42
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADP+KL5XzGo/eMy6vWmtT75vQQK+cYGUPQAAAAAAAAAAzYyYuVJc9rvYCkK+rvpLu97JRz2ryd89AACAPwAAgD/gjSa+wSdNP7oMnL3DuZi+lmawvedJJL0AAAAAAAAAAIA7r70DTHI9mVWiPu/qK76afBA9ttolvQAAAAAAAAAAps7FvaQKMzybEWE9y5A1vpRBdL2AcT09AAAAAAAAAACalfy7ycUDPguVjT5BzDK+BAV1PdPEbD0AAAAAAAAAAA13mD2S4h0/ZfgTvjIRhb4F/WK86L6JvQAAAAAAAAAAM6tIPa+ApT4gD0s8NhBbvvIte7v4xf86AAAAAAAAAADNeLq9Roo0P+bCEb5itZ++WknMvTZ0GTwAAAAAAAAAAADYpzwc1Vi8bdvBOylotjw217m9efiSPQAAgD8AAIA/c4qqvfbkV7pW6T49sKcDNuaZzToIF/g0AAAAAAAAAADqrV6+4/MMP6D35zzaaW++2I6svTHliz0AAAAAAAAAANDBmj59a5o/XkO2PkeXur7vCng+inIevgAAAAAAAAAATYg/vRLa8jwe6cY8Zz1Zvu2KETyYu2S9AAAAAAAAAAAAfnu8i++vP6oavb5ZkeO+xJTPO0YqB70AAAAAAAAAANKenL4ROkg/JhLOvYYFtb6RCSy+phBfPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
43
  },
44
  "_last_episode_starts": {
45
  ":type:": "<class 'numpy.ndarray'>",
46
- ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
47
  },
48
  "_last_original_obs": null,
49
  "_episode_num": 0,
@@ -53,16 +45,16 @@
53
  "_stats_window_size": 100,
54
  "ep_info_buffer": {
55
  ":type:": "<class 'collections.deque'>",
56
- ":serialized:": "gAWVQAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG6Ibs4T9KqMAWyUTU4BjAF0lEdAire2H1vl2nV9lChoBkdAcXcEdeY2KmgHTRkBaAhHQIq4Wn4wh4d1fZQoaAZHQGxXFQ2uPmxoB00oAWgIR0CKuKj/uLJkdX2UKGgGR0AoVhWo3rD7aAdL82gIR0CKuecx0uDjdX2UKGgGR0Bw6hQGfPHDaAdNVQFoCEdAirsgTZg5R3V9lChoBkdAbIGNI9TxXmgHTToBaAhHQIq8bo0Q9Rt1fZQoaAZHQG15srNGEwpoB00lAWgIR0CKvRWo3rD7dX2UKGgGR0BvQ0fcN6PbaAdNDgFoCEdAir0ebNKRMnV9lChoBkdAcnQa72+PBGgHTTIBaAhHQIq9XJYDDCR1fZQoaAZHQG4fPrWy1NRoB003AWgIR0CKvdz+WGATdX2UKGgGR0Bx62ePJaJRaAdNQwFoCEdAir6MiB5HE3V9lChoBkdAcUEiiZfD12gHTTABaAhHQIq+rSqlxfh1fZQoaAZHQG8h6uOjqOdoB00iAWgIR0CKvyCROk+HdX2UKGgGR0Bx+m65Gz8haAdNIQFoCEdAir+FRP420nV9lChoBkdAcb0HxjJ+2GgHTT8BaAhHQIrA4Wi1y/91fZQoaAZHQHDLtyYG+sZoB004AWgIR0CKwUydnTRZdX2UKGgGR0Bu6zTWoWHlaAdNNwFoCEdAisJRmbsniXV9lChoBkdAcM9+ERJ2+2gHTU0BaAhHQIrCpEWqLjx1fZQoaAZHQCJUTBZZB9loB0vpaAhHQIrDpnDiwSt1fZQoaAZHQESwe8PFvQ5oB0veaAhHQIrD1ELH+611fZQoaAZHQHBKc+qzZ6FoB01AAWgIR0CKxArhisnzdX2UKGgGR0BwVdRFZxJeaAdNPwFoCEdAisU3+dbxE3V9lChoBkdAbnzRl6JIlWgHTSkBaAhHQIrGV6Vt4zJ1fZQoaAZHQHD/b4Ju2qloB002AWgIR0CKx7pRoAXEdX2UKGgGR0Budz2g3974aAdNJAFoCEdAisfn4fwI+nV9lChoBkdAcS5de6ZpjGgHTV0BaAhHQIrIfcFhXsB1fZQoaAZHQHEKfoA4n4RoB00lAWgIR0CKyIzoEB8ydX2UKGgGR0BryXtx+8XfaAdNJAFoCEdAisjpwsGxEHV9lChoBkdAbs/OKO1fFGgHTVsBaAhHQIrJvYBeXzF1fZQoaAZHQG4XVQ66reZoB00rAWgIR0CKyoElE7W/dX2UKGgGR0BxbG2d/axpaAdNKQFoCEdAisraLfk3j3V9lChoBkdAbct5M10knmgHTRkBaAhHQIrLYFiay8l1fZQoaAZHQHHLZRXOnl5oB01FAWgIR0CKzRDNyHVPdX2UKGgGR0Bx6cM9bHIZaAdNHQFoCEdAis0/s3Q2M3V9lChoBkdAb/6+VTrE+GgHTS8BaAhHQIrNbIT4+KV1fZQoaAZHQHBlqubI91VoB005AWgIR0CKze2FWXC1dX2UKGgGR0BwpNRQ79ycaAdNNAFoCEdAis9IBJZntnV9lChoBkdAbmJa/RE4N2gHTTYBaAhHQIrQhid8Rcx1fZQoaAZHQGzUJ4B3iaRoB00fAWgIR0CK0P9Wp6yCdX2UKGgGR0BvgNEgGKQ8aAdNEAFoCEdAitFAXEZR9HV9lChoBkdAcbVfEn9ehWgHTQsBaAhHQIrRg/xDst11fZQoaAZHQG9m02tMfzVoB00wAWgIR0CK0kgoPTXrdX2UKGgGR0Bw03lmvnr6aAdNTAFoCEdAitKLtmcvunV9lChoBkdAcYQlRxcVxmgHTSoBaAhHQIrTS/Efkmx1fZQoaAZHQGBxoqLCN0hoB03oA2gIR0CK1FVQyhzvdX2UKGgGR0BwRQWKuSwGaAdNLAFoCEdAitUKJEYwZnV9lChoBkdAcHG+WGATZmgHTRQBaAhHQIrWLPIGQjl1fZQoaAZHQHFBOyquKXRoB01vAWgIR0CK1pwFTvRadX2UKGgGR0BxJToePq9oaAdNGQFoCEdAitb7y6MBIXV9lChoBkdAcbnlruYx+WgHTUsBaAhHQIrXr15B1Ld1fZQoaAZHQHIY6VdHDrJoB01VAWgIR0CK2FVFQVKxdX2UKGgGR0BwgnFtKqXGaAdNFAFoCEdAitnQ04zabnV9lChoBkdAckNtShrWRWgHTVgBaAhHQIraTfLs8gZ1fZQoaAZHQG5X181Gb1BoB00bAWgIR0CK2l3225QQdX2UKGgGR0BvlSkEcKgJaAdNMwFoCEdAitqeiSJTEXV9lChoBkdAbrtQqqfe12gHTUQBaAhHQIrau4G2TgV1fZQoaAZHQHBxpzPrv9doB00mAWgIR0CK22UO/cnFdX2UKGgGR0BxjUtvn8sMaAdNNAFoCEdAitwMMAmzB3V9lChoBkdAcW3PLPldT2gHTQEBaAhHQIrcS4SYgJV1fZQoaAZHQG9Jgntv4udoB002AWgIR0CK3MwTufEodX2UKGgGR0BwVqAqd6LPaAdNLAFoCEdAit4jr7fpEHV9lChoBkdAccBpbD/EO2gHTSoBaAhHQIrfKx5cC5p1fZQoaAZHQG5PFQMx46hoB00nAWgIR0CK3/Bt1p0wdX2UKGgGR0BwvZHz6JqJaAdNSgFoCEdAiuC37+DODHV9lChoBkdAcML3ljmSyWgHTTQBaAhHQIrhN6LOzIF1fZQoaAZHQG3Krh73PAxoB00oAWgIR0CK4YXuVopQdX2UKGgGR0ByQoYAKfFraAdNLwFoCEdAiuPr0J4SpXV9lChoBkdAcd6TUiILxGgHS/doCEdAiuQLiuMdcXV9lChoBkdAa2WsIVuaW2gHTTABaAhHQIrkbhNucc51fZQoaAZHQG4UG9xp+MJoB01DAWgIR0CK5J+TeO4odX2UKGgGR0ByBHY287IUaAdNVwFoCEdAiuTT/IbOvHV9lChoBkdAcDagMc6vJWgHTUQBaAhHQIrk+0ojOcF1fZQoaAZHQHFFo9kjHGVoB009AWgIR0CK5Zkd3jdYdX2UKGgGR0BwSmWE9MbnaAdNEwFoCEdAiuXV89fTkXV9lChoBkdAbXv1ZkkKNWgHTUIBaAhHQIrmpjhDPWx1fZQoaAZHQHDYrnTy8SRoB00gAWgIR0CK559zfaYedX2UKGgGR0Br6aufVZs9aAdNNgFoCEdAiulyeRPoFHV9lChoBkdAXaU5OrQw9WgHTegDaAhHQIrqXn8sMAp1fZQoaAZHQHB3S/O+qR5oB00xAWgIR0CK6tdrwe/6dX2UKGgGR0ByW62rn1WbaAdNUwFoCEdAius4FA3T/nV9lChoBkdAa/TBTn7pFGgHTSgBaAhHQIrrS1y/9Hd1fZQoaAZHQHGmugxrSE1oB00yAWgIR0CK61Jo0ygxdX2UKGgGR0Bu9WZ5Rjz7aAdNGgFoCEdAiuzhPCVKPHV9lChoBkdAcDnvAGjbjGgHTSwBaAhHQIruJI1+AmR1fZQoaAZHQHCphjawljVoB00UAWgIR0CK7jIyTINmdX2UKGgGR0Bx8uEg4ffXaAdNPwFoCEdAiu5hg/keZHV9lChoBkdAcdEVh1DBuWgHTToBaAhHQIrutJjDsMR1fZQoaAZHQG/6nUlRgqpoB003AWgIR0CK73P0I1LrdX2UKGgGR0ByA7VRUFSsaAdNZAFoCEdAiu+aVMVUM3V9lChoBkdAbTadTYNAkmgHTSgBaAhHQIrvzl3hXKd1fZQoaAZHQHG3fZElVtJoB00lAWgIR0CK8IgxJul5dX2UKGgGR0Bxm3jhky1vaAdNoAFoCEdAivCiosI3SHV9lChoBkdAcKgDIikftGgHTR4BaAhHQIryxOWSlnB1fZQoaAZHQG8aL/82rGRoB01AAWgIR0CK8wbz9S/CdX2UKGgGR0BuJEwvg3tKaAdNGwFoCEdAivODTBqKxnV9lChoBkdAcC4GMXJo02gHTSgBaAhHQIr0BJ2+wkh1fZQoaAZHQHE8CgPEsJ9oB009AWgIR0CK9DBvaURndX2UKGgGR0BwIolXzUZvaAdNSAFoCEdAivTsnJDE33V9lChoBkdAbFsf0VafSWgHTRIBaAhHQIr09pZfUnZ1fZQoaAZHQG/FJFCswL5oB00YAWgIR0CK9obS7Xg+dWUu"
57
  },
58
  "ep_success_buffer": {
59
  ":type:": "<class 'collections.deque'>",
60
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
61
  },
62
- "_n_updates": 460,
63
  "observation_space": {
64
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
65
- ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
66
  "dtype": "float32",
67
  "bounded_below": "[ True True True True True True True True]",
68
  "bounded_above": "[ True True True True True True True True]",
@@ -77,7 +69,7 @@
77
  },
78
  "action_space": {
79
  ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
80
- ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=",
81
  "n": "4",
82
  "start": "0",
83
  "_shape": [],
@@ -85,23 +77,23 @@
85
  "_np_random": null
86
  },
87
  "n_envs": 16,
88
- "n_steps": 2048,
89
- "gamma": 0.99,
90
- "gae_lambda": 0.97,
91
- "ent_coef": 0.0005,
92
  "vf_coef": 0.5,
93
  "max_grad_norm": 0.5,
94
  "batch_size": 64,
95
- "n_epochs": 10,
96
  "clip_range": {
97
  ":type:": "<class 'function'>",
98
- ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjE0vb3B0L2FuYWNvbmRhMy9saWIvcHl0aG9uMy4xMi9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlEuEQwj4gADYDxKICpRDAJSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjE0vb3B0L2FuYWNvbmRhMy9saWIvcHl0aG9uMy4xMi9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoIX2UfZQoaBhoDYwMX19xdWFsbmFtZV9flGgOjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgZjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
99
  },
100
  "clip_range_vf": null,
101
  "normalize_advantage": true,
102
  "target_kl": null,
103
  "lr_schedule": {
104
  ":type:": "<class 'function'>",
105
- ":serialized:": "gAWV+QEAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0sDQxKXAGQBZAJ8AHoKAAB6BQAAUwCUTkc/Gjbi6xxDLUsBh5QpjAFflIWUjE4vdmFyL2ZvbGRlcnMva2wveTE3cGtxNG4zeHoycXk3YnZyYmRwaHFjMDAwMGduL1QvaXB5a2VybmVsXzU1NDM4LzM5Mzg1NjQwMjkucHmUjAg8bGFtYmRhPpRoDUsTQw6AAJhEoEGoAaFFmU6AAJRDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaBd9lH2UKGgUaA2MDF9fcXVhbG5hbWVfX5RoDYwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoFYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5ROjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
106
  }
107
  }
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x79dd3027fce0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x79dd3027fd80>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x79dd3027fe20>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x79dd3027fec0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x79dd3027ff60>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x79dd30280040>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x79dd302800e0>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x79dd30280180>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x79dd30280220>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x79dd302802c0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x79dd30280360>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x79dd30280400>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x79dd303e7780>"
21
  },
22
  "verbose": 1,
23
+ "policy_kwargs": {},
 
 
 
 
 
24
  "num_timesteps": 1507328,
25
  "_total_timesteps": 1500000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1765473389146329985,
30
+ "learning_rate": 0.0003,
 
 
 
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAACm/7K9gueQPui4oT50P8y+ocIePj+5HT4AAAAAAAAAAM0oUTzL7K8935JHvgV4Ub6Hs7i9MaLGPAAAAAAAAAAAM/nMPLs0qrwGokC8xIhzPe0bmz01ebW8AACAPwAAgD/mbSA9CCOfPZNnYL0/JVa+2c6HPLLKpTwAAAAAAAAAAACfQj1k3vQ+JuEEvYKDlL7q/gE9jk98OAAAAAAAAAAAM0epO08rWj336BG+V9SBvuyZNbzeEZy9AAAAAAAAAABtrkQ+DVn1Pp7Eg72d4qG+JtGGPfZHRj0AAAAAAAAAABqfST0VRTA/znaivUaDt75Zfek8QOUavQAAAAAAAAAAmtuYvMEy8T2pXwK9ooGMvjJgrTygj808AAAAAAAAAADtHAm+2xC1PzpoF7+taoW+ddIWvr2El74AAAAAAAAAAICY4r2h1bY946USPjmhlL7adWw9lpmJPAAAAAAAAAAAM7PevGxr1LuBHjE+K1zpO9YmJ72Wj9E8AACAPwAAgD/I1Ya+UPCJP0eYnr47ReO+Bs7EvsIBLr0AAAAAAAAAAEAQtL16bI8/ghKlvZHI574zth6+/UjavAAAAAAAAAAAsw+NvVs9bz/abrO9ZmHOvnrU/r0uOHq8AAAAAAAAAAAQxqE+VEVePwLtmb0M9ae+S7xqPrfGtr0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
38
+ ":serialized:": "gAWVhAAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksQhZSMAUOUdJRSlC4="
39
  },
40
  "_last_original_obs": null,
41
  "_episode_num": 0,
 
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWVFQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHEFle4TbnKMAWyUS+OMAXSUR0CYamL876pHdX2UKGgGR0Bxcvvx6OYIaAdL6mgIR0CYard5IH1OdX2UKGgGR0BzFQRSP2f1aAdNLwFoCEdAmGrWrfcesHV9lChoBkdAcdasOoYNzGgHTQMBaAhHQJhrIdU83dd1fZQoaAZHQHB8Ey+HrQhoB00rAWgIR0CYa4VEd/8VdX2UKGgGR0BwcwqAjIJaaAdNMwFoCEdAmGuS79Q40nV9lChoBkdAcQQmU4aP0mgHS/ZoCEdAmG3GUfPom3V9lChoBkdAcTpmtyPuHGgHS+VoCEdAmG4Mhs67unV9lChoBkdAcP3k9ECvHWgHTRMBaAhHQJhuWI1tO211fZQoaAZHQHGN3gP3BYVoB0vjaAhHQJhu7lRxcVx1fZQoaAZHQHCzEadc0LtoB0v0aAhHQJhvOnivPkd1fZQoaAZHQHEom8yvcJtoB00LAWgIR0CYb9Qw9JSSdX2UKGgGR0Bv+gsZpBX0aAdNFAFoCEdAmG//Qv6CUXV9lChoBkdAcS/xzaK1omgHS+1oCEdAmHAZSzgMt3V9lChoBkdAbp9ijL0SRWgHS+loCEdAmHCUtNBWxXV9lChoBkdAcCiMPSUkfWgHS/loCEdAmHCmPYFqz3V9lChoBkdAbbgDRtxdZGgHTQABaAhHQJhyM8r7O3V1fZQoaAZHQHAzWf5DZ15oB00SAWgIR0CYcjtPHktFdX2UKGgGR0BxKz9XLeQ/aAdNKAFoCEdAmHJ8/+sHSnV9lChoBkdAcEvxKg7HQ2gHTSUBaAhHQJhzPdoFmnR1fZQoaAZHQHIbrU1AJLNoB00dAmgIR0CYc8byH2ytdX2UKGgGR0BxSukTHsC1aAdNAwFoCEdAmHURTfixV3V9lChoBkdAcYoEg4ffXWgHS+NoCEdAmHV3qzJIUnV9lChoBkdAcptUvf0mMWgHS/9oCEdAmHX8CYCyQnV9lChoBkdAcmU9kBjnWGgHTTMBaAhHQJh2TbblA/t1fZQoaAZHQHI1V2aDwphoB0v0aAhHQJh22s6q8151fZQoaAZHQHGT5e/pMYdoB0v3aAhHQJh3NM7EHdJ1fZQoaAZHQHNU41k1/DtoB01RAWgIR0CYeFyd4FA3dX2UKGgGR0BxHTZmI0qIaAdNFwFoCEdAmHih8pkPMHV9lChoBkdAc2NoS+QEIWgHTR0BaAhHQJh5pgeA/cF1fZQoaAZHQG5X1vVEuxtoB00DAWgIR0CYerdhiLEUdX2UKGgGR0BvDuxY7q6faAdL+WgIR0CYerhBZ6lddX2UKGgGR0ByiIbZOBUaaAdNBwFoCEdAmHrjlxOtXHV9lChoBkdAbHWKF7D2rWgHS+xoCEdAmHwWe18b73V9lChoBkdAcXkkDZDiO2gHTQwBaAhHQJh8iZPVNHp1fZQoaAZHQHJ3AU1yeZpoB0vbaAhHQJh92PS2H+J1fZQoaAZHQHElczyjHn5oB0vnaAhHQJh+zI+4b0h1fZQoaAZHQG73KgyuZCxoB00GAWgIR0CYftxvNu+AdX2UKGgGR0BvxqKYRdyDaAdL6WgIR0CYki5P/JeWdX2UKGgGR0Bw2vXxvvSdaAdNAQFoCEdAmJKPyXlbNnV9lChoBkdAcFaQ79ycTmgHS+poCEdAmJOFWCEpRXV9lChoBkdAcejsLv1DjWgHTRABaAhHQJiTlGSZBs11fZQoaAZHQHAuB6v7m+1oB0v2aAhHQJiUojX4CZF1fZQoaAZHQG4jWhh6SkloB00jAWgIR0CYlPZbILgGdX2UKGgGR0BuY+38XN1RaAdL6WgIR0CYlRnUUfxMdX2UKGgGR0Bw0wDklu3uaAdNAAFoCEdAmJW6QJXyRXV9lChoBkdActhT3qRlpWgHTQsBaAhHQJiWJVWCEpR1fZQoaAZHQEpwSyMUAT9oB0vPaAhHQJiXbWxyGSJ1fZQoaAZHQHLzxzaK1ohoB00nAWgIR0CYl/MHKOktdX2UKGgGR0BxBc/iYLLIaAdNBwFoCEdAmJg/n0TURXV9lChoBkdAcsK3Sro4dmgHS/NoCEdAmJiDguRLb3V9lChoBkdAcMO72tdRi2gHTTgBaAhHQJiYzVPN3W51fZQoaAZHQGQ0VWCEpRZoB03oA2gIR0CYmachkiD/dX2UKGgGR0BwANSHdoFnaAdNAwFoCEdAmJnlqN6w+3V9lChoBkdAcaLWGATZhGgHTQ4BaAhHQJiZ5hx5s0p1fZQoaAZHQEy9G8VYZEVoB0vraAhHQJiaNnM+u/11fZQoaAZHQHLGc3uNPxhoB00BAWgIR0CYmrq0MPSVdX2UKGgGR0ByDFCUornUaAdL5WgIR0CYm0lTFVDKdX2UKGgGR0BxPrcYZVGTaAdNAwFoCEdAmJvdETg2qHV9lChoBkdAbhokTpPhymgHS+loCEdAmJw1TR6WxHV9lChoBkdAbvBRaX8fm2gHS9toCEdAmJxCFPBSDXV9lChoBkdAcWwSAYpDu2gHTSwBaAhHQJidUxVQyh11fZQoaAZHQHKzCyyD7IloB0vcaAhHQJidbLV4HHF1fZQoaAZHQHHTt+CsfaJoB0vtaAhHQJieggkka/B1fZQoaAZHQHBJQpF1B+poB0v9aAhHQJieuIdlum91fZQoaAZHQHDrPIbOu7poB00WAWgIR0CYoGOJ+DvmdX2UKGgGR0ByXUN4JNTMaAdL8WgIR0CYoIedTYNBdX2UKGgGR0BxjCqU/wAmaAdNKAFoCEdAmKCnXd0q6XV9lChoBkdAZkPr2QGOdWgHTegDaAhHQJihvaL4vex1fZQoaAZHQHDbx/qgRK9oB00bAWgIR0CYoc5jYqXodX2UKGgGR0By+GmelKsdaAdNJgFoCEdAmKHb5IpYtHV9lChoBkdAcxw0SRKYiWgHS9ZoCEdAmKHvu1F6RnV9lChoBkdAbjyK8cuJ12gHS/BoCEdAmKIdWdVebHV9lChoBkdAcO8XiBGx2WgHTQwBaAhHQJiiQrmQr+Z1fZQoaAZHQHFGYbn5i3JoB00qAWgIR0CYonqS5iEydX2UKGgGR0BwrsNQTEiuaAdL42gIR0CYo5gAp8WsdX2UKGgGR0Bw/+KdhAnlaAdL42gIR0CYo7JO32EkdX2UKGgGR0A5cRP420iRaAdLemgIR0CYo7fKp1ifdX2UKGgGR0BxTs+RoysTaAdNHQFoCEdAmKP3qmj0tnV9lChoBkdAbe8er+5vtWgHTSQBaAhHQJikFESdvsJ1fZQoaAZHQHLKjFZPl+5oB00CAWgIR0CYpUY/3WWhdX2UKGgGR0BxvZYigTRIaAdL/mgIR0CYpVmzByjpdX2UKGgGR0Bw/VFEy+HraAdL0mgIR0CYpY8a4tpVdX2UKGgGR0BxCGvmozeoaAdL7GgIR0CYpqTHKfWddX2UKGgGR0BzDUOlO45MaAdL2WgIR0CYqIiOearndX2UKGgGR0BwYF1dPci4aAdNBAFoCEdAmKkZNj9XLnV9lChoBkdAbYTFglWwNmgHS/FoCEdAmKkliz9jw3V9lChoBkdAc07p84Pwu2gHTRQBaAhHQJip5YFJQLx1fZQoaAZHQHJZIkVvddpoB00XAWgIR0CYql9bX6IndX2UKGgGR0BxYzkkrwvyaAdNKAFoCEdAmKqOUD+zdHV9lChoBkdAcN/lOoHcDmgHTSwBaAhHQJiq23b212J1fZQoaAZHQHNM4d+5OJtoB0vwaAhHQJirR13dKul1fZQoaAZHQG4TivPkaMtoB0v6aAhHQJirgIv8IiV1fZQoaAZHQHLutM0xdptoB0v1aAhHQJirgUFjd591fZQoaAZHQHN/zSLIgeRoB00CAWgIR0CYrGQxN7BwdX2UKGgGR0Bvwc+u/1xsaAdNHQFoCEdAmK0kfozN2XV9lChoBkdAcelEIgNgB2gHS/xoCEdAmK4zoMa0hXV9lChoBkdAcO55WRzRyGgHS/RoCEdAmK467EpAlnV9lChoBkdAb6RdAxBVuWgHTQMBaAhHQJiuTFUADJV1fZQoaAZHQHMPE/GEPDpoB0vqaAhHQJiuudZq20B1ZS4="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
  },
54
+ "_n_updates": 368,
55
  "observation_space": {
56
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
+ ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu",
58
  "dtype": "float32",
59
  "bounded_below": "[ True True True True True True True True]",
60
  "bounded_above": "[ True True True True True True True True]",
 
69
  },
70
  "action_space": {
71
  ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
72
+ ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu",
73
  "n": "4",
74
  "start": "0",
75
  "_shape": [],
 
77
  "_np_random": null
78
  },
79
  "n_envs": 16,
80
+ "n_steps": 1024,
81
+ "gamma": 0.999,
82
+ "gae_lambda": 0.98,
83
+ "ent_coef": 0.01,
84
  "vf_coef": 0.5,
85
  "max_grad_norm": 0.5,
86
  "batch_size": 64,
87
+ "n_epochs": 4,
88
  "clip_range": {
89
  ":type:": "<class 'function'>",
90
+ ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
91
  },
92
  "clip_range_vf": null,
93
  "normalize_advantage": true,
94
  "target_kl": null,
95
  "lr_schedule": {
96
  ":type:": "<class 'function'>",
97
+ ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
98
  }
99
  }
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c06a7ab6ea3fed30c9a9f61907d4b6b3ee72609b49d1221997f6f27caaa49deb
3
- size 1109879
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5a8b82a91cf3cdfe41aeafecbe0fc52038e1a3592406ead2b06fc4885244e91
3
+ size 88695
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c959e9ee9642c8106a515cb842eb5300661714ca187a127259fd13000ea373c
3
- size 554751
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b4220b30a703513238096fd1a75956ba205314d4dfe112638d0e2a007aeb647
3
+ size 44095
ppo-LunarLander-v2/pytorch_variables.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b6bbfc035aeac78f3ee425960893ff8bb7927d3cf3425470ac4b6c6ce280c5d
3
  size 1261
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07c7431cf6005e7d8f367d79e995f63e2f9b981a37e3437b795d058f9af4308b
3
  size 1261
ppo-LunarLander-v2/system_info.txt CHANGED
@@ -1,9 +1,9 @@
1
- - OS: macOS-15.6.1-arm64-arm-64bit Darwin Kernel Version 24.6.0: Mon Jul 14 11:30:40 PDT 2025; root:xnu-11417.140.69~1/RELEASE_ARM64_T6041
2
- - Python: 3.12.2
3
  - Stable-Baselines3: 2.0.0a5
4
- - PyTorch: 2.7.0
5
- - GPU Enabled: False
6
- - Numpy: 1.26.4
7
- - Cloudpickle: 3.0.0
8
  - Gymnasium: 0.28.1
9
- - OpenAI Gym: 0.26.2
 
1
+ - OS: Linux-6.6.105+-x86_64-with-glibc2.35 # 1 SMP Thu Oct 2 10:42:05 UTC 2025
2
+ - Python: 3.12.12
3
  - Stable-Baselines3: 2.0.0a5
4
+ - PyTorch: 2.9.0+cu126
5
+ - GPU Enabled: True
6
+ - Numpy: 2.0.2
7
+ - Cloudpickle: 3.1.2
8
  - Gymnasium: 0.28.1
9
+ - OpenAI Gym: 0.25.2
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b200c648224be4a8aeec3adf1e68c46878621354ab4c0f4b3ddde3d07aab0543
3
- size 164333
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33c60f47cb8fc1d053f797569ccf8f41ced461123b4fa2a7becac136d21804f7
3
+ size 147427
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 209.8153486915452, "std_reward": 73.31105441841818, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-12-06T17:19:59.849254"}
 
1
+ {"mean_reward": 275.7800392308601, "std_reward": 17.288160639183115, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-12-11T17:42:51.775045"}