reeeemo commited on
Commit
eb12ccd
·
verified ·
1 Parent(s): b405060

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 258.08 +/- 11.55
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 279.70 +/- 18.00
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x79d6765153a0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x79d676515440>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x79d6765154e0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x79d676515580>", "_build": "<function ActorCriticPolicy._build at 0x79d676515620>", "forward": "<function ActorCriticPolicy.forward at 0x79d6765156c0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x79d676515760>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x79d676515800>", "_predict": "<function ActorCriticPolicy._predict at 0x79d6765158a0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x79d676515940>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x79d6765159e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x79d676515a80>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x79d6766a0780>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1751586655091952105, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAACmTSs+fMI3P+2WB76O/nO+2/xUPH7dAb0AAAAAAAAAAObAcD3DiU66PSddOCYblrUr0pU6sfGXtAAAgD8AAIA/M2+vvMNZJLqBTQM48coEM3PwujrFNxy3AACAPwAAgD/NRMk7VBvRPSlyC7wJMVO+LazOO99PgT0AAAAAAAAAAM2w9Tt7Rpa8fqx5Oyb7BT1nNMg9mGkcPQAAgD8AAIA/mg4fvcOdK7oAStI6DX26NRqsEjtzGfq5AACAPwAAgD/NHys9FaSKP9rGIT0PXI++TKCDPAs/+rsAAAAAAAAAAKbCxb28nM8+mqQ2O6rkVL51hXA9xOIsPQAAAAAAAAAAZsLROxRAhbovOMM6CUeZNcZturq2TOO5AACAPwAAgD+AF0u9XPNvugvp47YeicSxrxWsupvxBjYAAIA/AACAP81klrtUuLI/YtBovkl5rb587HQ73oapPAAAAAAAAAAAQKyyvR/NwLlyeNY4FgtRNMxsfjl+hgi4AACAPwAAgD+ApwM9SIOUukp16LvF8yA4XBYVuj8yIbcAAIA/AACAP81wdLw8mHQ/zvDIu6oWoL4/yCQ8yODPPAAAAAAAAAAAZnwjvCkMULoIsrc6RH2gtI8aqLs4ydS5AACAPwAAgD8Alpy8PaoZucLmR7nzW7q0FabqO3u5cDgAAIA/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVhAAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksQhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGNGF6Z6UqyMAWyUTegDjAF0lEdAkJ7nrpqynnV9lChoBkdAZco1Aqur62gHTegDaAhHQJCiiUt7KJV1fZQoaAZHQGDft0eU6gdoB03oA2gIR0CQrI92X9iudX2UKGgGR0BlJ+eg+QlsaAdN6ANoCEdAkLMr/82rGXV9lChoBkdAYxzaakRBeGgHTegDaAhHQJC2Cj4593N1fZQoaAZHQGEk1oxpL29oB03oA2gIR0CQuYctXgccdX2UKGgGR0Bi9y9TP0I1aAdN6ANoCEdAkL4Wn4wh4nV9lChoBkdAYYZG+bmU4mgHTegDaAhHQJDDnKFIuoR1fZQoaAZHQF8MHrQgLZ1oB03oA2gIR0CQyJmnfl6rdX2UKGgGR0BfSupwS8J2aAdN6ANoCEdAkMipRjz7M3V9lChoBkdAZQWPmxMWXWgHTegDaAhHQJDJyprDZUV1fZQoaAZHQGLs5c1O0sxoB03oA2gIR0CQz/W/ag27dX2UKGgGR0Bgr+GKyfL+aAdN6ANoCEdAkND3VXmvGXV9lChoBkdAZaZCXyAhCGgHTegDaAhHQJDRJcTrVvx1fZQoaAZHQGc+sHryDqZoB03oA2gIR0CQ0g46wMYudX2UKGgGR0Bfdj3mFJxvaAdN6ANoCEdAkPBltfoicHV9lChoBkdAY/2A4n4O+mgHTegDaAhHQJDzM4WDYiB1fZQoaAZHQGDxl8G9pRJoB03oA2gIR0CQ9toYekpJdX2UKGgGR0BfxCx3V09yaAdN6ANoCEdAkQCg/s3Q2XV9lChoBkdAYH+DW9US7GgHTegDaAhHQJEHC9eyAx11fZQoaAZHQFt9xZuAI6doB03oA2gIR0CRCViVSn+AdX2UKGgGR0Bg/eTFERapaAdN6ANoCEdAkQwD/dZaFHV9lChoBkdAZnx47ihnJ2gHTegDaAhHQJEPbPeHi3p1fZQoaAZHQGc7orFwT/RoB03oA2gIR0CRFJdjoZAIdX2UKGgGR0BhYeloDgZTaAdN6ANoCEdAkRsVqi48U3V9lChoBkdAYzf9roGIK2gHTegDaAhHQJEbLG6wt8N1fZQoaAZHQGZyyLqD9O1oB03oA2gIR0CRHM6ab4JvdX2UKGgGR0BhuY86mwaBaAdN6ANoCEdAkSN6PGQ0XXV9lChoBkdAYHkn3L3bmGgHTegDaAhHQJEkd9ORDCx1fZQoaAZHQGajeY+jdpJoB03oA2gIR0CRJKSQYDT0dX2UKGgGR0BfKlHOKO1faAdN6ANoCEdAkSWMpXp4bHV9lChoBkdAYX0lQdjoZGgHTegDaAhHQJFDDaL4vex1fZQoaAZHQGC5CVB2OhloB03oA2gIR0CRRk3Sro4ddX2UKGgGR0BlFCHTI/7jaAdN6ANoCEdAkUuLdvbXYnV9lChoBkdAZZhyOJcgQ2gHTegDaAhHQJFWhkUbkwN1fZQoaAZHQGTfTzundftoB03oA2gIR0CRXXnTy8SPdX2UKGgGR0BjpgaDPGADaAdN6ANoCEdAkWAIvWYnfHV9lChoBkdAYbSVrylN12gHTegDaAhHQJFi2kBS1md1fZQoaAZHQFrJ9CNS619oB03oA2gIR0CRZrBsQ/X5dX2UKGgGR0BlJlm16Vt5aAdN6ANoCEdAkWxr9qDbrXV9lChoBkdAYt1vUjLSu2gHTegDaAhHQJFxfdbgTAZ1fZQoaAZHQF9LhnrY5DJoB03oA2gIR0CRcZCFsYVJdX2UKGgGR0BkXqvcJtzkaAdN6ANoCEdAkXLTxb0OE3V9lChoBkdAYOLGSZBsymgHTegDaAhHQJF54Mw1zhh1fZQoaAZHQF6xaCcwxnFoB03oA2gIR0CRexjgAIY4dX2UKGgGR0Be1Zhz/6wdaAdN6ANoCEdAkXtPv4M4LnV9lChoBkdAZR/zcRDkVGgHTegDaAhHQJF8fPomoit1fZQoaAZHQGQAZ9d/rjZoB03oA2gIR0CRma4REnb7dX2UKGgGR0BiuOLxZuAJaAdN6ANoCEdAkZx/uLJjlXV9lChoBkdAYuMsV+I/JWgHTegDaAhHQJGfzSOR1YB1fZQoaAZHQFurHc1wYLtoB03oA2gIR0CRqOWKMvRJdX2UKGgGR0BkiBdt2s7uaAdN6ANoCEdAkbDBusLfDXV9lChoBkdAZz2wXZXdTGgHTegDaAhHQJGy9wcYIjZ1fZQoaAZHQGO+hE8aGYdoB03oA2gIR0CRtT84PwuvdX2UKGgGR0Bip519v0iAaAdN6ANoCEdAkbh4nBtUGXV9lChoBkdAXqfF85S3s2gHTegDaAhHQJG9dshxHXp1fZQoaAZHQF/uedkJ8fFoB03oA2gIR0CRwj1F6RhddX2UKGgGR0BjQeZqmCRPaAdN6ANoCEdAkcJMVgx8D3V9lChoBkdAZxDuEVWS2mgHTegDaAhHQJHDejua4MF1fZQoaAZHQGGEyT6i0v5oB03oA2gIR0CRyZFrl/6PdX2UKGgGR0BjFb9qDbrUaAdN6ANoCEdAkcp3FLnLaHV9lChoBkdAYsDBSk0rLGgHTegDaAhHQJHKoxEfDDV1fZQoaAZHQF4ZzCUHIIZoB03oA2gIR0CRy36kIomYdX2UKGgGR0BMtcH4XXRPaAdNIAFoCEdAkc2NUGVzIXV9lChoBkdAZyV4nF5v+GgHTegDaAhHQJHpGb5M10l1fZQoaAZHQGOB0UGmk31oB03oA2gIR0CR67g+hXbNdX2UKGgGR0Bl+pMWXTmXaAdN6ANoCEdAke7f5tWMj3V9lChoBkdAYFzbItDlYGgHTegDaAhHQJH3E3sHB1t1fZQoaAZHQGLjPr4WUKRoB03oA2gIR0CR/Hcdo372dX2UKGgGR0BbFFopQUHqaAdN6ANoCEdAkf5P5gw483V9lChoBkdAYTVwYLsru2gHTegDaAhHQJIAfLTx5LR1fZQoaAZHQGJZtQj2SMdoB03oA2gIR0CSA375Ec81dX2UKGgGR0BkjLW07bL2aAdN6ANoCEdAkg5MXFcY7HV9lChoBkdAZPJmfXf642gHTegDaAhHQJIOYUvf0mN1fZQoaAZHQGIhEyk9ECxoB03oA2gIR0CSD/fRu0kXdX2UKGgGR0BaLcbFS88LaAdN6ANoCEdAkhfx9srNGHV9lChoBkdAZcPKtga3qmgHTegDaAhHQJIZJnBciW51fZQoaAZHQGN1O9vjwQVoB03oA2gIR0CSGV+8Gs3idX2UKGgGR0BhASB/ZuhsaAdN6ANoCEdAkhp4ikfs/3V9lChoBkdAZUmKD0163WgHTegDaAhHQJIcZ9Tgl4V1fZQoaAZHQFgkOObRWtFoB03oA2gIR0CSI4soDxLCdX2UKGgGR0Bix3xWkrPMaAdN6ANoCEdAkjeiu+yquXV9lChoBkdAYaYQNCqp+GgHTegDaAhHQJI6/seGO+91fZQoaAZHQHEqGnTAnD1oB03vAWgIR0CSPiXY150KdX2UKGgGR0ByMWWw/xDtaAdNrQFoCEdAkkOdTLns9nV9lChoBkdAZ/6LpiZv1mgHTegDaAhHQJJEwLb5/LF1fZQoaAZHQGbV6/Zdv89oB03oA2gIR0CSSaUKzAvddX2UKGgGR0BhhaEg4ffXaAdN6ANoCEdAkktnAh0QsnV9lChoBkdAZO7jy4FzMmgHTegDaAhHQJJNhXdTHbR1fZQoaAZHQGbg/PPcBU9oB03oA2gIR0CSUF2TPjXGdX2UKGgGR0BuxI5vLowFaAdNugJoCEdAklEhddE9dXV9lChoBkdAYfCGwiaAnWgHTegDaAhHQJJZauV5a/11fZQoaAZHQGFO1wgkkbBoB03oA2gIR0CSWoiM5wOwdX2UKGgGR0BlJYRRMvh7aAdN6ANoCEdAkmBHWz4UOHV9lChoBkdAZ6OepXIU8GgHTegDaAhHQJJiKyD7Ikt1fZQoaAZHQGQ/Dn/1g6VoB03oA2gIR0CSZFZIxxkvdX2UKGgGR0Bx1S2JBPbgaAdNBwNoCEdAkmfWjCYTkHV9lChoBkdAcgIY9gWrO2gHTd4CaAhHQJJq5jpcHGF1fZQoaAZHQHFE2/etSydoB03iA2gIR0CSa8K4hEBsdX2UKGgGR0Bi/ZOpKjBVaAdN6ANoCEdAkm83bh3qzXVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjExL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTEvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjExL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTEvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.1.123+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Mar 30 16:01:29 UTC 2025", "Python": "3.11.13", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.6.0+cu124", "GPU Enabled": "True", "Numpy": "2.0.2", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7c12f7f46a20>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7c12f7f46ac0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7c12f7f46b60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7c12f7f46c00>", "_build": "<function ActorCriticPolicy._build at 0x7c12f7f46ca0>", "forward": "<function ActorCriticPolicy.forward at 0x7c12f7f46d40>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7c12f7f46de0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7c12f7f46e80>", "_predict": "<function ActorCriticPolicy._predict at 0x7c12f7f46f20>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7c12f7f46fc0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7c12f7f47060>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7c12f7f47100>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7c12f80a2b40>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVaQAAAAAAAAB9lCiMCG5ldF9hcmNolH2UKIwCcGmUXZQoTQACTQACZYwCdmaUXZQoTQACTQACZXWMDWFjdGl2YXRpb25fZm6UjBt0b3JjaC5ubi5tb2R1bGVzLmFjdGl2YXRpb26UjARUYW5olJOUdS4=", "net_arch": {"pi": [512, 512], "vf": [512, 512]}, "activation_fn": "<class 'torch.nn.modules.activation.Tanh'>"}, "num_timesteps": 1001472, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1766810274384480236, "learning_rate": 0.00038779746460731866, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVlgAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAACARj09EQXtPYg6lb7aa2C+PTCfvRVogr0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsIhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksBhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0014719999999999178, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVCwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG+N6RZEDySMAWyUS/qMAXSUR0CsTEXGff4zdX2UKGgGR0Bwclbs4T9LaAdNFAFoCEdArE1vGOuJUHV9lChoBkdAcdzAo5PuX2gHS9doCEdArFR82eg+QnV9lChoBkdAcopbwSamXWgHTREBaAhHQKxVOKVpsXV1fZQoaAZHQG2WuinHeadoB00AAWgIR0CsVfCUPhAGdX2UKGgGR0BynFMPBi1BaAdL1mgIR0CsVn6Wom5UdX2UKGgGR0Bvl+QGOdXlaAdNFgFoCEdArFdHNA1NxnV9lChoBkdAcp4ZeRgZ0mgHS9xoCEdArFfvm1YyPHV9lChoBkdAcdTf2K2rn2gHS+VoCEdArFihB/qgRXV9lChoBkdAcckXS0BwM2gHS99oCEdArFk2+IuXeHV9lChoBkdAcMSH9WIXTGgHS/hoCEdArGCFFBppOHV9lChoBkdAcVaflZHNHGgHTRYBaAhHQKxhaxB3Roh1fZQoaAZHQEu5YhdMTOBoB0voaAhHQKxicMfigkF1fZQoaAZHQHEkI0/GEPFoB00bAWgIR0CsY6IcBEKFdX2UKGgGR0BzJYDLbHp9aAdL22gIR0CsZIluFYdRdX2UKGgGR0BtxRHkLhJiaAdL/GgIR0CsZZfnW8RMdX2UKGgGR0BzkVE4NqgzaAdL8WgIR0CsZmZ0r9VFdX2UKGgGR0BxwqGQCCBgaAdNEAFoCEdArGcZJwsGxHV9lChoBkdAYSRle4TbnGgHTegDaAhHQKxxdFfAsTZ1fZQoaAZHQHHGEdzXBgxoB00cAWgIR0CsclTfJmuldX2UKGgGR0BxeIC1Z1V6aAdL5GgIR0Cscv6H9FWodX2UKGgGR0BzQKUdJaq0aAdL62gIR0Csc5vN3W4FdX2UKGgGR0Bh2CEg4ffXaAdN6ANoCEdArH6iaiKziXV9lChoBkdAcSQ8m8dxQ2gHS/hoCEdArH9/CVKPGXV9lChoBkdAcbJIaLn9vWgHTQUBaAhHQKyAS7T2FnJ1fZQoaAZHQHE9YE8q4H5oB00FAWgIR0CsgQ8n/kvLdX2UKGgGR0BxZOTpxFRYaAdL72gIR0Csgc1IZqEfdX2UKGgGR0BubGtITXaraAdL/GgIR0CsgqBdt2s8dX2UKGgGR0BwI5djXnQqaAdNBgFoCEdArIN//echDHV9lChoBkdAcdylvIfbK2gHS/NoCEdArIqysS00FnV9lChoBkdAcSeNZvDP4WgHS+hoCEdArItJ6lchT3V9lChoBkdAcHQCqZML4WgHTQEBaAhHQKyMC1sLv1F1fZQoaAZHQHJFOjdpItloB0vnaAhHQKyMtrqMWGh1fZQoaAZHQHCCCVrylN1oB0v/aAhHQKyNiYeDFqB1fZQoaAZHQG+vmj0th/loB00DAWgIR0CsjlGcOLBLdX2UKGgGR0BwO9I5HVgAaAdL+WgIR0CsjwWyTpxFdX2UKGgGR0BthaKaXrt3aAdNQwFoCEdArJAIl8gIQnV9lChoBkdAba0BpYcNpmgHS/FoCEdArJiZYgaFVXV9lChoBkdAcq3I+nqFAWgHTQABaAhHQKyZTT1kDp11fZQoaAZHQHNJgi/wiJRoB00rAWgIR0CsmjdCmdiEdX2UKGgGR0BwSRggHNX6aAdNDQFoCEdArJr8vf0mMXV9lChoBkdAcwKaA4GUwGgHS/NoCEdArJufmFJxvXV9lChoBkdAbS9rX18LKGgHTRQBaAhHQKyccVj7Q9l1fZQoaAZHQHJjjk6tDD1oB00CAWgIR0CsnSNAcDKYdX2UKGgGR0BxFX5gw482aAdL22gIR0CsncISL61tdX2UKGgGR0BwItjAi3XqaAdL8mgIR0CspP4+B6KMdX2UKGgGR0ByWIVrRBu5aAdNFwFoCEdArKXI4Otnw3V9lChoBkdAbhZw7T2FnWgHS/hoCEdArKaDI/7iynV9lChoBkdAcDARKpT/AGgHS+loCEdArKctDOTq0XV9lChoBkdAb9QgQHzH0mgHS/ZoCEdArKfVklNUO3V9lChoBkdAcCA/Z/Tb4GgHS/JoCEdArKiZA8jiXXV9lChoBkdAb5U26TW5H2gHS+5oCEdArKk7MxGlRHV9lChoBkdAcG67QLNOd2gHS+toCEdArKnljRUm2XV9lChoBkdAcV+ypJf6XWgHS/doCEdArLKs3bVSXXV9lChoBkdAcSY8wYcebWgHS+1oCEdArLNSH6/IsHV9lChoBkdATGx2ZAprlGgHS4VoCEdArLOrGWD6FnV9lChoBkdAcLFIE8q4IGgHS+doCEdArLRPJT2nKnV9lChoBkdAcZ6lNDc/MWgHS+poCEdArLTsnPVurXV9lChoBkdAcSQzImw7kmgHTU0BaAhHQKy18+IuXeF1fZQoaAZHQHD0QuuieupoB00CAWgIR0Cstqmh/RVqdX2UKGgGR0ByCKE9Mbm2aAdNEQFoCEdArLd32ZiNKnV9lChoBkdAb/Um8/UvwmgHTRgBaAhHQKy+0p9ZzPt1fZQoaAZHQG8UbFjurp9oB0v8aAhHQKy/h5pJwsJ1fZQoaAZHQG994wIt16poB0voaAhHQKzAMzImw7l1fZQoaAZHQHK7/H1e0HBoB00tAWgIR0CswQrK3d9EdX2UKGgGR0BwUne7+T/yaAdL2WgIR0CswZdG7SRbdX2UKGgGR0BzV8iUxEfDaAdNGAFoCEdArMJxvFWGRHV9lChoBkdAchtTFl05l2gHTSoBaAhHQKzDPyuIRAd1fZQoaAZHQHLlD/MnqmloB00YAWgIR0CsxAGRvFWGdX2UKGgGR0ByPKGzru6VaAdNCAFoCEdArMzM1hsqKHV9lChoBkdAbq8PvKEFn2gHS/FoCEdArM1oISlFdHV9lChoBkdAcgdMLF4s3GgHTT0BaAhHQKzOa1IAfdR1fZQoaAZHQHLoT3mFJxxoB00bAWgIR0Cszy3d0q6OdX2UKGgGR0BzAtilSCOFaAdNDAFoCEdArNABYT0xunV9lChoBkdAQgkO09hZyWgHS61oCEdArNCK8xsVL3V9lChoBkdAby5oL5RCQmgHS/xoCEdArNExu89Oh3V9lChoBkdAcZrOLR8c/GgHTQsBaAhHQKzR8EM9bHJ1fZQoaAZHQHBTIiosI3RoB0v/aAhHQKzZFzGPxQV1fZQoaAZHQG/kms3hn8NoB0v1aAhHQKzZyOrhisp1fZQoaAZHQHK5Ot4iX6ZoB0vZaAhHQKzaW2y9mHx1fZQoaAZHQHAh8Z1mrbRoB0vvaAhHQKzbEINVinZ1fZQoaAZHQHG/6ODJ2dNoB00JAWgIR0Cs283enAIqdX2UKGgGR0ByIXHfdhy9aAdL+GgIR0Cs3IC4BmwrdX2UKGgGR0Bw41PhybQUaAdL6mgIR0Cs3STfrKNidX2UKGgGR0BvfBT4tYjjaAdL9WgIR0Cs3fFFlTWHdX2UKGgGR0By0cLux8lYaAdNBgFoCEdArOa4X0oSc3V9lChoBkdAcFt2OhkAgmgHTQEBaAhHQKznZ4sVclh1fZQoaAZHQG6OCtzS1E5oB0vtaAhHQKzoCza9K291fZQoaAZHQG5wgZ88cMpoB0v1aAhHQKzos8DB/I91fZQoaAZHQHJqOtwJgLJoB00MAWgIR0Cs6WzfrKNidX2UKGgGR0BxMWt5le4TaAdL6mgIR0Cs6hPeYUnHdX2UKGgGR0BtJVbA1vVFaAdNBQFoCEdArOrGVE/jbXV9lChoBkdAcv3jJ+2E02gHS/BoCEdArOth9d/rjnV9lChoBkdAcQMF36hxpGgHS/JoCEdArOwSW7e2u3V9lChoBkdAcmlEbYK6WmgHTYgCaAhHQKz1hfgrH2h1fZQoaAZHQHD2wVoHs1NoB0vzaAhHQKz2P0OmR/51fZQoaAZHQHKS5B1LamJoB0v/aAhHQKz3HJxNqQB1fZQoaAZHQHEFjnaFmFtoB0v5aAhHQKz4HOWSlnB1fZQoaAZHQHAuP6O5rgxoB00DAWgIR0Cs+RUbLlmwdX2UKGgGR0BtoufVZs9CaAdNFQFoCEdArPo349HMEHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 6357, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 1, "n_steps": 2048, "gamma": 0.9927390555180292, "gae_lambda": 0.9353501463066322, "ent_coef": 0.007068533587811773, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 128, "n_epochs": 13, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8l7FFTLZMCFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzlqKW2Oy+WFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.6.105+-x86_64-with-glibc2.35 # 1 SMP Thu Oct 2 10:42:05 UTC 2025", "Python": "3.12.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.9.0+cpu", "GPU Enabled": "False", "Numpy": "2.0.2", "Cloudpickle": "3.1.2", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2-optimized.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:210f614038c4cce5455a3b1dc76807d30dfed19c96c3643218c692cdbc84d2e5
3
+ size 6476219
ppo-LunarLander-v2-optimized/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 2.0.0a5
ppo-LunarLander-v2-optimized/data ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
+ "__module__": "stable_baselines3.common.policies",
6
+ "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7c12f7f46a20>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7c12f7f46ac0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7c12f7f46b60>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7c12f7f46c00>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7c12f7f46ca0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7c12f7f46d40>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7c12f7f46de0>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7c12f7f46e80>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7c12f7f46f20>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7c12f7f46fc0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7c12f7f47060>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7c12f7f47100>",
19
+ "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7c12f80a2b40>"
21
+ },
22
+ "verbose": 1,
23
+ "policy_kwargs": {
24
+ ":type:": "<class 'dict'>",
25
+ ":serialized:": "gAWVaQAAAAAAAAB9lCiMCG5ldF9hcmNolH2UKIwCcGmUXZQoTQACTQACZYwCdmaUXZQoTQACTQACZXWMDWFjdGl2YXRpb25fZm6UjBt0b3JjaC5ubi5tb2R1bGVzLmFjdGl2YXRpb26UjARUYW5olJOUdS4=",
26
+ "net_arch": {
27
+ "pi": [
28
+ 512,
29
+ 512
30
+ ],
31
+ "vf": [
32
+ 512,
33
+ 512
34
+ ]
35
+ },
36
+ "activation_fn": "<class 'torch.nn.modules.activation.Tanh'>"
37
+ },
38
+ "num_timesteps": 1001472,
39
+ "_total_timesteps": 1000000,
40
+ "_num_timesteps_at_start": 0,
41
+ "seed": null,
42
+ "action_noise": null,
43
+ "start_time": 1766810274384480236,
44
+ "learning_rate": 0.00038779746460731866,
45
+ "tensorboard_log": null,
46
+ "_last_obs": {
47
+ ":type:": "<class 'numpy.ndarray'>",
48
+ ":serialized:": "gAWVlgAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAACARj09EQXtPYg6lb7aa2C+PTCfvRVogr0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsIhpSMAUOUdJRSlC4="
49
+ },
50
+ "_last_episode_starts": {
51
+ ":type:": "<class 'numpy.ndarray'>",
52
+ ":serialized:": "gAWVdQAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksBhZSMAUOUdJRSlC4="
53
+ },
54
+ "_last_original_obs": null,
55
+ "_episode_num": 0,
56
+ "use_sde": false,
57
+ "sde_sample_freq": -1,
58
+ "_current_progress_remaining": -0.0014719999999999178,
59
+ "_stats_window_size": 100,
60
+ "ep_info_buffer": {
61
+ ":type:": "<class 'collections.deque'>",
62
+ ":serialized:": "gAWVCwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG+N6RZEDySMAWyUS/qMAXSUR0CsTEXGff4zdX2UKGgGR0Bwclbs4T9LaAdNFAFoCEdArE1vGOuJUHV9lChoBkdAcdzAo5PuX2gHS9doCEdArFR82eg+QnV9lChoBkdAcopbwSamXWgHTREBaAhHQKxVOKVpsXV1fZQoaAZHQG2WuinHeadoB00AAWgIR0CsVfCUPhAGdX2UKGgGR0BynFMPBi1BaAdL1mgIR0CsVn6Wom5UdX2UKGgGR0Bvl+QGOdXlaAdNFgFoCEdArFdHNA1NxnV9lChoBkdAcp4ZeRgZ0mgHS9xoCEdArFfvm1YyPHV9lChoBkdAcdTf2K2rn2gHS+VoCEdArFihB/qgRXV9lChoBkdAcckXS0BwM2gHS99oCEdArFk2+IuXeHV9lChoBkdAcMSH9WIXTGgHS/hoCEdArGCFFBppOHV9lChoBkdAcVaflZHNHGgHTRYBaAhHQKxhaxB3Roh1fZQoaAZHQEu5YhdMTOBoB0voaAhHQKxicMfigkF1fZQoaAZHQHEkI0/GEPFoB00bAWgIR0CsY6IcBEKFdX2UKGgGR0BzJYDLbHp9aAdL22gIR0CsZIluFYdRdX2UKGgGR0BtxRHkLhJiaAdL/GgIR0CsZZfnW8RMdX2UKGgGR0BzkVE4NqgzaAdL8WgIR0CsZmZ0r9VFdX2UKGgGR0BxwqGQCCBgaAdNEAFoCEdArGcZJwsGxHV9lChoBkdAYSRle4TbnGgHTegDaAhHQKxxdFfAsTZ1fZQoaAZHQHHGEdzXBgxoB00cAWgIR0CsclTfJmuldX2UKGgGR0BxeIC1Z1V6aAdL5GgIR0Cscv6H9FWodX2UKGgGR0BzQKUdJaq0aAdL62gIR0Csc5vN3W4FdX2UKGgGR0Bh2CEg4ffXaAdN6ANoCEdArH6iaiKziXV9lChoBkdAcSQ8m8dxQ2gHS/hoCEdArH9/CVKPGXV9lChoBkdAcbJIaLn9vWgHTQUBaAhHQKyAS7T2FnJ1fZQoaAZHQHE9YE8q4H5oB00FAWgIR0CsgQ8n/kvLdX2UKGgGR0BxZOTpxFRYaAdL72gIR0Csgc1IZqEfdX2UKGgGR0BubGtITXaraAdL/GgIR0CsgqBdt2s8dX2UKGgGR0BwI5djXnQqaAdNBgFoCEdArIN//echDHV9lChoBkdAcdylvIfbK2gHS/NoCEdArIqysS00FnV9lChoBkdAcSeNZvDP4WgHS+hoCEdArItJ6lchT3V9lChoBkdAcHQCqZML4WgHTQEBaAhHQKyMC1sLv1F1fZQoaAZHQHJFOjdpItloB0vnaAhHQKyMtrqMWGh1fZQoaAZHQHCCCVrylN1oB0v/aAhHQKyNiYeDFqB1fZQoaAZHQG+vmj0th/loB00DAWgIR0CsjlGcOLBLdX2UKGgGR0BwO9I5HVgAaAdL+WgIR0CsjwWyTpxFdX2UKGgGR0BthaKaXrt3aAdNQwFoCEdArJAIl8gIQnV9lChoBkdAba0BpYcNpmgHS/FoCEdArJiZYgaFVXV9lChoBkdAcq3I+nqFAWgHTQABaAhHQKyZTT1kDp11fZQoaAZHQHNJgi/wiJRoB00rAWgIR0CsmjdCmdiEdX2UKGgGR0BwSRggHNX6aAdNDQFoCEdArJr8vf0mMXV9lChoBkdAcwKaA4GUwGgHS/NoCEdArJufmFJxvXV9lChoBkdAbS9rX18LKGgHTRQBaAhHQKyccVj7Q9l1fZQoaAZHQHJjjk6tDD1oB00CAWgIR0CsnSNAcDKYdX2UKGgGR0BxFX5gw482aAdL22gIR0CsncISL61tdX2UKGgGR0BwItjAi3XqaAdL8mgIR0CspP4+B6KMdX2UKGgGR0ByWIVrRBu5aAdNFwFoCEdArKXI4Otnw3V9lChoBkdAbhZw7T2FnWgHS/hoCEdArKaDI/7iynV9lChoBkdAcDARKpT/AGgHS+loCEdArKctDOTq0XV9lChoBkdAb9QgQHzH0mgHS/ZoCEdArKfVklNUO3V9lChoBkdAcCA/Z/Tb4GgHS/JoCEdArKiZA8jiXXV9lChoBkdAb5U26TW5H2gHS+5oCEdArKk7MxGlRHV9lChoBkdAcG67QLNOd2gHS+toCEdArKnljRUm2XV9lChoBkdAcV+ypJf6XWgHS/doCEdArLKs3bVSXXV9lChoBkdAcSY8wYcebWgHS+1oCEdArLNSH6/IsHV9lChoBkdATGx2ZAprlGgHS4VoCEdArLOrGWD6FnV9lChoBkdAcLFIE8q4IGgHS+doCEdArLRPJT2nKnV9lChoBkdAcZ6lNDc/MWgHS+poCEdArLTsnPVurXV9lChoBkdAcSQzImw7kmgHTU0BaAhHQKy18+IuXeF1fZQoaAZHQHD0QuuieupoB00CAWgIR0Cstqmh/RVqdX2UKGgGR0ByCKE9Mbm2aAdNEQFoCEdArLd32ZiNKnV9lChoBkdAb/Um8/UvwmgHTRgBaAhHQKy+0p9ZzPt1fZQoaAZHQG8UbFjurp9oB0v8aAhHQKy/h5pJwsJ1fZQoaAZHQG994wIt16poB0voaAhHQKzAMzImw7l1fZQoaAZHQHK7/H1e0HBoB00tAWgIR0CswQrK3d9EdX2UKGgGR0BwUne7+T/yaAdL2WgIR0CswZdG7SRbdX2UKGgGR0BzV8iUxEfDaAdNGAFoCEdArMJxvFWGRHV9lChoBkdAchtTFl05l2gHTSoBaAhHQKzDPyuIRAd1fZQoaAZHQHLlD/MnqmloB00YAWgIR0CsxAGRvFWGdX2UKGgGR0ByPKGzru6VaAdNCAFoCEdArMzM1hsqKHV9lChoBkdAbq8PvKEFn2gHS/FoCEdArM1oISlFdHV9lChoBkdAcgdMLF4s3GgHTT0BaAhHQKzOa1IAfdR1fZQoaAZHQHLoT3mFJxxoB00bAWgIR0Cszy3d0q6OdX2UKGgGR0BzAtilSCOFaAdNDAFoCEdArNABYT0xunV9lChoBkdAQgkO09hZyWgHS61oCEdArNCK8xsVL3V9lChoBkdAby5oL5RCQmgHS/xoCEdArNExu89Oh3V9lChoBkdAcZrOLR8c/GgHTQsBaAhHQKzR8EM9bHJ1fZQoaAZHQHBTIiosI3RoB0v/aAhHQKzZFzGPxQV1fZQoaAZHQG/kms3hn8NoB0v1aAhHQKzZyOrhisp1fZQoaAZHQHK5Ot4iX6ZoB0vZaAhHQKzaW2y9mHx1fZQoaAZHQHAh8Z1mrbRoB0vvaAhHQKzbEINVinZ1fZQoaAZHQHG/6ODJ2dNoB00JAWgIR0Cs283enAIqdX2UKGgGR0ByIXHfdhy9aAdL+GgIR0Cs3IC4BmwrdX2UKGgGR0Bw41PhybQUaAdL6mgIR0Cs3STfrKNidX2UKGgGR0BvfBT4tYjjaAdL9WgIR0Cs3fFFlTWHdX2UKGgGR0By0cLux8lYaAdNBgFoCEdArOa4X0oSc3V9lChoBkdAcFt2OhkAgmgHTQEBaAhHQKznZ4sVclh1fZQoaAZHQG6OCtzS1E5oB0vtaAhHQKzoCza9K291fZQoaAZHQG5wgZ88cMpoB0v1aAhHQKzos8DB/I91fZQoaAZHQHJqOtwJgLJoB00MAWgIR0Cs6WzfrKNidX2UKGgGR0BxMWt5le4TaAdL6mgIR0Cs6hPeYUnHdX2UKGgGR0BtJVbA1vVFaAdNBQFoCEdArOrGVE/jbXV9lChoBkdAcv3jJ+2E02gHS/BoCEdArOth9d/rjnV9lChoBkdAcQMF36hxpGgHS/JoCEdArOwSW7e2u3V9lChoBkdAcmlEbYK6WmgHTYgCaAhHQKz1hfgrH2h1fZQoaAZHQHD2wVoHs1NoB0vzaAhHQKz2P0OmR/51fZQoaAZHQHKS5B1LamJoB0v/aAhHQKz3HJxNqQB1fZQoaAZHQHEFjnaFmFtoB0v5aAhHQKz4HOWSlnB1fZQoaAZHQHAuP6O5rgxoB00DAWgIR0Cs+RUbLlmwdX2UKGgGR0BtoufVZs9CaAdNFQFoCEdArPo349HMEHVlLg=="
63
+ },
64
+ "ep_success_buffer": {
65
+ ":type:": "<class 'collections.deque'>",
66
+ ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
67
+ },
68
+ "_n_updates": 6357,
69
+ "observation_space": {
70
+ ":type:": "<class 'gymnasium.spaces.box.Box'>",
71
+ ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu",
72
+ "dtype": "float32",
73
+ "bounded_below": "[ True True True True True True True True]",
74
+ "bounded_above": "[ True True True True True True True True]",
75
+ "_shape": [
76
+ 8
77
+ ],
78
+ "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
79
+ "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
80
+ "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
81
+ "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
82
+ "_np_random": null
83
+ },
84
+ "action_space": {
85
+ ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
86
+ ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu",
87
+ "n": "4",
88
+ "start": "0",
89
+ "_shape": [],
90
+ "dtype": "int64",
91
+ "_np_random": null
92
+ },
93
+ "n_envs": 1,
94
+ "n_steps": 2048,
95
+ "gamma": 0.9927390555180292,
96
+ "gae_lambda": 0.9353501463066322,
97
+ "ent_coef": 0.007068533587811773,
98
+ "vf_coef": 0.5,
99
+ "max_grad_norm": 0.5,
100
+ "batch_size": 128,
101
+ "n_epochs": 13,
102
+ "clip_range": {
103
+ ":type:": "<class 'function'>",
104
+ ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8l7FFTLZMCFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
105
+ },
106
+ "clip_range_vf": null,
107
+ "normalize_advantage": true,
108
+ "target_kl": null,
109
+ "lr_schedule": {
110
+ ":type:": "<class 'function'>",
111
+ ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzlqKW2Oy+WFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
112
+ }
113
+ }
ppo-LunarLander-v2-optimized/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af9983e46f579c24e8d3b35f5aee22cc60f3f313251b8e6613d60ee7d427e359
3
+ size 4306807
ppo-LunarLander-v2-optimized/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:507e2ddb1f29e173c519cb2df8edfea5aaa0299b52efb4455abf4a5130ad48af
3
+ size 2153215
ppo-LunarLander-v2-optimized/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07c7431cf6005e7d8f367d79e995f63e2f9b981a37e3437b795d058f9af4308b
3
+ size 1261
ppo-LunarLander-v2-optimized/system_info.txt ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ - OS: Linux-6.6.105+-x86_64-with-glibc2.35 # 1 SMP Thu Oct 2 10:42:05 UTC 2025
2
+ - Python: 3.12.12
3
+ - Stable-Baselines3: 2.0.0a5
4
+ - PyTorch: 2.9.0+cpu
5
+ - GPU Enabled: False
6
+ - Numpy: 2.0.2
7
+ - Cloudpickle: 3.1.2
8
+ - Gymnasium: 0.28.1
9
+ - OpenAI Gym: 0.25.2
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aeda352f9b225c52b903c725da21467ff6abfa988135b989edff7115efe29c23
3
- size 168986
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45fd6866972822761e64c2dacb63508e92cd3f96ae2f7537b483dc40b601fe70
3
+ size 162350
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 258.0804094, "std_reward": 11.551674245215613, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-07-04T00:16:09.789130"}
 
1
+ {"mean_reward": 279.7000609, "std_reward": 18.00438714305934, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-12-27T05:42:33.748193"}