Bavantha11 commited on
Commit
523d856
·
verified ·
1 Parent(s): b5b2aed

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 260.80 +/- 19.08
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 276.30 +/- 15.52
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7ce06a3e2660>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7ce06a3e2700>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7ce06a3e27a0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7ce06a3e2840>", "_build": "<function ActorCriticPolicy._build at 0x7ce06a3e28e0>", "forward": "<function ActorCriticPolicy.forward at 0x7ce06a3e2980>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7ce06a3e2a20>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7ce06a3e2ac0>", "_predict": "<function ActorCriticPolicy._predict at 0x7ce06a3e2b60>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7ce06a3e2c00>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7ce06a3e2ca0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7ce06a3e2d40>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7ce06a3665c0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1294336, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1757508119235870233, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWVYgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAksTQw6VAZcAfACJAXoFAABTAJROhZQpjBJwcm9ncmVzc19yZW1haW5pbmeUhZSMIC90bXAvaXB5dGhvbi1pbnB1dC0zMzE3MjIzNjg4LnB5lIwIPGxhbWJkYT6UjCFsaW5lYXJfc2NoZWR1bGUuPGxvY2Fscz4uPGxhbWJkYT6USwRDC/iAANAmOLg90iZIlEMAlIwNaW5pdGlhbF92YWx1ZZSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5ROjAhfX25hbWVfX5SMCF9fbWFpbl9flHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgefZR9lChoF4wIPGxhbWJkYT6UjAxfX3F1YWxuYW1lX1+UjCFsaW5lYXJfc2NoZWR1bGUuPGxvY2Fscz4uPGxhbWJkYT6UjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAACaJNO8GnTBP6znDb6leUg9WnMYPKNAMr0AAAAAAAAAAA0Llz0FPNq7TYyiu7oZzr2QSF29652vvgAAgD8AAIA/83CuPScEbz5GLFO+3s1VvtgHCL1W9Z69AAAAAAAAAAB6jzW+f9qjP87eF79CjtO+LmiKvv9dvL4AAAAAAAAAAJog6L0E/B4/KrWaParIqb7BoRC7MuuNPQAAAAAAAAAAM1eQPP38sT/w0ZE+Jedevjh8gLxTjMG7AAAAAAAAAABmI7u8oYIJP+vw1rsW4Ji+MFWCvNOOAD0AAAAAAAAAAM0yjzyFN8i7vpcrPKo9ljwv7BW9ooJ9PQAAgD8AAIA/k8oNPqlzArxrtqo8ao+ZPGzwYb3ySnw9AACAPwAAgD+aPQo8qp6PP4jksDwSe8i+2H4VPAU+Pj0AAAAAAAAAABoDQT1cJ2C6bmrItpFnITFfBpu7fWTpNQAAgD8AAIA/M7MYObrzhD/aOEQ98IDhvr0uTbu0/8q8AAAAAAAAAABmYTc9dn9dPXqg27wprnm+GNKfO53VAT0AAAAAAAAAANpDHz6dMmk+um+Hvq0Xbr7wumO9DhHHvQAAAAAAAAAAjWy/vf6K5T3TEw0+O050vg7ahD2u3aC9AAAAAAAAAAAzdSy9GCLBPzpGa74lsS49ZH3BPOXvS70AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVhAAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksQhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.35283200000000003, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVOAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHEckWAPNFCMAWyUTTQBjAF0lEdAlTbPy08eS3V9lChoBkdAbpK4RVZLZmgHTTMBaAhHQJU3WXVsk6d1fZQoaAZHQHI0X9m6GxloB00cAWgIR0CVN4cT8HfNdX2UKGgGR0Bw0GGfwqiHaAdNAwFoCEdAlThGgnMMZ3V9lChoBkdAccq5mRNh3WgHTQYBaAhHQJU4zkdV/+d1fZQoaAZHQEREqBmPHT9oB0v3aAhHQJU5OzPa+N91fZQoaAZHQHE6Am/nGKhoB00pAWgIR0CVOYsq8UVSdX2UKGgGR0BwRwXN1QqJaAdNOQFoCEdAlTqC5/b0v3V9lChoBkdAcE8ckMTewmgHTQEBaAhHQJU6gUFjd591fZQoaAZHQHGtfrWy1NRoB00SAWgIR0CVOwXvphWpdX2UKGgGR0Bxb41dgOSXaAdNWAFoCEdAlTsbHyVfNXV9lChoBkdAck94Ju2qk2gHTQQBaAhHQJU7dmBe5Wl1fZQoaAZHQG95oBRyfcxoB00RAWgIR0CVPBf5k9U0dX2UKGgGR0Bvobnq3VkMaAdNDwFoCEdAlTyzVx0dR3V9lChoBkdAcF+pOvdM02gHTTcBaAhHQJU9lpVS4vx1fZQoaAZHQHDsfh/Aj6hoB00OAWgIR0CVPpfYjB2wdX2UKGgGR0BxlKGahHskaAdNGAFoCEdAlT+BdIGyHHV9lChoBkdAcFYAeq7yx2gHTRABaAhHQJVAiBz3h4t1fZQoaAZHQHEYHmmtQsRoB00GAWgIR0CVQJ8qFyq/dX2UKGgGR0Bt80384xUOaAdNEAFoCEdAlUE4ppeu3nV9lChoBkdAb6XTkQwsXmgHTTkBaAhHQJVBSpOvdM11fZQoaAZHQG/xTDwYtQNoB00WAWgIR0CVQkpKBd2QdX2UKGgGR0Bu42V1Oj7AaAdNMgFoCEdAlUMbxAjY7XV9lChoBkdAcPMy1NQCS2gHTRABaAhHQJVDJGoaUA11fZQoaAZHQHB7ALiMo+hoB00iAWgIR0CVQyzSkTHsdX2UKGgGR0BvS2d07r9maAdNNAFoCEdAlUOzrJKaonV9lChoBkdAb+dahYeT3mgHTQEBaAhHQJVD9V+7UXp1fZQoaAZHQHKoVKTSssBoB00jAWgIR0CVRDajvd/KdX2UKGgGR0Btwq4jKPn0aAdNKwFoCEdAlUXQVCXyAnV9lChoBkdAcRH6wt8NQWgHTQ0BaAhHQJVG7MQmNR51fZQoaAZHQFFIKaG5+YtoB0vZaAhHQJVHFbVz6rN1fZQoaAZHQHDInI6r/85oB00LAWgIR0CVR90OEug6dX2UKGgGR0BzZEnv2GqQaAdNOQFoCEdAlUkhq9GqgnV9lChoBkdAcMh3iaRZEGgHTS8BaAhHQJVJfNB4Uvh1fZQoaAZHQG/5V+AmReVoB0vzaAhHQJVJp7v5P/J1fZQoaAZHQGXT6qbSZ0FoB03oA2gIR0CVSn4wRGtqdX2UKGgGR0BtG6w6hg3MaAdNGAFoCEdAlUqlvybx3HV9lChoBkdAcP2R3NcGDGgHTcABaAhHQJVLDUZvUBp1fZQoaAZHQHIDBSUC7shoB00cAWgIR0CVS1rD63y7dX2UKGgGR0BxREkPczqKaAdNPAFoCEdAlUubLhaTwHV9lChoBkdAcJmDO1OTJWgHTSkBaAhHQJVL9AX2ugZ1fZQoaAZHQG9gt8eCCjFoB01rAWgIR0CVTBGO+7DmdX2UKGgGR0By4G+7Dl5oaAdNRwFoCEdAlUzl7+kxh3V9lChoBkdAcD0ApKBd2WgHTQkBaAhHQJVhz0I1LrZ1fZQoaAZHQEfgxoqTbFloB0vTaAhHQJViToicG1R1fZQoaAZHQHA0cejmCAdoB00xAWgIR0CVYsDPWxyGdX2UKGgGR0BxQMyXUpd9aAdNXQFoCEdAlWLd4mkWRHV9lChoBkdAcb4FlTWGy2gHTToBaAhHQJVj7Ah0Qsh1fZQoaAZHQG+5jghr30xoB00UAWgIR0CVZGv8IiTudX2UKGgGR0BxK7ObAk9maAdNIwFoCEdAlWUI/eLvTnV9lChoBkdAcRTD/2kBS2gHTQwBaAhHQJVlO7wrlNl1fZQoaAZHQG9Or56+nIhoB00TAWgIR0CVZgojOcDsdX2UKGgGR0BwUaunuRcNaAdNJgFoCEdAlWYlIy0rsnV9lChoBkdAcB7tY0VJtmgHTRgBaAhHQJVmgYl6Z6V1fZQoaAZHQGZDDM/yGztoB03oA2gIR0CVZrQ2dd3TdX2UKGgGR0BwomcbzbvgaAdNDAFoCEdAlWbuUY8+zXV9lChoBkdAcMd1qnFYMmgHTTwBaAhHQJVnuz8gpz91fZQoaAZHQHBV/6XSjQBoB01CAWgIR0CVaEA9mpVCdX2UKGgGR0BwViOYIBzWaAdNJAFoCEdAlWiIQFs54nV9lChoBkdAcLTGs3hn8WgHS/doCEdAlWmAWFev6nV9lChoBkdAcONmbsniN2gHTSkBaAhHQJVp8fxMFll1fZQoaAZHQHIZwTAWSEFoB0vpaAhHQJVqURkEs8R1fZQoaAZHQHAqaOgg5ipoB00rAWgIR0CVanxcE/0NdX2UKGgGR0BwIbW6K+BZaAdNIwFoCEdAlWrLt/nW8XV9lChoBkdAbyTohY/3WWgHS/ZoCEdAlWuqGDcuanV9lChoBkdAcorcpLEk0WgHS/9oCEdAlW0LEtNBW3V9lChoBkdAc2Z4ubqhUWgHTSsBaAhHQJVtcCtA9mp1fZQoaAZHQHBhXnU2DQJoB01YAWgIR0CVbfpcophGdX2UKGgGR0BykIHRkVesaAdNEgFoCEdAlW4HFo+OfnV9lChoBkdAbjXrvb48EGgHTUMBaAhHQJVu6gctGut1fZQoaAZHQHKIJsXSBshoB007AWgIR0CVb2RF7UobdX2UKGgGR0ByjhXko4MnaAdNRAFoCEdAlW/sAmzBynV9lChoBkdAcRhZ0Syt3mgHTRYBaAhHQJVwA0HhS+B1fZQoaAZHQHA6+TeO4oZoB001AWgIR0CVcFD+irT6dX2UKGgGR0BzSs0rK/21aAdNMQFoCEdAlXD+kDZDiXV9lChoBkdAcfFPbfxc3WgHTQoBaAhHQJVxYY64lQd1fZQoaAZHQHBtXogV45doB00hAWgIR0CVclVG0/nodX2UKGgGR0BzbKAPNFBqaAdNRwFoCEdAlXKO8TSLInV9lChoBkdAcZBkSmIj4mgHTTQBaAhHQJVzAT7EYO51fZQoaAZHQHBF/yf+S8toB00tAWgIR0CVcyYChew+dX2UKGgGR0BvgM1VHWjHaAdNGwFoCEdAlXOOii7Ci3V9lChoBkdAcdnKSxJNCmgHS/xoCEdAlXRGKVII4XV9lChoBkdAcQM9C/oJRmgHTQUBaAhHQJV1Cr/82rJ1fZQoaAZHQHBitYwIt19oB00sAWgIR0CVdT5GjKxLdX2UKGgGR0BvyyfHxSYPaAdNGAFoCEdAlXWCgPEsKHV9lChoBkdAcOY1ZkkKNWgHTQYBaAhHQJV2U7/4qPR1fZQoaAZHQHAci3b212JoB0v4aAhHQJV2bHCGetl1fZQoaAZHQHCq8X7+DOFoB00bAWgIR0CVdnNh3JPqdX2UKGgGR0Bxtv5gw482aAdL9mgIR0CVd2N6gM+edX2UKGgGR0BwTnoHLRrraAdNLwFoCEdAlXfsU/OdG3V9lChoBkdATzwAS39aU2gHS9VoCEdAlXfozWPLgXV9lChoBkdAb6f2h7E5yWgHTTUBaAhHQJV4V6cAiml1fZQoaAZHQG/VRZuAI6doB00yAWgIR0CVeUtxdY4idX2UKGgGR0Bw5ug6EJ0GaAdNGAFoCEdAlXnHz6JqI3V9lChoBkdAb2pctXgccWgHTQ0BaAhHQJV6dF1B+nZ1fZQoaAZHQHMyByn1nNBoB001AWgIR0CVewWJ79hrdX2UKGgGR0BwqV7/n4fwaAdNTQFoCEdAlXvuMyad+XV9lChoBkdAcRDK3/givGgHTQ8BaAhHQJV8N2hZha11fZQoaAZHQHKClAVwgkloB00HAWgIR0CVfDEXcgyNdX2UKGgGR0BwrmgrYoRaaAdNNgFoCEdAlXx/5DZ13nVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 561, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV/gAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoC4wCaTiUiYiHlFKUKEsDaA9OTk5K/////0r/////SwB0lGKMCl9ucF9yYW5kb22UTnViLg==", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.1.123+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Mar 30 16:01:29 UTC 2025", "Python": "3.12.11", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.8.0+cu126", "GPU Enabled": "True", "Numpy": "2.0.2", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f9b1752caf0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f9b1752cb80>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f9b1752cc10>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f9b1752cca0>", "_build": "<function ActorCriticPolicy._build at 0x7f9b1752cd30>", "forward": "<function ActorCriticPolicy.forward at 0x7f9b1752cdc0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f9b1752ce50>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f9b1752cee0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f9b1752cf70>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f9b1752d000>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f9b1752d090>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f9b1752d120>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f9b17529440>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1212416, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1758012501621178721, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWVMAIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAksTQwh8AIgAFABTAJROhZQpjBJwcm9ncmVzc19yZW1haW5pbmeUhZSMJC90bXAvaXB5a2VybmVsXzE0NjExOTQvMzMxNzIyMzY4OC5weZSMCDxsYW1iZGE+lEsEQwIIAJSMDWluaXRpYWxfdmFsdWWUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoHH2UfZQoaBWMCDxsYW1iZGE+lIwMX19xdWFsbmFtZV9flIwhbGluZWFyX3NjaGVkdWxlLjxsb2NhbHM+LjxsYW1iZGE+lIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoFowHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAADNFGC8CuNgu4+FjTu0QoI81vmMvGvNYD0AAIA/AACAP7P3H73h8J+6bPEcPG4SFz2uYlm7yaiNtwAAgD8AAIA/wGmTPVK15buVfoW7EkRnPASjQT391kS9AACAPwAAgD8AXZU8yIC3P1LPuT6AJBg+I22OvPLoRL0AAAAAAAAAAI0ugT243aS7Opz3OGVrej3E9vu82nv9OwAAgD8AAIA/mhnIPD2iA7vDcGO6n5w3PM7eOTxpDiO9AACAPwAAgD/N9So9EgihPNTRxrx3zni+Y1lwPWsDFb0AAAAAAAAAAIDVRz1+Xqg+Lau2PEWtq77Hbdm8zok/PQAAAAAAAAAAYOAVPo8VxD4tjAi+dV6LviLGyzyCQmC9AAAAAAAAAACa+rQ9EdXjPfmxQ7zGzpO+se2KPZW4Zj0AAAAAAAAAAM29aT0pSDi6Q15NNt6bZjF409m6EvJ8tQAAgD8AAIA/2gCfPfYENbr8Gws6Rir0NEreTzqj+CS5AACAPwAAAAAm1rc9YFN9P+3kQT5ltvW+qelfPUB3oD0AAAAAAAAAACBqUT4B2Q4/DmuAPAKX974h+2E+oa7DvQAAAAAAAAAAgMfLPYcjRz6IA++9JX6nvnaNlryR5qS9AAAAAAAAAABmR2U94J66P3PVoj4D5Li9V7OOuy6iJz0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVhAAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksQhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.39379200000000003, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV+AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHJU/5ULlV+MAWyUTQEBjAF0lEdAkbD51ie/YnV9lChoBkdAb37OdoWYW2gHS+NoCEdAkbGmCuloDnV9lChoBkdAc5YBAv+OwWgHTRgBaAhHQJGx0YR/ViF1fZQoaAZHQHHffZdv865oB0vmaAhHQJGyBfWtlqd1fZQoaAZHQHJD/dEb5uZoB00OAWgIR0CRsiSsKb8WdX2UKGgGR0Bwc3p0OmSAaAdNjgJoCEdAkbKOS0Sh8XV9lChoBkdAclAlbeMyamgHS/RoCEdAkbLYC+10DHV9lChoBkdAcpI9S/CZW2gHS89oCEdAkbNiEYfnwHV9lChoBkdAcvYMLncL0GgHS/NoCEdAkbQ+GO+7DnV9lChoBkdAclRdH2AXmGgHS9doCEdAkbSaRQrMDHV9lChoBkdAb/DDn/1g6WgHS9loCEdAkbUSHEdeY3V9lChoBkdAcXqksSTQmmgHS+FoCEdAkbVlY6nzhHV9lChoBkdAc3pfu1F6RmgHS8RoCEdAkbWvqHGjsXV9lChoBkdAUYYkMTewcGgHS7poCEdAkbW8OoYNzHV9lChoBkdAcRCnJT2nKmgHTQEBaAhHQJG2czN2TxJ1fZQoaAZHQHPxI/7iyY5oB0vJaAhHQJG2+lpGnXN1fZQoaAZHQHGQEL2HtWxoB0veaAhHQJG3Ls0HhS91fZQoaAZHQHBnigwoLG9oB0vtaAhHQJG4ArhBJI11fZQoaAZHQG7qkjgQ6IZoB0vcaAhHQJG4BObiIcl1fZQoaAZHQHLGryYoiLVoB00CAWgIR0CRuD+dK/VRdX2UKGgGR0BykGlgtvn9aAdL0GgIR0CRuYce8wpOdX2UKGgGR0BxlGBreqJeaAdNCQFoCEdAkboqZYxL03V9lChoBkdAYhRvAoG6gGgHTegDaAhHQJG60gU1yeZ1fZQoaAZHQG0VZcC5mRNoB0v7aAhHQJG7HCpFTeh1fZQoaAZHQHNKKGtZFG5oB033AmgIR0CRu3CQ9zOpdX2UKGgGR0BxQ7s/pt78aAdL8mgIR0CRu6njABT5dX2UKGgGR0ByaMfq5byIaAdL62gIR0CRu8dxQzk7dX2UKGgGR0BxsCS8rZrYaAdNBAFoCEdAkbvIKtxMnXV9lChoBkdAbhJ5P/JeV2gHS/VoCEdAkbwMw1zhgnV9lChoBkdAcJ9FjNIK+mgHS95oCEdAkbzbr5ZbIXV9lChoBkdAc0TpCKJl8WgHS8ZoCEdAkb0Na+vhZXV9lChoBkdAcdV9RJmNBGgHS/BoCEdAkb0XlbNbDHV9lChoBkdAcXG+QlruY2gHTQcBaAhHQJG9IjVx0dR1fZQoaAZHQHJf1HrhR65oB0vyaAhHQJHm+2SdOIt1fZQoaAZHQHDlCEg4ffZoB00FAWgIR0CR5zghr30xdX2UKGgGR0B0Kld2Pkq+aAdL+GgIR0CR6NaouPFOdX2UKGgGR0Bw6xx//echaAdNHwJoCEdAkekFGgBcRnV9lChoBkdAcGWkK/mDDmgHS+xoCEdAkekfJA+pwXV9lChoBkdAcv6nXumaY2gHS+RoCEdAkekzurp7kXV9lChoBkdAcaMiobXHzmgHTR8BaAhHQJHpPrE9+w11fZQoaAZHQG8aL876pHZoB0vbaAhHQJHpS2a2F391fZQoaAZHQHB1BwVCXyBoB0vWaAhHQJHpe9kBjnV1fZQoaAZHQHByMvqTr3VoB0v5aAhHQJHqGLMs6JZ1fZQoaAZHQHGltcOby6NoB0vHaAhHQJHqJovi97F1fZQoaAZHQHFjvBBRhttoB0v+aAhHQJHqTBGhEjR1fZQoaAZHQHMTpXdTHbRoB0vNaAhHQJHqdapxWDJ1fZQoaAZHQG8us1baAWloB0vraAhHQJHrFNHpbEB1fZQoaAZHQHIu/fKp1ihoB00DAWgIR0CR634O+ZgHdX2UKGgGR0BuUBEv0yxiaAdNTQFoCEdAkewc7yQPqnV9lChoBkdAcesFBY3eemgHS+1oCEdAkewjposZpHV9lChoBkdAbRUgmJFb3WgHS/RoCEdAkex6ABkqc3V9lChoBkdAcqGO3UhFE2gHS8poCEdAkez686FM7HV9lChoBkdAQdIHgP3BYWgHS79oCEdAke1X1FpfyHV9lChoBkdAchVNo8IRiGgHS8xoCEdAke1rFXJYDHV9lChoBkdAcu6t8NQTEmgHS+RoCEdAke2ugg5imXV9lChoBkdAbj+4ecQRPGgHS+1oCEdAke4Ia99MK3V9lChoBkdAcvsA5Jbt7mgHS9loCEdAke6cK1G9YnV9lChoBkdAckurC3w1BWgHS9toCEdAke6aePJaJXV9lChoBkdAb6HSVnmJWWgHTQkBaAhHQJHusg+yJKt1fZQoaAZHQHDKKYVqN6xoB00TAWgIR0CR7smQ8wHrdX2UKGgGR0Bydh8XvYvnaAdLyWgIR0CR7z/NZ/0/dX2UKGgGR0BwVcBFNL13aAdL+GgIR0CR75GEPDpDdX2UKGgGR0Bw5vROUMXraAdNDgFoCEdAke/X7Hhjv3V9lChoBkdAc2G3PAwfyWgHS8JoCEdAkfAgtFrmAHV9lChoBkdAcpvzImw7kmgHS85oCEdAkfFDM7lq8HV9lChoBkdAcsNxiG34K2gHS/loCEdAkfFKpgkTpXV9lChoBkdAcUId4mkWRGgHS+toCEdAkfFbaufVZ3V9lChoBkdAckLD7Ikqt2gHS9BoCEdAkfHB/Aj6e3V9lChoBkdAb8DNJOFg2WgHS+9oCEdAkfJizLOiWXV9lChoBkdAUbWJ3xFy72gHS4hoCEdAkfLCkGiYcHV9lChoBkdAbrU4bS7XhGgHTV8BaAhHQJHy5UyYXwd1fZQoaAZHQHCOafBeok1oB0vRaAhHQJHzIDwH7gt1fZQoaAZHQHFvyFsYVItoB0vgaAhHQJHzYDbJwKl1fZQoaAZHQHEiNFKCg9NoB00bAWgIR0CR87zv7WNFdX2UKGgGR0BwQOiN83MqaAdL8WgIR0CR871pj+aSdX2UKGgGR0BwDWQ4jrzHaAdNDwFoCEdAkfPVct5D7nV9lChoBkdAcd3ez2OAAmgHS+9oCEdAkfPfsRg7YHV9lChoBkdAbSfeDWbw0GgHS91oCEdAkfQ9c0Ltu3V9lChoBkdAcjZ6reZXuGgHS+5oCEdAkfRGOU+s5nV9lChoBkdAcAt+Q2dd3WgHS8toCEdAkfWAIMSbpnV9lChoBkdAcGgZ9NN8E2gHTQUBaAhHQJH1invUjLV1fZQoaAZHQHMCsR6F/QVoB0vQaAhHQJH1lV81Gb11fZQoaAZHQG1jIVM23rloB0vvaAhHQJH2R0GNaQp1fZQoaAZHQHE5frKNhmZoB0vzaAhHQJH2xmf5DZ11fZQoaAZHQHCWLH2h7E5oB0viaAhHQJH3Amu1WsB1fZQoaAZHQG5LjOTq0MRoB0vhaAhHQJH3W5e7cwh1fZQoaAZHQG/c+1KGtZFoB0vaaAhHQJH3ktDlYEJ1fZQoaAZHQHJqNCE6DGtoB0vOaAhHQJH3j+FUQ051fZQoaAZHQG7Mz3AVO9FoB0vnaAhHQJH3ocghbGF1fZQoaAZHQHOU0Ao5PuZoB0vHaAhHQJH32SdOIqN1fZQoaAZHQG/7OZb6guhoB0vRaAhHQJH39NdqtYB1fZQoaAZHQHE9CLVFx4poB0vTaAhHQJH4iRB/qgR1fZQoaAZHQHDlNKmKqGVoB0voaAhHQJH4jVawD/51fZQoaAZHQFRHuuzQeFNoB0uTaAhHQJH4nwb2lEZ1fZQoaAZHQGwOY1YQrc1oB0vfaAhHQJH4yu6mO2l1fZQoaAZHQHFL/8ZUDMhoB00LAWgIR0CR+Qlf7aZhdX2UKGgGR0BzZFDb8FY/aAdL42gIR0CR+g4z7/GVdX2UKGgGR0Bwk5gqmTC+aAdL22gIR0CR+p+mFajfdX2UKGgGR0Bw61pItlI3aAdL4mgIR0CR+01FYuCgdX2UKGgGR0BxEC04R28qaAdL5WgIR0CR+5zSkTHsdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 853, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV/gAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoC4wCaTiUiYiHlFKUKEsDaA9OTk5K/////0r/////SwB0lGKMCl9ucF9yYW5kb22UTnViLg==", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMXi9ob21lL3VkdWdhbWF2aXRoYW5hZ2JsdS8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjF4vaG9tZS91ZHVnYW1hdml0aGFuYWdibHUvLmxvY2FsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMXi9ob21lL3VkdWdhbWF2aXRoYW5hZ2JsdS8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjF4vaG9tZS91ZHVnYW1hdml0aGFuYWdibHUvLmxvY2FsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.0-136-generic-x86_64-with-glibc2.35 # 147-Ubuntu SMP Sat Mar 15 15:53:30 UTC 2025", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.8.0+cu128", "GPU Enabled": "True", "Numpy": "2.2.6", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2dc8ef7b113f8d5bb8413e51b4cbc85676c8753401ce90cb612d4bb93ce1e8dc
3
- size 150317
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec4d61725f5120240c7e754b98e9f8be3d205e69e997aed52d1435a73e4150cd
3
+ size 150147
ppo-LunarLander-v2/data CHANGED
@@ -4,37 +4,37 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7ce06a3e2660>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7ce06a3e2700>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7ce06a3e27a0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7ce06a3e2840>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7ce06a3e28e0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7ce06a3e2980>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7ce06a3e2a20>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7ce06a3e2ac0>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7ce06a3e2b60>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7ce06a3e2c00>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7ce06a3e2ca0>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7ce06a3e2d40>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7ce06a3665c0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
- "num_timesteps": 1294336,
25
  "_total_timesteps": 2000000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1757508119235870233,
30
  "learning_rate": {
31
  ":type:": "<class 'function'>",
32
- ":serialized:": "gAWVYgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAksTQw6VAZcAfACJAXoFAABTAJROhZQpjBJwcm9ncmVzc19yZW1haW5pbmeUhZSMIC90bXAvaXB5dGhvbi1pbnB1dC0zMzE3MjIzNjg4LnB5lIwIPGxhbWJkYT6UjCFsaW5lYXJfc2NoZWR1bGUuPGxvY2Fscz4uPGxhbWJkYT6USwRDC/iAANAmOLg90iZIlEMAlIwNaW5pdGlhbF92YWx1ZZSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5ROjAhfX25hbWVfX5SMCF9fbWFpbl9flHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgefZR9lChoF4wIPGxhbWJkYT6UjAxfX3F1YWxuYW1lX1+UjCFsaW5lYXJfc2NoZWR1bGUuPGxvY2Fscz4uPGxhbWJkYT6UjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
33
  },
34
  "tensorboard_log": null,
35
  "_last_obs": {
36
  ":type:": "<class 'numpy.ndarray'>",
37
- ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAACaJNO8GnTBP6znDb6leUg9WnMYPKNAMr0AAAAAAAAAAA0Llz0FPNq7TYyiu7oZzr2QSF29652vvgAAgD8AAIA/83CuPScEbz5GLFO+3s1VvtgHCL1W9Z69AAAAAAAAAAB6jzW+f9qjP87eF79CjtO+LmiKvv9dvL4AAAAAAAAAAJog6L0E/B4/KrWaParIqb7BoRC7MuuNPQAAAAAAAAAAM1eQPP38sT/w0ZE+Jedevjh8gLxTjMG7AAAAAAAAAABmI7u8oYIJP+vw1rsW4Ji+MFWCvNOOAD0AAAAAAAAAAM0yjzyFN8i7vpcrPKo9ljwv7BW9ooJ9PQAAgD8AAIA/k8oNPqlzArxrtqo8ao+ZPGzwYb3ySnw9AACAPwAAgD+aPQo8qp6PP4jksDwSe8i+2H4VPAU+Pj0AAAAAAAAAABoDQT1cJ2C6bmrItpFnITFfBpu7fWTpNQAAgD8AAIA/M7MYObrzhD/aOEQ98IDhvr0uTbu0/8q8AAAAAAAAAABmYTc9dn9dPXqg27wprnm+GNKfO53VAT0AAAAAAAAAANpDHz6dMmk+um+Hvq0Xbr7wumO9DhHHvQAAAAAAAAAAjWy/vf6K5T3TEw0+O050vg7ahD2u3aC9AAAAAAAAAAAzdSy9GCLBPzpGa74lsS49ZH3BPOXvS70AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="
38
  },
39
  "_last_episode_starts": {
40
  ":type:": "<class 'numpy.ndarray'>",
@@ -44,17 +44,17 @@
44
  "_episode_num": 0,
45
  "use_sde": false,
46
  "sde_sample_freq": -1,
47
- "_current_progress_remaining": 0.35283200000000003,
48
  "_stats_window_size": 100,
49
  "ep_info_buffer": {
50
  ":type:": "<class 'collections.deque'>",
51
- ":serialized:": "gAWVOAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHEckWAPNFCMAWyUTTQBjAF0lEdAlTbPy08eS3V9lChoBkdAbpK4RVZLZmgHTTMBaAhHQJU3WXVsk6d1fZQoaAZHQHI0X9m6GxloB00cAWgIR0CVN4cT8HfNdX2UKGgGR0Bw0GGfwqiHaAdNAwFoCEdAlThGgnMMZ3V9lChoBkdAccq5mRNh3WgHTQYBaAhHQJU4zkdV/+d1fZQoaAZHQEREqBmPHT9oB0v3aAhHQJU5OzPa+N91fZQoaAZHQHE6Am/nGKhoB00pAWgIR0CVOYsq8UVSdX2UKGgGR0BwRwXN1QqJaAdNOQFoCEdAlTqC5/b0v3V9lChoBkdAcE8ckMTewmgHTQEBaAhHQJU6gUFjd591fZQoaAZHQHGtfrWy1NRoB00SAWgIR0CVOwXvphWpdX2UKGgGR0Bxb41dgOSXaAdNWAFoCEdAlTsbHyVfNXV9lChoBkdAck94Ju2qk2gHTQQBaAhHQJU7dmBe5Wl1fZQoaAZHQG95oBRyfcxoB00RAWgIR0CVPBf5k9U0dX2UKGgGR0Bvobnq3VkMaAdNDwFoCEdAlTyzVx0dR3V9lChoBkdAcF+pOvdM02gHTTcBaAhHQJU9lpVS4vx1fZQoaAZHQHDsfh/Aj6hoB00OAWgIR0CVPpfYjB2wdX2UKGgGR0BxlKGahHskaAdNGAFoCEdAlT+BdIGyHHV9lChoBkdAcFYAeq7yx2gHTRABaAhHQJVAiBz3h4t1fZQoaAZHQHEYHmmtQsRoB00GAWgIR0CVQJ8qFyq/dX2UKGgGR0Bt80384xUOaAdNEAFoCEdAlUE4ppeu3nV9lChoBkdAb6XTkQwsXmgHTTkBaAhHQJVBSpOvdM11fZQoaAZHQG/xTDwYtQNoB00WAWgIR0CVQkpKBd2QdX2UKGgGR0Bu42V1Oj7AaAdNMgFoCEdAlUMbxAjY7XV9lChoBkdAcPMy1NQCS2gHTRABaAhHQJVDJGoaUA11fZQoaAZHQHB7ALiMo+hoB00iAWgIR0CVQyzSkTHsdX2UKGgGR0BvS2d07r9maAdNNAFoCEdAlUOzrJKaonV9lChoBkdAb+dahYeT3mgHTQEBaAhHQJVD9V+7UXp1fZQoaAZHQHKoVKTSssBoB00jAWgIR0CVRDajvd/KdX2UKGgGR0Btwq4jKPn0aAdNKwFoCEdAlUXQVCXyAnV9lChoBkdAcRH6wt8NQWgHTQ0BaAhHQJVG7MQmNR51fZQoaAZHQFFIKaG5+YtoB0vZaAhHQJVHFbVz6rN1fZQoaAZHQHDInI6r/85oB00LAWgIR0CVR90OEug6dX2UKGgGR0BzZEnv2GqQaAdNOQFoCEdAlUkhq9GqgnV9lChoBkdAcMh3iaRZEGgHTS8BaAhHQJVJfNB4Uvh1fZQoaAZHQG/5V+AmReVoB0vzaAhHQJVJp7v5P/J1fZQoaAZHQGXT6qbSZ0FoB03oA2gIR0CVSn4wRGtqdX2UKGgGR0BtG6w6hg3MaAdNGAFoCEdAlUqlvybx3HV9lChoBkdAcP2R3NcGDGgHTcABaAhHQJVLDUZvUBp1fZQoaAZHQHIDBSUC7shoB00cAWgIR0CVS1rD63y7dX2UKGgGR0BxREkPczqKaAdNPAFoCEdAlUubLhaTwHV9lChoBkdAcJmDO1OTJWgHTSkBaAhHQJVL9AX2ugZ1fZQoaAZHQG9gt8eCCjFoB01rAWgIR0CVTBGO+7DmdX2UKGgGR0By4G+7Dl5oaAdNRwFoCEdAlUzl7+kxh3V9lChoBkdAcD0ApKBd2WgHTQkBaAhHQJVhz0I1LrZ1fZQoaAZHQEfgxoqTbFloB0vTaAhHQJViToicG1R1fZQoaAZHQHA0cejmCAdoB00xAWgIR0CVYsDPWxyGdX2UKGgGR0BxQMyXUpd9aAdNXQFoCEdAlWLd4mkWRHV9lChoBkdAcb4FlTWGy2gHTToBaAhHQJVj7Ah0Qsh1fZQoaAZHQG+5jghr30xoB00UAWgIR0CVZGv8IiTudX2UKGgGR0BxK7ObAk9maAdNIwFoCEdAlWUI/eLvTnV9lChoBkdAcRTD/2kBS2gHTQwBaAhHQJVlO7wrlNl1fZQoaAZHQG9Or56+nIhoB00TAWgIR0CVZgojOcDsdX2UKGgGR0BwUaunuRcNaAdNJgFoCEdAlWYlIy0rsnV9lChoBkdAcB7tY0VJtmgHTRgBaAhHQJVmgYl6Z6V1fZQoaAZHQGZDDM/yGztoB03oA2gIR0CVZrQ2dd3TdX2UKGgGR0BwomcbzbvgaAdNDAFoCEdAlWbuUY8+zXV9lChoBkdAcMd1qnFYMmgHTTwBaAhHQJVnuz8gpz91fZQoaAZHQHBV/6XSjQBoB01CAWgIR0CVaEA9mpVCdX2UKGgGR0BwViOYIBzWaAdNJAFoCEdAlWiIQFs54nV9lChoBkdAcLTGs3hn8WgHS/doCEdAlWmAWFev6nV9lChoBkdAcONmbsniN2gHTSkBaAhHQJVp8fxMFll1fZQoaAZHQHIZwTAWSEFoB0vpaAhHQJVqURkEs8R1fZQoaAZHQHAqaOgg5ipoB00rAWgIR0CVanxcE/0NdX2UKGgGR0BwIbW6K+BZaAdNIwFoCEdAlWrLt/nW8XV9lChoBkdAbyTohY/3WWgHS/ZoCEdAlWuqGDcuanV9lChoBkdAcorcpLEk0WgHS/9oCEdAlW0LEtNBW3V9lChoBkdAc2Z4ubqhUWgHTSsBaAhHQJVtcCtA9mp1fZQoaAZHQHBhXnU2DQJoB01YAWgIR0CVbfpcophGdX2UKGgGR0BykIHRkVesaAdNEgFoCEdAlW4HFo+OfnV9lChoBkdAbjXrvb48EGgHTUMBaAhHQJVu6gctGut1fZQoaAZHQHKIJsXSBshoB007AWgIR0CVb2RF7UobdX2UKGgGR0ByjhXko4MnaAdNRAFoCEdAlW/sAmzBynV9lChoBkdAcRhZ0Syt3mgHTRYBaAhHQJVwA0HhS+B1fZQoaAZHQHA6+TeO4oZoB001AWgIR0CVcFD+irT6dX2UKGgGR0BzSs0rK/21aAdNMQFoCEdAlXD+kDZDiXV9lChoBkdAcfFPbfxc3WgHTQoBaAhHQJVxYY64lQd1fZQoaAZHQHBtXogV45doB00hAWgIR0CVclVG0/nodX2UKGgGR0BzbKAPNFBqaAdNRwFoCEdAlXKO8TSLInV9lChoBkdAcZBkSmIj4mgHTTQBaAhHQJVzAT7EYO51fZQoaAZHQHBF/yf+S8toB00tAWgIR0CVcyYChew+dX2UKGgGR0BvgM1VHWjHaAdNGwFoCEdAlXOOii7Ci3V9lChoBkdAcdnKSxJNCmgHS/xoCEdAlXRGKVII4XV9lChoBkdAcQM9C/oJRmgHTQUBaAhHQJV1Cr/82rJ1fZQoaAZHQHBitYwIt19oB00sAWgIR0CVdT5GjKxLdX2UKGgGR0BvyyfHxSYPaAdNGAFoCEdAlXWCgPEsKHV9lChoBkdAcOY1ZkkKNWgHTQYBaAhHQJV2U7/4qPR1fZQoaAZHQHAci3b212JoB0v4aAhHQJV2bHCGetl1fZQoaAZHQHCq8X7+DOFoB00bAWgIR0CVdnNh3JPqdX2UKGgGR0Bxtv5gw482aAdL9mgIR0CVd2N6gM+edX2UKGgGR0BwTnoHLRrraAdNLwFoCEdAlXfsU/OdG3V9lChoBkdATzwAS39aU2gHS9VoCEdAlXfozWPLgXV9lChoBkdAb6f2h7E5yWgHTTUBaAhHQJV4V6cAiml1fZQoaAZHQG/VRZuAI6doB00yAWgIR0CVeUtxdY4idX2UKGgGR0Bw5ug6EJ0GaAdNGAFoCEdAlXnHz6JqI3V9lChoBkdAb2pctXgccWgHTQ0BaAhHQJV6dF1B+nZ1fZQoaAZHQHMyByn1nNBoB001AWgIR0CVewWJ79hrdX2UKGgGR0BwqV7/n4fwaAdNTQFoCEdAlXvuMyad+XV9lChoBkdAcRDK3/givGgHTQ8BaAhHQJV8N2hZha11fZQoaAZHQHKClAVwgkloB00HAWgIR0CVfDEXcgyNdX2UKGgGR0BwrmgrYoRaaAdNNgFoCEdAlXx/5DZ13nVlLg=="
52
  },
53
  "ep_success_buffer": {
54
  ":type:": "<class 'collections.deque'>",
55
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
56
  },
57
- "_n_updates": 561,
58
  "observation_space": {
59
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
60
  ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu",
@@ -90,13 +90,13 @@
90
  "n_epochs": 4,
91
  "clip_range": {
92
  ":type:": "<class 'function'>",
93
- ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
94
  },
95
  "clip_range_vf": null,
96
  "normalize_advantage": true,
97
  "target_kl": null,
98
  "lr_schedule": {
99
  ":type:": "<class 'function'>",
100
- ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEyL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTIvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
101
  }
102
  }
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f9b1752caf0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f9b1752cb80>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f9b1752cc10>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f9b1752cca0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f9b1752cd30>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f9b1752cdc0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f9b1752ce50>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f9b1752cee0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f9b1752cf70>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f9b1752d000>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f9b1752d090>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f9b1752d120>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7f9b17529440>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
+ "num_timesteps": 1212416,
25
  "_total_timesteps": 2000000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1758012501621178721,
30
  "learning_rate": {
31
  ":type:": "<class 'function'>",
32
+ ":serialized:": "gAWVMAIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAksTQwh8AIgAFABTAJROhZQpjBJwcm9ncmVzc19yZW1haW5pbmeUhZSMJC90bXAvaXB5a2VybmVsXzE0NjExOTQvMzMxNzIyMzY4OC5weZSMCDxsYW1iZGE+lEsEQwIIAJSMDWluaXRpYWxfdmFsdWWUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoHH2UfZQoaBWMCDxsYW1iZGE+lIwMX19xdWFsbmFtZV9flIwhbGluZWFyX3NjaGVkdWxlLjxsb2NhbHM+LjxsYW1iZGE+lIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoFowHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
33
  },
34
  "tensorboard_log": null,
35
  "_last_obs": {
36
  ":type:": "<class 'numpy.ndarray'>",
37
+ ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAADNFGC8CuNgu4+FjTu0QoI81vmMvGvNYD0AAIA/AACAP7P3H73h8J+6bPEcPG4SFz2uYlm7yaiNtwAAgD8AAIA/wGmTPVK15buVfoW7EkRnPASjQT391kS9AACAPwAAgD8AXZU8yIC3P1LPuT6AJBg+I22OvPLoRL0AAAAAAAAAAI0ugT243aS7Opz3OGVrej3E9vu82nv9OwAAgD8AAIA/mhnIPD2iA7vDcGO6n5w3PM7eOTxpDiO9AACAPwAAgD/N9So9EgihPNTRxrx3zni+Y1lwPWsDFb0AAAAAAAAAAIDVRz1+Xqg+Lau2PEWtq77Hbdm8zok/PQAAAAAAAAAAYOAVPo8VxD4tjAi+dV6LviLGyzyCQmC9AAAAAAAAAACa+rQ9EdXjPfmxQ7zGzpO+se2KPZW4Zj0AAAAAAAAAAM29aT0pSDi6Q15NNt6bZjF409m6EvJ8tQAAgD8AAIA/2gCfPfYENbr8Gws6Rir0NEreTzqj+CS5AACAPwAAAAAm1rc9YFN9P+3kQT5ltvW+qelfPUB3oD0AAAAAAAAAACBqUT4B2Q4/DmuAPAKX974h+2E+oa7DvQAAAAAAAAAAgMfLPYcjRz6IA++9JX6nvnaNlryR5qS9AAAAAAAAAABmR2U94J66P3PVoj4D5Li9V7OOuy6iJz0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="
38
  },
39
  "_last_episode_starts": {
40
  ":type:": "<class 'numpy.ndarray'>",
 
44
  "_episode_num": 0,
45
  "use_sde": false,
46
  "sde_sample_freq": -1,
47
+ "_current_progress_remaining": 0.39379200000000003,
48
  "_stats_window_size": 100,
49
  "ep_info_buffer": {
50
  ":type:": "<class 'collections.deque'>",
51
+ ":serialized:": "gAWV+AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHJU/5ULlV+MAWyUTQEBjAF0lEdAkbD51ie/YnV9lChoBkdAb37OdoWYW2gHS+NoCEdAkbGmCuloDnV9lChoBkdAc5YBAv+OwWgHTRgBaAhHQJGx0YR/ViF1fZQoaAZHQHHffZdv865oB0vmaAhHQJGyBfWtlqd1fZQoaAZHQHJD/dEb5uZoB00OAWgIR0CRsiSsKb8WdX2UKGgGR0Bwc3p0OmSAaAdNjgJoCEdAkbKOS0Sh8XV9lChoBkdAclAlbeMyamgHS/RoCEdAkbLYC+10DHV9lChoBkdAcpI9S/CZW2gHS89oCEdAkbNiEYfnwHV9lChoBkdAcvYMLncL0GgHS/NoCEdAkbQ+GO+7DnV9lChoBkdAclRdH2AXmGgHS9doCEdAkbSaRQrMDHV9lChoBkdAb/DDn/1g6WgHS9loCEdAkbUSHEdeY3V9lChoBkdAcXqksSTQmmgHS+FoCEdAkbVlY6nzhHV9lChoBkdAc3pfu1F6RmgHS8RoCEdAkbWvqHGjsXV9lChoBkdAUYYkMTewcGgHS7poCEdAkbW8OoYNzHV9lChoBkdAcRCnJT2nKmgHTQEBaAhHQJG2czN2TxJ1fZQoaAZHQHPxI/7iyY5oB0vJaAhHQJG2+lpGnXN1fZQoaAZHQHGQEL2HtWxoB0veaAhHQJG3Ls0HhS91fZQoaAZHQHBnigwoLG9oB0vtaAhHQJG4ArhBJI11fZQoaAZHQG7qkjgQ6IZoB0vcaAhHQJG4BObiIcl1fZQoaAZHQHLGryYoiLVoB00CAWgIR0CRuD+dK/VRdX2UKGgGR0BykGlgtvn9aAdL0GgIR0CRuYce8wpOdX2UKGgGR0BxlGBreqJeaAdNCQFoCEdAkboqZYxL03V9lChoBkdAYhRvAoG6gGgHTegDaAhHQJG60gU1yeZ1fZQoaAZHQG0VZcC5mRNoB0v7aAhHQJG7HCpFTeh1fZQoaAZHQHNKKGtZFG5oB033AmgIR0CRu3CQ9zOpdX2UKGgGR0BxQ7s/pt78aAdL8mgIR0CRu6njABT5dX2UKGgGR0ByaMfq5byIaAdL62gIR0CRu8dxQzk7dX2UKGgGR0BxsCS8rZrYaAdNBAFoCEdAkbvIKtxMnXV9lChoBkdAbhJ5P/JeV2gHS/VoCEdAkbwMw1zhgnV9lChoBkdAcJ9FjNIK+mgHS95oCEdAkbzbr5ZbIXV9lChoBkdAc0TpCKJl8WgHS8ZoCEdAkb0Na+vhZXV9lChoBkdAcdV9RJmNBGgHS/BoCEdAkb0XlbNbDHV9lChoBkdAcXG+QlruY2gHTQcBaAhHQJG9IjVx0dR1fZQoaAZHQHJf1HrhR65oB0vyaAhHQJHm+2SdOIt1fZQoaAZHQHDlCEg4ffZoB00FAWgIR0CR5zghr30xdX2UKGgGR0B0Kld2Pkq+aAdL+GgIR0CR6NaouPFOdX2UKGgGR0Bw6xx//echaAdNHwJoCEdAkekFGgBcRnV9lChoBkdAcGWkK/mDDmgHS+xoCEdAkekfJA+pwXV9lChoBkdAcv6nXumaY2gHS+RoCEdAkekzurp7kXV9lChoBkdAcaMiobXHzmgHTR8BaAhHQJHpPrE9+w11fZQoaAZHQG8aL876pHZoB0vbaAhHQJHpS2a2F391fZQoaAZHQHB1BwVCXyBoB0vWaAhHQJHpe9kBjnV1fZQoaAZHQHByMvqTr3VoB0v5aAhHQJHqGLMs6JZ1fZQoaAZHQHGltcOby6NoB0vHaAhHQJHqJovi97F1fZQoaAZHQHFjvBBRhttoB0v+aAhHQJHqTBGhEjR1fZQoaAZHQHMTpXdTHbRoB0vNaAhHQJHqdapxWDJ1fZQoaAZHQG8us1baAWloB0vraAhHQJHrFNHpbEB1fZQoaAZHQHIu/fKp1ihoB00DAWgIR0CR634O+ZgHdX2UKGgGR0BuUBEv0yxiaAdNTQFoCEdAkewc7yQPqnV9lChoBkdAcesFBY3eemgHS+1oCEdAkewjposZpHV9lChoBkdAbRUgmJFb3WgHS/RoCEdAkex6ABkqc3V9lChoBkdAcqGO3UhFE2gHS8poCEdAkez686FM7HV9lChoBkdAQdIHgP3BYWgHS79oCEdAke1X1FpfyHV9lChoBkdAchVNo8IRiGgHS8xoCEdAke1rFXJYDHV9lChoBkdAcu6t8NQTEmgHS+RoCEdAke2ugg5imXV9lChoBkdAbj+4ecQRPGgHS+1oCEdAke4Ia99MK3V9lChoBkdAcvsA5Jbt7mgHS9loCEdAke6cK1G9YnV9lChoBkdAckurC3w1BWgHS9toCEdAke6aePJaJXV9lChoBkdAb6HSVnmJWWgHTQkBaAhHQJHusg+yJKt1fZQoaAZHQHDKKYVqN6xoB00TAWgIR0CR7smQ8wHrdX2UKGgGR0Bydh8XvYvnaAdLyWgIR0CR7z/NZ/0/dX2UKGgGR0BwVcBFNL13aAdL+GgIR0CR75GEPDpDdX2UKGgGR0Bw5vROUMXraAdNDgFoCEdAke/X7Hhjv3V9lChoBkdAc2G3PAwfyWgHS8JoCEdAkfAgtFrmAHV9lChoBkdAcpvzImw7kmgHS85oCEdAkfFDM7lq8HV9lChoBkdAcsNxiG34K2gHS/loCEdAkfFKpgkTpXV9lChoBkdAcUId4mkWRGgHS+toCEdAkfFbaufVZ3V9lChoBkdAckLD7Ikqt2gHS9BoCEdAkfHB/Aj6e3V9lChoBkdAb8DNJOFg2WgHS+9oCEdAkfJizLOiWXV9lChoBkdAUbWJ3xFy72gHS4hoCEdAkfLCkGiYcHV9lChoBkdAbrU4bS7XhGgHTV8BaAhHQJHy5UyYXwd1fZQoaAZHQHCOafBeok1oB0vRaAhHQJHzIDwH7gt1fZQoaAZHQHFvyFsYVItoB0vgaAhHQJHzYDbJwKl1fZQoaAZHQHEiNFKCg9NoB00bAWgIR0CR87zv7WNFdX2UKGgGR0BwQOiN83MqaAdL8WgIR0CR871pj+aSdX2UKGgGR0BwDWQ4jrzHaAdNDwFoCEdAkfPVct5D7nV9lChoBkdAcd3ez2OAAmgHS+9oCEdAkfPfsRg7YHV9lChoBkdAbSfeDWbw0GgHS91oCEdAkfQ9c0Ltu3V9lChoBkdAcjZ6reZXuGgHS+5oCEdAkfRGOU+s5nV9lChoBkdAcAt+Q2dd3WgHS8toCEdAkfWAIMSbpnV9lChoBkdAcGgZ9NN8E2gHTQUBaAhHQJH1invUjLV1fZQoaAZHQHMCsR6F/QVoB0vQaAhHQJH1lV81Gb11fZQoaAZHQG1jIVM23rloB0vvaAhHQJH2R0GNaQp1fZQoaAZHQHE5frKNhmZoB0vzaAhHQJH2xmf5DZ11fZQoaAZHQHCWLH2h7E5oB0viaAhHQJH3Amu1WsB1fZQoaAZHQG5LjOTq0MRoB0vhaAhHQJH3W5e7cwh1fZQoaAZHQG/c+1KGtZFoB0vaaAhHQJH3ktDlYEJ1fZQoaAZHQHJqNCE6DGtoB0vOaAhHQJH3j+FUQ051fZQoaAZHQG7Mz3AVO9FoB0vnaAhHQJH3ocghbGF1fZQoaAZHQHOU0Ao5PuZoB0vHaAhHQJH32SdOIqN1fZQoaAZHQG/7OZb6guhoB0vRaAhHQJH39NdqtYB1fZQoaAZHQHE9CLVFx4poB0vTaAhHQJH4iRB/qgR1fZQoaAZHQHDlNKmKqGVoB0voaAhHQJH4jVawD/51fZQoaAZHQFRHuuzQeFNoB0uTaAhHQJH4nwb2lEZ1fZQoaAZHQGwOY1YQrc1oB0vfaAhHQJH4yu6mO2l1fZQoaAZHQHFL/8ZUDMhoB00LAWgIR0CR+Qlf7aZhdX2UKGgGR0BzZFDb8FY/aAdL42gIR0CR+g4z7/GVdX2UKGgGR0Bwk5gqmTC+aAdL22gIR0CR+p+mFajfdX2UKGgGR0Bw61pItlI3aAdL4mgIR0CR+01FYuCgdX2UKGgGR0BxEC04R28qaAdL5WgIR0CR+5zSkTHsdWUu"
52
  },
53
  "ep_success_buffer": {
54
  ":type:": "<class 'collections.deque'>",
55
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
56
  },
57
+ "_n_updates": 853,
58
  "observation_space": {
59
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
60
  ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu",
 
90
  "n_epochs": 4,
91
  "clip_range": {
92
  ":type:": "<class 'function'>",
93
+ ":serialized:": "gAWV1wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMXi9ob21lL3VkdWdhbWF2aXRoYW5hZ2JsdS8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjF4vaG9tZS91ZHVnYW1hdml0aGFuYWdibHUvLmxvY2FsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
94
  },
95
  "clip_range_vf": null,
96
  "normalize_advantage": true,
97
  "target_kl": null,
98
  "lr_schedule": {
99
  ":type:": "<class 'function'>",
100
+ ":serialized:": "gAWV1wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMXi9ob21lL3VkdWdhbWF2aXRoYW5hZ2JsdS8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjF4vaG9tZS91ZHVnYW1hdml0aGFuYWdibHUvLmxvY2FsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFowEZnVuY5SMDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
101
  }
102
  }
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:667c1e66d9303d1f30409f9391d1f75582ea8289602a950d3373f0929f692111
3
  size 88887
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9ecbf804f43494b877aa0f95b650004712f84e981740932805386549532e20e
3
  size 88887
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d3064d30b04745477cf03f29481c873c1e6d5b8778daf238b8ca4f2d25fd97c
3
  size 44095
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4865e32ecfbfdc6e007a787ba0cb6e50932fd71b8259dbd1e1240441abb497b
3
  size 44095
ppo-LunarLander-v2/system_info.txt CHANGED
@@ -1,9 +1,8 @@
1
- - OS: Linux-6.1.123+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Mar 30 16:01:29 UTC 2025
2
- - Python: 3.12.11
3
  - Stable-Baselines3: 2.0.0a5
4
- - PyTorch: 2.8.0+cu126
5
  - GPU Enabled: True
6
- - Numpy: 2.0.2
7
  - Cloudpickle: 3.1.1
8
  - Gymnasium: 0.28.1
9
- - OpenAI Gym: 0.25.2
 
1
+ - OS: Linux-5.15.0-136-generic-x86_64-with-glibc2.35 # 147-Ubuntu SMP Sat Mar 15 15:53:30 UTC 2025
2
+ - Python: 3.10.12
3
  - Stable-Baselines3: 2.0.0a5
4
+ - PyTorch: 2.8.0+cu128
5
  - GPU Enabled: True
6
+ - Numpy: 2.2.6
7
  - Cloudpickle: 3.1.1
8
  - Gymnasium: 0.28.1
 
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90db9de583e2f129bf15a26884629b07a02206009a347ca97b22f6ddde363740
3
- size 148508
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d1e78b98c561ae4d53c00ed455d190253617243077dde948ccc9a2902e5c796
3
+ size 143978
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 260.8037887, "std_reward": 19.080430760396418, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-09-10T13:05:56.265281"}
 
1
+ {"mean_reward": 276.29566489999996, "std_reward": 15.517366313599448, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-09-16T11:09:56.452508"}