DumbleDuck commited on
Commit
9e9dfcf
·
verified ·
1 Parent(s): e9a97e2
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 259.71 +/- 23.20
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 271.31 +/- 18.36
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7e632f3bfe20>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e632f3bfec0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e632f3bff60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e632f3c4040>", "_build": "<function ActorCriticPolicy._build at 0x7e632f3c40e0>", "forward": "<function ActorCriticPolicy.forward at 0x7e632f3c4180>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7e632f3c4220>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e632f3c42c0>", "_predict": "<function ActorCriticPolicy._predict at 0x7e632f3c4360>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e632f3c4400>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e632f3c44a0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7e632f3c4540>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7e632f32cdc0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1744928601912979673, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAACy/aq+Tg+sPkJL8T12/4S+9xGFOsbmHTwAAAAAAAAAABp2Kz6P8nS87huOuZCTDTg9cte9sci7OAAAgD8AAIA/GrJKvbtr9T3tIAw93zjqvcF/OLyLYku9AAAAAAAAAABFqLK+1sssP2jwdjqSba2+G64hvkvejDwAAAAAAAAAAFqEFT6s/io+9o5Wvi0jZL7o+TO9LC4PvQAAAAAAAAAAmuaJPAc8tT961w0/u5FCPavhTrxNnhu9AAAAAAAAAADA71a+xUurPAoAAzuPVYK5OcQ5vjKMLroAAIA/AACAP6Asj76B+bw+Xi9JPqxTj74Hkho8+rQPvQAAAAAAAAAAzcCdvdLA9zy+S/A9b8TtvYWq/zxdxde7AAAAAAAAAABacpG97grcPYWGvz0JJ0i+NA8yPe0NWrwAAAAAAAAAAJp7lD2GiEQ/dF6APVQYC7+Kp649VVFaPAAAAAAAAAAA5kDxvXtc+LpgjC27iVOduEgc6Tv4EW06AACAPwAAAADasdm9TWAKPp7RK72KsFS+zk9MvVacqj0AAAAAAAAAAA1Ujb1yOAA/FahlPWHSvL7dxgU9kAH0vAAAAAAAAAAACsSVPtKeGz7N3IS+SyBSvsCYFryOjq68AAAAAAAAAAAaaya+z8xjvGYCvbuaZja6W1bEPf3qEzsAAIA/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVhAAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksQhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVCgwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHAqbJOnEVGMAWyUTWQBjAF0lEdAniXF8b70nXV9lChoBkdAcGhBf8dgfGgHS/NoCEdAniY5C4SYgXV9lChoBkdAcCaOVgQYk2gHS/poCEdAniZEi+tbLXV9lChoBkdAb3Py+Yc/+2gHS/BoCEdAnigGi5/b03V9lChoBkdAYK/4etCAtmgHTegDaAhHQJ4osawUxmF1fZQoaAZHQHFwrPIGQjloB0v1aAhHQJ4pB2OhkAh1fZQoaAZHQDrn5XU6PsBoB0vKaAhHQJ4ppHG0eEJ1fZQoaAZHQHGI9/nW8RNoB0vfaAhHQJ4q5v2oNut1fZQoaAZHQGEMgjps41hoB03oA2gIR0CeKwYFaB7NdX2UKGgGR0BvxdEuxrzoaAdL42gIR0CeK7xZdOZcdX2UKGgGR0BtttY4hllLaAdL72gIR0CeK8nRb8m8dX2UKGgGR0Bw6AX+ERJ3aAdL/WgIR0CeK/N9ph4MdX2UKGgGR0BuhBVENOM3aAdL82gIR0CeLAnPmgandX2UKGgGR0Bic7Z6D5CXaAdN6ANoCEdAniwvLHMlknV9lChoBkdAcVxX2M85j2gHTXQBaAhHQJ4sWiO/+Kl1fZQoaAZHQHFBXFDOTq1oB0voaAhHQJ4uTbN8ma91fZQoaAZHQHDDp+c6Nl1oB00FAWgIR0CeLvrQw9JSdX2UKGgGR0BvV0oQWepXaAdL22gIR0CeL/E87p3YdX2UKGgGR0Bw9urilzltaAdL5GgIR0CeMJ1q33HrdX2UKGgGR0BzSbUsnRb9aAdNcgFoCEdAnjD1h9b5dnV9lChoBkdAckvFDOTq0WgHTVIBaAhHQJ4xpZ1V5rx1fZQoaAZHQGy5GB4D9wZoB0vxaAhHQJ4x5NHpbEB1fZQoaAZHQHDcV8G9pRJoB00kAWgIR0CeMggRbr1NdX2UKGgGR0Bw5CQRwqAjaAdL2GgIR0CeMhVB2OhkdX2UKGgGR0BwiBiCrcTKaAdL+WgIR0CeMima6STydX2UKGgGR0BwXmPDHfdiaAdL8WgIR0CeMmsY2sJZdX2UKGgGR0BwxdEw35vcaAdL9WgIR0CeMrcW0qpcdX2UKGgGR0BxEAudwvQGaAdL+GgIR0CeMwuUliSadX2UKGgGR0Bw5HwVj7Q+aAdNAAFoCEdAnjNjVtoBaXV9lChoBkdAcjEnYQJ5V2gHTS4BaAhHQJ4z5VR1oxp1fZQoaAZHQG5/MySFGodoB0vzaAhHQJ41sqDsdDJ1fZQoaAZHQHBehNRFZxJoB00XAWgIR0CeNh8IAwPAdX2UKGgGR0BwEmBg/keZaAdL92gIR0CeNrjMFEApdX2UKGgGR0Bu91xwQ176aAdL2GgIR0CeOFZU1hsqdX2UKGgGR0BwOLEXLvCuaAdL7mgIR0CeOGcriEQHdX2UKGgGR0ByAtCngpBpaAdNAQFoCEdAnjjDtG/etXV9lChoBkdAa7+1ejVQRGgHTSABaAhHQJ45ETlDF611fZQoaAZHQHE+CGrS3LFoB00DAWgIR0CeOTtzS1E3dX2UKGgGR0BwnqOdXko4aAdL6mgIR0CeOUsBQvYfdX2UKGgGR0BscsCYCyQgaAdL2mgIR0CeOaouf29MdX2UKGgGR0BwxWmtQsPKaAdL7mgIR0CeOdpaA4GVdX2UKGgGR0ByGIYP5HmSaAdNIAFoCEdAnjoxfShJy3V9lChoBkdAbWs6V+qioWgHS+loCEdAnjqpI+W4VnV9lChoBkdAcN1ITXarWGgHS+poCEdAnjz6nFYMfHV9lChoBkdAcCWgg5imVWgHS/5oCEdAnj0i1E3KjnV9lChoBkdAcNXHRCx/u2gHS/BoCEdAnj+mxt52QnV9lChoBkdAcXBqp97Wu2gHTQQBaAhHQJ5A0Cih37l1fZQoaAZHQG5qKq4pc5doB0v8aAhHQJ5A2jrRjSZ1fZQoaAZHQG6DcohIOH5oB0vlaAhHQJ5A+MaS9uh1fZQoaAZHQG9VUhvBJqZoB0vdaAhHQJ5BLLowEhd1fZQoaAZHQHD1x9gF5fNoB00AAWgIR0CeQUVbA1vVdX2UKGgGR0BroEjAzpHJaAdNCAFoCEdAnkF5dOZb6nV9lChoBkdAb8KOwxFiKGgHS+9oCEdAnkJZX2dupHV9lChoBkdAcSjQAuIykGgHTRwBaAhHQJ5CldMTN+t1fZQoaAZHQHHcSNn5BTpoB0v3aAhHQJ5FNS88La51fZQoaAZHQG/x4ptrKvFoB0v1aAhHQJ5FT4Kx9oh1fZQoaAZHQGTYILPUrkNoB03oA2gIR0CeRwr7wazedX2UKGgGR0BxoBsi0OVgaAdL6WgIR0CeSMXCTEBKdX2UKGgGR0ByEXbRF7UoaAdL5WgIR0CeSQbIcR16dX2UKGgGR0BxePFXJYDDaAdL9mgIR0CeSVMo+fRNdX2UKGgGR0BxkqnaWX1KaAdL8WgIR0CeSZpKzzErdX2UKGgGR0Bywna11GLDaAdNIgFoCEdAnknFMmF8HHV9lChoBkdARWkmplz2e2gHS9NoCEdAnkoBt52Qn3V9lChoBkdAcHO08NhE0GgHS/BoCEdAnkrFPrOZ9nV9lChoBkdAcGFh2GIsRWgHTQ8BaAhHQJ5K5sCT2WZ1fZQoaAZHQHGOVBMSK3xoB00TAWgIR0CeT6SNfgJkdX2UKGgGR0Bs+pfKISDiaAdL7WgIR0CeUBn752yLdX2UKGgGR0BjiKgdwNsnaAdN6ANoCEdAnlE23nZCfHV9lChoBkdAcBgVRDTjN2gHS9xoCEdAnlFMQ2/BWXV9lChoBkdAZL+OHWSU1WgHTegDaAhHQJ5TPGDL8rJ1fZQoaAZHQG81f16E8JVoB0v8aAhHQJ5TiM6zVtp1fZQoaAZHQHIHepCKJl9oB00gAWgIR0CeVKbhFVkudX2UKGgGR0ByuRZkkKNRaAdNOwFoCEdAnldQUYbbUXV9lChoBkdAcnz5UtI07GgHTSQBaAhHQJ5XifukUK11fZQoaAZHQG2ZvN3W4ExoB00+AWgIR0CeV8aYeDFqdX2UKGgGR0Bxh/QTmGM5aAdNOgFoCEdAnljPFWGRFXV9lChoBkdAYSTV4oqkM2gHTegDaAhHQJ5c1xbSqlx1fZQoaAZHQHFMfllsguBoB0v8aAhHQJ5c2AtnPE91fZQoaAZHQHA3QKv3ai9oB00QAWgIR0CeXSyzXz19dX2UKGgGR0BwOaMglnh9aAdL+GgIR0CeXbEcsDnvdX2UKGgGR0BtAp84PwuvaAdNQAJoCEdAnl4TshPj43V9lChoBkdAYkhX6InBtWgHTegDaAhHQJ5ekBPsRg91fZQoaAZHQG/ugTh5xBFoB0vmaAhHQJ5emMbWEsd1fZQoaAZHQG5X8/lhgE5oB0vpaAhHQJ5e9EpiI+J1fZQoaAZHQHGkjMibDuVoB00FAWgIR0CeYG0WM0gsdX2UKGgGR0Bwo++SKWLQaAdNBwFoCEdAnmIDBRAKOXV9lChoBkdAcamS4OMER2gHS/1oCEdAnmKvV3EAHXV9lChoBkdAcNqaF23az2gHTRYBaAhHQJ5i1AJLM9t1fZQoaAZHQHCAWPo3aSNoB0vbaAhHQJ5k+P7vXsh1fZQoaAZHQHElDQzDXOJoB00KAWgIR0CeZeZGKAJ+dX2UKGgGR0BwTcxJul41aAdL4WgIR0CeZkpNbkfcdX2UKGgGR0BxFBKAavRraAdL6GgIR0CeZofzjFQ3dX2UKGgGR0BtuzbBXS0CaAdL/GgIR0CeZrKnvUjLdX2UKGgGR0BwKup++dsjaAdNGQFoCEdAnmbQKKHfuXV9lChoBkdAcEeLUTcqOWgHS+VoCEdAnmbYTPBzm3V9lChoBkdAbpydhiLEUGgHTSgBaAhHQJ5nA5zYEnt1fZQoaAZHQF3IeFcpsoFoB03oA2gIR0CeZ/Syt3fRdX2UKGgGR0Bxm0OI68xsaAdL6WgIR0CeaGmvGIbgdX2UKGgGR0BwTC6+WWyDaAdL4WgIR0CeaY2t+1BudX2UKGgGR0BzCL0se4kNaAdL+mgIR0CeawO0LMLXdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjExL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTEvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjExL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTEvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.1.123+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Mar 30 16:01:29 UTC 2025", "Python": "3.11.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.6.0+cu124", "GPU Enabled": "True", "Numpy": "2.0.2", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7e6e8ed8d6c0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e6e8ed8d760>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e6e8ed8d800>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e6e8ed8d8a0>", "_build": "<function ActorCriticPolicy._build at 0x7e6e8ed8d940>", "forward": "<function ActorCriticPolicy.forward at 0x7e6e8ed8d9e0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7e6e8ed8da80>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e6e8ed8db20>", "_predict": "<function ActorCriticPolicy._predict at 0x7e6e8ed8dbc0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e6e8ed8dc60>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e6e8ed8dd00>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7e6e8ed8dda0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7e6e8f1cf9c0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1744934599250485401, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAAB6uxs+tkBXvGoHDjuz2dS5xNrFvUOVkboAAIA/AACAPwY+RL6PWX28Ox77upLKGbkXLts9c4ocOgAAgD8AAIA/esxAPvbwUbzynZw6TRKTuHeetL2jI7+5AACAPwAAgD8Nh7I9kqOUPiJSGDxGS7W+PPVKPe4tjzsAAAAAAAAAAHPHyb1cY126ILrsuc+9ALgh55K6KRgOOQAAgD8AAIA/gIiyPb6Nqz/8Ogw/PYLKvk1NLrwwLPs9AAAAAAAAAAAWHJM+0y8GPwmItr0rkvK+XpkUPsw+hr0AAAAAAAAAAGar870ePMA943FfPsmFVb78HIY9vlRYvAAAAAAAAAAAZoPdPaDS1D5v8YS9eX4IvyAsSD2p1oy8AAAAAAAAAABaQoE+VYBaPsbB672Vona+5mJzPW5bIr0AAAAAAAAAAACcxT1yXpc/RosUPqD1Qb+fZRg9OkERvQAAAAAAAAAAAiegvqfP3z6byY29vgHxvrUbd75yYRM+AAAAAAAAAABaxm0+lM38PmN8nD3pgAW/SL8rPnr7g7wAAAAAAAAAADNBIDxpK3E/9uILPDMNL7+pTCg8v/isuwAAAAAAAAAAIDMovi7ugbzisRs7ByVhOaqJ7z3jcVO6AACAPwAAgD/NYnk8KYehPx5zBT5Rniy/heUpPGifcT0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVhAAAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksQhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV/AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHHP/1+RYA+MAWyUS+2MAXSUR0CZ4G2LYPGydX2UKGgGR0BLJeUhV2idaAdLr2gIR0CZ4Oai9IwudX2UKGgGR0BxZnZqVQhwaAdL8mgIR0CZ4g3gDRtxdX2UKGgGR0BxvB8+iaiLaAdLrGgIR0CZ4g1s+FDfdX2UKGgGR0ByYds0pEx7aAdL/GgIR0CZ4kSJj2BbdX2UKGgGR0Bx0gcOskpraAdL6mgIR0CZ5eYDklu4dX2UKGgGR0BvOUuctoSMaAdL4GgIR0CZ5sE+gUUPdX2UKGgGR0Bxmwxzq8lHaAdL82gIR0CZ5sAMUh3adX2UKGgGR0Bw9/t8eCCjaAdL5mgIR0CZ6NH2RJVbdX2UKGgGR0BxUTW1+iJwaAdLsWgIR0CZ6OtEXtSidX2UKGgGR0BwMX9rGipOaAdL3GgIR0CZ6Q12q1gIdX2UKGgGR0Bhtb3XZoPDaAdN6ANoCEdAmenLi6xxDXV9lChoBkdAbXTQswtap2gHTU4BaAhHQJnqHKlpGnZ1fZQoaAZHQHJCmH1vl2hoB00qAWgIR0CZ6kg0j1PFdX2UKGgGR0BwHbanJkoXaAdL6WgIR0CZ6rfCyhSMdX2UKGgGR0Bxg8jps41haAdNBwFoCEdAmevdnCfpU3V9lChoBkdAYH8ZlWfbsWgHTegDaAhHQJntKiQDFId1fZQoaAZHQHF9g3T/hl1oB0vmaAhHQJnuL7/GVA11fZQoaAZHQGJ4qsdT5whoB03oA2gIR0CZ7rULUkOadX2UKGgGR0BwWupwS8J2aAdNAAFoCEdAme78PJ7swHV9lChoBkdAcxpo/RmbsmgHS8loCEdAme8w8OkLyHV9lChoBkdAYxabjLjgh2gHTegDaAhHQJnviaTfR/p1fZQoaAZHQHBqomPYFq1oB0vWaAhHQJnvoiKR+0B1fZQoaAZHQHIRPEwWWQhoB0vAaAhHQJnv+lvZRKp1fZQoaAZHwC+l7x/d69loB0uYaAhHQJnwewFC9h91fZQoaAZHQHAPzYAbQ1JoB0v8aAhHQJnwwdlum791fZQoaAZHQHDWjJp35etoB0vgaAhHQJnw/H3lCC11fZQoaAZHQG/kHryDqW1oB0vCaAhHQJnymG34Kx91fZQoaAZHQHGV/epGWldoB005AWgIR0CZ8uBCUorndX2UKGgGR0Bwxbww0wajaAdLsGgIR0CZ82xs2vSudX2UKGgGR0BxaUbuMMqjaAdLzmgIR0CZ88yQxN7CdX2UKGgGR0BxuovduYQbaAdLwmgIR0CZ9FhS9/SZdX2UKGgGR0BG5wIUrTYvaAdLwmgIR0CZ9LnIQvpRdX2UKGgGR0BwiVYmsvIwaAdL82gIR0CZ9ojc2zfKdX2UKGgGR0Bvtk2P1ct5aAdL7mgIR0CZ9un7YTTOdX2UKGgGR0BsmYUvf0mMaAdL3WgIR0CZ9vzpHI6sdX2UKGgGR0BwRpmWdEsraAdL2WgIR0CZ9zdcjZ+QdX2UKGgGR0BvUDxgAp8XaAdL1WgIR0CZ92exfOUudX2UKGgGR0Bue+vECNjtaAdLxWgIR0CZ+TYJE6T4dX2UKGgGR0Bx1iKaXrt3aAdL5GgIR0CZ+8OrQw9JdX2UKGgGR0BuLrDuSfUXaAdL1WgIR0CZ/KWBjFyadX2UKGgGR0ByRUl8gIQfaAdNEAFoCEdAmfzxaC+UQnV9lChoBkdAZR9bdJrckGgHTegDaAhHQJn8/RSgoPV1fZQoaAZHQHDz5rYXfqJoB00BAWgIR0CZ/bnlGPPtdX2UKGgGR0BwrOfkFOfvaAdLr2gIR0CZ/kMewLVndX2UKGgGR0BxhyWX1J18aAdLymgIR0CZ/wgNPP9ldX2UKGgGR0BuoKLIgeRxaAdLwWgIR0CZ/yj+aScLdX2UKGgGR0BzBOWTot+TaAdNGwFoCEdAmf+Wt6ol2XV9lChoBkdAYLG8Gs3hoGgHTegDaAhHQJn/qUliSaF1fZQoaAZHQHGUqnaWX1JoB0vaaAhHQJn/tFI/Z/V1fZQoaAZHwDE7ABT4tYloB0uHaAhHQJoAdQsPJ7t1fZQoaAZHQG5D5k078vVoB0vVaAhHQJoDXNpudf91fZQoaAZHQG4ODCP6sQxoB0vVaAhHQJoDiyUs4DN1fZQoaAZHQHCQm9DhLoRoB0viaAhHQJoD/7Kq4pd1fZQoaAZHQHA3u+M6zVtoB0vSaAhHQJoECdQO4G51fZQoaAZHQHHdl7MPjGVoB01dAWgIR0CaBTJIUahpdX2UKGgGR0BuViB/ZuhsaAdL02gIR0CaBX8NQTEjdX2UKGgGR0BwyFkGzKLbaAdL72gIR0CaBkz2exwAdX2UKGgGR0BlyP5i3G4raAdN6ANoCEdAmgZqR2bG3nV9lChoBkdAch6PykKu0WgHS99oCEdAmgaJ0bLlm3V9lChoBkdAcK4W6bvw3GgHS+BoCEdAmgaIDs+mnHV9lChoBkdAclkjX4CZGGgHS+loCEdAmgatgBtDUnV9lChoBkdAcgqJ6po9LmgHTRoBaAhHQJoGyh11W811fZQoaAZHQHGQjundfsxoB00BAWgIR0CaCBSfDk2hdX2UKGgGR0BxCKup0fYBaAdLqWgIR0CaCeDPnjhldX2UKGgGR0BzUytJWeYlaAdL5WgIR0CaCf7eVLSNdX2UKGgGR0BxRzag2606aAdL2GgIR0CaCjXCj1wpdX2UKGgGR0Biug2uPmxMaAdN6ANoCEdAmgpFlkH2RXV9lChoBkdAcNspmEoOQWgHS+1oCEdAmgrNvKlpGnV9lChoBkdAcgxsOoYNzGgHTQgBaAhHQJoLHm2b5M11fZQoaAZHQHHpkeIVM25oB0u2aAhHQJoLN+c6Nl11fZQoaAZHQHDcU2pAD7toB0vEaAhHQJoLs32mHgx1fZQoaAZHQHDojUVi4KBoB0vSaAhHQJoMPgccU/R1fZQoaAZHQHB9BeC04R5oB0v7aAhHQJoMUfgaWHF1fZQoaAZHQHGKeDjBEa5oB0voaAhHQJoMcBltj1B1fZQoaAZHQHLZnDziCJ5oB00EAWgIR0CaDZLcbiqAdX2UKGgGR0ByH/987ZFoaAdL1mgIR0CaDdGgSOBEdX2UKGgGR0BhJhmZmZmaaAdN6ANoCEdAmg3QUUO/cnV9lChoBkdAb1X1SwW30GgHS8BoCEdAmg74+bExZnV9lChoBkdAcKlJuVHFxWgHS8BoCEdAmg9CaJAMUnV9lChoBkdAb09rGipNsWgHS8ZoCEdAmg/62KEWZnV9lChoBkdAcwMRgJC0GGgHTXYBaAhHQJoQWGqPwNN1fZQoaAZHQHFtCBbwBo5oB0v3aAhHQJoQsh5gPVd1fZQoaAZHQHIieGfwqiJoB00LAWgIR0CaEO2n889wdX2UKGgGR0BvQedXko4NaAdLxGgIR0CaEYqnWJ7+dX2UKGgGR0BzBis4ku6FaAdL82gIR0CaEhlO45LidX2UKGgGR0ByK9tgrpaBaAdL4GgIR0CaEh9QoCuEdX2UKGgGR0BySDPqs2ehaAdNFgFoCEdAmhKDnmq5snV9lChoBkdAcX2r4nF5wGgHS71oCEdAmhQn9aUzK3V9lChoBkdAcTtIvJzT4WgHS/ZoCEdAmhR6W9lEqnV9lChoBkdAYch2alUIcGgHTegDaAhHQJoVCrp7kXF1fZQoaAZHQHEyV/x2B8RoB00cAWgIR0CaFWJ1aGHpdX2UKGgGR0Bw/Yqur6tUaAdLyGgIR0CaFZASnLq2dX2UKGgGR0BuKlAgPmPpaAdLxGgIR0CaFde5WilBdX2UKGgGR0BwjC0w8GLUaAdL8GgIR0CaFf7bcoH+dX2UKGgGR0By8dNg0CRwaAdNMgFoCEdAmhZGF8G9pXV9lChoBkdAcF/IQvpQlGgHS8xoCEdAmhatGViWmnV9lChoBkdAcZgM23rleWgHS9xoCEdAmhbXtfG+9XV9lChoBkdAcWaITGo73mgHS8xoCEdAmhfUPMB6r3V9lChoBkdAcITCvHLidmgHS79oCEdAmhfkqUeMh3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBNudW1weS5fY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolggAAAAAAAAAAQEBAQEBAQGUaBVLCIWUaBl0lFKUjAZfc2hhcGWUSwiFlIwDbG93lGgRKJYgAAAAAAAAAAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlGgLSwiFlGgZdJRSlIwEaGlnaJRoESiWIAAAAAAAAAAAALRCAAC0QgAAoEAAAKBA2w9JQAAAoEAAAIA/AACAP5RoC0sIhZRoGXSUUpSMCGxvd19yZXBylIxbWy05MC4gICAgICAgIC05MC4gICAgICAgICAtNS4gICAgICAgICAtNS4gICAgICAgICAtMy4xNDE1OTI3ICAtNS4KICAtMC4gICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMU1s5MC4gICAgICAgIDkwLiAgICAgICAgIDUuICAgICAgICAgNS4gICAgICAgICAzLjE0MTU5MjcgIDUuCiAgMS4gICAgICAgICAxLiAgICAgICBdlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV3AAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFm51bXB5Ll9jb3JlLm11bHRpYXJyYXmUjAZzY2FsYXKUk5SMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJDCAQAAAAAAAAAlIaUUpSMBXN0YXJ0lGgIaA5DCAAAAAAAAAAAlIaUUpSMBl9zaGFwZZQpjAVkdHlwZZRoDowKX25wX3JhbmRvbZROdWIu", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.015, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjExL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTEvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjExL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTEvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.1.123+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Mar 30 16:01:29 UTC 2025", "Python": "3.11.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.6.0+cu124", "GPU Enabled": "True", "Numpy": "2.0.2", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1dfcd7833e791e9d63fbd905d84b0dbf17144a7b44b2fc2f2c2d817262c616e
3
- size 148055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ebdcdee26b73e0c5cdba478998addf2d19b5b87d5a4ef1df33171953768d342
3
+ size 148041
ppo-LunarLander-v2/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7e632f3bfe20>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e632f3bfec0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e632f3bff60>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e632f3c4040>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7e632f3c40e0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7e632f3c4180>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7e632f3c4220>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e632f3c42c0>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7e632f3c4360>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e632f3c4400>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e632f3c44a0>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7e632f3c4540>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7e632f32cdc0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
@@ -26,12 +26,12 @@
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1744928601912979673,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAACy/aq+Tg+sPkJL8T12/4S+9xGFOsbmHTwAAAAAAAAAABp2Kz6P8nS87huOuZCTDTg9cte9sci7OAAAgD8AAIA/GrJKvbtr9T3tIAw93zjqvcF/OLyLYku9AAAAAAAAAABFqLK+1sssP2jwdjqSba2+G64hvkvejDwAAAAAAAAAAFqEFT6s/io+9o5Wvi0jZL7o+TO9LC4PvQAAAAAAAAAAmuaJPAc8tT961w0/u5FCPavhTrxNnhu9AAAAAAAAAADA71a+xUurPAoAAzuPVYK5OcQ5vjKMLroAAIA/AACAP6Asj76B+bw+Xi9JPqxTj74Hkho8+rQPvQAAAAAAAAAAzcCdvdLA9zy+S/A9b8TtvYWq/zxdxde7AAAAAAAAAABacpG97grcPYWGvz0JJ0i+NA8yPe0NWrwAAAAAAAAAAJp7lD2GiEQ/dF6APVQYC7+Kp649VVFaPAAAAAAAAAAA5kDxvXtc+LpgjC27iVOduEgc6Tv4EW06AACAPwAAAADasdm9TWAKPp7RK72KsFS+zk9MvVacqj0AAAAAAAAAAA1Ujb1yOAA/FahlPWHSvL7dxgU9kAH0vAAAAAAAAAAACsSVPtKeGz7N3IS+SyBSvsCYFryOjq68AAAAAAAAAAAaaya+z8xjvGYCvbuaZja6W1bEPf3qEzsAAIA/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -45,7 +45,7 @@
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWVCgwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHAqbJOnEVGMAWyUTWQBjAF0lEdAniXF8b70nXV9lChoBkdAcGhBf8dgfGgHS/NoCEdAniY5C4SYgXV9lChoBkdAcCaOVgQYk2gHS/poCEdAniZEi+tbLXV9lChoBkdAb3Py+Yc/+2gHS/BoCEdAnigGi5/b03V9lChoBkdAYK/4etCAtmgHTegDaAhHQJ4osawUxmF1fZQoaAZHQHFwrPIGQjloB0v1aAhHQJ4pB2OhkAh1fZQoaAZHQDrn5XU6PsBoB0vKaAhHQJ4ppHG0eEJ1fZQoaAZHQHGI9/nW8RNoB0vfaAhHQJ4q5v2oNut1fZQoaAZHQGEMgjps41hoB03oA2gIR0CeKwYFaB7NdX2UKGgGR0BvxdEuxrzoaAdL42gIR0CeK7xZdOZcdX2UKGgGR0BtttY4hllLaAdL72gIR0CeK8nRb8m8dX2UKGgGR0Bw6AX+ERJ3aAdL/WgIR0CeK/N9ph4MdX2UKGgGR0BuhBVENOM3aAdL82gIR0CeLAnPmgandX2UKGgGR0Bic7Z6D5CXaAdN6ANoCEdAniwvLHMlknV9lChoBkdAcVxX2M85j2gHTXQBaAhHQJ4sWiO/+Kl1fZQoaAZHQHFBXFDOTq1oB0voaAhHQJ4uTbN8ma91fZQoaAZHQHDDp+c6Nl1oB00FAWgIR0CeLvrQw9JSdX2UKGgGR0BvV0oQWepXaAdL22gIR0CeL/E87p3YdX2UKGgGR0Bw9urilzltaAdL5GgIR0CeMJ1q33HrdX2UKGgGR0BzSbUsnRb9aAdNcgFoCEdAnjD1h9b5dnV9lChoBkdAckvFDOTq0WgHTVIBaAhHQJ4xpZ1V5rx1fZQoaAZHQGy5GB4D9wZoB0vxaAhHQJ4x5NHpbEB1fZQoaAZHQHDcV8G9pRJoB00kAWgIR0CeMggRbr1NdX2UKGgGR0Bw5CQRwqAjaAdL2GgIR0CeMhVB2OhkdX2UKGgGR0BwiBiCrcTKaAdL+WgIR0CeMima6STydX2UKGgGR0BwXmPDHfdiaAdL8WgIR0CeMmsY2sJZdX2UKGgGR0BwxdEw35vcaAdL9WgIR0CeMrcW0qpcdX2UKGgGR0BxEAudwvQGaAdL+GgIR0CeMwuUliSadX2UKGgGR0Bw5HwVj7Q+aAdNAAFoCEdAnjNjVtoBaXV9lChoBkdAcjEnYQJ5V2gHTS4BaAhHQJ4z5VR1oxp1fZQoaAZHQG5/MySFGodoB0vzaAhHQJ41sqDsdDJ1fZQoaAZHQHBehNRFZxJoB00XAWgIR0CeNh8IAwPAdX2UKGgGR0BwEmBg/keZaAdL92gIR0CeNrjMFEApdX2UKGgGR0Bu91xwQ176aAdL2GgIR0CeOFZU1hsqdX2UKGgGR0BwOLEXLvCuaAdL7mgIR0CeOGcriEQHdX2UKGgGR0ByAtCngpBpaAdNAQFoCEdAnjjDtG/etXV9lChoBkdAa7+1ejVQRGgHTSABaAhHQJ45ETlDF611fZQoaAZHQHE+CGrS3LFoB00DAWgIR0CeOTtzS1E3dX2UKGgGR0BwnqOdXko4aAdL6mgIR0CeOUsBQvYfdX2UKGgGR0BscsCYCyQgaAdL2mgIR0CeOaouf29MdX2UKGgGR0BwxWmtQsPKaAdL7mgIR0CeOdpaA4GVdX2UKGgGR0ByGIYP5HmSaAdNIAFoCEdAnjoxfShJy3V9lChoBkdAbWs6V+qioWgHS+loCEdAnjqpI+W4VnV9lChoBkdAcN1ITXarWGgHS+poCEdAnjz6nFYMfHV9lChoBkdAcCWgg5imVWgHS/5oCEdAnj0i1E3KjnV9lChoBkdAcNXHRCx/u2gHS/BoCEdAnj+mxt52QnV9lChoBkdAcXBqp97Wu2gHTQQBaAhHQJ5A0Cih37l1fZQoaAZHQG5qKq4pc5doB0v8aAhHQJ5A2jrRjSZ1fZQoaAZHQG6DcohIOH5oB0vlaAhHQJ5A+MaS9uh1fZQoaAZHQG9VUhvBJqZoB0vdaAhHQJ5BLLowEhd1fZQoaAZHQHD1x9gF5fNoB00AAWgIR0CeQUVbA1vVdX2UKGgGR0BroEjAzpHJaAdNCAFoCEdAnkF5dOZb6nV9lChoBkdAb8KOwxFiKGgHS+9oCEdAnkJZX2dupHV9lChoBkdAcSjQAuIykGgHTRwBaAhHQJ5CldMTN+t1fZQoaAZHQHHcSNn5BTpoB0v3aAhHQJ5FNS88La51fZQoaAZHQG/x4ptrKvFoB0v1aAhHQJ5FT4Kx9oh1fZQoaAZHQGTYILPUrkNoB03oA2gIR0CeRwr7wazedX2UKGgGR0BxoBsi0OVgaAdL6WgIR0CeSMXCTEBKdX2UKGgGR0ByEXbRF7UoaAdL5WgIR0CeSQbIcR16dX2UKGgGR0BxePFXJYDDaAdL9mgIR0CeSVMo+fRNdX2UKGgGR0BxkqnaWX1KaAdL8WgIR0CeSZpKzzErdX2UKGgGR0Bywna11GLDaAdNIgFoCEdAnknFMmF8HHV9lChoBkdARWkmplz2e2gHS9NoCEdAnkoBt52Qn3V9lChoBkdAcHO08NhE0GgHS/BoCEdAnkrFPrOZ9nV9lChoBkdAcGFh2GIsRWgHTQ8BaAhHQJ5K5sCT2WZ1fZQoaAZHQHGOVBMSK3xoB00TAWgIR0CeT6SNfgJkdX2UKGgGR0Bs+pfKISDiaAdL7WgIR0CeUBn752yLdX2UKGgGR0BjiKgdwNsnaAdN6ANoCEdAnlE23nZCfHV9lChoBkdAcBgVRDTjN2gHS9xoCEdAnlFMQ2/BWXV9lChoBkdAZL+OHWSU1WgHTegDaAhHQJ5TPGDL8rJ1fZQoaAZHQG81f16E8JVoB0v8aAhHQJ5TiM6zVtp1fZQoaAZHQHIHepCKJl9oB00gAWgIR0CeVKbhFVkudX2UKGgGR0ByuRZkkKNRaAdNOwFoCEdAnldQUYbbUXV9lChoBkdAcnz5UtI07GgHTSQBaAhHQJ5XifukUK11fZQoaAZHQG2ZvN3W4ExoB00+AWgIR0CeV8aYeDFqdX2UKGgGR0Bxh/QTmGM5aAdNOgFoCEdAnljPFWGRFXV9lChoBkdAYSTV4oqkM2gHTegDaAhHQJ5c1xbSqlx1fZQoaAZHQHFMfllsguBoB0v8aAhHQJ5c2AtnPE91fZQoaAZHQHA3QKv3ai9oB00QAWgIR0CeXSyzXz19dX2UKGgGR0BwOaMglnh9aAdL+GgIR0CeXbEcsDnvdX2UKGgGR0BtAp84PwuvaAdNQAJoCEdAnl4TshPj43V9lChoBkdAYkhX6InBtWgHTegDaAhHQJ5ekBPsRg91fZQoaAZHQG/ugTh5xBFoB0vmaAhHQJ5emMbWEsd1fZQoaAZHQG5X8/lhgE5oB0vpaAhHQJ5e9EpiI+J1fZQoaAZHQHGkjMibDuVoB00FAWgIR0CeYG0WM0gsdX2UKGgGR0Bwo++SKWLQaAdNBwFoCEdAnmIDBRAKOXV9lChoBkdAcamS4OMER2gHS/1oCEdAnmKvV3EAHXV9lChoBkdAcNqaF23az2gHTRYBaAhHQJ5i1AJLM9t1fZQoaAZHQHCAWPo3aSNoB0vbaAhHQJ5k+P7vXsh1fZQoaAZHQHElDQzDXOJoB00KAWgIR0CeZeZGKAJ+dX2UKGgGR0BwTcxJul41aAdL4WgIR0CeZkpNbkfcdX2UKGgGR0BxFBKAavRraAdL6GgIR0CeZofzjFQ3dX2UKGgGR0BtuzbBXS0CaAdL/GgIR0CeZrKnvUjLdX2UKGgGR0BwKup++dsjaAdNGQFoCEdAnmbQKKHfuXV9lChoBkdAcEeLUTcqOWgHS+VoCEdAnmbYTPBzm3V9lChoBkdAbpydhiLEUGgHTSgBaAhHQJ5nA5zYEnt1fZQoaAZHQF3IeFcpsoFoB03oA2gIR0CeZ/Syt3fRdX2UKGgGR0Bxm0OI68xsaAdL6WgIR0CeaGmvGIbgdX2UKGgGR0BwTC6+WWyDaAdL4WgIR0CeaY2t+1BudX2UKGgGR0BzCL0se4kNaAdL+mgIR0CeawO0LMLXdWUu"
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
@@ -80,7 +80,7 @@
80
  "n_steps": 2048,
81
  "gamma": 0.99,
82
  "gae_lambda": 0.95,
83
- "ent_coef": 0.0,
84
  "vf_coef": 0.5,
85
  "max_grad_norm": 0.5,
86
  "batch_size": 64,
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7e6e8ed8d6c0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e6e8ed8d760>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e6e8ed8d800>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e6e8ed8d8a0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7e6e8ed8d940>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7e6e8ed8d9e0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7e6e8ed8da80>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e6e8ed8db20>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7e6e8ed8dbc0>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e6e8ed8dc60>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e6e8ed8dd00>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7e6e8ed8dda0>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7e6e8f1cf9c0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
 
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1744934599250485401,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdgIAAAAAAACME251bXB5Ll9jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAAIAAAAAAAB6uxs+tkBXvGoHDjuz2dS5xNrFvUOVkboAAIA/AACAPwY+RL6PWX28Ox77upLKGbkXLts9c4ocOgAAgD8AAIA/esxAPvbwUbzynZw6TRKTuHeetL2jI7+5AACAPwAAgD8Nh7I9kqOUPiJSGDxGS7W+PPVKPe4tjzsAAAAAAAAAAHPHyb1cY126ILrsuc+9ALgh55K6KRgOOQAAgD8AAIA/gIiyPb6Nqz/8Ogw/PYLKvk1NLrwwLPs9AAAAAAAAAAAWHJM+0y8GPwmItr0rkvK+XpkUPsw+hr0AAAAAAAAAAGar870ePMA943FfPsmFVb78HIY9vlRYvAAAAAAAAAAAZoPdPaDS1D5v8YS9eX4IvyAsSD2p1oy8AAAAAAAAAABaQoE+VYBaPsbB672Vona+5mJzPW5bIr0AAAAAAAAAAACcxT1yXpc/RosUPqD1Qb+fZRg9OkERvQAAAAAAAAAAAiegvqfP3z6byY29vgHxvrUbd75yYRM+AAAAAAAAAABaxm0+lM38PmN8nD3pgAW/SL8rPnr7g7wAAAAAAAAAADNBIDxpK3E/9uILPDMNL7+pTCg8v/isuwAAAAAAAAAAIDMovi7ugbzisRs7ByVhOaqJ7z3jcVO6AACAPwAAgD/NYnk8KYehPx5zBT5Rniy/heUpPGifcT0AAAAAAAAAAJSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsIhpSMAUOUdJRSlC4="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWV/AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHHP/1+RYA+MAWyUS+2MAXSUR0CZ4G2LYPGydX2UKGgGR0BLJeUhV2idaAdLr2gIR0CZ4Oai9IwudX2UKGgGR0BxZnZqVQhwaAdL8mgIR0CZ4g3gDRtxdX2UKGgGR0BxvB8+iaiLaAdLrGgIR0CZ4g1s+FDfdX2UKGgGR0ByYds0pEx7aAdL/GgIR0CZ4kSJj2BbdX2UKGgGR0Bx0gcOskpraAdL6mgIR0CZ5eYDklu4dX2UKGgGR0BvOUuctoSMaAdL4GgIR0CZ5sE+gUUPdX2UKGgGR0Bxmwxzq8lHaAdL82gIR0CZ5sAMUh3adX2UKGgGR0Bw9/t8eCCjaAdL5mgIR0CZ6NH2RJVbdX2UKGgGR0BxUTW1+iJwaAdLsWgIR0CZ6OtEXtSidX2UKGgGR0BwMX9rGipOaAdL3GgIR0CZ6Q12q1gIdX2UKGgGR0Bhtb3XZoPDaAdN6ANoCEdAmenLi6xxDXV9lChoBkdAbXTQswtap2gHTU4BaAhHQJnqHKlpGnZ1fZQoaAZHQHJCmH1vl2hoB00qAWgIR0CZ6kg0j1PFdX2UKGgGR0BwHbanJkoXaAdL6WgIR0CZ6rfCyhSMdX2UKGgGR0Bxg8jps41haAdNBwFoCEdAmevdnCfpU3V9lChoBkdAYH8ZlWfbsWgHTegDaAhHQJntKiQDFId1fZQoaAZHQHF9g3T/hl1oB0vmaAhHQJnuL7/GVA11fZQoaAZHQGJ4qsdT5whoB03oA2gIR0CZ7rULUkOadX2UKGgGR0BwWupwS8J2aAdNAAFoCEdAme78PJ7swHV9lChoBkdAcxpo/RmbsmgHS8loCEdAme8w8OkLyHV9lChoBkdAYxabjLjgh2gHTegDaAhHQJnviaTfR/p1fZQoaAZHQHBqomPYFq1oB0vWaAhHQJnvoiKR+0B1fZQoaAZHQHIRPEwWWQhoB0vAaAhHQJnv+lvZRKp1fZQoaAZHwC+l7x/d69loB0uYaAhHQJnwewFC9h91fZQoaAZHQHAPzYAbQ1JoB0v8aAhHQJnwwdlum791fZQoaAZHQHDWjJp35etoB0vgaAhHQJnw/H3lCC11fZQoaAZHQG/kHryDqW1oB0vCaAhHQJnymG34Kx91fZQoaAZHQHGV/epGWldoB005AWgIR0CZ8uBCUorndX2UKGgGR0Bwxbww0wajaAdLsGgIR0CZ82xs2vSudX2UKGgGR0BxaUbuMMqjaAdLzmgIR0CZ88yQxN7CdX2UKGgGR0BxuovduYQbaAdLwmgIR0CZ9FhS9/SZdX2UKGgGR0BG5wIUrTYvaAdLwmgIR0CZ9LnIQvpRdX2UKGgGR0BwiVYmsvIwaAdL82gIR0CZ9ojc2zfKdX2UKGgGR0Bvtk2P1ct5aAdL7mgIR0CZ9un7YTTOdX2UKGgGR0BsmYUvf0mMaAdL3WgIR0CZ9vzpHI6sdX2UKGgGR0BwRpmWdEsraAdL2WgIR0CZ9zdcjZ+QdX2UKGgGR0BvUDxgAp8XaAdL1WgIR0CZ92exfOUudX2UKGgGR0Bue+vECNjtaAdLxWgIR0CZ+TYJE6T4dX2UKGgGR0Bx1iKaXrt3aAdL5GgIR0CZ+8OrQw9JdX2UKGgGR0BuLrDuSfUXaAdL1WgIR0CZ/KWBjFyadX2UKGgGR0ByRUl8gIQfaAdNEAFoCEdAmfzxaC+UQnV9lChoBkdAZR9bdJrckGgHTegDaAhHQJn8/RSgoPV1fZQoaAZHQHDz5rYXfqJoB00BAWgIR0CZ/bnlGPPtdX2UKGgGR0BwrOfkFOfvaAdLr2gIR0CZ/kMewLVndX2UKGgGR0BxhyWX1J18aAdLymgIR0CZ/wgNPP9ldX2UKGgGR0BuoKLIgeRxaAdLwWgIR0CZ/yj+aScLdX2UKGgGR0BzBOWTot+TaAdNGwFoCEdAmf+Wt6ol2XV9lChoBkdAYLG8Gs3hoGgHTegDaAhHQJn/qUliSaF1fZQoaAZHQHGUqnaWX1JoB0vaaAhHQJn/tFI/Z/V1fZQoaAZHwDE7ABT4tYloB0uHaAhHQJoAdQsPJ7t1fZQoaAZHQG5D5k078vVoB0vVaAhHQJoDXNpudf91fZQoaAZHQG4ODCP6sQxoB0vVaAhHQJoDiyUs4DN1fZQoaAZHQHCQm9DhLoRoB0viaAhHQJoD/7Kq4pd1fZQoaAZHQHA3u+M6zVtoB0vSaAhHQJoECdQO4G51fZQoaAZHQHHdl7MPjGVoB01dAWgIR0CaBTJIUahpdX2UKGgGR0BuViB/ZuhsaAdL02gIR0CaBX8NQTEjdX2UKGgGR0BwyFkGzKLbaAdL72gIR0CaBkz2exwAdX2UKGgGR0BlyP5i3G4raAdN6ANoCEdAmgZqR2bG3nV9lChoBkdAch6PykKu0WgHS99oCEdAmgaJ0bLlm3V9lChoBkdAcK4W6bvw3GgHS+BoCEdAmgaIDs+mnHV9lChoBkdAclkjX4CZGGgHS+loCEdAmgatgBtDUnV9lChoBkdAcgqJ6po9LmgHTRoBaAhHQJoGyh11W811fZQoaAZHQHGQjundfsxoB00BAWgIR0CaCBSfDk2hdX2UKGgGR0BxCKup0fYBaAdLqWgIR0CaCeDPnjhldX2UKGgGR0BzUytJWeYlaAdL5WgIR0CaCf7eVLSNdX2UKGgGR0BxRzag2606aAdL2GgIR0CaCjXCj1wpdX2UKGgGR0Biug2uPmxMaAdN6ANoCEdAmgpFlkH2RXV9lChoBkdAcNspmEoOQWgHS+1oCEdAmgrNvKlpGnV9lChoBkdAcgxsOoYNzGgHTQgBaAhHQJoLHm2b5M11fZQoaAZHQHHpkeIVM25oB0u2aAhHQJoLN+c6Nl11fZQoaAZHQHDcU2pAD7toB0vEaAhHQJoLs32mHgx1fZQoaAZHQHDojUVi4KBoB0vSaAhHQJoMPgccU/R1fZQoaAZHQHB9BeC04R5oB0v7aAhHQJoMUfgaWHF1fZQoaAZHQHGKeDjBEa5oB0voaAhHQJoMcBltj1B1fZQoaAZHQHLZnDziCJ5oB00EAWgIR0CaDZLcbiqAdX2UKGgGR0ByH/987ZFoaAdL1mgIR0CaDdGgSOBEdX2UKGgGR0BhJhmZmZmaaAdN6ANoCEdAmg3QUUO/cnV9lChoBkdAb1X1SwW30GgHS8BoCEdAmg74+bExZnV9lChoBkdAcKlJuVHFxWgHS8BoCEdAmg9CaJAMUnV9lChoBkdAb09rGipNsWgHS8ZoCEdAmg/62KEWZnV9lChoBkdAcwMRgJC0GGgHTXYBaAhHQJoQWGqPwNN1fZQoaAZHQHFtCBbwBo5oB0v3aAhHQJoQsh5gPVd1fZQoaAZHQHIieGfwqiJoB00LAWgIR0CaEO2n889wdX2UKGgGR0BvQedXko4NaAdLxGgIR0CaEYqnWJ7+dX2UKGgGR0BzBis4ku6FaAdL82gIR0CaEhlO45LidX2UKGgGR0ByK9tgrpaBaAdL4GgIR0CaEh9QoCuEdX2UKGgGR0BySDPqs2ehaAdNFgFoCEdAmhKDnmq5snV9lChoBkdAcX2r4nF5wGgHS71oCEdAmhQn9aUzK3V9lChoBkdAcTtIvJzT4WgHS/ZoCEdAmhR6W9lEqnV9lChoBkdAYch2alUIcGgHTegDaAhHQJoVCrp7kXF1fZQoaAZHQHEyV/x2B8RoB00cAWgIR0CaFWJ1aGHpdX2UKGgGR0Bw/Yqur6tUaAdLyGgIR0CaFZASnLq2dX2UKGgGR0BuKlAgPmPpaAdLxGgIR0CaFde5WilBdX2UKGgGR0BwjC0w8GLUaAdL8GgIR0CaFf7bcoH+dX2UKGgGR0By8dNg0CRwaAdNMgFoCEdAmhZGF8G9pXV9lChoBkdAcF/IQvpQlGgHS8xoCEdAmhatGViWmnV9lChoBkdAcZgM23rleWgHS9xoCEdAmhbXtfG+9XV9lChoBkdAcWaITGo73mgHS8xoCEdAmhfUPMB6r3V9lChoBkdAcITCvHLidmgHS79oCEdAmhfkqUeMh3VlLg=="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
 
80
  "n_steps": 2048,
81
  "gamma": 0.99,
82
  "gae_lambda": 0.95,
83
+ "ent_coef": 0.015,
84
  "vf_coef": 0.5,
85
  "max_grad_norm": 0.5,
86
  "batch_size": 64,
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08979682af18c3b1ececb955b9f47c4828d3201fe1aef565557f8f8ec940ecd0
3
  size 88362
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b84b0bddc54bf042fc7217a53e97ddbf53d11e30598faaf77fe8cf065594d72
3
  size 88362
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb8f716db32cd071fe3e5a2cd63d41ca5d1d39f4c9e0d8fe9df9b5b46b28513b
3
  size 43762
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c53cc5018d122e95d44f908510dfa67ae5a054d81e30087c2a9935e535b517ad
3
  size 43762
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1120cb703de81e293912d5814df03c4c72dba2e89b742ca23a231e7e29015789
3
- size 155191
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cfe9d1e148854eda9cd5811600f7bdc59c031584a76f689d2ffb91c73d8f9ef
3
+ size 124578
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 259.70984710000005, "std_reward": 23.204909559512487, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-04-17T23:39:14.321794"}
 
1
+ {"mean_reward": 271.308085, "std_reward": 18.357892429701838, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-04-18T00:31:50.731080"}