AllIllusion commited on
Commit
ae0d26e
·
verified ·
1 Parent(s): 9699326

Upload PPO LunarLander-v2 LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep14000K.zip

Browse files
LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep14000K.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf56cabf46c175b2fdf2f10107c487906f0c34c73de32003e310015eb3a935d1
3
  size 147519
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2559e780e6b972805bd6fb72d69c2de52fb3b2d3c7e45d670f69401d0f22d036
3
  size 147519
LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep14000K/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7ff7606941f0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7ff760694280>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7ff760694310>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7ff7606943a0>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7ff760694430>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7ff7606944c0>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7ff760694550>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7ff7606945e0>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7ff760694670>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7ff760694700>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7ff760694790>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7ff760694820>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc_data object at 0x7ff7606f3d20>"
21
  },
22
  "verbose": 0,
23
  "policy_kwargs": {},
@@ -26,12 +26,12 @@
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1744199644083624492,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAI20bD66G8o+WEDzvnURTr+Oqq4+3SUCvwAAAAAAAAAA5i2cvVP3Rz+v8IW9qreAvzN2Pb4jJfY7AAAAAAAAAAAN7UA+gw2aP9RVnD4TD+S+pQYGP5jEBT8AAAAAAAAAAIBbD71I+4u6ImdCskf1O7Edd4Y6+gyQMgAAgD8AAIA/mjmKvIUar7uCW988t5uaPOT6nzxIr4u7AACAPwAAgD/NF20+Y+2mP2qDyD5WChe/YfFNP5c/mD4AAAAAAAAAAEidqr5qaHo/dVFGvYoEN7+AXjy/1j0QPgAAAAAAAAAAALpYvCE2jbz4fag821yFPWdozj260eW6AACAPwAAgD9m1my8v497Pl+QpL25KCa/mnv4O1J/db0AAAAAAAAAAGYGxroF/9272/uVvDlP0DwgfTa9BXysPQAAgD8AAIA/mlW8u+EMnLogBoAyFETcsJOs57kL0OiyAACAPwAAgD+tTFQ+ZecxP9rv2L3A+0+/EpgFPw05s74AAAAAAAAAAJrnGzy8Bho9tlg6vjZl1r74FGO+o6yjvgAAAAAAAAAAM9ErPcTurj8SGhM/hpy4vi3QX7wibos9AAAAAAAAAABNfrM92rtHP2MIFD6/kmO/dnekPhtFcD0AAAAAAAAAADP1lbwF7tO7bfYcvAF6rzwOoSC9DqeSPQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -45,7 +45,7 @@
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWV4gsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHB7mnCO3lWMAWyUS6yMAXSUR0DuoUaY1He8dX2UKGgGR0BzC7jIaLn+aAdLk2gIR0DuoUePFvQ4dX2UKGgGR0BwPkUM5OrRaAdLmGgIR0DuoUullbu/dX2UKGgGR0BxqBlxwQ18aAdLsWgIR0DuoU2wW3z+dX2UKGgGR0Bwc6cRUWEcaAdLlGgIR0DuoVBwCr93dX2UKGgGR0Bx2H127nPnaAdLn2gIR0DuocdNVR1pdX2UKGgGR0Bzl7mZE2HdaAdLuWgIR0DuocfEhq0udX2UKGgGR0B0DAVHnU2DaAdLtGgIR0DuochAbhm5dX2UKGgGR0BzNmu8scyWaAdLkWgIR0Duocj6fra/dX2UKGgGR0BypWw3YL9daAdLtGgIR0Duoc8qlxffdX2UKGgGR0BzA7gUDdP+aAdLwGgIR0DuodAFfzBidX2UKGgGR0B0G7fHggoxaAdLrGgIR0Duoc/idat+dX2UKGgGR0BylPJQtSQ6aAdLnmgIR0DuodE+8Gs4dX2UKGgGR0Bx7/IMjNY9aAdLnGgIR0DuodHG9YfXdX2UKGgGR0BxsKS8rZrYaAdLpWgIR0DuodJedkJ8dX2UKGgGR0Bz03jZL7GeaAdLtWgIR0DuodPr3TNMdX2UKGgGR0BwV/WEsasIaAdLk2gIR0DuodUBmwqzdX2UKGgGR0B0DRQ66reZaAdLt2gIR0DuodcSwGGEdX2UKGgGR0BwQYWfseGPaAdLmGgIR0Duodm/7iyZdX2UKGgGR0BwWnTspoboaAdLqWgIR0DuodpwsGxEdX2UKGgGR0ByOtoqTbFkaAdLpGgIR0DuoeWBsANodX2UKGgGR0BzyF7E5yU+aAdLomgIR0Duoed3EAHWdX2UKGgGR0BxEhwPy08eaAdLqmgIR0DuoeiblzU7dX2UKGgGR0Byc1+NLlFMaAdLuWgIR0Duoet7dBSldX2UKGgGR0BwC/zjFQ2uaAdLiWgIR0Duoevlg+hXdX2UKGgGR0BwX5iRW912aAdLlWgIR0DuofDHIZIhdX2UKGgGR0ByQtP1tfoiaAdLoWgIR0DuofLzwtrcdX2UKGgGR0Bxqk/iYLLIaAdLlmgIR0DuofP9b5dodX2UKGgGR0ByL+OinHeaaAdLrGgIR0DuofQAWBSUdX2UKGgGR0Byc4w8GLUDaAdLsGgIR0DuofQBwuM/dX2UKGgGR0Bz0IIfKZDzaAdLnGgIR0DuofanwXqJdX2UKGgGR0ByQpeRgZ0kaAdLvGgIR0DuogFbqQiidX2UKGgGR0Bz/huGbkOqaAdL5WgIR0DuogRKMefadX2UKGgGR0BxjCt5le4TaAdLuGgIR0DuogVOqNp/dX2UKGgGR0Bx1HCiyprDaAdLhmgIR0DuogcoKlYVdX2UKGgGR0Bzijghr30xaAdLyWgIR0DuogicnVoYdX2UKGgGR0ByRGO6unuRaAdLp2gIR0Duog1p+MIedX2UKGgGR0Bxfbx5LRKIaAdLomgIR0Duog8GTs6adX2UKGgGR0Bv14O8TSLJaAdLoWgIR0DuohG88La3dX2UKGgGR0B0BNwDNhVmaAdLq2gIR0DuohSSAYpEdX2UKGgGR0BxWh5s0pEyaAdLjWgIR0DuohicoYvWdX2UKGgGR0BxmgpWmxdIaAdLoWgIR0Duohpyy2QXdX2UKGgGR0BxIfVjI7vHaAdLpGgIR0Duohsom5UcdX2UKGgGR0BzcM1n/T9baAdLp2gIR0Duohvo+wC9dX2UKGgGR0Bz5uqn3ta7aAdLsGgIR0Duoh0X1J18dX2UKGgGR0ByyG4qgAZLaAdLg2gIR0DuoiV2U0N0dX2UKGgGR0By6d3NcGC7aAdLs2gIR0Duoi6q5LAYdX2UKGgGR0BGo8dgfEGaaAdLWGgIR0Duoi/a24NJdX2UKGgGR0ByPeDBdld1aAdLqmgIR0DuojJ6AOJ+dX2UKGgGR0BygsHX2/SIaAdLuGgIR0DuojNG+bmVdX2UKGgGR0B0HonE2pAEaAdLqGgIR0DuojOaR6njdX2UKGgGR0Byhg+lj3EiaAdLj2gIR0DuojQYwZfldX2UKGgGR0BvjotnPE88aAdLp2gIR0DuojhwvQF+dX2UKGgGR0Bx7VKRMewLaAdLj2gIR0Duoj8IX0oSdX2UKGgGR0BzKV7VrhzeaAdLrGgIR0Duoj+9AX2vdX2UKGgGR0BxDGNaQmu1aAdLx2gIR0DuokLkoWpIdX2UKGgGR0BwK/cynDR/aAdLomgIR0DuokQsg+yJdX2UKGgGR0BzVe9du5z6aAdLr2gIR0DuokY5ZKWcdX2UKGgGR0BznlUHY6GQaAdLsGgIR0DuokgXqqwRdX2UKGgGR0B0AQbzbvgFaAdLrWgIR0Duok80TDfndX2UKGgGR0BwiONMoMKDaAdLlWgIR0DuolFHWBjGdX2UKGgGR0BygHAM2FWXaAdNlQNoCEdA7qJT4FRpDnV9lChoBkdAcqUBw++ueWgHS6hoCEdA7qJWWLHdXXV9lChoBkdAcC9XIlt0m2gHS6VoCEdA7qJYTNMXanV9lChoBkdAcsWuFHrhSGgHS65oCEdA7qJZkEkjYHV9lChoBkdAcnbMVk+X7mgHS4FoCEdA7qJbX6Q/5nV9lChoBkdAcjMFAVwgkmgHS7JoCEdA7qJbMRpUP3V9lChoBkdAcpEU3n6l+GgHS7RoCEdA7qJb5qM3qHV9lChoBkdAdH7/J/5Ly2gHS7NoCEdA7qJfIe5nUXV9lChoBkdAcmRLux8lX2gHS5FoCEdA7qJlmkFfRnV9lChoBkdAc7y+pOvdM2gHS6doCEdA7qJm+hGpdnV9lChoBkdAcZwuoP07KmgHS6loCEdA7qJovIfbK3V9lChoBkdAclVBO58Sf2gHS8BoCEdA7qJpB9b5dnV9lChoBkdAcVwVurIYFmgHS69oCEdA7qJt7349HXV9lChoBkdAcq/FSKm8/WgHS6poCEdA7qJy6Kk2xnV9lChoBkdAcw8B1cMVlGgHS5NoCEdA7qJ1CqZMMHV9lChoBkdAct7NRFZxJmgHS7BoCEdA7qJ5FTNt7HV9lChoBkdAcMUZha1Ti2gHS59oCEdA7qJ50C7sfXV9lChoBkdAc/4UJOWSlmgHS79oCEdA7qJ5sTFl1HV9lChoBkdAclZRr8BMjGgHS5JoCEdA7qJ57LdN4HV9lChoBkdAcPi4AS39aWgHS5VoCEdA7qJ61mz0H3V9lChoBkdAcbIbMHKOk2gHS6VoCEdA7qJ7pGFzuHV9lChoBkdAckVkWRA8jmgHTV8CaAhHQO6ifD1Iy0t1fZQoaAZHQHKCQpON5t5oB0uVaAhHQO6ifYJNTLp1fZQoaAZHQHNYCpR4yGloB0u6aAhHQO6igF58jRl1fZQoaAZHQHOh5aJQ+EBoB0uXaAhHQO6igpV0cOt1fZQoaAZHQHMSR+OOsDJoB0uqaAhHQO6iiKoS+QF1fZQoaAZHQHORyzsyBTZoB0uvaAhHQO6ii2f7Jnx1fZQoaAZHQHKcZZ8rqdJoB0u2aAhHQO6ijIG2TgV1fZQoaAZHQHKNQrQPZqVoB0ukaAhHQO6ijaZML4N1fZQoaAZHQHBEtXtBv75oB0uUaAhHQO6ij1US7Gx1fZQoaAZHQHNc8XFcY65oB0uaaAhHQO6ikqBPKuB1fZQoaAZHQHGbuQZGax5oB0uRaAhHQO6ilRPwd811fZQoaAZHQG/kQXIlt0poB0uYaAhHQO6ile/tY0V1fZQoaAZHQHIY88DB/I9oB0uVaAhHQO6ilkypJf91fZQoaAZHQHIALKzRhMJoB0uaaAhHQO6ilzr3TNN1fZQoaAZHQHIys4PwuuloB0ueaAhHQO6imoqslsx1fZQoaAZHQHHpzQE6kqNoB0uraAhHQO6inDp5eJJ1fZQoaAZHQHENwSvkilloB0ufaAhHQO6inTpJPIp1fZQoaAZHQHQLWRmseXBoB0u+aAhHQO6ioi9ytFN1ZS4="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f2803f51160>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f2803f511f0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f2803f51280>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f2803f51310>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f2803f513a0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f2803f51430>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f2803f514c0>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f2803f51550>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f2803f515e0>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f2803f51670>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f2803f51700>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f2803f51790>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc_data object at 0x7f2803fb2d20>"
21
  },
22
  "verbose": 0,
23
  "policy_kwargs": {},
 
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1744204003805074415,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGbOHzuu9bG6U1fyOI1Z1zOa2nu5p4MKuAAAgD8AAIA/AFiPO+E6gLryTAw8Fz2itbjkejuQ3520AACAPwAAgD+aI3E9+9H9O4hp4L7OE4O+GYJ0voi4OT8AAIA/AAAAAGZEhLxtMAY/VrKwPG4MXb94W3C9ZkPCPAAAAAAAAAAAZkaGu1yjYrrIJGM88UfPuB8UiLraRsq3AACAPwAAgD/TLm4+au2tP+fuCD8dBha/g1EAP2hJzD4AAAAAAAAAAGZmiDnSxam7FHKhPM5dhDyZ6+s8gmRivQAAgD8AAIA/zRS0u72Wfjy+TIM9AP2xvvRzqT2vMLA9AAAAAAAAAAAaLhy+IWR5PqnmvD4lMSm/jUofvjHPoT4AAAAAAAAAAL0ipz5Ir1o/fuUnvWycUr/wLyw/+ElUvgAAAAAAAAAAyphcvpF9hT8DUU2+0oBQv3lRJL+vToy7AAAAAAAAAAAz/y+80qXzu4qzUDyyv6E8XyM+PSISh70AAIA/AACAP4COB73LQpI/HKCkvaMfWr/PlQi+lZ6ivAAAAAAAAAAAZjxnPPmxsj9iIjU/ssSvvm5FaLxuFfS9AAAAAAAAAACaPcy7duMGvKgqoL2nocQ8MLjmuz3HjDsAAIA/AACAP5rl0rtIaZO64n4aODM3CTPtP+06zvcytwAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWV4QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHSYG3BpHqiMAWyUS8mMAXSUR0DxDX5Xe3x4dX2UKGgGR0Bx/qsPrfLtaAdLqGgIR0DxDYAwljVhdX2UKGgGR0BxIf4IrvsraAdLo2gIR0DxDcBgte2NdX2UKGgGR0BxhzQZ4wAVaAdLmWgIR0DxDcEmnO0LdX2UKGgGR0ByPl/Ue+23aAdLoGgIR0DxDcFPl+3IdX2UKGgGR0Byb1w1ivxIaAdLkmgIR0DxDcHYYBNmdX2UKGgGR0BzByp71Iy1aAdLv2gIR0DxDcJnV5KOdX2UKGgGR0Bz9b7vXsgMaAdLwWgIR0DxDcLOinHedX2UKGgGR0BySv3fyf+TaAdLq2gIR0DxDcPYLLIQdX2UKGgGR0Bx2RQSBbwCaAdLqWgIR0DxDcP5JsfrdX2UKGgGR0ByvvjDKoycaAdLkmgIR0DxDcQVzIV/dX2UKGgGR0Bzbjh1klNUaAdLpWgIR0DxDcdUkfLcdX2UKGgGR0ByGITh5xBFaAdLxmgIR0DxDcgIOH32dX2UKGgGR0BxHWDzyz5XaAdLn2gIR0DxDcg8Hv+gdX2UKGgGR0ByBWynk1dgaAdLl2gIR0DxDciq4YrKdX2UKGgGR0BxPfDfm9xqaAdLoWgIR0DxDckTCLuQdX2UKGgGR0BxqiSRr8BNaAdLk2gIR0DxDcmV81GcdX2UKGgGR0BLIYbjtG/faAdLa2gIR0DxDcuQQ+UydX2UKGgGR0BxrZjtoi9qaAdLqmgIR0DxDc1sTnJUdX2UKGgGR0BxGNC7btZ3aAdLlGgIR0DxDc72ys0YdX2UKGgGR0Bz/NYJVsDXaAdLsWgIR0DxDc/xCIDYdX2UKGgGR0Bvzq9/SYw7aAdLpWgIR0DxDdACJoCddX2UKGgGR0BwoyIsRQJpaAdLlWgIR0DxDdB3W4EwdX2UKGgGR0Bxa17eEZivaAdLtGgIR0DxDdE3eenRdX2UKGgGR0BwYbyf+S8raAdLlWgIR0DxDdHmMOwxdX2UKGgGR0BTiiblRxcWaAdLgGgIR0DxDdWwfQrudX2UKGgGR0Byy/dWQwK0aAdLvmgIR0DxDdaVsUItdX2UKGgGR0BxsKfRNRFaaAdLxGgIR0DxDddwAU+LdX2UKGgGR0ByAarMkhRqaAdLnmgIR0DxDden0TURdX2UKGgGR0ByVCjynUDuaAdLlmgIR0DxDdihs67vdX2UKGgGR0By5tXo1UEQaAdLmWgIR0DxDdl8K5TZdX2UKGgGR0BzvsG0NSZSaAdLrGgIR0DxDdnrMTvidX2UKGgGR0BD2RGlQ/HHaAdLamgIR0DxDdpYpDu0dX2UKGgGR0ByBEg2ZRbbaAdLu2gIR0DxDduM72csdX2UKGgGR0B0S6fEn9ehaAdLtGgIR0DxDd41IiC8dX2UKGgGR0BwF1LM9r44aAdLi2gIR0DxDd5tNzsAdX2UKGgGR0BxdC1twaR7aAdLkmgIR0DxDd9A2hqTdX2UKGgGR0Bz7ufBeokzaAdLxmgIR0DxDeJLJSzgdX2UKGgGR0BwAe6g/TsqaAdLo2gIR0DxDeJ+uNgjdX2UKGgGR0BzqnN7jT8YaAdLpWgIR0DxDeNgZTAGdX2UKGgGR0BzAA+wC8vmaAdLuWgIR0DxDeQCFbmmdX2UKGgGR0BwWYmhM8HOaAdLkGgIR0DxDeTUyHmBdX2UKGgGR0BxfgWnCO3laAdLiWgIR0DxDeWV0Lc9dX2UKGgGR0Byuavs7dSEaAdLmWgIR0DxDehUmlZYdX2UKGgGR0Bzsi8AaNuMaAdLsWgIR0DxDejliBoVdX2UKGgGR0Bxh/LowEhaaAdLqmgIR0DxDek8kD6ndX2UKGgGR0BwPcg+yJKraAdLnmgIR0DxDem/T9bYdX2UKGgGR0Bw5cZNwiqyaAdLomgIR0DxDeqCBf8edX2UKGgGR0BzfjqPfbblaAdLnWgIR0DxDep36Q/5dX2UKGgGR0BN4jIzWPLgaAdLgGgIR0DxDeyOearndX2UKGgGR0Bzg4cPvrnlaAdLpWgIR0DxDe+NhVlxdX2UKGgGR0B0F6QV9F4LaAdLxGgIR0DxDfAL7oB8dX2UKGgGR0BxqQwnH/96aAdLmWgIR0DxDfKndfsvdX2UKGgGR0B0LZ/iHZbqaAdLxmgIR0DxDfOW7OE/dX2UKGgGR0BxdzMdLg4waAdLpWgIR0DxDfT64UeudX2UKGgGR0Bx51n003wTaAdLo2gIR0DxDfVgi/widX2UKGgGR0BzMzVH4GliaAdLuWgIR0DxDfYDU3GXdX2UKGgGR0Bxx7HcUM5PaAdLqmgIR0DxDffQbMoudX2UKGgGR0Byk+fSQYDUaAdLs2gIR0DxDffw4sErdX2UKGgGR0ByugsI3R5UaAdLkWgIR0DxDfgASWZ7dX2UKGgGR0BxxkcFQl8gaAdLiGgIR0DxDfkpe/pMdX2UKGgGR0BwXaPPszEaaAdLpWgIR0DxDfqVcUuddX2UKGgGR0Bvnac7QswtaAdLmmgIR0DxDfsJqIrOdX2UKGgGR0BzMEsAeaKDaAdLqmgIR0DxDfvsTFl1dX2UKGgGR0B0MjUmUnogaAdLvmgIR0DxDf1y0rsjdX2UKGgGR0BwUwMOPNmlaAdLiGgIR0DxDf4QYk3TdX2UKGgGR0BxOAp4KQaKaAdLmGgIR0DxDgA0QK8ddX2UKGgGR0BwtBTJhfBvaAdLm2gIR0DxDgNZLIxQdX2UKGgGR0BxDsVIqbz9aAdLl2gIR0DxDgaohY/3dX2UKGgGR0ByBJSxZ+x4aAdLimgIR0DxDgqsunMudX2UKGgGR0BzS89Oh0yQaAdLu2gIR0DxDgqJaJQ+dX2UKGgGR0BznFStNi6QaAdLxGgIR0DxDgs69CeFdX2UKGgGR0BxnrLU1AJLaAdLnWgIR0DxDgt4W1twdX2UKGgGR0Bx5t7hNucdaAdLrWgIR0DxDgvgsbvPdX2UKGgGR0BxqeAe7tiQaAdLsGgIR0DxDgxUj9n9dX2UKGgGR0BwwCQLeANHaAdLuWgIR0DxDg0v+OwQdX2UKGgGR0BwXulrM1TBaAdLkGgIR0DxDg0eOn2qdX2UKGgGR0BzuyoKlYU4aAdL5GgIR0DxDg2ImPYGdX2UKGgGR0BzUulGgBcSaAdLvGgIR0DxDhES1maqdX2UKGgGR0BzIwhFEy+IaAdLrGgIR0DxDhKsRQJpdX2UKGgGR0BzPPiS7oStaAdLtmgIR0DxDhMi9qUNdX2UKGgGR0BzfHslb/wRaAdLpWgIR0DxDhQ+F10UdX2UKGgGR0BwHAUuctoSaAdLoGgIR0DxDhbI9TxYdX2UKGgGR0BwwW1eBxxUaAdLn2gIR0DxDhnSQYDUdX2UKGgGR0BzLT/xUedTaAdLkmgIR0DxDhwANG3GdX2UKGgGR0ByxHrB0p3HaAdLjWgIR0DxDhyGn4widX2UKGgGR0BxbpelbeMyaAdLkWgIR0DxDh1uTRpldX2UKGgGR0Bym5Uo8ZDRaAdLnWgIR0DxDh3GNrCWdX2UKGgGR0BwNmhew9q2aAdLpmgIR0DxDh5MVUModX2UKGgGR0ByW6N4qwyJaAdLoGgIR0DxDh5ppvgndX2UKGgGR0By+myv9tMxaAdLlmgIR0DxDh7QN0/4dX2UKGgGR0ByUoIkZ75VaAdLmWgIR0DxDh81jy4GdX2UKGgGR0BwCxorWiDeaAdLnWgIR0DxDh//keZHdX2UKGgGR0BxqZ16mfoSaAdLkmgIR0DxDiOf1pTNdX2UKGgGR0Bx0tTXJ5miaAdLmGgIR0DxDiTKA8SxdX2UKGgGR0BxnRbdJrckaAdLmmgIR0DxDiYC+De1dX2UKGgGR0Bz2Wtnwob5aAdLt2gIR0DxDiZdnTRZdX2UKGgGR0BzfgBtDUmVaAdNBQJoCEdA8Q4nviDM/3V9lChoBkdAcsZqBmPHUGgHS5loCEdA8Q4oaBNEgHV9lChoBkdAdBeMtsenymgHS6VoCEdA8Q4sMPnSv3VlLg=="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep14000K/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96701d427799c8d221e681918bc0b9e28b5af865015ac58b5c09cf6761518bd6
3
  size 87978
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:849d3d12b2304968fd58d6e3950def05e2d14ceb3e014ee795632767cd1fafb5
3
  size 87978
LunarLander-v2_PPO_ne16_ns1024_b64_e4_cpu_TotalStep14000K/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:610748244e800929ead5cf251778f2f7119de772e8e99053b20cecb08b66f2a6
3
  size 43634
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a41a488dada2cff72a430207c0333d6e4272b7f34ae63c390ea85aefc8b8b1d
3
  size 43634
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 298.45 +/- 18.92
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 288.93 +/- 18.53
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7ff7606941f0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7ff760694280>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7ff760694310>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7ff7606943a0>", "_build": "<function ActorCriticPolicy._build at 0x7ff760694430>", "forward": "<function ActorCriticPolicy.forward at 0x7ff7606944c0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7ff760694550>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7ff7606945e0>", "_predict": "<function ActorCriticPolicy._predict at 0x7ff760694670>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7ff760694700>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7ff760694790>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7ff760694820>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7ff7606f3d20>"}, "verbose": 0, "policy_kwargs": {}, "num_timesteps": 14008320, "_total_timesteps": 14000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1744199644083624492, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAI20bD66G8o+WEDzvnURTr+Oqq4+3SUCvwAAAAAAAAAA5i2cvVP3Rz+v8IW9qreAvzN2Pb4jJfY7AAAAAAAAAAAN7UA+gw2aP9RVnD4TD+S+pQYGP5jEBT8AAAAAAAAAAIBbD71I+4u6ImdCskf1O7Edd4Y6+gyQMgAAgD8AAIA/mjmKvIUar7uCW988t5uaPOT6nzxIr4u7AACAPwAAgD/NF20+Y+2mP2qDyD5WChe/YfFNP5c/mD4AAAAAAAAAAEidqr5qaHo/dVFGvYoEN7+AXjy/1j0QPgAAAAAAAAAAALpYvCE2jbz4fag821yFPWdozj260eW6AACAPwAAgD9m1my8v497Pl+QpL25KCa/mnv4O1J/db0AAAAAAAAAAGYGxroF/9272/uVvDlP0DwgfTa9BXysPQAAgD8AAIA/mlW8u+EMnLogBoAyFETcsJOs57kL0OiyAACAPwAAgD+tTFQ+ZecxP9rv2L3A+0+/EpgFPw05s74AAAAAAAAAAJrnGzy8Bho9tlg6vjZl1r74FGO+o6yjvgAAAAAAAAAAM9ErPcTurj8SGhM/hpy4vi3QX7wibos9AAAAAAAAAABNfrM92rtHP2MIFD6/kmO/dnekPhtFcD0AAAAAAAAAADP1lbwF7tO7bfYcvAF6rzwOoSC9DqeSPQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0005942857142857694, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4gsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHB7mnCO3lWMAWyUS6yMAXSUR0DuoUaY1He8dX2UKGgGR0BzC7jIaLn+aAdLk2gIR0DuoUePFvQ4dX2UKGgGR0BwPkUM5OrRaAdLmGgIR0DuoUullbu/dX2UKGgGR0BxqBlxwQ18aAdLsWgIR0DuoU2wW3z+dX2UKGgGR0Bwc6cRUWEcaAdLlGgIR0DuoVBwCr93dX2UKGgGR0Bx2H127nPnaAdLn2gIR0DuocdNVR1pdX2UKGgGR0Bzl7mZE2HdaAdLuWgIR0DuocfEhq0udX2UKGgGR0B0DAVHnU2DaAdLtGgIR0DuochAbhm5dX2UKGgGR0BzNmu8scyWaAdLkWgIR0Duocj6fra/dX2UKGgGR0BypWw3YL9daAdLtGgIR0Duoc8qlxffdX2UKGgGR0BzA7gUDdP+aAdLwGgIR0DuodAFfzBidX2UKGgGR0B0G7fHggoxaAdLrGgIR0Duoc/idat+dX2UKGgGR0BylPJQtSQ6aAdLnmgIR0DuodE+8Gs4dX2UKGgGR0Bx7/IMjNY9aAdLnGgIR0DuodHG9YfXdX2UKGgGR0BxsKS8rZrYaAdLpWgIR0DuodJedkJ8dX2UKGgGR0Bz03jZL7GeaAdLtWgIR0DuodPr3TNMdX2UKGgGR0BwV/WEsasIaAdLk2gIR0DuodUBmwqzdX2UKGgGR0B0DRQ66reZaAdLt2gIR0DuodcSwGGEdX2UKGgGR0BwQYWfseGPaAdLmGgIR0Duodm/7iyZdX2UKGgGR0BwWnTspoboaAdLqWgIR0DuodpwsGxEdX2UKGgGR0ByOtoqTbFkaAdLpGgIR0DuoeWBsANodX2UKGgGR0BzyF7E5yU+aAdLomgIR0Duoed3EAHWdX2UKGgGR0BxEhwPy08eaAdLqmgIR0DuoeiblzU7dX2UKGgGR0Byc1+NLlFMaAdLuWgIR0Duoet7dBSldX2UKGgGR0BwC/zjFQ2uaAdLiWgIR0Duoevlg+hXdX2UKGgGR0BwX5iRW912aAdLlWgIR0DuofDHIZIhdX2UKGgGR0ByQtP1tfoiaAdLoWgIR0DuofLzwtrcdX2UKGgGR0Bxqk/iYLLIaAdLlmgIR0DuofP9b5dodX2UKGgGR0ByL+OinHeaaAdLrGgIR0DuofQAWBSUdX2UKGgGR0Byc4w8GLUDaAdLsGgIR0DuofQBwuM/dX2UKGgGR0Bz0IIfKZDzaAdLnGgIR0DuofanwXqJdX2UKGgGR0ByQpeRgZ0kaAdLvGgIR0DuogFbqQiidX2UKGgGR0Bz/huGbkOqaAdL5WgIR0DuogRKMefadX2UKGgGR0BxjCt5le4TaAdLuGgIR0DuogVOqNp/dX2UKGgGR0Bx1HCiyprDaAdLhmgIR0DuogcoKlYVdX2UKGgGR0Bzijghr30xaAdLyWgIR0DuogicnVoYdX2UKGgGR0ByRGO6unuRaAdLp2gIR0Duog1p+MIedX2UKGgGR0Bxfbx5LRKIaAdLomgIR0Duog8GTs6adX2UKGgGR0Bv14O8TSLJaAdLoWgIR0DuohG88La3dX2UKGgGR0B0BNwDNhVmaAdLq2gIR0DuohSSAYpEdX2UKGgGR0BxWh5s0pEyaAdLjWgIR0DuohicoYvWdX2UKGgGR0BxmgpWmxdIaAdLoWgIR0Duohpyy2QXdX2UKGgGR0BxIfVjI7vHaAdLpGgIR0Duohsom5UcdX2UKGgGR0BzcM1n/T9baAdLp2gIR0Duohvo+wC9dX2UKGgGR0Bz5uqn3ta7aAdLsGgIR0Duoh0X1J18dX2UKGgGR0ByyG4qgAZLaAdLg2gIR0DuoiV2U0N0dX2UKGgGR0By6d3NcGC7aAdLs2gIR0Duoi6q5LAYdX2UKGgGR0BGo8dgfEGaaAdLWGgIR0Duoi/a24NJdX2UKGgGR0ByPeDBdld1aAdLqmgIR0DuojJ6AOJ+dX2UKGgGR0BygsHX2/SIaAdLuGgIR0DuojNG+bmVdX2UKGgGR0B0HonE2pAEaAdLqGgIR0DuojOaR6njdX2UKGgGR0Byhg+lj3EiaAdLj2gIR0DuojQYwZfldX2UKGgGR0BvjotnPE88aAdLp2gIR0DuojhwvQF+dX2UKGgGR0Bx7VKRMewLaAdLj2gIR0Duoj8IX0oSdX2UKGgGR0BzKV7VrhzeaAdLrGgIR0Duoj+9AX2vdX2UKGgGR0BxDGNaQmu1aAdLx2gIR0DuokLkoWpIdX2UKGgGR0BwK/cynDR/aAdLomgIR0DuokQsg+yJdX2UKGgGR0BzVe9du5z6aAdLr2gIR0DuokY5ZKWcdX2UKGgGR0BznlUHY6GQaAdLsGgIR0DuokgXqqwRdX2UKGgGR0B0AQbzbvgFaAdLrWgIR0Duok80TDfndX2UKGgGR0BwiONMoMKDaAdLlWgIR0DuolFHWBjGdX2UKGgGR0BygHAM2FWXaAdNlQNoCEdA7qJT4FRpDnV9lChoBkdAcqUBw++ueWgHS6hoCEdA7qJWWLHdXXV9lChoBkdAcC9XIlt0m2gHS6VoCEdA7qJYTNMXanV9lChoBkdAcsWuFHrhSGgHS65oCEdA7qJZkEkjYHV9lChoBkdAcnbMVk+X7mgHS4FoCEdA7qJbX6Q/5nV9lChoBkdAcjMFAVwgkmgHS7JoCEdA7qJbMRpUP3V9lChoBkdAcpEU3n6l+GgHS7RoCEdA7qJb5qM3qHV9lChoBkdAdH7/J/5Ly2gHS7NoCEdA7qJfIe5nUXV9lChoBkdAcmRLux8lX2gHS5FoCEdA7qJlmkFfRnV9lChoBkdAc7y+pOvdM2gHS6doCEdA7qJm+hGpdnV9lChoBkdAcZwuoP07KmgHS6loCEdA7qJovIfbK3V9lChoBkdAclVBO58Sf2gHS8BoCEdA7qJpB9b5dnV9lChoBkdAcVwVurIYFmgHS69oCEdA7qJt7349HXV9lChoBkdAcq/FSKm8/WgHS6poCEdA7qJy6Kk2xnV9lChoBkdAcw8B1cMVlGgHS5NoCEdA7qJ1CqZMMHV9lChoBkdAct7NRFZxJmgHS7BoCEdA7qJ5FTNt7HV9lChoBkdAcMUZha1Ti2gHS59oCEdA7qJ50C7sfXV9lChoBkdAc/4UJOWSlmgHS79oCEdA7qJ5sTFl1HV9lChoBkdAclZRr8BMjGgHS5JoCEdA7qJ57LdN4HV9lChoBkdAcPi4AS39aWgHS5VoCEdA7qJ61mz0H3V9lChoBkdAcbIbMHKOk2gHS6VoCEdA7qJ7pGFzuHV9lChoBkdAckVkWRA8jmgHTV8CaAhHQO6ifD1Iy0t1fZQoaAZHQHKCQpON5t5oB0uVaAhHQO6ifYJNTLp1fZQoaAZHQHNYCpR4yGloB0u6aAhHQO6igF58jRl1fZQoaAZHQHOh5aJQ+EBoB0uXaAhHQO6igpV0cOt1fZQoaAZHQHMSR+OOsDJoB0uqaAhHQO6iiKoS+QF1fZQoaAZHQHORyzsyBTZoB0uvaAhHQO6ii2f7Jnx1fZQoaAZHQHKcZZ8rqdJoB0u2aAhHQO6ijIG2TgV1fZQoaAZHQHKNQrQPZqVoB0ukaAhHQO6ijaZML4N1fZQoaAZHQHBEtXtBv75oB0uUaAhHQO6ij1US7Gx1fZQoaAZHQHNc8XFcY65oB0uaaAhHQO6ikqBPKuB1fZQoaAZHQHGbuQZGax5oB0uRaAhHQO6ilRPwd811fZQoaAZHQG/kQXIlt0poB0uYaAhHQO6ile/tY0V1fZQoaAZHQHIY88DB/I9oB0uVaAhHQO6ilkypJf91fZQoaAZHQHIALKzRhMJoB0uaaAhHQO6ilzr3TNN1fZQoaAZHQHIys4PwuuloB0ueaAhHQO6imoqslsx1fZQoaAZHQHHpzQE6kqNoB0uraAhHQO6inDp5eJJ1fZQoaAZHQHENwSvkilloB0ufaAhHQO6inTpJPIp1fZQoaAZHQHQLWRmseXBoB0u+aAhHQO6ioi9ytFN1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 25676, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV5QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZS9ob21lL3NlbmxpLy5jb25kYS9lbnZzL3NlbmxpX1B5dGhvbjMuOC9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLhEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxlL2hvbWUvc2VubGkvLmNvbmRhL2VudnMvc2VubGlfUHl0aG9uMy44L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV5QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZS9ob21lL3NlbmxpLy5jb25kYS9lbnZzL3NlbmxpX1B5dGhvbjMuOC9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLhEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxlL2hvbWUvc2VubGkvLmNvbmRhL2VudnMvc2VubGlfUHl0aG9uMy44L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-5.15.0-134-generic-x86_64-with-glibc2.17 # 145-Ubuntu SMP Wed Feb 12 20:08:39 UTC 2025", "Python": "3.8.20", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.1+cu121", "GPU Enabled": "True", "Numpy": "1.24.4", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.26.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f2803f51160>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f2803f511f0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f2803f51280>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f2803f51310>", "_build": "<function ActorCriticPolicy._build at 0x7f2803f513a0>", "forward": "<function ActorCriticPolicy.forward at 0x7f2803f51430>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f2803f514c0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f2803f51550>", "_predict": "<function ActorCriticPolicy._predict at 0x7f2803f515e0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f2803f51670>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f2803f51700>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f2803f51790>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f2803fb2d20>"}, "verbose": 0, "policy_kwargs": {}, "num_timesteps": 14008320, "_total_timesteps": 14000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1744204003805074415, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGbOHzuu9bG6U1fyOI1Z1zOa2nu5p4MKuAAAgD8AAIA/AFiPO+E6gLryTAw8Fz2itbjkejuQ3520AACAPwAAgD+aI3E9+9H9O4hp4L7OE4O+GYJ0voi4OT8AAIA/AAAAAGZEhLxtMAY/VrKwPG4MXb94W3C9ZkPCPAAAAAAAAAAAZkaGu1yjYrrIJGM88UfPuB8UiLraRsq3AACAPwAAgD/TLm4+au2tP+fuCD8dBha/g1EAP2hJzD4AAAAAAAAAAGZmiDnSxam7FHKhPM5dhDyZ6+s8gmRivQAAgD8AAIA/zRS0u72Wfjy+TIM9AP2xvvRzqT2vMLA9AAAAAAAAAAAaLhy+IWR5PqnmvD4lMSm/jUofvjHPoT4AAAAAAAAAAL0ipz5Ir1o/fuUnvWycUr/wLyw/+ElUvgAAAAAAAAAAyphcvpF9hT8DUU2+0oBQv3lRJL+vToy7AAAAAAAAAAAz/y+80qXzu4qzUDyyv6E8XyM+PSISh70AAIA/AACAP4COB73LQpI/HKCkvaMfWr/PlQi+lZ6ivAAAAAAAAAAAZjxnPPmxsj9iIjU/ssSvvm5FaLxuFfS9AAAAAAAAAACaPcy7duMGvKgqoL2nocQ8MLjmuz3HjDsAAIA/AACAP5rl0rtIaZO64n4aODM3CTPtP+06zvcytwAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0005942857142857694, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHSYG3BpHqiMAWyUS8mMAXSUR0DxDX5Xe3x4dX2UKGgGR0Bx/qsPrfLtaAdLqGgIR0DxDYAwljVhdX2UKGgGR0BxIf4IrvsraAdLo2gIR0DxDcBgte2NdX2UKGgGR0BxhzQZ4wAVaAdLmWgIR0DxDcEmnO0LdX2UKGgGR0ByPl/Ue+23aAdLoGgIR0DxDcFPl+3IdX2UKGgGR0Byb1w1ivxIaAdLkmgIR0DxDcHYYBNmdX2UKGgGR0BzByp71Iy1aAdLv2gIR0DxDcJnV5KOdX2UKGgGR0Bz9b7vXsgMaAdLwWgIR0DxDcLOinHedX2UKGgGR0BySv3fyf+TaAdLq2gIR0DxDcPYLLIQdX2UKGgGR0Bx2RQSBbwCaAdLqWgIR0DxDcP5JsfrdX2UKGgGR0ByvvjDKoycaAdLkmgIR0DxDcQVzIV/dX2UKGgGR0Bzbjh1klNUaAdLpWgIR0DxDcdUkfLcdX2UKGgGR0ByGITh5xBFaAdLxmgIR0DxDcgIOH32dX2UKGgGR0BxHWDzyz5XaAdLn2gIR0DxDcg8Hv+gdX2UKGgGR0ByBWynk1dgaAdLl2gIR0DxDciq4YrKdX2UKGgGR0BxPfDfm9xqaAdLoWgIR0DxDckTCLuQdX2UKGgGR0BxqiSRr8BNaAdLk2gIR0DxDcmV81GcdX2UKGgGR0BLIYbjtG/faAdLa2gIR0DxDcuQQ+UydX2UKGgGR0BxrZjtoi9qaAdLqmgIR0DxDc1sTnJUdX2UKGgGR0BxGNC7btZ3aAdLlGgIR0DxDc72ys0YdX2UKGgGR0Bz/NYJVsDXaAdLsWgIR0DxDc/xCIDYdX2UKGgGR0Bvzq9/SYw7aAdLpWgIR0DxDdACJoCddX2UKGgGR0BwoyIsRQJpaAdLlWgIR0DxDdB3W4EwdX2UKGgGR0Bxa17eEZivaAdLtGgIR0DxDdE3eenRdX2UKGgGR0BwYbyf+S8raAdLlWgIR0DxDdHmMOwxdX2UKGgGR0BTiiblRxcWaAdLgGgIR0DxDdWwfQrudX2UKGgGR0Byy/dWQwK0aAdLvmgIR0DxDdaVsUItdX2UKGgGR0BxsKfRNRFaaAdLxGgIR0DxDddwAU+LdX2UKGgGR0ByAarMkhRqaAdLnmgIR0DxDden0TURdX2UKGgGR0ByVCjynUDuaAdLlmgIR0DxDdihs67vdX2UKGgGR0By5tXo1UEQaAdLmWgIR0DxDdl8K5TZdX2UKGgGR0BzvsG0NSZSaAdLrGgIR0DxDdnrMTvidX2UKGgGR0BD2RGlQ/HHaAdLamgIR0DxDdpYpDu0dX2UKGgGR0ByBEg2ZRbbaAdLu2gIR0DxDduM72csdX2UKGgGR0B0S6fEn9ehaAdLtGgIR0DxDd41IiC8dX2UKGgGR0BwF1LM9r44aAdLi2gIR0DxDd5tNzsAdX2UKGgGR0BxdC1twaR7aAdLkmgIR0DxDd9A2hqTdX2UKGgGR0Bz7ufBeokzaAdLxmgIR0DxDeJLJSzgdX2UKGgGR0BwAe6g/TsqaAdLo2gIR0DxDeJ+uNgjdX2UKGgGR0BzqnN7jT8YaAdLpWgIR0DxDeNgZTAGdX2UKGgGR0BzAA+wC8vmaAdLuWgIR0DxDeQCFbmmdX2UKGgGR0BwWYmhM8HOaAdLkGgIR0DxDeTUyHmBdX2UKGgGR0BxfgWnCO3laAdLiWgIR0DxDeWV0Lc9dX2UKGgGR0Byuavs7dSEaAdLmWgIR0DxDehUmlZYdX2UKGgGR0Bzsi8AaNuMaAdLsWgIR0DxDejliBoVdX2UKGgGR0Bxh/LowEhaaAdLqmgIR0DxDek8kD6ndX2UKGgGR0BwPcg+yJKraAdLnmgIR0DxDem/T9bYdX2UKGgGR0Bw5cZNwiqyaAdLomgIR0DxDeqCBf8edX2UKGgGR0BzfjqPfbblaAdLnWgIR0DxDep36Q/5dX2UKGgGR0BN4jIzWPLgaAdLgGgIR0DxDeyOearndX2UKGgGR0Bzg4cPvrnlaAdLpWgIR0DxDe+NhVlxdX2UKGgGR0B0F6QV9F4LaAdLxGgIR0DxDfAL7oB8dX2UKGgGR0BxqQwnH/96aAdLmWgIR0DxDfKndfsvdX2UKGgGR0B0LZ/iHZbqaAdLxmgIR0DxDfOW7OE/dX2UKGgGR0BxdzMdLg4waAdLpWgIR0DxDfT64UeudX2UKGgGR0Bx51n003wTaAdLo2gIR0DxDfVgi/widX2UKGgGR0BzMzVH4GliaAdLuWgIR0DxDfYDU3GXdX2UKGgGR0Bxx7HcUM5PaAdLqmgIR0DxDffQbMoudX2UKGgGR0Byk+fSQYDUaAdLs2gIR0DxDffw4sErdX2UKGgGR0ByugsI3R5UaAdLkWgIR0DxDfgASWZ7dX2UKGgGR0BxxkcFQl8gaAdLiGgIR0DxDfkpe/pMdX2UKGgGR0BwXaPPszEaaAdLpWgIR0DxDfqVcUuddX2UKGgGR0Bvnac7QswtaAdLmmgIR0DxDfsJqIrOdX2UKGgGR0BzMEsAeaKDaAdLqmgIR0DxDfvsTFl1dX2UKGgGR0B0MjUmUnogaAdLvmgIR0DxDf1y0rsjdX2UKGgGR0BwUwMOPNmlaAdLiGgIR0DxDf4QYk3TdX2UKGgGR0BxOAp4KQaKaAdLmGgIR0DxDgA0QK8ddX2UKGgGR0BwtBTJhfBvaAdLm2gIR0DxDgNZLIxQdX2UKGgGR0BxDsVIqbz9aAdLl2gIR0DxDgaohY/3dX2UKGgGR0ByBJSxZ+x4aAdLimgIR0DxDgqsunMudX2UKGgGR0BzS89Oh0yQaAdLu2gIR0DxDgqJaJQ+dX2UKGgGR0BznFStNi6QaAdLxGgIR0DxDgs69CeFdX2UKGgGR0BxnrLU1AJLaAdLnWgIR0DxDgt4W1twdX2UKGgGR0Bx5t7hNucdaAdLrWgIR0DxDgvgsbvPdX2UKGgGR0BxqeAe7tiQaAdLsGgIR0DxDgxUj9n9dX2UKGgGR0BwwCQLeANHaAdLuWgIR0DxDg0v+OwQdX2UKGgGR0BwXulrM1TBaAdLkGgIR0DxDg0eOn2qdX2UKGgGR0BzuyoKlYU4aAdL5GgIR0DxDg2ImPYGdX2UKGgGR0BzUulGgBcSaAdLvGgIR0DxDhES1maqdX2UKGgGR0BzIwhFEy+IaAdLrGgIR0DxDhKsRQJpdX2UKGgGR0BzPPiS7oStaAdLtmgIR0DxDhMi9qUNdX2UKGgGR0BzfHslb/wRaAdLpWgIR0DxDhQ+F10UdX2UKGgGR0BwHAUuctoSaAdLoGgIR0DxDhbI9TxYdX2UKGgGR0BwwW1eBxxUaAdLn2gIR0DxDhnSQYDUdX2UKGgGR0BzLT/xUedTaAdLkmgIR0DxDhwANG3GdX2UKGgGR0ByxHrB0p3HaAdLjWgIR0DxDhyGn4widX2UKGgGR0BxbpelbeMyaAdLkWgIR0DxDh1uTRpldX2UKGgGR0Bym5Uo8ZDRaAdLnWgIR0DxDh3GNrCWdX2UKGgGR0BwNmhew9q2aAdLpmgIR0DxDh5MVUModX2UKGgGR0ByW6N4qwyJaAdLoGgIR0DxDh5ppvgndX2UKGgGR0By+myv9tMxaAdLlmgIR0DxDh7QN0/4dX2UKGgGR0ByUoIkZ75VaAdLmWgIR0DxDh81jy4GdX2UKGgGR0BwCxorWiDeaAdLnWgIR0DxDh//keZHdX2UKGgGR0BxqZ16mfoSaAdLkmgIR0DxDiOf1pTNdX2UKGgGR0Bx0tTXJ5miaAdLmGgIR0DxDiTKA8SxdX2UKGgGR0BxnRbdJrckaAdLmmgIR0DxDiYC+De1dX2UKGgGR0Bz2Wtnwob5aAdLt2gIR0DxDiZdnTRZdX2UKGgGR0BzfgBtDUmVaAdNBQJoCEdA8Q4nviDM/3V9lChoBkdAcsZqBmPHUGgHS5loCEdA8Q4oaBNEgHV9lChoBkdAdBeMtsenymgHS6VoCEdA8Q4sMPnSv3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 25676, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV5QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZS9ob21lL3NlbmxpLy5jb25kYS9lbnZzL3NlbmxpX1B5dGhvbjMuOC9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLhEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxlL2hvbWUvc2VubGkvLmNvbmRhL2VudnMvc2VubGlfUHl0aG9uMy44L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV5QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZS9ob21lL3NlbmxpLy5jb25kYS9lbnZzL3NlbmxpX1B5dGhvbjMuOC9saWIvcHl0aG9uMy44L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLhEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxlL2hvbWUvc2VubGkvLmNvbmRhL2VudnMvc2VubGlfUHl0aG9uMy44L2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWjARmdW5jlIwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-5.15.0-134-generic-x86_64-with-glibc2.17 # 145-Ubuntu SMP Wed Feb 12 20:08:39 UTC 2025", "Python": "3.8.20", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.1+cu121", "GPU Enabled": "True", "Numpy": "1.24.4", "Cloudpickle": "3.1.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.26.2"}}
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63cde384c248a8902d3c3bbbb7ac40632d48023c8dc9908fc3d8dc432c07aee1
3
- size 162590
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66632549a98444f6dc92b9323a11c86e50ce07ab796e82a4d9bc84b6f65ec46a
3
+ size 158465
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 298.4455764, "std_reward": 18.91756831948335, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-04-09T14:04:14.867966"}
 
1
+ {"mean_reward": 288.9304148, "std_reward": 18.526441769155003, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-04-09T15:52:03.252837"}