CoderMan-O commited on
Commit
36dc6b3
·
verified ·
1 Parent(s): 3134c0d

Upload PPO BipedalWalker-v3 trained agent

Browse files
BipedalWalker-v3.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a4d0702e184611e78cf370b25feca519e76c33fb3cb25161cf994050f776ad6
3
- size 173325
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f32267edd904b8cab23930eb85c7f3af605e7a4477e8d9fd2bdce341c41cce4
3
+ size 176431
BipedalWalker-v3/data CHANGED
@@ -4,34 +4,34 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x783b7dbb27a0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x783b7dbb2830>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x783b7dbb28c0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x783b7dbb2950>",
11
- "_build": "<function ActorCriticPolicy._build at 0x783b7dbb29e0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x783b7dbb2a70>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x783b7dbb2b00>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x783b7dbb2b90>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x783b7dbb2c20>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x783b7dbb2cb0>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x783b7dbb2d40>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x783b7dbb2dd0>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x783b7db57600>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
- "num_timesteps": 4800,
25
- "_total_timesteps": 2000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1714022747756011012,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAJfx1T0yGOw6RPSNvXNMwrztv40/yB5tP6YuTD/9/3+/AACAPyio775VwQ+/LE6svv3/fz8AAAAAuySQPsvHkT7m4ZY+dRSgPvilrj5GAMU+KePnPt7YED+K5UY/AACAP9pWkj6E//i8kj8nPUEONbwRhVa/QDIdOwA1X764fn8/AACAPxpflT88IYA/Ui4yP1XXf78AAAAAOR58PjL7fj7W84M+/f6LPpe8mD73SKw+XsvKPktZ/T5a8S0/AACAP/2niT8WpqC9L8NePRYJ1Dyr42c+HrGnPvB/Cb4A+2W8AACAP5sRSb82WeU+YNgiv8W84rsAAIA/SFybPvUfnT6zn6I+fImsPjk9vD7TVNQ+su75PnAeHD/bX1Y/AACAP+KZij5DS2w9jmmHvKi3KjzfL4U/Hby3vljLLD+UYE+9AACAP+ymV7+cSQO/+m0mvwEAgL8AAAAAmI2DPg4MhT4UtIk++RiSPrpknz41y7M+BKLTPv8xBD8XhjU/AACAPxHApD/Akd492si4PCgoC7od4le+4MLKvSihMr/9/3+/AAAAAL3bV78AAIC/TIkiv5Xjvj4AAAAAox6oPmgHqj7D+q8+97S6PtWyyz71xOU+rzoHP73wKD+pVWg/AACAP4RRwT4Pvow9Vrb9Ozov7jrDxD0+gDVeuzAVOT77/38/AAAAANuAEr9QpVu/HVZvPwAAAAAAAAAAd2DyPh4h9T5Vtf0+QZYGP9jVEj/boCU/fPVCP12Pcz8AAIA/AACAPzs3kD42UZW7lHLpvNvR2jzv0YI/bE47Pdr7OD8BAIC/AAAAAN8MT796YT4+IIaRvp0lWr4AAAAAm4CEPtMBhj5zsoo+2iaTPiuLoD5VF7U+9SjVPjImBT9p1TY/AACAPxBbjz9OXFg9LwSWvX2csDzG8Ls9/P9/vz5DC7+0WOE+AAAAABzo3r7vdrG+zIocv8kW+D0AAIA/E7uqPm+rrD5ztrI+Tpu9Prvczj6DVuk+WlQJP3CQKz9JlWs/AACAP+UlrD521fy6bI+QvEEUj72Cf5A/BOJSP5w5ND8AAIC/AAAAANlmT78AAAAAPOsBv/j/fz8AAAAA9lCGPnTXhz6EmIw+jCqVPsu9oj74kbc++hPYPtH4Bj/mFDY/AACAP2tNKz74gRs8eyEMvQTcNzy9G1e/AAqKOYBlsTuJAIC/AAAAAKTcgD8MHKC90GBvP1UN7DgAAIA/3xhpPou+az6s/nM+I2+BPqs2jT59SZ8+pX67Piw86j7b0SA/AACAP24v9b7XoAW9GvYGPn1+N71JZ+M+AgCAP4Bwyb6P16W/AAAAABbjSD/kfVK+jt0rv/3/f78AAIA/TJ6vPt6csT4s1Lc+3QjDPr/I1D6PBPA+yUINP8V5MD8GIHI/AACAPzXP4D2EuMo9OaMePNvCWjyoCVK/AACAs7DT+T0AAIC/AAAAAAwukT8AAAAAjmFDPxl5ab8AAIA/iT9uPi/0cD78Ynk+XUuEPolVkD6azqI+VKO/PkZp7z6jXyQ/AACAP7z4gD40zne8YZtmPWWflLxShos/zZipvZzJVj+tAIA/AAAAAHKgVb8AABw1APQ6vZS9ej0AAIA/IAqCPi+Egz5+Hog+qmqQPkKPnT6nubE+rzLRPqOsAj9xbzM/AACAP/mGoT4kxgu99x4JvWigmzxi8Y4/AACAsnR6nD77/38/AACAP9YyQr/27fY9gGZfvv3/fz8AAAAAB3GLPmwGjT7s9ZE+rNuaPojzqD4rk74+u1LgPkofDD+caEA/AACAP6sNuD9MZ9g8FIEEPCVUWDujOFy/8Gp1v07QGL8AAAAAAACAPx5igD7Jpz++yIwivwAAgLEAAAAAjjCiPhUIpD61xak+DB+0PnuDxD4xqt0+mHUCPz77Ij83zF8/AACAPxoEQT3xaqu8aYQmPr29GLyjqgq//xKPvnCHm76jDYA/AAAAAIfadL4k9MI8qrEOv4DVf78AAIA/wvKQPimYkj6PuZc+Q/mgPpmfrz7aGcY+mi7pPuenET/UAUg/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -41,17 +41,17 @@
41
  "_episode_num": 0,
42
  "use_sde": false,
43
  "sde_sample_freq": -1,
44
- "_current_progress_remaining": -1.4,
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWV+AIAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwFtsxpcophGMAWyUSzCMAXSUR0AVHjrAxi5NdX2UKGgGR8BcyqAnUlRhaAdLM2gIR0AVOGetjkMkdX2UKGgGR8BdgXX7Lt/naAdLP2gIR0AVfcIqslsxdX2UKGgGR8BZnbzkIX0oaAdLQWgIR0AVk7fYSQHSdX2UKGgGR8BaxrhegL7XaAdLQ2gIR0AVp5HEuQIVdX2UKGgGR8BdnFO9FnZkaAdLRGgIR0AVqneizsyBdX2UKGgGR8BanrpRoAXEaAdLRmgIR0AVu9g4OtnxdX2UKGgGR8BZtIQSSNfgaAdLVGgIR0AWDZcs189fdX2UKGgGR8BZwIkqtozvaAdLN2gIR0AWfrJKaodddX2UKGgGR8Bb1nFglWwNaAdLPGgIR0AWtBJI1+AmdX2UKGgGR8BbrTv/io87aAdLNGgIR0AWzTkQwsXjdX2UKGgGR8BcvF5WzWwvaAdLemgIR0AW/guRLbpNdX2UKGgGR8Bb4Cr5qM3qaAdLPWgIR0AXLEFW4mTldX2UKGgGR8BbLQc94eLfaAdLQGgIR0AXNg1FYuCgdX2UKGgGR8BfLF5v99+gaAdLYmgIR0AYAre67NB4dX2UKGgGR8BcWyWmgrYoaAdLOGgIR0AYYXVLBbfQdX2UKGgGR8BaszMA3kxRaAdLRmgIR0AYdfLLZBcBdX2UKGgGR8BZn/va11GLaAdLXmgIR0AY2kFfReC1dX2UKGgGR8BfNT7ZWaMKaAdLeGgIR0AZBPVNHpbEdX2UKGgGR8BbjXRkVeruaAdLK2gIR0AZfzbvgFX8dX2UKGgGR8BaJRPj4pMIaAdLSGgIR0AZygSOBDohdX2UKGgGR8BcKyntOVPfaAdLOWgIR0AaMxzq8lHCdX2UKGgGR8Ba8uDe0ojOaAdLOGgIR0AaWasp5NXYdX2UKGgGR8BZG5JwsGxEaAdLQWgIR0AbDl+3H7xedWUu"
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
  },
54
- "_n_updates": 4,
55
  "observation_space": {
56
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
  ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==",
@@ -83,7 +83,7 @@
83
  "_np_random": null
84
  },
85
  "n_envs": 16,
86
- "n_steps": 300,
87
  "gamma": 0.999,
88
  "gae_lambda": 0.98,
89
  "ent_coef": 0.01,
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7e38025c36d0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e38025c3760>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e38025c37f0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e38025c3880>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7e38025c3910>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7e38025c39a0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7e38025c3a30>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e38025c3ac0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7e38025c3b50>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e38025c3be0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e38025c3c70>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7e38025c3d00>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7e380255dec0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
+ "num_timesteps": 104000,
25
+ "_total_timesteps": 100000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1714106227409224375,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAMIJBD7QzQA8/lIjPIr3Ozwlf0S/ZFonPyCr0z1ZNBG/AAAAAIDelD///38/dDIuPzXnv78AAIA/X6ltPkHdbz4rsHc+73WDPhLvjz6efqE+iyy8Pm8l6z78Tx8/AACAP+cNzj1Xxws9sPoiPdpdXzyrhJA/9OLwPsRlSj/7/3+/AACAPyBUKr/OdBS+mM/CvjzweL8AAAAAKQKKPimAiz7+/Y8+c7CYPpxKqD6B6L0+DtvePrGeCz9Vazc/AACAPwFr3j06IKk7hADePFKH/Dyq/FK/AAAAM0BfX70FAIA/AAAAAEVzjT8AAAAA/OdaP58z5b0AAIA/8apnPnVMaj6if3I+8aOAPvxYjD5uT54+TVi6PnTM6D4BbCc/AACAP02wXL9IhsC91PaauwWHCb4P5uQ+udGMPiKjKD/9/38/AAAAAMFbET6ADOQ7bH4uPyVWer8AAAAAzbvdPnBA4D6aGeg+lD/2PlFUBj+UhRc/sloyP+fQXj8AAIA/AACAP1FCXz0Nkq485H3nPGFe6Dwg4hq/XCtbvVg4Nr5W0oC/AAAAAB1ekD8ANH85KlxbP9Isgb4AAIA/Z8l/PnDegT7liYY+67SOPptsmj46B6w+/X3KPndk8z7MRho/ErN3P75zTD5loAS9am7ZO2ZovTyfRJE/AGYqOzRcRT+5CIA/AAAAAG8NSr++ZpE+MLz6vnXck74AAIA/BEODPlHxhT6T8Ys+j3yUPin9oT6tuLY+0qDUPjce/z4fjys/AACAP+T92z2vjgG8DkKVPOofAj2DU1W/oI7QuqhGcT6zH+o9AAAAABjijD8AJJo4SEZsP0t0VjsAAIA/qZZsPnxGbz4/pnc+dm6DPnF5jz7zYJ8+NBO3Plqq3z4FtSI/AACAP5Lp1D0bL4A9de3yutODfrxG91K/SDwAPSxbCD4AAIC/AAAAALa2jj8AAAAAvCtOP/gBB78AAIA/Z9ptPueNcD7cwXc+I7KCPq46jz6HOaM+15nAPhHL8T4AEC0/AACAP/6rFj6e/IC8sJELPt+B87xRz1G/YGc8OwBOfL6FbIC/AAAAAKREkT8AEJy3gG9NPw0RgD8AAAAAJvJrPhygbj4M+nY+0POCPiIWjj7kJJ8+JYW5Pk7Z7j5UDSU/AACAP1Wxvj3kamC87DYLPfSuMD0tvVG/ANSeuITBaz7bEzI+AACAP5dMjj8AgF42QlxbP7HS+zwAAIA/KZ1qPj5HbT4dlXU+v0aCPuYhjj7TUqA++La8PkLh7T5h0SY/AACAP4L+gj2d7KI7+D1mvHY8Nj3AbDy/OEsoPkDDcL3dt3+/AAAAAB26jT/M2qm+4jdZPzC6qT4AAIA/lw9sPjfrbj6ShXc+Hn+DPh7Ljz6PZaM+sQXEPtT0/j6Fxi0/AACAP7W/Kj5I7YQ9DJsTPYU44byRuo8/eLYMvvafTz8AAIC/AAAAALl4UL8e5oi/WIm0PcmcIj8AAIA/aUKFPtXFhj5RfYs+Ff6TPnsqoT7wrrU+DNTYPgRbCT/hVTk/AACAP210S74hahy9tmTAvZfGvb2Gd4++L9TRPgtWbz8AAAAAAAAAAG57Jj9HQaQ/qJ1GPwAAgL8AAAAA9pDoPhg16z5pcPM+qyMBP1bkDD+e7B4/UxE7P5mzaT8AAIA/AACAPzEroz07oOq82P3EPHj3Ar2x41K/AABAM+g2dz4CAIA/AAAAAD1wkD8w+Ps+Qo5sPwAAAAAAAIA/qRdtPvPIbz5HLXg+EqeDPkqijz5k76A+r8O5PlC44T6cdyA/AACAP8VD/T3m9fU7w6yYvEHqCLk6OE6/ZnWXPaT9jb4RCxa+AAAAANhRiD/WPTm/CMR8PwAAgD8AAIA/O9BnPjrnaD56O24+fk15Pjkihj6HI5U+lIuuPnfj2T4j0Rg/AACAP8gmvD2j9Xm7OqM7PSmmvb0Q0U6/AADAsuCUkj5QuRS+AACAP4wZkD8AAAAAUhxCP/z/f78AAAAAS4R5PrRZfD5Ol4I+No2KPikplz7mgao+uLPIPnEL+T5Ebiw/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
41
  "_episode_num": 0,
42
  "use_sde": false,
43
  "sde_sample_freq": -1,
44
+ "_current_progress_remaining": -0.040000000000000036,
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWVAQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwF24MBp5/sqMAWyUS1iMAXSUR0Btyv7+DOC5dX2UKGgGR8BaevKdQO4HaAdLOWgIR0Bt24V/MGHIdX2UKGgGR8Ba06MNtqHoaAdLS2gIR0BuM2gOBlMAdX2UKGgGR8BcJc4T9KmLaAdLR2gIR0BuTNjEvTPTdX2UKGgGR8BhJ5NwiqyXaAdLo2gIR0Buc/lOoHcDdX2UKGgGR8Bcl9L127nQaAdLNGgIR0Bufvcxj8UFdX2UKGgGR8BbUWpVCHARaAdLPmgIR0BujQAEMb3odX2UKGgGR8BdfvRqoIfKaAdLV2gIR0BuoSynk1dgdX2UKGgGR8BZd4TfzjFRaAdNQAZoCEdAbtwzMzMzM3V9lChoBkfAX1hOIqLCN2gHS1ZoCEdAbt3QcghbGHV9lChoBkfAWy3yd4FA3WgHSzhoCEdAbupeVLSNO3V9lChoBkfAWYU5R0lqrWgHS0FoCEdAbusIxgy/K3V9lChoBkfAXBYG+sYEXGgHS0doCEdAbvqBU70WdnV9lChoBkfAXDxZ+x4Y8GgHS1BoCEdAbvwP7N0NjXV9lChoBkfAWcVMURFqjGgHTUAGaAhHQG8CvwEyLyd1fZQoaAZHwFnrKq4pc5doB01ABmgIR0BvApgogFHKdX2UKGgGR8Bb2C+cpb2UaAdNQAZoCEdAbwK2gFotc3V9lChoBkfAWMz7ALy+YmgHTUAGaAhHQG8Cwpe/pMZ1fZQoaAZHwFtQXeWOZLJoB01ABmgIR0BvAtPxhDw6dX2UKGgGR8BaHWsA/9pAaAdLN2gIR0BvCDHyVfNSdX2UKGgGR8BXUlZDArQPaAdNQAZoCEdAbxOSpR4yGnV9lChoBkfAWuNN7BwdbWgHS0doCEdAbxNVIZqEe3V9lChoBkfAWNWOPvKEFmgHTUAGaAhHQG8Teb/ffoB1fZQoaAZHwFlT3RG+bmVoB0tIaAhHQG8Ub961LJ11fZQoaAZHwF5LImw7kn1oB0tJaAhHQG8URe1KGtZ1fZQoaAZHwFn5uMdcSoRoB0tOaAhHQG8V/zJ6po91fZQoaAZHwFv4pY9xIatoB0thaAhHQG8aE6DGtIV1fZQoaAZHwFyR/LDAJsxoB0uOaAhHQG8cFev6j351fZQoaAZHwFromfGuLaVoB0tkaAhHQG8gZc1O0sx1fZQoaAZHwFy3Btk4FRpoB0s3aAhHQG8mGSpzcRF1fZQoaAZHwF4d8eS0Sh9oB0tzaAhHQG8t62WpqAV1fZQoaAZHwFn+KzRhMJxoB01ABmgIR0BvMTbi6xxDdX2UKGgGR8BbctugpSaWaAdNQAZoCEdAbzKenyd4FHV9lChoBkfAWWphDw6QvGgHSz9oCEdAbzVND+irUHV9lChoBkfAW4K3WnTAnGgHS1hoCEdAb0KtUXHim3V9lChoBkfAXCxgWrOqvWgHS05oCEdAb0Pc+qzZ6HV9lChoBkfAWaBkH2RJVmgHTUAGaAhHQG9FqTr3TNN1fZQoaAZHwGHAtQbdadNoB0v0aAhHQG93yXUpd8l1fZQoaAZHwFi9QJ5VwP1oB01ABmgIR0BveBzHS4OMdX2UKGgGR8BcAvsRg7YDaAdLNWgIR0Bvfa5LAYYSdX2UKGgGR8BcknF98Z1naAdLS2gIR0BvgCgZjx0/dX2UKGgGR8BZIBMWXTmXaAdLWGgIR0BvhApjMFEBdX2UKGgGR8BcmP7WNFSbaAdLUmgIR0BviwYLsruqdX2UKGgGR8BcorhvR7Z4aAdLMWgIR0Bvi5YmsvIwdX2UKGgGR8BYzWoJiRW+aAdNQAZoCEdAb5E8EFGG23V9lChoBkfAWUpK02LpA2gHS1loCEdAb5NaIvalDXV9lChoBkfAWfnaTOgQH2gHS0BoCEdAb50jcEeQuHV9lChoBkfAWcCtJWeYlmgHS09oCEdAb6MREF4cFXV9lChoBkfAWNHlp48lomgHTUAGaAhHQG+kTxXnyNJ1fZQoaAZHwFoYRChN/ONoB0t+aAhHQG+o/p2U0N11fZQoaAZHwFsGBi1AqutoB01ABmgIR0Bvsz850bLmdX2UKGgGR8BcWZ8jRlYmaAdLOWgIR0BvxkebNKRMdX2UKGgGR8BeVdUKiO/+aAdLZ2gIR0BvzQRGtp22dX2UKGgGR8Be72g3974SaAdLe2gIR0Bv0CrtE5QxdX2UKGgGR8Bb+USqU/wBaAdLOWgIR0Bv4kZJkGzKdX2UKGgGR8BZS0AggX/HaAdLWGgIR0Bv5zWPLgXNdX2UKGgGR8BbdoiX6ZYxaAdLU2gIR0Bv7acslLOBdX2UKGgGR8BbKbhaTwDvaAdLNmgIR0Bv+atHQQcxdX2UKGgGR8BaYZzLfUF0aAdLUmgIR0BwBM4PwuuidX2UKGgGR8Bb2OLR8c+8aAdNQAZoCEdAcJSvEjxCpnV9lChoBkfAV/n/xUedTmgHTUAGaAhHQHCU8UEgW8B1fZQoaAZHwFiJJF9a2WpoB01ABmgIR0BwlN6AvtdBdX2UKGgGR8BZyZKODJ2daAdNQAZoCEdAcJWmXgLqlnV9lChoBkfAWizJvHcUNGgHTUAGaAhHQHCY1LvkRz11fZQoaAZHwFkaCFsYVItoB01ABmgIR0Bwmy+fywwCdX2UKGgGR8BaSLyUcGTtaAdLRWgIR0BwnQu8K5TZdX2UKGgGR8Bal8kdFOO9aAdLL2gIR0BwnhQsPJ7tdX2UKGgGR8BfY2yHEdeZaAdLU2gIR0BwnwyN4qwydX2UKGgGR8BZQ8PBi1AraAdLLWgIR0BwofZ+QU5/dX2UKGgGR8Bbc0n5SFXaaAdNQAZoCEdAcLtbmEGqxXV9lChoBkfAWidowmE5AGgHSy9oCEdAcLwajN6gNHV9lChoBkfAWGRWJaaCtmgHTUAGaAhHQHC9VHSWqtJ1fZQoaAZHwFmA287IT5BoB0tdaAhHQHC90xASnLt1fZQoaAZHwFlPKkVN5+poB0tWaAhHQHDBSprDZUV1fZQoaAZHwFyuXhfjS5RoB0tIaAhHQHDFTAeq7yx1fZQoaAZHwFlm8scyWRloB0s4aAhHQHDMDch1Tzd1fZQoaAZHwFnZMqz7di5oB0tmaAhHQHDOqqXF98Z1fZQoaAZHwFgRsMRYigVoB01ABmgIR0Bw0DiT+vQodX2UKGgGR8BfNTeTFERbaAdLZWgIR0Bw0KBEroW6dX2UKGgGR8BaaAam4y44aAdLLGgIR0Bw2GafBeoldX2UKGgGR8BW/T101ZTyaAdNQAZoCEdAcOKNlRP423V9lChoBkfAWv2RLbpNbmgHTUAGaAhHQHDkDGYKIBR1fZQoaAZHwF0RCaqjrRloB01ABmgIR0Bw6f8/D+BIdX2UKGgGR8BXqFqagElmaAdNQAZoCEdAcO1PdVNpNHV9lChoBkfAWgIhGH58B2gHSzloCEdAcO7a1Cw8n3V9lChoBkfAXHzXiBGx2WgHSz9oCEdAcPNqqfe1r3V9lChoBkfAWyzbi6xxDWgHSzBoCEdAcPSxYJVsDXV9lChoBkfAXNqdvsJID2gHS0loCEdAcPchUBGQS3V9lChoBkfAWcLD50r9VGgHS1hoCEdAcP98ejmCAnV9lChoBkfAXSUqmTC+DmgHS0xoCEdAcQBFXq7iAHV9lChoBkfAVyVfgJkXlGgHTUAGaAhHQHEDlcY64lR1fZQoaAZHwFanqYJE6T5oB01ABmgIR0BxH1C2MKkVdX2UKGgGR8BfBPmcOLBLaAdLb2gIR0BxI7bJwKjSdX2UKGgGR8BaS91hb4ahaAdNQAZoCEdAcSQvLowEhnV9lChoBkfAXVCF+NLlFWgHS0BoCEdAcSYDGLk0anV9lChoBkfAWjyHvc8DCGgHS0JoCEdAcSrBacI7eXV9lChoBkfAWuFhG6PKdWgHS1toCEdAcTUJu2qkunV9lChoBkfAWzYk8ifQKWgHSy5oCEdAcTqz90ihWnV9lChoBkfAWC825xzaK2gHTUAGaAhHQHGvNWQwK0F1fZQoaAZHwFm8e4kNWlxoB01ABmgIR0Bxr43WFvhqdWUu"
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
  },
54
+ "_n_updates": 52,
55
  "observation_space": {
56
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
  ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==",
 
83
  "_np_random": null
84
  },
85
  "n_envs": 16,
86
+ "n_steps": 500,
87
  "gamma": 0.999,
88
  "gae_lambda": 0.98,
89
  "ent_coef": 0.01,
BipedalWalker-v3/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a7e8bc42784ccbfbcd118cea6311c7f9413a5d53c79ef8a9e01efad2594f102
3
  size 105121
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe480b1affd3f12c7bdbfa38d90e0efaa46541ee8bdb46a0ccd1a14548f3760f
3
  size 105121
BipedalWalker-v3/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c895e264373f2e0d208fde78d2d1d6fff3d16e098516f71b641048a8b8ced28
3
  size 52143
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cd9fbe0b5642c693800623b3c04934011be739d37d15f644055770befea5a76
3
  size 52143
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: BipedalWalker-v3
17
  metrics:
18
  - type: mean_reward
19
- value: -92.28 +/- 0.07
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: BipedalWalker-v3
17
  metrics:
18
  - type: mean_reward
19
+ value: -56.38 +/- 0.22
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x783b7dbb27a0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x783b7dbb2830>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x783b7dbb28c0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x783b7dbb2950>", "_build": "<function ActorCriticPolicy._build at 0x783b7dbb29e0>", "forward": "<function ActorCriticPolicy.forward at 0x783b7dbb2a70>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x783b7dbb2b00>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x783b7dbb2b90>", "_predict": "<function ActorCriticPolicy._predict at 0x783b7dbb2c20>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x783b7dbb2cb0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x783b7dbb2d40>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x783b7dbb2dd0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x783b7db57600>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 4800, "_total_timesteps": 2000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1714022747756011012, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAJfx1T0yGOw6RPSNvXNMwrztv40/yB5tP6YuTD/9/3+/AACAPyio775VwQ+/LE6svv3/fz8AAAAAuySQPsvHkT7m4ZY+dRSgPvilrj5GAMU+KePnPt7YED+K5UY/AACAP9pWkj6E//i8kj8nPUEONbwRhVa/QDIdOwA1X764fn8/AACAPxpflT88IYA/Ui4yP1XXf78AAAAAOR58PjL7fj7W84M+/f6LPpe8mD73SKw+XsvKPktZ/T5a8S0/AACAP/2niT8WpqC9L8NePRYJ1Dyr42c+HrGnPvB/Cb4A+2W8AACAP5sRSb82WeU+YNgiv8W84rsAAIA/SFybPvUfnT6zn6I+fImsPjk9vD7TVNQ+su75PnAeHD/bX1Y/AACAP+KZij5DS2w9jmmHvKi3KjzfL4U/Hby3vljLLD+UYE+9AACAP+ymV7+cSQO/+m0mvwEAgL8AAAAAmI2DPg4MhT4UtIk++RiSPrpknz41y7M+BKLTPv8xBD8XhjU/AACAPxHApD/Akd492si4PCgoC7od4le+4MLKvSihMr/9/3+/AAAAAL3bV78AAIC/TIkiv5Xjvj4AAAAAox6oPmgHqj7D+q8+97S6PtWyyz71xOU+rzoHP73wKD+pVWg/AACAP4RRwT4Pvow9Vrb9Ozov7jrDxD0+gDVeuzAVOT77/38/AAAAANuAEr9QpVu/HVZvPwAAAAAAAAAAd2DyPh4h9T5Vtf0+QZYGP9jVEj/boCU/fPVCP12Pcz8AAIA/AACAPzs3kD42UZW7lHLpvNvR2jzv0YI/bE47Pdr7OD8BAIC/AAAAAN8MT796YT4+IIaRvp0lWr4AAAAAm4CEPtMBhj5zsoo+2iaTPiuLoD5VF7U+9SjVPjImBT9p1TY/AACAPxBbjz9OXFg9LwSWvX2csDzG8Ls9/P9/vz5DC7+0WOE+AAAAABzo3r7vdrG+zIocv8kW+D0AAIA/E7uqPm+rrD5ztrI+Tpu9Prvczj6DVuk+WlQJP3CQKz9JlWs/AACAP+UlrD521fy6bI+QvEEUj72Cf5A/BOJSP5w5ND8AAIC/AAAAANlmT78AAAAAPOsBv/j/fz8AAAAA9lCGPnTXhz6EmIw+jCqVPsu9oj74kbc++hPYPtH4Bj/mFDY/AACAP2tNKz74gRs8eyEMvQTcNzy9G1e/AAqKOYBlsTuJAIC/AAAAAKTcgD8MHKC90GBvP1UN7DgAAIA/3xhpPou+az6s/nM+I2+BPqs2jT59SZ8+pX67Piw86j7b0SA/AACAP24v9b7XoAW9GvYGPn1+N71JZ+M+AgCAP4Bwyb6P16W/AAAAABbjSD/kfVK+jt0rv/3/f78AAIA/TJ6vPt6csT4s1Lc+3QjDPr/I1D6PBPA+yUINP8V5MD8GIHI/AACAPzXP4D2EuMo9OaMePNvCWjyoCVK/AACAs7DT+T0AAIC/AAAAAAwukT8AAAAAjmFDPxl5ab8AAIA/iT9uPi/0cD78Ynk+XUuEPolVkD6azqI+VKO/PkZp7z6jXyQ/AACAP7z4gD40zne8YZtmPWWflLxShos/zZipvZzJVj+tAIA/AAAAAHKgVb8AABw1APQ6vZS9ej0AAIA/IAqCPi+Egz5+Hog+qmqQPkKPnT6nubE+rzLRPqOsAj9xbzM/AACAP/mGoT4kxgu99x4JvWigmzxi8Y4/AACAsnR6nD77/38/AACAP9YyQr/27fY9gGZfvv3/fz8AAAAAB3GLPmwGjT7s9ZE+rNuaPojzqD4rk74+u1LgPkofDD+caEA/AACAP6sNuD9MZ9g8FIEEPCVUWDujOFy/8Gp1v07QGL8AAAAAAACAPx5igD7Jpz++yIwivwAAgLEAAAAAjjCiPhUIpD61xak+DB+0PnuDxD4xqt0+mHUCPz77Ij83zF8/AACAPxoEQT3xaqu8aYQmPr29GLyjqgq//xKPvnCHm76jDYA/AAAAAIfadL4k9MI8qrEOv4DVf78AAIA/wvKQPimYkj6PuZc+Q/mgPpmfrz7aGcY+mi7pPuenET/UAUg/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -1.4, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV+AIAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwFtsxpcophGMAWyUSzCMAXSUR0AVHjrAxi5NdX2UKGgGR8BcyqAnUlRhaAdLM2gIR0AVOGetjkMkdX2UKGgGR8BdgXX7Lt/naAdLP2gIR0AVfcIqslsxdX2UKGgGR8BZnbzkIX0oaAdLQWgIR0AVk7fYSQHSdX2UKGgGR8BaxrhegL7XaAdLQ2gIR0AVp5HEuQIVdX2UKGgGR8BdnFO9FnZkaAdLRGgIR0AVqneizsyBdX2UKGgGR8BanrpRoAXEaAdLRmgIR0AVu9g4OtnxdX2UKGgGR8BZtIQSSNfgaAdLVGgIR0AWDZcs189fdX2UKGgGR8BZwIkqtozvaAdLN2gIR0AWfrJKaodddX2UKGgGR8Bb1nFglWwNaAdLPGgIR0AWtBJI1+AmdX2UKGgGR8BbrTv/io87aAdLNGgIR0AWzTkQwsXjdX2UKGgGR8BcvF5WzWwvaAdLemgIR0AW/guRLbpNdX2UKGgGR8Bb4Cr5qM3qaAdLPWgIR0AXLEFW4mTldX2UKGgGR8BbLQc94eLfaAdLQGgIR0AXNg1FYuCgdX2UKGgGR8BfLF5v99+gaAdLYmgIR0AYAre67NB4dX2UKGgGR8BcWyWmgrYoaAdLOGgIR0AYYXVLBbfQdX2UKGgGR8BaszMA3kxRaAdLRmgIR0AYdfLLZBcBdX2UKGgGR8BZn/va11GLaAdLXmgIR0AY2kFfReC1dX2UKGgGR8BfNT7ZWaMKaAdLeGgIR0AZBPVNHpbEdX2UKGgGR8BbjXRkVeruaAdLK2gIR0AZfzbvgFX8dX2UKGgGR8BaJRPj4pMIaAdLSGgIR0AZygSOBDohdX2UKGgGR8BcKyntOVPfaAdLOWgIR0AaMxzq8lHCdX2UKGgGR8Ba8uDe0ojOaAdLOGgIR0AaWasp5NXYdX2UKGgGR8BZG5JwsGxEaAdLQWgIR0AbDl+3H7xedWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 4, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "_shape": [24], "low": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "low_repr": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high_repr": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVpwEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True]", "bounded_above": "[ True True True True]", "_shape": [4], "low": "[-1. -1. -1. -1.]", "high": "[1. 1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 16, "n_steps": 300, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 128, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "False", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7e38025c36d0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7e38025c3760>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7e38025c37f0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7e38025c3880>", "_build": "<function ActorCriticPolicy._build at 0x7e38025c3910>", "forward": "<function ActorCriticPolicy.forward at 0x7e38025c39a0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7e38025c3a30>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7e38025c3ac0>", "_predict": "<function ActorCriticPolicy._predict at 0x7e38025c3b50>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7e38025c3be0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7e38025c3c70>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7e38025c3d00>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7e380255dec0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 104000, "_total_timesteps": 100000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1714106227409224375, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAMIJBD7QzQA8/lIjPIr3Ozwlf0S/ZFonPyCr0z1ZNBG/AAAAAIDelD///38/dDIuPzXnv78AAIA/X6ltPkHdbz4rsHc+73WDPhLvjz6efqE+iyy8Pm8l6z78Tx8/AACAP+cNzj1Xxws9sPoiPdpdXzyrhJA/9OLwPsRlSj/7/3+/AACAPyBUKr/OdBS+mM/CvjzweL8AAAAAKQKKPimAiz7+/Y8+c7CYPpxKqD6B6L0+DtvePrGeCz9Vazc/AACAPwFr3j06IKk7hADePFKH/Dyq/FK/AAAAM0BfX70FAIA/AAAAAEVzjT8AAAAA/OdaP58z5b0AAIA/8apnPnVMaj6if3I+8aOAPvxYjD5uT54+TVi6PnTM6D4BbCc/AACAP02wXL9IhsC91PaauwWHCb4P5uQ+udGMPiKjKD/9/38/AAAAAMFbET6ADOQ7bH4uPyVWer8AAAAAzbvdPnBA4D6aGeg+lD/2PlFUBj+UhRc/sloyP+fQXj8AAIA/AACAP1FCXz0Nkq485H3nPGFe6Dwg4hq/XCtbvVg4Nr5W0oC/AAAAAB1ekD8ANH85KlxbP9Isgb4AAIA/Z8l/PnDegT7liYY+67SOPptsmj46B6w+/X3KPndk8z7MRho/ErN3P75zTD5loAS9am7ZO2ZovTyfRJE/AGYqOzRcRT+5CIA/AAAAAG8NSr++ZpE+MLz6vnXck74AAIA/BEODPlHxhT6T8Ys+j3yUPin9oT6tuLY+0qDUPjce/z4fjys/AACAP+T92z2vjgG8DkKVPOofAj2DU1W/oI7QuqhGcT6zH+o9AAAAABjijD8AJJo4SEZsP0t0VjsAAIA/qZZsPnxGbz4/pnc+dm6DPnF5jz7zYJ8+NBO3Plqq3z4FtSI/AACAP5Lp1D0bL4A9de3yutODfrxG91K/SDwAPSxbCD4AAIC/AAAAALa2jj8AAAAAvCtOP/gBB78AAIA/Z9ptPueNcD7cwXc+I7KCPq46jz6HOaM+15nAPhHL8T4AEC0/AACAP/6rFj6e/IC8sJELPt+B87xRz1G/YGc8OwBOfL6FbIC/AAAAAKREkT8AEJy3gG9NPw0RgD8AAAAAJvJrPhygbj4M+nY+0POCPiIWjj7kJJ8+JYW5Pk7Z7j5UDSU/AACAP1Wxvj3kamC87DYLPfSuMD0tvVG/ANSeuITBaz7bEzI+AACAP5dMjj8AgF42QlxbP7HS+zwAAIA/KZ1qPj5HbT4dlXU+v0aCPuYhjj7TUqA++La8PkLh7T5h0SY/AACAP4L+gj2d7KI7+D1mvHY8Nj3AbDy/OEsoPkDDcL3dt3+/AAAAAB26jT/M2qm+4jdZPzC6qT4AAIA/lw9sPjfrbj6ShXc+Hn+DPh7Ljz6PZaM+sQXEPtT0/j6Fxi0/AACAP7W/Kj5I7YQ9DJsTPYU44byRuo8/eLYMvvafTz8AAIC/AAAAALl4UL8e5oi/WIm0PcmcIj8AAIA/aUKFPtXFhj5RfYs+Ff6TPnsqoT7wrrU+DNTYPgRbCT/hVTk/AACAP210S74hahy9tmTAvZfGvb2Gd4++L9TRPgtWbz8AAAAAAAAAAG57Jj9HQaQ/qJ1GPwAAgL8AAAAA9pDoPhg16z5pcPM+qyMBP1bkDD+e7B4/UxE7P5mzaT8AAIA/AACAPzEroz07oOq82P3EPHj3Ar2x41K/AABAM+g2dz4CAIA/AAAAAD1wkD8w+Ps+Qo5sPwAAAAAAAIA/qRdtPvPIbz5HLXg+EqeDPkqijz5k76A+r8O5PlC44T6cdyA/AACAP8VD/T3m9fU7w6yYvEHqCLk6OE6/ZnWXPaT9jb4RCxa+AAAAANhRiD/WPTm/CMR8PwAAgD8AAIA/O9BnPjrnaD56O24+fk15Pjkihj6HI5U+lIuuPnfj2T4j0Rg/AACAP8gmvD2j9Xm7OqM7PSmmvb0Q0U6/AADAsuCUkj5QuRS+AACAP4wZkD8AAAAAUhxCP/z/f78AAAAAS4R5PrRZfD5Ol4I+No2KPikplz7mgao+uLPIPnEL+T5Ebiw/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.040000000000000036, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVAQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwF24MBp5/sqMAWyUS1iMAXSUR0Btyv7+DOC5dX2UKGgGR8BaevKdQO4HaAdLOWgIR0Bt24V/MGHIdX2UKGgGR8Ba06MNtqHoaAdLS2gIR0BuM2gOBlMAdX2UKGgGR8BcJc4T9KmLaAdLR2gIR0BuTNjEvTPTdX2UKGgGR8BhJ5NwiqyXaAdLo2gIR0Buc/lOoHcDdX2UKGgGR8Bcl9L127nQaAdLNGgIR0Bufvcxj8UFdX2UKGgGR8BbUWpVCHARaAdLPmgIR0BujQAEMb3odX2UKGgGR8BdfvRqoIfKaAdLV2gIR0BuoSynk1dgdX2UKGgGR8BZd4TfzjFRaAdNQAZoCEdAbtwzMzMzM3V9lChoBkfAX1hOIqLCN2gHS1ZoCEdAbt3QcghbGHV9lChoBkfAWy3yd4FA3WgHSzhoCEdAbupeVLSNO3V9lChoBkfAWYU5R0lqrWgHS0FoCEdAbusIxgy/K3V9lChoBkfAXBYG+sYEXGgHS0doCEdAbvqBU70WdnV9lChoBkfAXDxZ+x4Y8GgHS1BoCEdAbvwP7N0NjXV9lChoBkfAWcVMURFqjGgHTUAGaAhHQG8CvwEyLyd1fZQoaAZHwFnrKq4pc5doB01ABmgIR0BvApgogFHKdX2UKGgGR8Bb2C+cpb2UaAdNQAZoCEdAbwK2gFotc3V9lChoBkfAWMz7ALy+YmgHTUAGaAhHQG8Cwpe/pMZ1fZQoaAZHwFtQXeWOZLJoB01ABmgIR0BvAtPxhDw6dX2UKGgGR8BaHWsA/9pAaAdLN2gIR0BvCDHyVfNSdX2UKGgGR8BXUlZDArQPaAdNQAZoCEdAbxOSpR4yGnV9lChoBkfAWuNN7BwdbWgHS0doCEdAbxNVIZqEe3V9lChoBkfAWNWOPvKEFmgHTUAGaAhHQG8Teb/ffoB1fZQoaAZHwFlT3RG+bmVoB0tIaAhHQG8Ub961LJ11fZQoaAZHwF5LImw7kn1oB0tJaAhHQG8URe1KGtZ1fZQoaAZHwFn5uMdcSoRoB0tOaAhHQG8V/zJ6po91fZQoaAZHwFv4pY9xIatoB0thaAhHQG8aE6DGtIV1fZQoaAZHwFyR/LDAJsxoB0uOaAhHQG8cFev6j351fZQoaAZHwFromfGuLaVoB0tkaAhHQG8gZc1O0sx1fZQoaAZHwFy3Btk4FRpoB0s3aAhHQG8mGSpzcRF1fZQoaAZHwF4d8eS0Sh9oB0tzaAhHQG8t62WpqAV1fZQoaAZHwFn+KzRhMJxoB01ABmgIR0BvMTbi6xxDdX2UKGgGR8BbctugpSaWaAdNQAZoCEdAbzKenyd4FHV9lChoBkfAWWphDw6QvGgHSz9oCEdAbzVND+irUHV9lChoBkfAW4K3WnTAnGgHS1hoCEdAb0KtUXHim3V9lChoBkfAXCxgWrOqvWgHS05oCEdAb0Pc+qzZ6HV9lChoBkfAWaBkH2RJVmgHTUAGaAhHQG9FqTr3TNN1fZQoaAZHwGHAtQbdadNoB0v0aAhHQG93yXUpd8l1fZQoaAZHwFi9QJ5VwP1oB01ABmgIR0BveBzHS4OMdX2UKGgGR8BcAvsRg7YDaAdLNWgIR0Bvfa5LAYYSdX2UKGgGR8BcknF98Z1naAdLS2gIR0BvgCgZjx0/dX2UKGgGR8BZIBMWXTmXaAdLWGgIR0BvhApjMFEBdX2UKGgGR8BcmP7WNFSbaAdLUmgIR0BviwYLsruqdX2UKGgGR8BcorhvR7Z4aAdLMWgIR0Bvi5YmsvIwdX2UKGgGR8BYzWoJiRW+aAdNQAZoCEdAb5E8EFGG23V9lChoBkfAWUpK02LpA2gHS1loCEdAb5NaIvalDXV9lChoBkfAWfnaTOgQH2gHS0BoCEdAb50jcEeQuHV9lChoBkfAWcCtJWeYlmgHS09oCEdAb6MREF4cFXV9lChoBkfAWNHlp48lomgHTUAGaAhHQG+kTxXnyNJ1fZQoaAZHwFoYRChN/ONoB0t+aAhHQG+o/p2U0N11fZQoaAZHwFsGBi1AqutoB01ABmgIR0Bvsz850bLmdX2UKGgGR8BcWZ8jRlYmaAdLOWgIR0BvxkebNKRMdX2UKGgGR8BeVdUKiO/+aAdLZ2gIR0BvzQRGtp22dX2UKGgGR8Be72g3974SaAdLe2gIR0Bv0CrtE5QxdX2UKGgGR8Bb+USqU/wBaAdLOWgIR0Bv4kZJkGzKdX2UKGgGR8BZS0AggX/HaAdLWGgIR0Bv5zWPLgXNdX2UKGgGR8BbdoiX6ZYxaAdLU2gIR0Bv7acslLOBdX2UKGgGR8BbKbhaTwDvaAdLNmgIR0Bv+atHQQcxdX2UKGgGR8BaYZzLfUF0aAdLUmgIR0BwBM4PwuuidX2UKGgGR8Bb2OLR8c+8aAdNQAZoCEdAcJSvEjxCpnV9lChoBkfAV/n/xUedTmgHTUAGaAhHQHCU8UEgW8B1fZQoaAZHwFiJJF9a2WpoB01ABmgIR0BwlN6AvtdBdX2UKGgGR8BZyZKODJ2daAdNQAZoCEdAcJWmXgLqlnV9lChoBkfAWizJvHcUNGgHTUAGaAhHQHCY1LvkRz11fZQoaAZHwFkaCFsYVItoB01ABmgIR0Bwmy+fywwCdX2UKGgGR8BaSLyUcGTtaAdLRWgIR0BwnQu8K5TZdX2UKGgGR8Bal8kdFOO9aAdLL2gIR0BwnhQsPJ7tdX2UKGgGR8BfY2yHEdeZaAdLU2gIR0BwnwyN4qwydX2UKGgGR8BZQ8PBi1AraAdLLWgIR0BwofZ+QU5/dX2UKGgGR8Bbc0n5SFXaaAdNQAZoCEdAcLtbmEGqxXV9lChoBkfAWidowmE5AGgHSy9oCEdAcLwajN6gNHV9lChoBkfAWGRWJaaCtmgHTUAGaAhHQHC9VHSWqtJ1fZQoaAZHwFmA287IT5BoB0tdaAhHQHC90xASnLt1fZQoaAZHwFlPKkVN5+poB0tWaAhHQHDBSprDZUV1fZQoaAZHwFyuXhfjS5RoB0tIaAhHQHDFTAeq7yx1fZQoaAZHwFlm8scyWRloB0s4aAhHQHDMDch1Tzd1fZQoaAZHwFnZMqz7di5oB0tmaAhHQHDOqqXF98Z1fZQoaAZHwFgRsMRYigVoB01ABmgIR0Bw0DiT+vQodX2UKGgGR8BfNTeTFERbaAdLZWgIR0Bw0KBEroW6dX2UKGgGR8BaaAam4y44aAdLLGgIR0Bw2GafBeoldX2UKGgGR8BW/T101ZTyaAdNQAZoCEdAcOKNlRP423V9lChoBkfAWv2RLbpNbmgHTUAGaAhHQHDkDGYKIBR1fZQoaAZHwF0RCaqjrRloB01ABmgIR0Bw6f8/D+BIdX2UKGgGR8BXqFqagElmaAdNQAZoCEdAcO1PdVNpNHV9lChoBkfAWgIhGH58B2gHSzloCEdAcO7a1Cw8n3V9lChoBkfAXHzXiBGx2WgHSz9oCEdAcPNqqfe1r3V9lChoBkfAWyzbi6xxDWgHSzBoCEdAcPSxYJVsDXV9lChoBkfAXNqdvsJID2gHS0loCEdAcPchUBGQS3V9lChoBkfAWcLD50r9VGgHS1hoCEdAcP98ejmCAnV9lChoBkfAXSUqmTC+DmgHS0xoCEdAcQBFXq7iAHV9lChoBkfAVyVfgJkXlGgHTUAGaAhHQHEDlcY64lR1fZQoaAZHwFanqYJE6T5oB01ABmgIR0BxH1C2MKkVdX2UKGgGR8BfBPmcOLBLaAdLb2gIR0BxI7bJwKjSdX2UKGgGR8BaS91hb4ahaAdNQAZoCEdAcSQvLowEhnV9lChoBkfAXVCF+NLlFWgHS0BoCEdAcSYDGLk0anV9lChoBkfAWjyHvc8DCGgHS0JoCEdAcSrBacI7eXV9lChoBkfAWuFhG6PKdWgHS1toCEdAcTUJu2qkunV9lChoBkfAWzYk8ifQKWgHSy5oCEdAcTqz90ihWnV9lChoBkfAWC825xzaK2gHTUAGaAhHQHGvNWQwK0F1fZQoaAZHwFm8e4kNWlxoB01ABmgIR0Bxr43WFvhqdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 52, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "_shape": [24], "low": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "low_repr": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high_repr": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVpwEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True]", "bounded_above": "[ True True True True]", "_shape": [4], "low": "[-1. -1. -1. -1.]", "high": "[1. 1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 16, "n_steps": 500, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 128, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "False", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -92.28305220068141, "std_reward": 0.07317789411062775, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-04-25T05:27:06.439335"}
 
1
+ {"mean_reward": -56.37531610364094, "std_reward": 0.21513498902641692, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-04-26T04:40:03.821594"}