Augcos commited on
Commit
de4f73a
·
1 Parent(s): 21223c9

Initial commit

Browse files
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ replay.mp4 filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: AntBulletEnv-v0
17
  metrics:
18
  - type: mean_reward
19
- value: 715.21 +/- 332.84
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: AntBulletEnv-v0
17
  metrics:
18
  - type: mean_reward
19
+ value: 1893.63 +/- 99.91
20
  name: mean_reward
21
  verified: false
22
  ---
a2c-AntBulletEnv-v0.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:048e824d59abcfb10689252f14993e201698bc3d3d07a1517cddcaf1ee2e4892
3
- size 129227
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:950a62b3c82cf4c40fc8bb8f49b92988fd05c199241f30722f436f16fd7c38cb
3
+ size 128975
a2c-AntBulletEnv-v0/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7fec6ce7f280>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fec6ce7f310>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fec6ce7f3a0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fec6ce7f430>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7fec6ce7f4c0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7fec6ce7f550>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fec6ce7f5e0>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fec6ce7f670>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7fec6ce7f700>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fec6ce7f790>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fec6ce7f820>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fec6ce7f8b0>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7fec6ce802c0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {
@@ -37,16 +37,16 @@
37
  "_num_timesteps_at_start": 0,
38
  "seed": null,
39
  "action_noise": null,
40
- "start_time": 1681226124513463565,
41
- "learning_rate": 0.00096,
42
  "tensorboard_log": null,
43
  "lr_schedule": {
44
  ":type:": "<class 'function'>",
45
- ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/T3UQTVUdaYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
46
  },
47
  "_last_obs": {
48
  ":type:": "<class 'numpy.ndarray'>",
49
- ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAGt/bj/eCna+Ea7xPolotr8G8Ng/G0EWP4+lA7841T299q1aPlcNA8CttWa/KWM3PH9UfL/46Zo+lKXEvVm2ML9G9Em+gCb4P8T92z4NTipAkxHEPQW6I78+sP0/Tk+5vuU2C8DaoZM+5tcJwImANj+Czpc/eOa+v6slOsBayAI/BfffPYtHwT2sjxo/TrL8vtKghL8mQYBACJIcQH1Pj0AiLEy/EAIjv+jKhb/gLDs/VRzUP/mwTL97IYy+SrPXvub86T/T4MQ9Tge9PwrpoT7lNgvA2qGTPhe47T6JgDY/Ip2BP/tuer9LuYi+/6kkP+O4UL+PKSa/rrNTP0lDc7+DRrI911UuwPhF9T9L51/Aq7pUvxwyuj8PHjy/mjGUv0q9vb/DCXU/lxwZP7/h3T+FBiI/VaZxvsoNpz8q1BI/5TYLwPn0XcAXuO0+iYA2P10C7j7jK7K/cVqcv8RiBL4jhyi+hMpkPUmRvj86/uC+KTHlvxpuID2rF0K/pC3HPzIq9L4QQCBAReqVvzFiFz+CPCQ/8GmBP3IthT9/meW+UDJdPybUAUDn1Yw9fDFpPuU2C8DaoZM+F7jtPomANj+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
50
  },
51
  "_last_episode_starts": {
52
  ":type:": "<class 'numpy.ndarray'>",
@@ -54,7 +54,7 @@
54
  },
55
  "_last_original_obs": {
56
  ":type:": "<class 'numpy.ndarray'>",
57
- ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAAAjRi62AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA5m9dPQAAAACKDt2/AAAAAJWd1zwAAAAA+ovgPwAAAAB3Rxy8AAAAAIdl+z8AAAAA0kOZPQAAAACf5Om/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAzPPrNAAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgEvevr0AAAAASN3fvwAAAACc9Mq9AAAAAOU+/z8AAAAASfvtPQAAAAAQ+OM/AAAAAExuvD0AAAAAhfjqvwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAM7MqTYAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAq5G29AAAAAK9p/L8AAAAAf2jmPQAAAAAyt+U/AAAAAH/75T0AAAAAqQ3iPwAAAADgBoY9AAAAAF38678AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACftnO1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAD/4IPQAAAAAO1/W/AAAAAMQXuD0AAAAAG7zdPwAAAABReb48AAAAAHk//j8AAAAAXurvPQAAAAAzzey/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
58
  },
59
  "_episode_num": 0,
60
  "use_sde": true,
@@ -63,7 +63,7 @@
63
  "_stats_window_size": 100,
64
  "ep_info_buffer": {
65
  ":type:": "<class 'collections.deque'>",
66
- ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJJn9z+3pfSMAWyUTegDjAF0lEdAq06n5N47inV9lChoBkdAkqeQwj+rEWgHTegDaAhHQKtSE72+PBB1fZQoaAZHQJKYLjENvwVoB03oA2gIR0CrWUSJTER8dX2UKGgGR0CQGj0PpY9xaAdN6ANoCEdAq1lxVsDW9XV9lChoBkdAkU2e3Ytg8mgHTegDaAhHQKta/ViF0xN1fZQoaAZHQIvtWIGhVVBoB03oA2gIR0CrXydPk7wKdX2UKGgGR0CSW1D6WPcSaAdN6ANoCEdAq2jxujynUHV9lChoBkdAkwq+k1uR92gHTegDaAhHQKtpHNB4Uvh1fZQoaAZHQJRWC/xlQMxoB03oA2gIR0Crap/i5uqFdX2UKGgGR0CR4bSk0rLAaAdN6ANoCEdAq23/rY5DJHV9lChoBkdAlUa7hrFfiWgHTegDaAhHQKt1DvrGBFx1fZQoaAZHQJZsZUzbeuVoB03oA2gIR0CrdTon0CiidX2UKGgGR0CT6jYzSCvpaAdN6ANoCEdAq3a8Fr2xp3V9lChoBkdAltQlyzXz2GgHTegDaAhHQKt6M3kPtlZ1fZQoaAZHQJX6TiZOSGJoB03oA2gIR0CrhH8TakAQdX2UKGgGR0CTvbA6Mir1aAdN6ANoCEdAq4TFz0Yj0XV9lChoBkdAlzqLmlqJuWgHTegDaAhHQKuGZTrE9+x1fZQoaAZHQJaqeWjXWe9oB03oA2gIR0CrifBbnoxIdX2UKGgGR0CWcB0Yj0L/aAdN6ANoCEdAq5DnSa3I/HV9lChoBkdAlhCKpgkTpWgHTegDaAhHQKuREMRYigV1fZQoaAZHQJV9WvwEyL1oB03oA2gIR0Crkqp2ECeVdX2UKGgGR0CWSf8Sf16FaAdN6ANoCEdAq5ZmALApKHV9lChoBkdAkjT6PKdQPGgHTegDaAhHQKufxBQemvZ1fZQoaAZHQIyOnGwRoRJoB03oA2gIR0CroA4IBzV+dX2UKGgGR0CVMVcG1QZXaAdN6ANoCEdAq6Jt/QSi/XV9lChoBkdAk7U7mMfigmgHTegDaAhHQKumFleWv8t1fZQoaAZHQJCH4qlP8AJoB03oA2gIR0CrrT7TUiIMdX2UKGgGR0CSLz3ueBhAaAdN6ANoCEdAq61rTBqKxnV9lChoBkdAkQeNAX2ugmgHTegDaAhHQKuu+pXIU8F1fZQoaAZHQJL7jsyBTXJoB03oA2gIR0Crsnei8FpxdX2UKGgGR0CR1fPFvQ4TaAdN6ANoCEdAq7qtTFVDKHV9lChoBkdAk+8YBvJiiWgHTegDaAhHQKu68JTl1bJ1fZQoaAZHQJOaPLfUF0RoB03oA2gIR0CrvVmK64DtdX2UKGgGR0CSf7SLZSNwaAdN6ANoCEdAq8IhTZQHiXV9lChoBkdAk5hwLRa5gGgHTegDaAhHQKvJW0CzTnd1fZQoaAZHQJPU0XyiEg5oB03oA2gIR0CryYd+XqqwdX2UKGgGR0CU5GMFlkH2aAdN6ANoCEdAq8sImCyyEHV9lChoBkdAYeQsQNCqqGgHS6poCEdAq8tvDUExI3V9lChoBkdAkVwkdzXBg2gHTegDaAhHQKvOcDsdDIB1fZQoaAZHQJVSmSX+l0poB03oA2gIR0Cr1n2nKnvVdX2UKGgGR0CSqgQxesxPaAdN6ANoCEdAq9ip+OOsDHV9lChoBkdAkifWuX/o7mgHTegDaAhHQKvZOD3/PxB1fZQoaAZHQJaD5VJcxCZoB03oA2gIR0Cr3gKubI91dX2UKGgGR0CUDEYAKfFraAdN6ANoCEdAq+W+ZgG8mXV9lChoBkdAlWld5Y5ksmgHTegDaAhHQKvnQgK4QSV1fZQoaAZHQIwT6qCHymRoB03oA2gIR0Cr56M8gZCOdX2UKGgGR0CVyC+GXXyzaAdN6ANoCEdAq+rBL/S6UnV9lChoBkdAlAzCHM2WIGgHTegDaAhHQKvx/sTFl051fZQoaAZHQJHf4S7GvOhoB03oA2gIR0Cr872BJ7LMdX2UKGgGR0CTDcTnJT2naAdN6ANoCEdAq/RPJPqLTHV9lChoBkdAlPICWeHzpWgHTegDaAhHQKv46aNMoMN1fZQoaAZHQI6HmjASFoNoB03oA2gIR0CsAdlN+LFXdX2UKGgGR0CQvyvB7/n4aAdN6ANoCEdArANi8lHBlHV9lChoBkdAkooJMxoIwGgHTegDaAhHQKwDxF0gbId1fZQoaAZHQJOUJZeRgZ1oB03oA2gIR0CsBtr9MsYmdX2UKGgGR0CBxGT4cm0FaAdN6ANoCEdArA46Ss8xK3V9lChoBkdAhLuOavzOHGgHTegDaAhHQKwPzKSxJNF1fZQoaAZHQI20l+CsfaJoB03oA2gIR0CsEC7zshPkdX2UKGgGR0CRp7JRwZO0aAdN6ANoCEdArBQsLa24NXV9lChoBkdAiKxkG7jDK2gHTegDaAhHQKwd8wWWQfZ1fZQoaAZHQJGUvo/zJ6poB03oA2gIR0CsH3yHM2WIdX2UKGgGR0CSv4B9Cu2aaAdN6ANoCEdArB/Zw++ueXV9lChoBkdAlDozxgAp8WgHTegDaAhHQKwi5pKSPlx1fZQoaAZHQJLvUnmaH9FoB03oA2gIR0CsKjFaKUFCdX2UKGgGR0CTRYOVgQYlaAdN6ANoCEdArCu4ZMtbtHV9lChoBkdAkdXt7SiM52gHTegDaAhHQKwsGX4TK1Z1fZQoaAZHQIIWrzPKMehoB03oA2gIR0CsLzV5jYqYdX2UKGgGR0CSUTqWTot+aAdN6ANoCEdArDoPvnbItHV9lChoBkdAi222vbGm12gHTegDaAhHQKw7kmj0tiB1fZQoaAZHQJLekyeqaPVoB03oA2gIR0CsO/me+VTrdX2UKGgGR0CHduw9JSR9aAdN6ANoCEdArD790A93bHV9lChoBkdAi8FZpi7TUmgHTegDaAhHQKxGGhY/3WZ1fZQoaAZHQJGMG25QP7NoB03oA2gIR0CsR5kQwsXjdX2UKGgGR0COOE0TDfm+aAdN6ANoCEdArEf/E87p3XV9lChoBkdAkHJ9To+wDGgHTegDaAhHQKxLKGHHmzV1fZQoaAZHQJGUdc3VColoB03oA2gIR0CsVQ6ttALRdX2UKGgGR0CQ6SL9MsYmaAdN6ANoCEdArFdZ9b5dnnV9lChoBkdAjqmaya/h2mgHTegDaAhHQKxXvBOYYzl1fZQoaAZHQI5l4llbu+hoB03oA2gIR0CsWs9QO4G2dX2UKGgGR0CLeUDbJwKjaAdN6ANoCEdArGIjKgZjx3V9lChoBkdAkKzjr/sE7mgHTegDaAhHQKxjqh8IAwR1fZQoaAZHQIQIllRP421oB03oA2gIR0CsZAoToMa1dX2UKGgGR0CQ69V/+bVjaAdN6ANoCEdArGcPDm8ujHV9lChoBkdAi1SbAckt3GgHTegDaAhHQKxvrzySV4Z1fZQoaAZHQI0u/5HmRvFoB03oA2gIR0Cscg7TlT3qdX2UKGgGR0CRlkYzSCvpaAdN6ANoCEdArHKpwOvt+nV9lChoBkdAjekEGqxTsWgHTegDaAhHQKx2vgzguRN1fZQoaAZHQIonmDcuandoB03oA2gIR0CsfkDAzpHJdX2UKGgGR0CMYcD9wWFfaAdN6ANoCEdArH/SAavRq3V9lChoBkdAgeiGhufmLmgHTegDaAhHQKyAOdMCcPR1fZQoaAZHQJL7WlchTwVoB03oA2gIR0Csg0ZB1LamdX2UKGgGR0CUDivVVghKaAdN6ANoCEdArIs+lGgBcXV9lChoBkdAkheBvm5lOGgHTegDaAhHQKyNb5ylvZR1fZQoaAZHQJNCHnq3VkNoB03oA2gIR0CsjgN+LFXJdX2UKGgGR0CRGjzsyBTXaAdN6ANoCEdArJLGrIYFaHV9lChoBkdAkv/eotL+P2gHTegDaAhHQKyaN6u4gA91fZQoaAZHQIrLhVp9JBhoB03oA2gIR0Csm8Cr92ovdX2UKGgGR0CL57b5dnkDaAdN6ANoCEdArJwnD3ueBnV9lChoBkdAkcCljZtelmgHTegDaAhHQKyfTyNn5BV1fZQoaAZHQIAQCfjCHh1oB027AmgIR0CsourCemNzdWUu"
67
  },
68
  "ep_success_buffer": {
69
  ":type:": "<class 'collections.deque'>",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f51f005b1f0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f51f005b280>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f51f005b310>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f51f005b3a0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f51f005b430>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f51f005b4c0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f51f005b550>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f51f005b5e0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f51f005b670>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f51f005b700>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f51f005b790>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f51f005b820>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7f51f0059b00>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {
 
37
  "_num_timesteps_at_start": 0,
38
  "seed": null,
39
  "action_noise": null,
40
+ "start_time": 1681288652863329946,
41
+ "learning_rate": 0.0001,
42
  "tensorboard_log": null,
43
  "lr_schedule": {
44
  ":type:": "<class 'function'>",
45
+ ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
46
  },
47
  "_last_obs": {
48
  ":type:": "<class 'numpy.ndarray'>",
49
+ ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAACakjz/Kkc8+UTAqP5bTUz+xgeM/Ryogv5sWpz5YAR8/Q7Z0v9cNiL1rmhs+q3q4v6yaRD+ASsY/YF3bv/1WUT8Ouc6+XZN+vmm9k79wnkjAoRXIvwwywzwI0DM/EiAdPW9XuL+kt8Q+lvP1PjbKXj9RuZI++BBiP7aJBj9CwZg9k7C9P/zmvT7v7JQ/T+xBPv9Nj78gT0A85Q6APutZer8UT+2/1IOEP6RL1b9tk9e9Dce6vTm6Zb2HHBE/KzGGPbVFRb7m55G/kLLxvkp9cz1vV7i/pLfEPpbz9T42yl4/oREPP+YlYr86dAq+1iB4v/nUFz9WsY+6QF3kProGBr1lh4c/5uBuPhHbwz/J4o28gXK0P+sXWj760Ku+jgUSPh0K5T6f4L893q+SPdaf/j2bK8Q/Tb1puv7dbD+p7wW8y8ExP6S3xD6W8/U+NspePxYXfD9+DHg/FonzPgOFwj8pLVc/7C0yPpKqpj+aIYg/slaSvw9/UL/y6kk/QONUP/qJGsAbbSU+1G3Bv8dV7r/joYm/mGQvPk4Zlr9xXKs/WuXCP+MDK7++vES/zIIFQMvBMT/zkibAlvP1Po0Uk7+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
50
  },
51
  "_last_episode_starts": {
52
  ":type:": "<class 'numpy.ndarray'>",
 
54
  },
55
  "_last_original_obs": {
56
  ":type:": "<class 'numpy.ndarray'>",
57
+ ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAACBcsi2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAv2AIvAAAAACfDNm/AAAAAE/8GL0AAAAAIxH6PwAAAAAlHfm9AAAAAGOQ3z8AAAAApx3kPQAAAAAPkeu/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAcQaHtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgKGBwD0AAAAAt5HlvwAAAAC6sq07AAAAANWZ6z8AAAAAaTo2vQAAAABvhQBAAAAAAKeMQD0AAAAAdfb+vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAFnP7DQAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAMWJS7AAAAAGcu7L8AAAAAvT/lvQAAAACan+w/AAAAAIxUAz4AAAAA9e3pPwAAAABX6Oe6AAAAAKVI/r8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADCL/41AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAm0GSvQAAAAA+Oei/AAAAAC613rwAAAAAji/wPwAAAAAmw9Y9AAAAAMHR+D8AAAAAfvx1PQAAAAAu0vO/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
58
  },
59
  "_episode_num": 0,
60
  "use_sde": true,
 
63
  "_stats_window_size": 100,
64
  "ep_info_buffer": {
65
  ":type:": "<class 'collections.deque'>",
66
+ ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJidmUs4DLeMAWyUTegDjAF0lEdAwgVsB8QZoHV9lChoBkdAlHO8Rcu8LGgHTegDaAhHQMIG6sJ6Y3N1fZQoaAZHQJfHA/qxC6ZoB03oA2gIR0DCBwzEvTPTdX2UKGgGR0CY9KS5AhStaAdN6ANoCEdAwgcS/M4cWHV9lChoBkdAlcHHPJJXhmgHTegDaAhHQMIJ5N+TeO51fZQoaAZHQJfWdZkkKNRoB03oA2gIR0DCCyL+WGATdX2UKGgGR0CYK/BOYYzjaAdN6ANoCEdAwgtdUjLSu3V9lChoBkdAl3hrVJ+UhWgHTegDaAhHQMILZvGp++d1fZQoaAZHQJV3Qlu3trtoB03oA2gIR0DCD3SnpB5YdX2UKGgGR0CZBhC53C9AaAdN6ANoCEdAwhDA+tbLU3V9lChoBkdAlcLPDxb0OGgHTegDaAhHQMIQ6Sr5qM51fZQoaAZHQJZZbOIInjRoB03oA2gIR0DCEO+mFajfdX2UKGgGR0CbScNVzZHvaAdN6ANoCEdAwhOYLkS26XV9lChoBkdAmAOTJ+2E02gHTegDaAhHQMIVd20zCUJ1fZQoaAZHQJS6gSYgJTloB03oA2gIR0DCFa7XnQpndX2UKGgGR0CWKX8rI5o5aAdN6ANoCEdAwhW46qbSZ3V9lChoBkdAlU9KVD8cdmgHTegDaAhHQMIY8U8NhE11fZQoaAZHQJYtLyrgflpoB03oA2gIR0DCGi18qnWKdX2UKGgGR0CWsKos7MgVaAdN6ANoCEdAwhpNcVxjrnV9lChoBkdAmWsmFzuF6GgHTegDaAhHQMIaU9DhLoR1fZQoaAZHQJe7dnBciW5oB03oA2gIR0DCHW0EJSiudX2UKGgGR0CXmfHP/rB1aAdN6ANoCEdAwh9qQz1scnV9lChoBkdAmFsAk9lmOGgHTegDaAhHQMIflrlmvnt1fZQoaAZHQJiGZlI3BHloB03oA2gIR0DCH51eUpuudX2UKGgGR0CXJF5XU6PsaAdN6ANoCEdAwiJ2lE7W/nV9lChoBkdAlJTgIUrTY2gHTegDaAhHQMIjvYKx9oh1fZQoaAZHQJZE6WjXWe9oB03oA2gIR0DCI+WLzf78dX2UKGgGR0CaUkAn2IweaAdN6ANoCEdAwiPsVzIV/XV9lChoBkdAla9c4o7V8WgHTegDaAhHQMIn3KJl8PZ1fZQoaAZHQJdKVWkrPMVoB03oA2gIR0DCKSBOLzf8dX2UKGgGR0CZW7KiwjdIaAdN6ANoCEdAwik+/zJ6p3V9lChoBkdAlcGvxUedTmgHTegDaAhHQMIpRYcvM8p1fZQoaAZHQJg3bxy4nWtoB03oA2gIR0DCK/17jT8YdX2UKGgGR0CWUQrZrYXgaAdN6ANoCEdAwi12AVfu1HV9lChoBkdAlSlLWmP5pWgHTegDaAhHQMItrEVnEl51fZQoaAZHQJhkDdnCfpVoB03oA2gIR0DCLbXn2ZiNdX2UKGgGR0CY71RkmQbNaAdN6ANoCEdAwjGTZQpF1HV9lChoBkdAm+YKUmlZYGgHTegDaAhHQMIy59/jKgZ1fZQoaAZHQJXNJIsiB5JoB03oA2gIR0DCMwoe3hGZdX2UKGgGR0CZTc/T9bX6aAdN6ANoCEdAwjMQmwaBJHV9lChoBkdAkm3ZQ+EAYGgHTegDaAhHQMI128dxQzl1fZQoaAZHQJhtd+z+m3xoB03oA2gIR0DCN+KobXHzdX2UKGgGR0CWcaq4pc5baAdN6ANoCEdAwjgec2BJ7XV9lChoBkdAmRDK5sj3VWgHTegDaAhHQMI4KNxdY4h1fZQoaAZHQJdY9Gqgh8poB03oA2gIR0DCO0WycCo1dX2UKGgGR0CWQHHVPN3XaAdN6ANoCEdAwjyo5paibnV9lChoBkdAl87JjlPrOmgHTegDaAhHQMI80QJPZZl1fZQoaAZHQJtjAuAZsKtoB03oA2gIR0DCPNeUfPondX2UKGgGR0CXWFRSxZ+yaAdN6ANoCEdAwkBfY+0PYnV9lChoBkdAmckZCngpB2gHTegDaAhHQMJCBrfk3jx1fZQoaAZHQJdlzWvr4WVoB03oA2gIR0DCQioLNOdodX2UKGgGR0CWfFXSjQAuaAdN6ANoCEdAwkIxUWEbpHV9lChoBkdAl/gE2pAD72gHTegDaAhHQMJEw5lvqC91fZQoaAZHQJao+9K28ZloB03oA2gIR0DCRf/gUDdQdX2UKGgGR0CbHnQWepXIaAdN6ANoCEdAwkYnP+n623V9lChoBkdAmN1BwVCXyGgHTegDaAhHQMJGLOkLx7R1fZQoaAZHQJWuaKAJ9iNoB03oA2gIR0DCSk3qTr3TdX2UKGgGR0CYcd4NqgyuaAdN6ANoCEdAwkuY/qxC6nV9lChoBkdAlx6QNwzch2gHTegDaAhHQMJLv1Muez51fZQoaAZHQJjAk2Hck+poB03oA2gIR0DCS8bm6oVEdX2UKGgGR0CZ+sqkdmxuaAdN6ANoCEdAwk6OpWFN+XV9lChoBkdAl4yo5ggHNWgHTegDaAhHQMJQJ2M85jp1fZQoaAZHQJU/t7AtWdVoB03oA2gIR0DCUFmr4nF6dX2UKGgGR0CaZUIkZ75VaAdN6ANoCEdAwlBihL5AQnV9lChoBkdAm3N4tQKrrGgHTegDaAhHQMJT96/h2nt1fZQoaAZHQJW4aDlHSWtoB03oA2gIR0DCVVfxSYPYdX2UKGgGR0CYc96Rhc7haAdN6ANoCEdAwlV8bAk9lnV9lChoBkdAmoRFJYkmhWgHTegDaAhHQMJVhDEvTPV1fZQoaAZHQJl2HwazeGhoB03oA2gIR0DCWNcbJfY0dX2UKGgGR0CXfyoIv8IiaAdN6ANoCEdAwlq8814xDnV9lChoBkdAk5ly5qdpZmgHTegDaAhHQMJa4fsNUfh1fZQoaAZHQJdxQxcmjTNoB03oA2gIR0DCWuiXlbNbdX2UKGgGR0CQ8ohoM8YAaAdN6ANoCEdAwl2OHoHLR3V9lChoBkdAlubBIre67WgHTegDaAhHQMJe434CZF51fZQoaAZHQJjotf1HvttoB03oA2gIR0DCXwh8IAwPdX2UKGgGR0CZsFIsiB5HaAdN6ANoCEdAwl8P5gPVeHV9lChoBkdAmOF20Re1KGgHTegDaAhHQMJi23Vsk6d1fZQoaAZHQJXsmydFvydoB03oA2gIR0DCZCPOObRXdX2UKGgGR0CZmlRg7YChaAdN6ANoCEdAwmRDqKP4mHV9lChoBkdAmE+w1rIo3WgHTegDaAhHQMJkSYKx9oh1fZQoaAZHQJYBi3XqZ+hoB03oA2gIR0DCZxunjyWidX2UKGgGR0CXHO3Ehq0uaAdN6ANoCEdAwmi3wd8zAXV9lChoBkdAl9eXY150KmgHTegDaAhHQMJo7nJ9y951fZQoaAZHQJiEnBj4HopoB03oA2gIR0DCaPeQMhHLdX2UKGgGR0CZVcRGc4HYaAdN6ANoCEdAwmy2r+YMOXV9lChoBkdAl2YcUAT7EmgHTegDaAhHQMJt6pm29ct1fZQoaAZHQJo0Q99tuUFoB03oA2gIR0DCbg6FEiMYdX2UKGgGR0CZgSEGqxTsaAdN6ANoCEdAwm4Vr6ciGHV9lChoBkdAmSVnPE87p2gHTegDaAhHQMJw6Z4W1tx1fZQoaAZHQJmDhLYf4h5oB03oA2gIR0DCcteu9vjwdX2UKGgGR0CXrzYQarFPaAdN6ANoCEdAwnMQRhc7hnV9lChoBkdAlrxx9b5dnmgHTegDaAhHQMJzGtTkyUN1fZQoaAZHQJYc2r8zhxZoB03oA2gIR0DCdiGcSXdCdX2UKGgGR0CYVeCa7VawaAdN6ANoCEdAwneEgIQe3nV9lChoBkdAmNflyeZof2gHTegDaAhHQMJ3pmvfTCt1fZQoaAZHQJkxH6eoUBZoB03oA2gIR0DCd60INVindX2UKGgGR0CZJXBUaQ3haAdN6ANoCEdAwntvYpUgjnV9lChoBkdAmU9/GlyimGgHTegDaAhHQMJ81gPNFBp1fZQoaAZHQJnwINKAavRoB03oA2gIR0DCfPpxBE8adX2UKGgGR0CYmfpobn5jaAdN6ANoCEdAwn0Bz8P4EnVlLg=="
67
  },
68
  "ep_success_buffer": {
69
  ":type:": "<class 'collections.deque'>",
a2c-AntBulletEnv-v0/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7ca5f3a3ab72fedf1fb5577af6a1c7ce42cc5bb6f6955c753f104efadad26b9
3
- size 56190
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b720c4c505ef920ccdb0804b474d841cf5119f56f904d2246ecba9f599f00f6f
3
+ size 56062
a2c-AntBulletEnv-v0/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cad0be0ed2ce159114659003a0a61442abd5ba791c7bd54152133d194a7e7fe
3
- size 56894
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f60fb7bf909dab05e132f8b385afb808076ba13626ddb3138f70efb2fbebd19
3
+ size 56766
a2c-AntBulletEnv-v0/system_info.txt CHANGED
@@ -2,6 +2,6 @@
2
  - Python: 3.9.16
3
  - Stable-Baselines3: 1.8.0
4
  - PyTorch: 2.0.0+cu118
5
- - GPU Enabled: True
6
  - Numpy: 1.22.4
7
  - Gym: 0.21.0
 
2
  - Python: 3.9.16
3
  - Stable-Baselines3: 1.8.0
4
  - PyTorch: 2.0.0+cu118
5
+ - GPU Enabled: False
6
  - Numpy: 1.22.4
7
  - Gym: 0.21.0
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fec6ce7f280>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fec6ce7f310>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fec6ce7f3a0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fec6ce7f430>", "_build": "<function ActorCriticPolicy._build at 0x7fec6ce7f4c0>", "forward": "<function ActorCriticPolicy.forward at 0x7fec6ce7f550>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fec6ce7f5e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fec6ce7f670>", "_predict": "<function ActorCriticPolicy._predict at 0x7fec6ce7f700>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fec6ce7f790>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fec6ce7f820>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fec6ce7f8b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fec6ce802c0>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1681226124513463565, "learning_rate": 0.00096, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/T3UQTVUdaYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAGt/bj/eCna+Ea7xPolotr8G8Ng/G0EWP4+lA7841T299q1aPlcNA8CttWa/KWM3PH9UfL/46Zo+lKXEvVm2ML9G9Em+gCb4P8T92z4NTipAkxHEPQW6I78+sP0/Tk+5vuU2C8DaoZM+5tcJwImANj+Czpc/eOa+v6slOsBayAI/BfffPYtHwT2sjxo/TrL8vtKghL8mQYBACJIcQH1Pj0AiLEy/EAIjv+jKhb/gLDs/VRzUP/mwTL97IYy+SrPXvub86T/T4MQ9Tge9PwrpoT7lNgvA2qGTPhe47T6JgDY/Ip2BP/tuer9LuYi+/6kkP+O4UL+PKSa/rrNTP0lDc7+DRrI911UuwPhF9T9L51/Aq7pUvxwyuj8PHjy/mjGUv0q9vb/DCXU/lxwZP7/h3T+FBiI/VaZxvsoNpz8q1BI/5TYLwPn0XcAXuO0+iYA2P10C7j7jK7K/cVqcv8RiBL4jhyi+hMpkPUmRvj86/uC+KTHlvxpuID2rF0K/pC3HPzIq9L4QQCBAReqVvzFiFz+CPCQ/8GmBP3IthT9/meW+UDJdPybUAUDn1Yw9fDFpPuU2C8DaoZM+F7jtPomANj+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAAAjRi62AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA5m9dPQAAAACKDt2/AAAAAJWd1zwAAAAA+ovgPwAAAAB3Rxy8AAAAAIdl+z8AAAAA0kOZPQAAAACf5Om/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAzPPrNAAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgEvevr0AAAAASN3fvwAAAACc9Mq9AAAAAOU+/z8AAAAASfvtPQAAAAAQ+OM/AAAAAExuvD0AAAAAhfjqvwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAM7MqTYAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAq5G29AAAAAK9p/L8AAAAAf2jmPQAAAAAyt+U/AAAAAH/75T0AAAAAqQ3iPwAAAADgBoY9AAAAAF38678AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACftnO1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAD/4IPQAAAAAO1/W/AAAAAMQXuD0AAAAAG7zdPwAAAABReb48AAAAAHk//j8AAAAAXurvPQAAAAAzzey/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJJn9z+3pfSMAWyUTegDjAF0lEdAq06n5N47inV9lChoBkdAkqeQwj+rEWgHTegDaAhHQKtSE72+PBB1fZQoaAZHQJKYLjENvwVoB03oA2gIR0CrWUSJTER8dX2UKGgGR0CQGj0PpY9xaAdN6ANoCEdAq1lxVsDW9XV9lChoBkdAkU2e3Ytg8mgHTegDaAhHQKta/ViF0xN1fZQoaAZHQIvtWIGhVVBoB03oA2gIR0CrXydPk7wKdX2UKGgGR0CSW1D6WPcSaAdN6ANoCEdAq2jxujynUHV9lChoBkdAkwq+k1uR92gHTegDaAhHQKtpHNB4Uvh1fZQoaAZHQJRWC/xlQMxoB03oA2gIR0Crap/i5uqFdX2UKGgGR0CR4bSk0rLAaAdN6ANoCEdAq23/rY5DJHV9lChoBkdAlUa7hrFfiWgHTegDaAhHQKt1DvrGBFx1fZQoaAZHQJZsZUzbeuVoB03oA2gIR0CrdTon0CiidX2UKGgGR0CT6jYzSCvpaAdN6ANoCEdAq3a8Fr2xp3V9lChoBkdAltQlyzXz2GgHTegDaAhHQKt6M3kPtlZ1fZQoaAZHQJX6TiZOSGJoB03oA2gIR0CrhH8TakAQdX2UKGgGR0CTvbA6Mir1aAdN6ANoCEdAq4TFz0Yj0XV9lChoBkdAlzqLmlqJuWgHTegDaAhHQKuGZTrE9+x1fZQoaAZHQJaqeWjXWe9oB03oA2gIR0CrifBbnoxIdX2UKGgGR0CWcB0Yj0L/aAdN6ANoCEdAq5DnSa3I/HV9lChoBkdAlhCKpgkTpWgHTegDaAhHQKuREMRYigV1fZQoaAZHQJV9WvwEyL1oB03oA2gIR0Crkqp2ECeVdX2UKGgGR0CWSf8Sf16FaAdN6ANoCEdAq5ZmALApKHV9lChoBkdAkjT6PKdQPGgHTegDaAhHQKufxBQemvZ1fZQoaAZHQIyOnGwRoRJoB03oA2gIR0CroA4IBzV+dX2UKGgGR0CVMVcG1QZXaAdN6ANoCEdAq6Jt/QSi/XV9lChoBkdAk7U7mMfigmgHTegDaAhHQKumFleWv8t1fZQoaAZHQJCH4qlP8AJoB03oA2gIR0CrrT7TUiIMdX2UKGgGR0CSLz3ueBhAaAdN6ANoCEdAq61rTBqKxnV9lChoBkdAkQeNAX2ugmgHTegDaAhHQKuu+pXIU8F1fZQoaAZHQJL7jsyBTXJoB03oA2gIR0Crsnei8FpxdX2UKGgGR0CR1fPFvQ4TaAdN6ANoCEdAq7qtTFVDKHV9lChoBkdAk+8YBvJiiWgHTegDaAhHQKu68JTl1bJ1fZQoaAZHQJOaPLfUF0RoB03oA2gIR0CrvVmK64DtdX2UKGgGR0CSf7SLZSNwaAdN6ANoCEdAq8IhTZQHiXV9lChoBkdAk5hwLRa5gGgHTegDaAhHQKvJW0CzTnd1fZQoaAZHQJPU0XyiEg5oB03oA2gIR0CryYd+XqqwdX2UKGgGR0CU5GMFlkH2aAdN6ANoCEdAq8sImCyyEHV9lChoBkdAYeQsQNCqqGgHS6poCEdAq8tvDUExI3V9lChoBkdAkVwkdzXBg2gHTegDaAhHQKvOcDsdDIB1fZQoaAZHQJVSmSX+l0poB03oA2gIR0Cr1n2nKnvVdX2UKGgGR0CSqgQxesxPaAdN6ANoCEdAq9ip+OOsDHV9lChoBkdAkifWuX/o7mgHTegDaAhHQKvZOD3/PxB1fZQoaAZHQJaD5VJcxCZoB03oA2gIR0Cr3gKubI91dX2UKGgGR0CUDEYAKfFraAdN6ANoCEdAq+W+ZgG8mXV9lChoBkdAlWld5Y5ksmgHTegDaAhHQKvnQgK4QSV1fZQoaAZHQIwT6qCHymRoB03oA2gIR0Cr56M8gZCOdX2UKGgGR0CVyC+GXXyzaAdN6ANoCEdAq+rBL/S6UnV9lChoBkdAlAzCHM2WIGgHTegDaAhHQKvx/sTFl051fZQoaAZHQJHf4S7GvOhoB03oA2gIR0Cr872BJ7LMdX2UKGgGR0CTDcTnJT2naAdN6ANoCEdAq/RPJPqLTHV9lChoBkdAlPICWeHzpWgHTegDaAhHQKv46aNMoMN1fZQoaAZHQI6HmjASFoNoB03oA2gIR0CsAdlN+LFXdX2UKGgGR0CQvyvB7/n4aAdN6ANoCEdArANi8lHBlHV9lChoBkdAkooJMxoIwGgHTegDaAhHQKwDxF0gbId1fZQoaAZHQJOUJZeRgZ1oB03oA2gIR0CsBtr9MsYmdX2UKGgGR0CBxGT4cm0FaAdN6ANoCEdArA46Ss8xK3V9lChoBkdAhLuOavzOHGgHTegDaAhHQKwPzKSxJNF1fZQoaAZHQI20l+CsfaJoB03oA2gIR0CsEC7zshPkdX2UKGgGR0CRp7JRwZO0aAdN6ANoCEdArBQsLa24NXV9lChoBkdAiKxkG7jDK2gHTegDaAhHQKwd8wWWQfZ1fZQoaAZHQJGUvo/zJ6poB03oA2gIR0CsH3yHM2WIdX2UKGgGR0CSv4B9Cu2aaAdN6ANoCEdArB/Zw++ueXV9lChoBkdAlDozxgAp8WgHTegDaAhHQKwi5pKSPlx1fZQoaAZHQJLvUnmaH9FoB03oA2gIR0CsKjFaKUFCdX2UKGgGR0CTRYOVgQYlaAdN6ANoCEdArCu4ZMtbtHV9lChoBkdAkdXt7SiM52gHTegDaAhHQKwsGX4TK1Z1fZQoaAZHQIIWrzPKMehoB03oA2gIR0CsLzV5jYqYdX2UKGgGR0CSUTqWTot+aAdN6ANoCEdArDoPvnbItHV9lChoBkdAi222vbGm12gHTegDaAhHQKw7kmj0tiB1fZQoaAZHQJLekyeqaPVoB03oA2gIR0CsO/me+VTrdX2UKGgGR0CHduw9JSR9aAdN6ANoCEdArD790A93bHV9lChoBkdAi8FZpi7TUmgHTegDaAhHQKxGGhY/3WZ1fZQoaAZHQJGMG25QP7NoB03oA2gIR0CsR5kQwsXjdX2UKGgGR0COOE0TDfm+aAdN6ANoCEdArEf/E87p3XV9lChoBkdAkHJ9To+wDGgHTegDaAhHQKxLKGHHmzV1fZQoaAZHQJGUdc3VColoB03oA2gIR0CsVQ6ttALRdX2UKGgGR0CQ6SL9MsYmaAdN6ANoCEdArFdZ9b5dnnV9lChoBkdAjqmaya/h2mgHTegDaAhHQKxXvBOYYzl1fZQoaAZHQI5l4llbu+hoB03oA2gIR0CsWs9QO4G2dX2UKGgGR0CLeUDbJwKjaAdN6ANoCEdArGIjKgZjx3V9lChoBkdAkKzjr/sE7mgHTegDaAhHQKxjqh8IAwR1fZQoaAZHQIQIllRP421oB03oA2gIR0CsZAoToMa1dX2UKGgGR0CQ69V/+bVjaAdN6ANoCEdArGcPDm8ujHV9lChoBkdAi1SbAckt3GgHTegDaAhHQKxvrzySV4Z1fZQoaAZHQI0u/5HmRvFoB03oA2gIR0Cscg7TlT3qdX2UKGgGR0CRlkYzSCvpaAdN6ANoCEdArHKpwOvt+nV9lChoBkdAjekEGqxTsWgHTegDaAhHQKx2vgzguRN1fZQoaAZHQIonmDcuandoB03oA2gIR0CsfkDAzpHJdX2UKGgGR0CMYcD9wWFfaAdN6ANoCEdArH/SAavRq3V9lChoBkdAgeiGhufmLmgHTegDaAhHQKyAOdMCcPR1fZQoaAZHQJL7WlchTwVoB03oA2gIR0Csg0ZB1LamdX2UKGgGR0CUDivVVghKaAdN6ANoCEdArIs+lGgBcXV9lChoBkdAkheBvm5lOGgHTegDaAhHQKyNb5ylvZR1fZQoaAZHQJNCHnq3VkNoB03oA2gIR0CsjgN+LFXJdX2UKGgGR0CRGjzsyBTXaAdN6ANoCEdArJLGrIYFaHV9lChoBkdAkv/eotL+P2gHTegDaAhHQKyaN6u4gA91fZQoaAZHQIrLhVp9JBhoB03oA2gIR0Csm8Cr92ovdX2UKGgGR0CL57b5dnkDaAdN6ANoCEdArJwnD3ueBnV9lChoBkdAkcCljZtelmgHTegDaAhHQKyfTyNn5BV1fZQoaAZHQIAQCfjCHh1oB027AmgIR0CsourCemNzdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 62500, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVZwIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSxyFlIwBQ5R0lFKUjARoaWdolGgSKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaApLHIWUaBV0lFKUjA1ib3VuZGVkX2JlbG93lGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCFLHIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAEBAQEBAQEBlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.8.0", "PyTorch": "2.0.0+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f51f005b1f0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f51f005b280>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f51f005b310>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f51f005b3a0>", "_build": "<function ActorCriticPolicy._build at 0x7f51f005b430>", "forward": "<function ActorCriticPolicy.forward at 0x7f51f005b4c0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f51f005b550>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f51f005b5e0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f51f005b670>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f51f005b700>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f51f005b790>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f51f005b820>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f51f0059b00>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1681288652863329946, "learning_rate": 0.0001, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAACakjz/Kkc8+UTAqP5bTUz+xgeM/Ryogv5sWpz5YAR8/Q7Z0v9cNiL1rmhs+q3q4v6yaRD+ASsY/YF3bv/1WUT8Ouc6+XZN+vmm9k79wnkjAoRXIvwwywzwI0DM/EiAdPW9XuL+kt8Q+lvP1PjbKXj9RuZI++BBiP7aJBj9CwZg9k7C9P/zmvT7v7JQ/T+xBPv9Nj78gT0A85Q6APutZer8UT+2/1IOEP6RL1b9tk9e9Dce6vTm6Zb2HHBE/KzGGPbVFRb7m55G/kLLxvkp9cz1vV7i/pLfEPpbz9T42yl4/oREPP+YlYr86dAq+1iB4v/nUFz9WsY+6QF3kProGBr1lh4c/5uBuPhHbwz/J4o28gXK0P+sXWj760Ku+jgUSPh0K5T6f4L893q+SPdaf/j2bK8Q/Tb1puv7dbD+p7wW8y8ExP6S3xD6W8/U+NspePxYXfD9+DHg/FonzPgOFwj8pLVc/7C0yPpKqpj+aIYg/slaSvw9/UL/y6kk/QONUP/qJGsAbbSU+1G3Bv8dV7r/joYm/mGQvPk4Zlr9xXKs/WuXCP+MDK7++vES/zIIFQMvBMT/zkibAlvP1Po0Uk7+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAACBcsi2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAv2AIvAAAAACfDNm/AAAAAE/8GL0AAAAAIxH6PwAAAAAlHfm9AAAAAGOQ3z8AAAAApx3kPQAAAAAPkeu/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAcQaHtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgKGBwD0AAAAAt5HlvwAAAAC6sq07AAAAANWZ6z8AAAAAaTo2vQAAAABvhQBAAAAAAKeMQD0AAAAAdfb+vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAFnP7DQAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAMWJS7AAAAAGcu7L8AAAAAvT/lvQAAAACan+w/AAAAAIxUAz4AAAAA9e3pPwAAAABX6Oe6AAAAAKVI/r8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADCL/41AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAm0GSvQAAAAA+Oei/AAAAAC613rwAAAAAji/wPwAAAAAmw9Y9AAAAAMHR+D8AAAAAfvx1PQAAAAAu0vO/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJidmUs4DLeMAWyUTegDjAF0lEdAwgVsB8QZoHV9lChoBkdAlHO8Rcu8LGgHTegDaAhHQMIG6sJ6Y3N1fZQoaAZHQJfHA/qxC6ZoB03oA2gIR0DCBwzEvTPTdX2UKGgGR0CY9KS5AhStaAdN6ANoCEdAwgcS/M4cWHV9lChoBkdAlcHHPJJXhmgHTegDaAhHQMIJ5N+TeO51fZQoaAZHQJfWdZkkKNRoB03oA2gIR0DCCyL+WGATdX2UKGgGR0CYK/BOYYzjaAdN6ANoCEdAwgtdUjLSu3V9lChoBkdAl3hrVJ+UhWgHTegDaAhHQMILZvGp++d1fZQoaAZHQJV3Qlu3trtoB03oA2gIR0DCD3SnpB5YdX2UKGgGR0CZBhC53C9AaAdN6ANoCEdAwhDA+tbLU3V9lChoBkdAlcLPDxb0OGgHTegDaAhHQMIQ6Sr5qM51fZQoaAZHQJZZbOIInjRoB03oA2gIR0DCEO+mFajfdX2UKGgGR0CbScNVzZHvaAdN6ANoCEdAwhOYLkS26XV9lChoBkdAmAOTJ+2E02gHTegDaAhHQMIVd20zCUJ1fZQoaAZHQJS6gSYgJTloB03oA2gIR0DCFa7XnQpndX2UKGgGR0CWKX8rI5o5aAdN6ANoCEdAwhW46qbSZ3V9lChoBkdAlU9KVD8cdmgHTegDaAhHQMIY8U8NhE11fZQoaAZHQJYtLyrgflpoB03oA2gIR0DCGi18qnWKdX2UKGgGR0CWsKos7MgVaAdN6ANoCEdAwhpNcVxjrnV9lChoBkdAmWsmFzuF6GgHTegDaAhHQMIaU9DhLoR1fZQoaAZHQJe7dnBciW5oB03oA2gIR0DCHW0EJSiudX2UKGgGR0CXmfHP/rB1aAdN6ANoCEdAwh9qQz1scnV9lChoBkdAmFsAk9lmOGgHTegDaAhHQMIflrlmvnt1fZQoaAZHQJiGZlI3BHloB03oA2gIR0DCH51eUpuudX2UKGgGR0CXJF5XU6PsaAdN6ANoCEdAwiJ2lE7W/nV9lChoBkdAlJTgIUrTY2gHTegDaAhHQMIjvYKx9oh1fZQoaAZHQJZE6WjXWe9oB03oA2gIR0DCI+WLzf78dX2UKGgGR0CaUkAn2IweaAdN6ANoCEdAwiPsVzIV/XV9lChoBkdAla9c4o7V8WgHTegDaAhHQMIn3KJl8PZ1fZQoaAZHQJdKVWkrPMVoB03oA2gIR0DCKSBOLzf8dX2UKGgGR0CZW7KiwjdIaAdN6ANoCEdAwik+/zJ6p3V9lChoBkdAlcGvxUedTmgHTegDaAhHQMIpRYcvM8p1fZQoaAZHQJg3bxy4nWtoB03oA2gIR0DCK/17jT8YdX2UKGgGR0CWUQrZrYXgaAdN6ANoCEdAwi12AVfu1HV9lChoBkdAlSlLWmP5pWgHTegDaAhHQMItrEVnEl51fZQoaAZHQJhkDdnCfpVoB03oA2gIR0DCLbXn2ZiNdX2UKGgGR0CY71RkmQbNaAdN6ANoCEdAwjGTZQpF1HV9lChoBkdAm+YKUmlZYGgHTegDaAhHQMIy59/jKgZ1fZQoaAZHQJXNJIsiB5JoB03oA2gIR0DCMwoe3hGZdX2UKGgGR0CZTc/T9bX6aAdN6ANoCEdAwjMQmwaBJHV9lChoBkdAkm3ZQ+EAYGgHTegDaAhHQMI128dxQzl1fZQoaAZHQJhtd+z+m3xoB03oA2gIR0DCN+KobXHzdX2UKGgGR0CWcaq4pc5baAdN6ANoCEdAwjgec2BJ7XV9lChoBkdAmRDK5sj3VWgHTegDaAhHQMI4KNxdY4h1fZQoaAZHQJdY9Gqgh8poB03oA2gIR0DCO0WycCo1dX2UKGgGR0CWQHHVPN3XaAdN6ANoCEdAwjyo5paibnV9lChoBkdAl87JjlPrOmgHTegDaAhHQMI80QJPZZl1fZQoaAZHQJtjAuAZsKtoB03oA2gIR0DCPNeUfPondX2UKGgGR0CXWFRSxZ+yaAdN6ANoCEdAwkBfY+0PYnV9lChoBkdAmckZCngpB2gHTegDaAhHQMJCBrfk3jx1fZQoaAZHQJdlzWvr4WVoB03oA2gIR0DCQioLNOdodX2UKGgGR0CWfFXSjQAuaAdN6ANoCEdAwkIxUWEbpHV9lChoBkdAl/gE2pAD72gHTegDaAhHQMJEw5lvqC91fZQoaAZHQJao+9K28ZloB03oA2gIR0DCRf/gUDdQdX2UKGgGR0CbHnQWepXIaAdN6ANoCEdAwkYnP+n623V9lChoBkdAmN1BwVCXyGgHTegDaAhHQMJGLOkLx7R1fZQoaAZHQJWuaKAJ9iNoB03oA2gIR0DCSk3qTr3TdX2UKGgGR0CYcd4NqgyuaAdN6ANoCEdAwkuY/qxC6nV9lChoBkdAlx6QNwzch2gHTegDaAhHQMJLv1Muez51fZQoaAZHQJjAk2Hck+poB03oA2gIR0DCS8bm6oVEdX2UKGgGR0CZ+sqkdmxuaAdN6ANoCEdAwk6OpWFN+XV9lChoBkdAl4yo5ggHNWgHTegDaAhHQMJQJ2M85jp1fZQoaAZHQJU/t7AtWdVoB03oA2gIR0DCUFmr4nF6dX2UKGgGR0CaZUIkZ75VaAdN6ANoCEdAwlBihL5AQnV9lChoBkdAm3N4tQKrrGgHTegDaAhHQMJT96/h2nt1fZQoaAZHQJW4aDlHSWtoB03oA2gIR0DCVVfxSYPYdX2UKGgGR0CYc96Rhc7haAdN6ANoCEdAwlV8bAk9lnV9lChoBkdAmoRFJYkmhWgHTegDaAhHQMJVhDEvTPV1fZQoaAZHQJl2HwazeGhoB03oA2gIR0DCWNcbJfY0dX2UKGgGR0CXfyoIv8IiaAdN6ANoCEdAwlq8814xDnV9lChoBkdAk5ly5qdpZmgHTegDaAhHQMJa4fsNUfh1fZQoaAZHQJdxQxcmjTNoB03oA2gIR0DCWuiXlbNbdX2UKGgGR0CQ8ohoM8YAaAdN6ANoCEdAwl2OHoHLR3V9lChoBkdAlubBIre67WgHTegDaAhHQMJe434CZF51fZQoaAZHQJjotf1HvttoB03oA2gIR0DCXwh8IAwPdX2UKGgGR0CZsFIsiB5HaAdN6ANoCEdAwl8P5gPVeHV9lChoBkdAmOF20Re1KGgHTegDaAhHQMJi23Vsk6d1fZQoaAZHQJXsmydFvydoB03oA2gIR0DCZCPOObRXdX2UKGgGR0CZmlRg7YChaAdN6ANoCEdAwmRDqKP4mHV9lChoBkdAmE+w1rIo3WgHTegDaAhHQMJkSYKx9oh1fZQoaAZHQJYBi3XqZ+hoB03oA2gIR0DCZxunjyWidX2UKGgGR0CXHO3Ehq0uaAdN6ANoCEdAwmi3wd8zAXV9lChoBkdAl9eXY150KmgHTegDaAhHQMJo7nJ9y951fZQoaAZHQJiEnBj4HopoB03oA2gIR0DCaPeQMhHLdX2UKGgGR0CZVcRGc4HYaAdN6ANoCEdAwmy2r+YMOXV9lChoBkdAl2YcUAT7EmgHTegDaAhHQMJt6pm29ct1fZQoaAZHQJo0Q99tuUFoB03oA2gIR0DCbg6FEiMYdX2UKGgGR0CZgSEGqxTsaAdN6ANoCEdAwm4Vr6ciGHV9lChoBkdAmSVnPE87p2gHTegDaAhHQMJw6Z4W1tx1fZQoaAZHQJmDhLYf4h5oB03oA2gIR0DCcteu9vjwdX2UKGgGR0CXrzYQarFPaAdN6ANoCEdAwnMQRhc7hnV9lChoBkdAlrxx9b5dnmgHTegDaAhHQMJzGtTkyUN1fZQoaAZHQJYc2r8zhxZoB03oA2gIR0DCdiGcSXdCdX2UKGgGR0CYVeCa7VawaAdN6ANoCEdAwneEgIQe3nV9lChoBkdAmNflyeZof2gHTegDaAhHQMJ3pmvfTCt1fZQoaAZHQJkxH6eoUBZoB03oA2gIR0DCd60INVindX2UKGgGR0CZJXBUaQ3haAdN6ANoCEdAwntvYpUgjnV9lChoBkdAmU9/GlyimGgHTegDaAhHQMJ81gPNFBp1fZQoaAZHQJnwINKAavRoB03oA2gIR0DCfPpxBE8adX2UKGgGR0CYmfpobn5jaAdN6ANoCEdAwn0Bz8P4EnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 62500, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVZwIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSxyFlIwBQ5R0lFKUjARoaWdolGgSKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaApLHIWUaBV0lFKUjA1ib3VuZGVkX2JlbG93lGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCFLHIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAEBAQEBAQEBlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.8.0", "PyTorch": "2.0.0+cu118", "GPU Enabled": "False", "Numpy": "1.22.4", "Gym": "0.21.0"}}
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 715.2088370108715, "std_reward": 332.8427206422767, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-04-11T16:20:30.456282"}
 
1
+ {"mean_reward": 1893.631191460346, "std_reward": 99.9121690982914, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-04-12T09:52:14.240754"}
vec_normalize.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1be7c943bb15b1c2f717d7902a806f8cf388a423a6f69107dbc14582f41040cd
3
  size 2170
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba461503ff84349f653667005790706b9ff1b5bb8e46499a21c0973424e1d112
3
  size 2170