Commit ·
3256b29
1
Parent(s): dd5e69c
Initial commit
Browse files- README.md +1 -1
- a2c-PandaReachDense-v2.zip +2 -2
- a2c-PandaReachDense-v2/data +21 -21
- a2c-PandaReachDense-v2/policy.optimizer.pth +1 -1
- a2c-PandaReachDense-v2/policy.pth +1 -1
- config.json +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
- vec_normalize.pkl +1 -1
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: PandaReachDense-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value: -
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: PandaReachDense-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: -2.08 +/- 0.33
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
a2c-PandaReachDense-v2.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae7ab90ed082594578d08a1e42e0e2f3de194330571039b2c2fdfcd96ea583a0
|
| 3 |
+
size 108197
|
a2c-PandaReachDense-v2/data
CHANGED
|
@@ -4,9 +4,9 @@
|
|
| 4 |
":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
-
"__init__": "<function MultiInputActorCriticPolicy.__init__ at
|
| 8 |
"__abstractmethods__": "frozenset()",
|
| 9 |
-
"_abc_impl": "<_abc._abc_data object at
|
| 10 |
},
|
| 11 |
"verbose": 1,
|
| 12 |
"policy_kwargs": {
|
|
@@ -41,24 +41,24 @@
|
|
| 41 |
"_np_random": null
|
| 42 |
},
|
| 43 |
"n_envs": 4,
|
| 44 |
-
"num_timesteps":
|
| 45 |
-
"_total_timesteps":
|
| 46 |
"_num_timesteps_at_start": 0,
|
| 47 |
"seed": null,
|
| 48 |
"action_noise": null,
|
| 49 |
-
"start_time":
|
| 50 |
-
"learning_rate": 0.
|
| 51 |
"tensorboard_log": null,
|
| 52 |
"lr_schedule": {
|
| 53 |
":type:": "<class 'function'>",
|
| 54 |
-
":serialized:": "gAWV7wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMXi9yb290L21pbmljb25kYTMvZW52cy9kZWVwLXJsLWhmL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjF4vcm9vdC9taW5pY29uZGEzL2VudnMvZGVlcC1ybC1oZi9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+
|
| 55 |
},
|
| 56 |
"_last_obs": {
|
| 57 |
":type:": "<class 'collections.OrderedDict'>",
|
| 58 |
-
":serialized:": "
|
| 59 |
-
"achieved_goal": "[[0.
|
| 60 |
-
"desired_goal": "[[
|
| 61 |
-
"observation": "[[
|
| 62 |
},
|
| 63 |
"_last_episode_starts": {
|
| 64 |
":type:": "<class 'numpy.ndarray'>",
|
|
@@ -66,9 +66,9 @@
|
|
| 66 |
},
|
| 67 |
"_last_original_obs": {
|
| 68 |
":type:": "<class 'collections.OrderedDict'>",
|
| 69 |
-
":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////
|
| 70 |
"achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
|
| 71 |
-
"desired_goal": "[[-0.
|
| 72 |
"observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
|
| 73 |
},
|
| 74 |
"_episode_num": 0,
|
|
@@ -77,18 +77,18 @@
|
|
| 77 |
"_current_progress_remaining": 0.0,
|
| 78 |
"ep_info_buffer": {
|
| 79 |
":type:": "<class 'collections.deque'>",
|
| 80 |
-
":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////
|
| 81 |
},
|
| 82 |
"ep_success_buffer": {
|
| 83 |
":type:": "<class 'collections.deque'>",
|
| 84 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 85 |
},
|
| 86 |
-
"_n_updates":
|
| 87 |
-
"n_steps":
|
| 88 |
-
"gamma": 0.
|
| 89 |
-
"gae_lambda":
|
| 90 |
-
"ent_coef": 0.
|
| 91 |
-
"vf_coef": 0.
|
| 92 |
-
"max_grad_norm": 0.
|
| 93 |
"normalize_advantage": false
|
| 94 |
}
|
|
|
|
| 4 |
":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
+
"__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7f7dec4bae50>",
|
| 8 |
"__abstractmethods__": "frozenset()",
|
| 9 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f7dec4bbbc0>"
|
| 10 |
},
|
| 11 |
"verbose": 1,
|
| 12 |
"policy_kwargs": {
|
|
|
|
| 41 |
"_np_random": null
|
| 42 |
},
|
| 43 |
"n_envs": 4,
|
| 44 |
+
"num_timesteps": 1500000,
|
| 45 |
+
"_total_timesteps": 1500000,
|
| 46 |
"_num_timesteps_at_start": 0,
|
| 47 |
"seed": null,
|
| 48 |
"action_noise": null,
|
| 49 |
+
"start_time": 1677446129579181900,
|
| 50 |
+
"learning_rate": 0.00010679258738466367,
|
| 51 |
"tensorboard_log": null,
|
| 52 |
"lr_schedule": {
|
| 53 |
":type:": "<class 'function'>",
|
| 54 |
+
":serialized:": "gAWV7wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMXi9yb290L21pbmljb25kYTMvZW52cy9kZWVwLXJsLWhmL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjF4vcm9vdC9taW5pY29uZGEzL2VudnMvZGVlcC1ybC1oZi9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8b/rquW+AohZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
| 55 |
},
|
| 56 |
"_last_obs": {
|
| 57 |
":type:": "<class 'collections.OrderedDict'>",
|
| 58 |
+
":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAcaPMPmTN17qrahY/caPMPmTN17qrahY/caPMPmTN17qrahY/caPMPmTN17qrahY/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAvyTIP9v8Kb9rfEU/SsDZP+T9oD9fmzY+ZRHZPw/suD+vkRa/7EvRv5NunL4AsAe+lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAABxo8w+ZM3XuqtqFj83XcI7wMU3usGSOjxxo8w+ZM3XuqtqFj83XcI7wMU3usGSOjxxo8w+ZM3XuqtqFj83XcI7wMU3usGSOjxxo8w+ZM3XuqtqFj83XcI7wMU3usGSOjyUaA5LBEsGhpRoEnSUUpR1Lg==",
|
| 59 |
+
"achieved_goal": "[[ 0.39968446 -0.00164644 0.5875651 ]\n [ 0.39968446 -0.00164644 0.5875651 ]\n [ 0.39968446 -0.00164644 0.5875651 ]\n [ 0.39968446 -0.00164644 0.5875651 ]]",
|
| 60 |
+
"desired_goal": "[[ 1.5636214 -0.6640145 0.7714297 ]\n [ 1.7011807 1.2577481 0.17832707]\n [ 1.6958433 1.4447039 -0.58816046]\n [-1.6351295 -0.3055311 -0.13250732]]",
|
| 61 |
+
"observation": "[[ 0.39968446 -0.00164644 0.5875651 0.00593152 -0.00070104 0.01138753]\n [ 0.39968446 -0.00164644 0.5875651 0.00593152 -0.00070104 0.01138753]\n [ 0.39968446 -0.00164644 0.5875651 0.00593152 -0.00070104 0.01138753]\n [ 0.39968446 -0.00164644 0.5875651 0.00593152 -0.00070104 0.01138753]]"
|
| 62 |
},
|
| 63 |
"_last_episode_starts": {
|
| 64 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
|
| 66 |
},
|
| 67 |
"_last_original_obs": {
|
| 68 |
":type:": "<class 'collections.OrderedDict'>",
|
| 69 |
+
":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAARYrYveudy7x85Hg+sT+NvBKKkzyKUmM+tYl6vcolSzyWjAI+MVbYvU8KDT4wGhY9lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==",
|
| 70 |
"achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
|
| 71 |
+
"desired_goal": "[[-0.10573248 -0.02485557 0.2430591 ]\n [-0.01724228 0.01801017 0.22199455]\n [-0.06116648 0.01239915 0.12748942]\n [-0.10563315 0.13773464 0.03664607]]",
|
| 72 |
"observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
|
| 73 |
},
|
| 74 |
"_episode_num": 0,
|
|
|
|
| 77 |
"_current_progress_remaining": 0.0,
|
| 78 |
"ep_info_buffer": {
|
| 79 |
":type:": "<class 'collections.deque'>",
|
| 80 |
+
":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIke18PzV+DMCUhpRSlIwBbJRLMowBdJRHQLAk4jtG/et1fZQoaAZoCWgPQwjU8ZiByngOwJSGlFKUaBVLMmgWR0CwI+Uiliz+dX2UKGgGaAloD0MIgCctXFYBCsCUhpRSlGgVSzJoFkdAsCL6p++dsnV9lChoBmgJaA9DCEbu6eqOBQ3AlIaUUpRoFUsyaBZHQLAh3OwgTyt1fZQoaAZoCWgPQwjRzf5AuW0RwJSGlFKUaBVLMmgWR0CwJWFUp/gBdX2UKGgGaAloD0MIyTocXaUbF8CUhpRSlGgVSzJoFkdAsCRkOuq3mXV9lChoBmgJaA9DCKuzWmCPKQ3AlIaUUpRoFUsyaBZHQLAjeb6guh91fZQoaAZoCWgPQwgGRl7WxHITwJSGlFKUaBVLMmgWR0CwIlv69CeFdX2UKGgGaAloD0MI6ITQQZcwEMCUhpRSlGgVSzJoFkdAsCXfVawD/3V9lChoBmgJaA9DCOLkfoeiwAnAlIaUUpRoFUsyaBZHQLAk4ixVyWB1fZQoaAZoCWgPQwgGEhQ/xpwNwJSGlFKUaBVLMmgWR0CwI/fIfbKzdX2UKGgGaAloD0MIlExO7QzjEcCUhpRSlGgVSzJoFkdAsCLaA2AG0XV9lChoBmgJaA9DCM8sCVBTSxvAlIaUUpRoFUsyaBZHQLAmXbQ1JlJ1fZQoaAZoCWgPQwgZjuczoE4RwJSGlFKUaBVLMmgWR0CwJWCJ9AoodX2UKGgGaAloD0MIp11MM93rDsCUhpRSlGgVSzJoFkdAsCR2HXVbzXV9lChoBmgJaA9DCC6rsBngohfAlIaUUpRoFUsyaBZHQLAjWFSsKb91fZQoaAZoCWgPQwijdOlfkroXwJSGlFKUaBVLMmgWR0CwJthX4j8ldX2UKGgGaAloD0MIqaJ4lbV9EMCUhpRSlGgVSzJoFkdAsCXbL8rI53V9lChoBmgJaA9DCNek2xK5MBLAlIaUUpRoFUsyaBZHQLAk8Lgn+hp1fZQoaAZoCWgPQwi++Q0TDUIQwJSGlFKUaBVLMmgWR0CwI9L0WdmQdX2UKGgGaAloD0MI86ykFd/QEsCUhpRSlGgVSzJoFkdAsCdhAWzninV9lChoBmgJaA9DCEyln3B2SxnAlIaUUpRoFUsyaBZHQLAmY9rGipN1fZQoaAZoCWgPQwhoz2VqEjwJwJSGlFKUaBVLMmgWR0CwJXldX1aodX2UKGgGaAloD0MIHjLlQ1BVE8CUhpRSlGgVSzJoFkdAsCRbnMdLhHV9lChoBmgJaA9DCNXQBmADUhbAlIaUUpRoFUsyaBZHQLAn266reZZ1fZQoaAZoCWgPQwh1djI4Sv4TwJSGlFKUaBVLMmgWR0CwJt6KxcFAdX2UKGgGaAloD0MIjbeVXpvtCcCUhpRSlGgVSzJoFkdAsCX0IsyzonV9lChoBmgJaA9DCO6wicxcwAXAlIaUUpRoFUsyaBZHQLAk1mMOwxF1fZQoaAZoCWgPQwjE0OrkDMULwJSGlFKUaBVLMmgWR0CwKGKS1Vo6dX2UKGgGaAloD0MIV7JjIxB/FMCUhpRSlGgVSzJoFkdAsCdlaePJaXV9lChoBmgJaA9DCGFUUiegmRrAlIaUUpRoFUsyaBZHQLAmeuctoSN1fZQoaAZoCWgPQwjkDwaee+8JwJSGlFKUaBVLMmgWR0CwJV0pqh11dX2UKGgGaAloD0MI7bsi+N8KBcCUhpRSlGgVSzJoFkdAsCje2c8Tz3V9lChoBmgJaA9DCCGRtvEnygnAlIaUUpRoFUsyaBZHQLAn4bYK6Wh1fZQoaAZoCWgPQwh/hcyVQdUGwJSGlFKUaBVLMmgWR0CwJvc+V1OkdX2UKGgGaAloD0MIRrJHqBkyC8CUhpRSlGgVSzJoFkdAsCXZkRSP2nV9lChoBmgJaA9DCHv3x3vVigzAlIaUUpRoFUsyaBZHQLApWz3AVO91fZQoaAZoCWgPQwgQlNv2PVoTwJSGlFKUaBVLMmgWR0CwKF4O6NEPdX2UKGgGaAloD0MIaww6IXQwB8CUhpRSlGgVSzJoFkdAsCdzrNW2gHV9lChoBmgJaA9DCBL6mXrdchPAlIaUUpRoFUsyaBZHQLAmVe67NB51fZQoaAZoCWgPQwhDyHn/HycIwJSGlFKUaBVLMmgWR0CwKdd8VpK0dX2UKGgGaAloD0MI2ZdsPNhCCsCUhpRSlGgVSzJoFkdAsCjaTHKfWnV9lChoBmgJaA9DCIcx6e+lsBDAlIaUUpRoFUsyaBZHQLAn78hs67x1fZQoaAZoCWgPQwjFdCFWf8QWwJSGlFKUaBVLMmgWR0CwJtIJiRW+dX2UKGgGaAloD0MIXFg33h35DcCUhpRSlGgVSzJoFkdAsCpmRxLkCHV9lChoBmgJaA9DCMgjuJGydRXAlIaUUpRoFUsyaBZHQLApaT4+KTB1fZQoaAZoCWgPQwhbfXVVoHYZwJSGlFKUaBVLMmgWR0CwKH7KFIuodX2UKGgGaAloD0MIbSBdbFpJC8CUhpRSlGgVSzJoFkdAsCdhDArQPnV9lChoBmgJaA9DCBqLprOTIRHAlIaUUpRoFUsyaBZHQLAq5No8IRh1fZQoaAZoCWgPQwiYMnBAS9cIwJSGlFKUaBVLMmgWR0CwKeeu/1xsdX2UKGgGaAloD0MIRn79EBt8EcCUhpRSlGgVSzJoFkdAsCj9N/OMVHV9lChoBmgJaA9DCBCtFW2OgxLAlIaUUpRoFUsyaBZHQLAn332mHgx1fZQoaAZoCWgPQwgBwocSLbkOwJSGlFKUaBVLMmgWR0CwK2HbmEGrdX2UKGgGaAloD0MIArfu5qlOFsCUhpRSlGgVSzJoFkdAsCpkrWiDd3V9lChoBmgJaA9DCD60jxX8hhbAlIaUUpRoFUsyaBZHQLApeigkC3h1fZQoaAZoCWgPQwhdv2A3bGsSwJSGlFKUaBVLMmgWR0CwKFxy8zyjdX2UKGgGaAloD0MIm1d1VgtMDsCUhpRSlGgVSzJoFkdAsCveYrrgO3V9lChoBmgJaA9DCAkbnl4pGxXAlIaUUpRoFUsyaBZHQLAq4T6zmfZ1fZQoaAZoCWgPQwiBI4EGm3oSwJSGlFKUaBVLMmgWR0CwKfa0D2aldX2UKGgGaAloD0MI7UW0HVO3BMCUhpRSlGgVSzJoFkdAsCjY8QqZt3V9lChoBmgJaA9DCNszSwLUtBHAlIaUUpRoFUsyaBZHQLAsWPS2H+J1fZQoaAZoCWgPQwiPpQ9dUN8OwJSGlFKUaBVLMmgWR0CwK1vJA+pwdX2UKGgGaAloD0MIP8dHizOGD8CUhpRSlGgVSzJoFkdAsCpxRMvh63V9lChoBmgJaA9DCMr6zcR0IQ3AlIaUUpRoFUsyaBZHQLApU4Pf8/F1fZQoaAZoCWgPQwgCYhIu5HEIwJSGlFKUaBVLMmgWR0CwLNr39JjEdX2UKGgGaAloD0MIHAdeLXcmCsCUhpRSlGgVSzJoFkdAsCvd4RmK7HV9lChoBmgJaA9DCHUCmggbDhLAlIaUUpRoFUsyaBZHQLAq811GLDR1fZQoaAZoCWgPQwhbecn/5C8JwJSGlFKUaBVLMmgWR0CwKdWyTpxFdX2UKGgGaAloD0MIiLzl6semCcCUhpRSlGgVSzJoFkdAsC1S1YyO73V9lChoBmgJaA9DCFyTbkvkAhLAlIaUUpRoFUsyaBZHQLAsVaXa8Hx1fZQoaAZoCWgPQwhLcyuE1YgRwJSGlFKUaBVLMmgWR0CwK2sjAzpHdX2UKGgGaAloD0MIw0Xu6epuDcCUhpRSlGgVSzJoFkdAsCpNZEDyOXV9lChoBmgJaA9DCPvqqkAtRhPAlIaUUpRoFUsyaBZHQLAt0Fkxyn11fZQoaAZoCWgPQwi1UZ0OZN0OwJSGlFKUaBVLMmgWR0CwLNMoc7yQdX2UKGgGaAloD0MI7rWg98awDMCUhpRSlGgVSzJoFkdAsCvoqMFUynV9lChoBmgJaA9DCEiHhzB++gXAlIaUUpRoFUsyaBZHQLAqyuh9LHx1fZQoaAZoCWgPQwhG7X4V4OsRwJSGlFKUaBVLMmgWR0CwLkutOmBOdX2UKGgGaAloD0MITU2CN6RxDcCUhpRSlGgVSzJoFkdAsC1OfRNRFnV9lChoBmgJaA9DCEimQ6fnjRXAlIaUUpRoFUsyaBZHQLAsY/wy6+Z1fZQoaAZoCWgPQwg+6Nms+rwMwJSGlFKUaBVLMmgWR0CwK0Y8U21ldX2UKGgGaAloD0MImpfD7jtmCcCUhpRSlGgVSzJoFkdAsC7KsRxtHnV9lChoBmgJaA9DCIeIm1PJgAvAlIaUUpRoFUsyaBZHQLAtzYpUgjh1fZQoaAZoCWgPQwhgIt46/7YJwJSGlFKUaBVLMmgWR0CwLOMGs3hodX2UKGgGaAloD0MITrNAu0MqCsCUhpRSlGgVSzJoFkdAsCvFP0qYq3V9lChoBmgJaA9DCO2BVmDIqhHAlIaUUpRoFUsyaBZHQLAvRhxo7FN1fZQoaAZoCWgPQwi1M0xtqcMOwJSGlFKUaBVLMmgWR0CwLkkDlo12dX2UKGgGaAloD0MIAcPy59vCEMCUhpRSlGgVSzJoFkdAsC1ef16E8XV9lChoBmgJaA9DCMOcoE0Ofw3AlIaUUpRoFUsyaBZHQLAsQNUwSJ11fZQoaAZoCWgPQwhNnx1wXdELwJSGlFKUaBVLMmgWR0CwL8LLdN34dX2UKGgGaAloD0MIiPNwAtMJHsCUhpRSlGgVSzJoFkdAsC7FpYcNpnV9lChoBmgJaA9DCIP4wI7/4gPAlIaUUpRoFUsyaBZHQLAt2zEaVD91fZQoaAZoCWgPQwit30xMF0IdwJSGlFKUaBVLMmgWR0CwLL2KuSwGdX2UKGgGaAloD0MIrVEP0ehuDsCUhpRSlGgVSzJoFkdAsDBBTn7pFHV9lChoBmgJaA9DCGrC9pMxBiDAlIaUUpRoFUsyaBZHQLAvRCMPz4F1fZQoaAZoCWgPQwhoQpPEkgITwJSGlFKUaBVLMmgWR0CwLlm3KB/adX2UKGgGaAloD0MIuk24V+atDsCUhpRSlGgVSzJoFkdAsC07/T9bYHV9lChoBmgJaA9DCMUe2scKPg/AlIaUUpRoFUsyaBZHQLAwwuVHFxZ1fZQoaAZoCWgPQwhkzjP2JdsOwJSGlFKUaBVLMmgWR0CwL8Wz0HyFdX2UKGgGaAloD0MILudSXFWWCsCUhpRSlGgVSzJoFkdAsC7bYRNAT3V9lChoBmgJaA9DCIgq/BnebArAlIaUUpRoFUsyaBZHQLAtveGwiaB1ZS4="
|
| 81 |
},
|
| 82 |
"ep_success_buffer": {
|
| 83 |
":type:": "<class 'collections.deque'>",
|
| 84 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 85 |
},
|
| 86 |
+
"_n_updates": 37500,
|
| 87 |
+
"n_steps": 10,
|
| 88 |
+
"gamma": 0.9005397464660235,
|
| 89 |
+
"gae_lambda": 0.8043567334308052,
|
| 90 |
+
"ent_coef": 0.0654376522770753,
|
| 91 |
+
"vf_coef": 0.3415400217360765,
|
| 92 |
+
"max_grad_norm": 0.472916136764715,
|
| 93 |
"normalize_advantage": false
|
| 94 |
}
|
a2c-PandaReachDense-v2/policy.optimizer.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 44734
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:15d1f7b647bddddb13475ef63d82107ec7d143f789e6aa60712ac386aa18dfd8
|
| 3 |
size 44734
|
a2c-PandaReachDense-v2/policy.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 46014
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06e019b340fc87b8545ce808c2c2a57233deb05f9e5bda8493f6e10bec768a2b
|
| 3 |
size 46014
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7fc761f10820>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fc761f0ef40>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.dict.Dict'>", ":serialized:": "gAWVUgMAAAAAAACMD2d5bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwOZ3ltLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUaBCTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowGX3NoYXBllEsDhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZSMAUOUdJRSlIwEaGlnaJRoHSiWDAAAAAAAAAAAACBBAAAgQQAAIEGUaBVLA4WUaCB0lFKUjA1ib3VuZGVkX2JlbG93lGgdKJYDAAAAAAAAAAEBAZRoEowCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZRoIHSUUpSMDWJvdW5kZWRfYWJvdmWUaB0olgMAAAAAAAAAAQEBlGgsSwOFlGggdJRSlIwKX25wX3JhbmRvbZROdWKMDGRlc2lyZWRfZ29hbJRoDSmBlH2UKGgQaBVoGEsDhZRoGmgdKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZRoIHSUUpRoI2gdKJYMAAAAAAAAAAAAIEEAACBBAAAgQZRoFUsDhZRoIHSUUpRoKGgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoMmgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoN051YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgVaBhLBoWUaBpoHSiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBVLBoWUaCB0lFKUaCNoHSiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBVLBoWUaCB0lFKUaChoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDJoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDdOdWJ1aBhOaBBOaDdOdWIu", "spaces": "OrderedDict([('achieved_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('desired_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('observation', Box([-10. -10. -10. -10. -10. -10.], [10. 10. 10. 10. 10. 10.], (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaApLA4WUjAFDlHSUUpSMBGhpZ2iUaBIolgwAAAAAAAAAAACAPwAAgD8AAIA/lGgKSwOFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWAwAAAAAAAAABAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYDAAAAAAAAAAEBAZRoIUsDhZRoFXSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 1000000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1677353986590013500, "learning_rate": 0.0007, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV7wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMXi9yb290L21pbmljb25kYTMvZW52cy9kZWVwLXJsLWhmL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjF4vcm9vdC9taW5pY29uZGEzL2VudnMvZGVlcC1ybC1oZi9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9G8AaNuLrHhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAShfQPjyUED10gxk/ShfQPjyUED10gxk/ShfQPjyUED10gxk/ShfQPjyUED10gxk/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAtJYkPyhmQz/Sd6Q/wYBHv7Qpej/VkVC/dLK5v27qRr/b9Do/XLBXPb8dur9CqWc/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAABKF9A+PJQQPXSDGT/fe4a5kWVrOX37f7tKF9A+PJQQPXSDGT/fe4a5kWVrOX37f7tKF9A+PJQQPXSDGT/fe4a5kWVrOX37f7tKF9A+PJQQPXSDGT/fe4a5kWVrOX37f7uUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[0.40642768 0.03529762 0.59966207]\n [0.40642768 0.03529762 0.59966207]\n [0.40642768 0.03529762 0.59966207]\n [0.40642768 0.03529762 0.59966207]]", "desired_goal": "[[ 0.64292455 0.76327753 1.2849066 ]\n [-0.7793084 0.97719884 -0.8147252 ]\n [-1.4507585 -0.7770146 0.7302987 ]\n [ 0.05265842 -1.4540328 0.9049264 ]]", "observation": "[[ 4.0642768e-01 3.5297617e-02 5.9966207e-01 -2.5650763e-04\n 2.2449183e-04 -3.9059811e-03]\n [ 4.0642768e-01 3.5297617e-02 5.9966207e-01 -2.5650763e-04\n 2.2449183e-04 -3.9059811e-03]\n [ 4.0642768e-01 3.5297617e-02 5.9966207e-01 -2.5650763e-04\n 2.2449183e-04 -3.9059811e-03]\n [ 4.0642768e-01 3.5297617e-02 5.9966207e-01 -2.5650763e-04\n 2.2449183e-04 -3.9059811e-03]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAABTK/vZOHIzssK509p2jKPepE3z19mVw+gNwjPMH4zz0J/PE9x0+YvZkqAj78sAA+lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[-0.09335712 0.00249526 0.0767425 ]\n [ 0.09883242 0.10901816 0.21542926]\n [ 0.0100013 0.10154868 0.1181565 ]\n [-0.07437091 0.12711562 0.12567514]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIzlFHx9WICMCUhpRSlIwBbJRLMowBdJRHQKbWD03fhuR1fZQoaAZoCWgPQwio4PCCiKQSwJSGlFKUaBVLMmgWR0Cm1d/iHZbqdX2UKGgGaAloD0MI+nspPGgWC8CUhpRSlGgVSzJoFkdAptWrDMvAXXV9lChoBmgJaA9DCOY/pN++fhHAlIaUUpRoFUsyaBZHQKbVep+c6Nl1fZQoaAZoCWgPQwiX4xWInvQNwJSGlFKUaBVLMmgWR0Cm1y/WtlqbdX2UKGgGaAloD0MI+zxGeeYlEMCUhpRSlGgVSzJoFkdAptcAZ0jkdXV9lChoBmgJaA9DCL5KPnYXOBDAlIaUUpRoFUsyaBZHQKbWy3solUp1fZQoaAZoCWgPQwj5SEp6GNoOwJSGlFKUaBVLMmgWR0Cm1ptATqSpdX2UKGgGaAloD0MIXWqEfqYuFsCUhpRSlGgVSzJoFkdAptheOQyRCHV9lChoBmgJaA9DCOup1VdXhRPAlIaUUpRoFUsyaBZHQKbYLsqJ/G51fZQoaAZoCWgPQwjBVZ5A2HkZwJSGlFKUaBVLMmgWR0Cm1/ocrAgxdX2UKGgGaAloD0MI8rVnlgRIDcCUhpRSlGgVSzJoFkdAptfJsZYPoXV9lChoBmgJaA9DCJIf8SvWsAvAlIaUUpRoFUsyaBZHQKbZfwR5C4V1fZQoaAZoCWgPQwjVWS2wx0QQwJSGlFKUaBVLMmgWR0Cm2U92Pkq+dX2UKGgGaAloD0MI8E+pEmUfFcCUhpRSlGgVSzJoFkdAptkamj0tiHV9lChoBmgJaA9DCNyfi4aMpw7AlIaUUpRoFUsyaBZHQKbY6rHU+cJ1fZQoaAZoCWgPQwgc7bjhdxMMwJSGlFKUaBVLMmgWR0Cm2pwRPGhmdX2UKGgGaAloD0MIdytLdJY5BsCUhpRSlGgVSzJoFkdAptpsuanaWXV9lChoBmgJaA9DCP4mFCLgcAvAlIaUUpRoFUsyaBZHQKbaOA7Pppx1fZQoaAZoCWgPQwg/jXvzG6YHwJSGlFKUaBVLMmgWR0Cm2geKTB69dX2UKGgGaAloD0MI29/ZHr0BDcCUhpRSlGgVSzJoFkdAptuxOpKjBXV9lChoBmgJaA9DCOOON/kteg3AlIaUUpRoFUsyaBZHQKbbgbQ1JlJ1fZQoaAZoCWgPQwjGTQ00n/MMwJSGlFKUaBVLMmgWR0Cm20zo2XLNdX2UKGgGaAloD0MIDAVsByM2BMCUhpRSlGgVSzJoFkdAptsckdFOPHV9lChoBmgJaA9DCOSG3023LBfAlIaUUpRoFUsyaBZHQKbc2vFFUhp1fZQoaAZoCWgPQwiMnfASnHoRwJSGlFKUaBVLMmgWR0Cm3KuiWVu8dX2UKGgGaAloD0MIB0Dc1asIFMCUhpRSlGgVSzJoFkdAptx22oegc3V9lChoBmgJaA9DCGCwG7YtyhDAlIaUUpRoFUsyaBZHQKbcRmOEM9d1fZQoaAZoCWgPQwgBwLFnz/UTwJSGlFKUaBVLMmgWR0Cm3gcPvrnldX2UKGgGaAloD0MI5SX/k7/bDMCUhpRSlGgVSzJoFkdApt3Xn8sMAnV9lChoBmgJaA9DCOz6Bbth+wrAlIaUUpRoFUsyaBZHQKbdoySmqHZ1fZQoaAZoCWgPQwiCV8udmYAKwJSGlFKUaBVLMmgWR0Cm3XKhcqvvdX2UKGgGaAloD0MIU3dlFwyOEsCUhpRSlGgVSzJoFkdApt8tanrIHXV9lChoBmgJaA9DCC5ZFeEmww3AlIaUUpRoFUsyaBZHQKbe/fAsTWZ1fZQoaAZoCWgPQwgY6xuY3GgLwJSGlFKUaBVLMmgWR0Cm3slVcUuddX2UKGgGaAloD0MIfvylRX3SCsCUhpRSlGgVSzJoFkdApt6Y5cTrV3V9lChoBmgJaA9DCEuTUtDtNRrAlIaUUpRoFUsyaBZHQKbgRy4nWrh1fZQoaAZoCWgPQwhoQpPEkoIRwJSGlFKUaBVLMmgWR0Cm4BfRNRFadX2UKGgGaAloD0MIh2wgXWy6EsCUhpRSlGgVSzJoFkdApt/i9mHxjXV9lChoBmgJaA9DCPgyUYTULRXAlIaUUpRoFUsyaBZHQKbfspEx7At1fZQoaAZoCWgPQwhd4PJYM7IIwJSGlFKUaBVLMmgWR0Cm4WNPP9k0dX2UKGgGaAloD0MIc4QM5NkFEsCUhpRSlGgVSzJoFkdApuE0IcBEKHV9lChoBmgJaA9DCIHtYMQ+oRjAlIaUUpRoFUsyaBZHQKbg/0KZ2IR1fZQoaAZoCWgPQwi6o//lWiQQwJSGlFKUaBVLMmgWR0Cm4M7kfcN6dX2UKGgGaAloD0MI9kIB28HoGsCUhpRSlGgVSzJoFkdApuKSfQKKHnV9lChoBmgJaA9DCLYuNUI/4xPAlIaUUpRoFUsyaBZHQKbiYwpON5t1fZQoaAZoCWgPQwjEP2zp0dQVwJSGlFKUaBVLMmgWR0Cm4i5HNHH4dX2UKGgGaAloD0MIFJSilXuxEcCUhpRSlGgVSzJoFkdApuH+NHYpUnV9lChoBmgJaA9DCJQT7SqkfBjAlIaUUpRoFUsyaBZHQKbjuRSxZ+x1fZQoaAZoCWgPQwjByTZwB2oOwJSGlFKUaBVLMmgWR0Cm44muTzNEdX2UKGgGaAloD0MIQu4iTFHuEsCUhpRSlGgVSzJoFkdApuNVeQdS23V9lChoBmgJaA9DCD7KiAtAUxjAlIaUUpRoFUsyaBZHQKbjJPLxI8R1fZQoaAZoCWgPQwj2mbM+5XgPwJSGlFKUaBVLMmgWR0Cm5Ply7wrldX2UKGgGaAloD0MIBAEydOygFMCUhpRSlGgVSzJoFkdApuTKkIomX3V9lChoBmgJaA9DCB1WuOUjqRHAlIaUUpRoFUsyaBZHQKbkldIGyHF1fZQoaAZoCWgPQwjImSZsPykVwJSGlFKUaBVLMmgWR0Cm5GWQOnVHdX2UKGgGaAloD0MIW5VE9kFGFMCUhpRSlGgVSzJoFkdApuYdeF+NLnV9lChoBmgJaA9DCEV/aObJNRjAlIaUUpRoFUsyaBZHQKbl7etSydF1fZQoaAZoCWgPQwhpjqz8MhgQwJSGlFKUaBVLMmgWR0Cm5bkOZssQdX2UKGgGaAloD0MIVvDbEON1DsCUhpRSlGgVSzJoFkdApuWIk9lmOHV9lChoBmgJaA9DCPmDgefeAxDAlIaUUpRoFUsyaBZHQKbnXyU9pyp1fZQoaAZoCWgPQwj3lJwTezgUwJSGlFKUaBVLMmgWR0Cm5y+vpyIYdX2UKGgGaAloD0MIYVW9/E4TDcCUhpRSlGgVSzJoFkdApub7HdXT3XV9lChoBmgJaA9DCEIKnkKu9A3AlIaUUpRoFUsyaBZHQKbmyq2jO9p1fZQoaAZoCWgPQwhk6NhBJX4TwJSGlFKUaBVLMmgWR0Cm6IfmDDjzdX2UKGgGaAloD0MIVft0PGYgFcCUhpRSlGgVSzJoFkdApuhYydnTRnV9lChoBmgJaA9DCDlE3JxKJgPAlIaUUpRoFUsyaBZHQKboI+9Jz1d1fZQoaAZoCWgPQwiDMSJRaDkRwJSGlFKUaBVLMmgWR0Cm5/NwJgLJdX2UKGgGaAloD0MIlX7C2a2VEcCUhpRSlGgVSzJoFkdApunMBS1ma3V9lChoBmgJaA9DCDIdOj3vJgrAlIaUUpRoFUsyaBZHQKbpnL5AQg91fZQoaAZoCWgPQwiKIqRuZy8UwJSGlFKUaBVLMmgWR0Cm6WgwoLG8dX2UKGgGaAloD0MI6Qq2EU82CsCUhpRSlGgVSzJoFkdApuk3uJDVpnV9lChoBmgJaA9DCGYQH9jx/w/AlIaUUpRoFUsyaBZHQKbq8/5+H8F1fZQoaAZoCWgPQwgfTfVk/jEMwJSGlFKUaBVLMmgWR0Cm6sTDn/1hdX2UKGgGaAloD0MInkSEfxHEEcCUhpRSlGgVSzJoFkdApuqP4dp7C3V9lChoBmgJaA9DCKQ4Rx0dVxHAlIaUUpRoFUsyaBZHQKbqX+jua4N1fZQoaAZoCWgPQwg5CaUvhMwRwJSGlFKUaBVLMmgWR0Cm7A6z/p+udX2UKGgGaAloD0MIiXssfegiGsCUhpRSlGgVSzJoFkdApuvfYQJ5V3V9lChoBmgJaA9DCDmaIyu/fBTAlIaUUpRoFUsyaBZHQKbrqrd30PJ1fZQoaAZoCWgPQwh/TGvT2O4QwJSGlFKUaBVLMmgWR0Cm63phF3INdX2UKGgGaAloD0MI/FI/byqSD8CUhpRSlGgVSzJoFkdApu0edf9gnnV9lChoBmgJaA9DCC82rRQCOQTAlIaUUpRoFUsyaBZHQKbs7uvUz9F1fZQoaAZoCWgPQwgkmdU73E4SwJSGlFKUaBVLMmgWR0Cm7LokAxSHdX2UKGgGaAloD0MIbeF5qdi4DcCUhpRSlGgVSzJoFkdApuyJnQID5nV9lChoBmgJaA9DCCbFxydkhxDAlIaUUpRoFUsyaBZHQKbuWLsKLKp1fZQoaAZoCWgPQwhXQKGePoIUwJSGlFKUaBVLMmgWR0Cm7ilrM1TBdX2UKGgGaAloD0MIeQPMfAd/EcCUhpRSlGgVSzJoFkdApu30pqh11XV9lChoBmgJaA9DCFMiiV5GURTAlIaUUpRoFUsyaBZHQKbtxDQZ4wB1fZQoaAZoCWgPQwgLYwtBDmoRwJSGlFKUaBVLMmgWR0Cm74DbBXS0dX2UKGgGaAloD0MIYYicvp5/EsCUhpRSlGgVSzJoFkdApu9RrHlwLnV9lChoBmgJaA9DCMvXZfhPZxXAlIaUUpRoFUsyaBZHQKbvHPFefI11fZQoaAZoCWgPQwjx2To42LsVwJSGlFKUaBVLMmgWR0Cm7uyYXwb3dX2UKGgGaAloD0MIYvcdw2NfDMCUhpRSlGgVSzJoFkdApvCu2TgVGnV9lChoBmgJaA9DCHkfR3NkhQ7AlIaUUpRoFUsyaBZHQKbwf1JUYKp1fZQoaAZoCWgPQwjb3JiesMQPwJSGlFKUaBVLMmgWR0Cm8Eqqfe1sdX2UKGgGaAloD0MIh086kWDaFsCUhpRSlGgVSzJoFkdApvAaSTyJ9HV9lChoBmgJaA9DCOFh2jf3NxDAlIaUUpRoFUsyaBZHQKbx7bBXS0B1fZQoaAZoCWgPQwhWDcLc7sUUwJSGlFKUaBVLMmgWR0Cm8b5k078vdX2UKGgGaAloD0MI8E3TZwf8EcCUhpRSlGgVSzJoFkdApvGJ26kIonV9lChoBmgJaA9DCKlr7X2q6hDAlIaUUpRoFUsyaBZHQKbxWdo371t1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 50000, "n_steps": 5, "gamma": 0.99, "gae_lambda": 1.0, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.10.16.3-microsoft-standard-WSL2-x86_64-with-glibc2.31 # 1 SMP Fri Apr 2 22:23:49 UTC 2021", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu117", "GPU Enabled": "True", "Numpy": "1.24.2", "Gym": "0.21.0"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7f7dec4bae50>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f7dec4bbbc0>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.dict.Dict'>", ":serialized:": "gAWVUgMAAAAAAACMD2d5bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwOZ3ltLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUaBCTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowGX3NoYXBllEsDhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZSMAUOUdJRSlIwEaGlnaJRoHSiWDAAAAAAAAAAAACBBAAAgQQAAIEGUaBVLA4WUaCB0lFKUjA1ib3VuZGVkX2JlbG93lGgdKJYDAAAAAAAAAAEBAZRoEowCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZRoIHSUUpSMDWJvdW5kZWRfYWJvdmWUaB0olgMAAAAAAAAAAQEBlGgsSwOFlGggdJRSlIwKX25wX3JhbmRvbZROdWKMDGRlc2lyZWRfZ29hbJRoDSmBlH2UKGgQaBVoGEsDhZRoGmgdKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZRoIHSUUpRoI2gdKJYMAAAAAAAAAAAAIEEAACBBAAAgQZRoFUsDhZRoIHSUUpRoKGgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoMmgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoN051YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgVaBhLBoWUaBpoHSiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBVLBoWUaCB0lFKUaCNoHSiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBVLBoWUaCB0lFKUaChoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDJoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDdOdWJ1aBhOaBBOaDdOdWIu", "spaces": "OrderedDict([('achieved_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('desired_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('observation', Box([-10. -10. -10. -10. -10. -10.], [10. 10. 10. 10. 10. 10.], (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaApLA4WUjAFDlHSUUpSMBGhpZ2iUaBIolgwAAAAAAAAAAACAPwAAgD8AAIA/lGgKSwOFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWAwAAAAAAAAABAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYDAAAAAAAAAAEBAZRoIUsDhZRoFXSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 1500000, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1677446129579181900, "learning_rate": 0.00010679258738466367, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV7wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMXi9yb290L21pbmljb25kYTMvZW52cy9kZWVwLXJsLWhmL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjF4vcm9vdC9taW5pY29uZGEzL2VudnMvZGVlcC1ybC1oZi9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8b/rquW+AohZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAcaPMPmTN17qrahY/caPMPmTN17qrahY/caPMPmTN17qrahY/caPMPmTN17qrahY/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAvyTIP9v8Kb9rfEU/SsDZP+T9oD9fmzY+ZRHZPw/suD+vkRa/7EvRv5NunL4AsAe+lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAABxo8w+ZM3XuqtqFj83XcI7wMU3usGSOjxxo8w+ZM3XuqtqFj83XcI7wMU3usGSOjxxo8w+ZM3XuqtqFj83XcI7wMU3usGSOjxxo8w+ZM3XuqtqFj83XcI7wMU3usGSOjyUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 0.39968446 -0.00164644 0.5875651 ]\n [ 0.39968446 -0.00164644 0.5875651 ]\n [ 0.39968446 -0.00164644 0.5875651 ]\n [ 0.39968446 -0.00164644 0.5875651 ]]", "desired_goal": "[[ 1.5636214 -0.6640145 0.7714297 ]\n [ 1.7011807 1.2577481 0.17832707]\n [ 1.6958433 1.4447039 -0.58816046]\n [-1.6351295 -0.3055311 -0.13250732]]", "observation": "[[ 0.39968446 -0.00164644 0.5875651 0.00593152 -0.00070104 0.01138753]\n [ 0.39968446 -0.00164644 0.5875651 0.00593152 -0.00070104 0.01138753]\n [ 0.39968446 -0.00164644 0.5875651 0.00593152 -0.00070104 0.01138753]\n [ 0.39968446 -0.00164644 0.5875651 0.00593152 -0.00070104 0.01138753]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAARYrYveudy7x85Hg+sT+NvBKKkzyKUmM+tYl6vcolSzyWjAI+MVbYvU8KDT4wGhY9lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[-0.10573248 -0.02485557 0.2430591 ]\n [-0.01724228 0.01801017 0.22199455]\n [-0.06116648 0.01239915 0.12748942]\n [-0.10563315 0.13773464 0.03664607]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIke18PzV+DMCUhpRSlIwBbJRLMowBdJRHQLAk4jtG/et1fZQoaAZoCWgPQwjU8ZiByngOwJSGlFKUaBVLMmgWR0CwI+Uiliz+dX2UKGgGaAloD0MIgCctXFYBCsCUhpRSlGgVSzJoFkdAsCL6p++dsnV9lChoBmgJaA9DCEbu6eqOBQ3AlIaUUpRoFUsyaBZHQLAh3OwgTyt1fZQoaAZoCWgPQwjRzf5AuW0RwJSGlFKUaBVLMmgWR0CwJWFUp/gBdX2UKGgGaAloD0MIyTocXaUbF8CUhpRSlGgVSzJoFkdAsCRkOuq3mXV9lChoBmgJaA9DCKuzWmCPKQ3AlIaUUpRoFUsyaBZHQLAjeb6guh91fZQoaAZoCWgPQwgGRl7WxHITwJSGlFKUaBVLMmgWR0CwIlv69CeFdX2UKGgGaAloD0MI6ITQQZcwEMCUhpRSlGgVSzJoFkdAsCXfVawD/3V9lChoBmgJaA9DCOLkfoeiwAnAlIaUUpRoFUsyaBZHQLAk4ixVyWB1fZQoaAZoCWgPQwgGEhQ/xpwNwJSGlFKUaBVLMmgWR0CwI/fIfbKzdX2UKGgGaAloD0MIlExO7QzjEcCUhpRSlGgVSzJoFkdAsCLaA2AG0XV9lChoBmgJaA9DCM8sCVBTSxvAlIaUUpRoFUsyaBZHQLAmXbQ1JlJ1fZQoaAZoCWgPQwgZjuczoE4RwJSGlFKUaBVLMmgWR0CwJWCJ9AoodX2UKGgGaAloD0MIp11MM93rDsCUhpRSlGgVSzJoFkdAsCR2HXVbzXV9lChoBmgJaA9DCC6rsBngohfAlIaUUpRoFUsyaBZHQLAjWFSsKb91fZQoaAZoCWgPQwijdOlfkroXwJSGlFKUaBVLMmgWR0CwJthX4j8ldX2UKGgGaAloD0MIqaJ4lbV9EMCUhpRSlGgVSzJoFkdAsCXbL8rI53V9lChoBmgJaA9DCNek2xK5MBLAlIaUUpRoFUsyaBZHQLAk8Lgn+hp1fZQoaAZoCWgPQwi++Q0TDUIQwJSGlFKUaBVLMmgWR0CwI9L0WdmQdX2UKGgGaAloD0MI86ykFd/QEsCUhpRSlGgVSzJoFkdAsCdhAWzninV9lChoBmgJaA9DCEyln3B2SxnAlIaUUpRoFUsyaBZHQLAmY9rGipN1fZQoaAZoCWgPQwhoz2VqEjwJwJSGlFKUaBVLMmgWR0CwJXldX1aodX2UKGgGaAloD0MIHjLlQ1BVE8CUhpRSlGgVSzJoFkdAsCRbnMdLhHV9lChoBmgJaA9DCNXQBmADUhbAlIaUUpRoFUsyaBZHQLAn266reZZ1fZQoaAZoCWgPQwh1djI4Sv4TwJSGlFKUaBVLMmgWR0CwJt6KxcFAdX2UKGgGaAloD0MIjbeVXpvtCcCUhpRSlGgVSzJoFkdAsCX0IsyzonV9lChoBmgJaA9DCO6wicxcwAXAlIaUUpRoFUsyaBZHQLAk1mMOwxF1fZQoaAZoCWgPQwjE0OrkDMULwJSGlFKUaBVLMmgWR0CwKGKS1Vo6dX2UKGgGaAloD0MIV7JjIxB/FMCUhpRSlGgVSzJoFkdAsCdlaePJaXV9lChoBmgJaA9DCGFUUiegmRrAlIaUUpRoFUsyaBZHQLAmeuctoSN1fZQoaAZoCWgPQwjkDwaee+8JwJSGlFKUaBVLMmgWR0CwJV0pqh11dX2UKGgGaAloD0MI7bsi+N8KBcCUhpRSlGgVSzJoFkdAsCje2c8Tz3V9lChoBmgJaA9DCCGRtvEnygnAlIaUUpRoFUsyaBZHQLAn4bYK6Wh1fZQoaAZoCWgPQwh/hcyVQdUGwJSGlFKUaBVLMmgWR0CwJvc+V1OkdX2UKGgGaAloD0MIRrJHqBkyC8CUhpRSlGgVSzJoFkdAsCXZkRSP2nV9lChoBmgJaA9DCHv3x3vVigzAlIaUUpRoFUsyaBZHQLApWz3AVO91fZQoaAZoCWgPQwgQlNv2PVoTwJSGlFKUaBVLMmgWR0CwKF4O6NEPdX2UKGgGaAloD0MIaww6IXQwB8CUhpRSlGgVSzJoFkdAsCdzrNW2gHV9lChoBmgJaA9DCBL6mXrdchPAlIaUUpRoFUsyaBZHQLAmVe67NB51fZQoaAZoCWgPQwhDyHn/HycIwJSGlFKUaBVLMmgWR0CwKdd8VpK0dX2UKGgGaAloD0MI2ZdsPNhCCsCUhpRSlGgVSzJoFkdAsCjaTHKfWnV9lChoBmgJaA9DCIcx6e+lsBDAlIaUUpRoFUsyaBZHQLAn78hs67x1fZQoaAZoCWgPQwjFdCFWf8QWwJSGlFKUaBVLMmgWR0CwJtIJiRW+dX2UKGgGaAloD0MIXFg33h35DcCUhpRSlGgVSzJoFkdAsCpmRxLkCHV9lChoBmgJaA9DCMgjuJGydRXAlIaUUpRoFUsyaBZHQLApaT4+KTB1fZQoaAZoCWgPQwhbfXVVoHYZwJSGlFKUaBVLMmgWR0CwKH7KFIuodX2UKGgGaAloD0MIbSBdbFpJC8CUhpRSlGgVSzJoFkdAsCdhDArQPnV9lChoBmgJaA9DCBqLprOTIRHAlIaUUpRoFUsyaBZHQLAq5No8IRh1fZQoaAZoCWgPQwiYMnBAS9cIwJSGlFKUaBVLMmgWR0CwKeeu/1xsdX2UKGgGaAloD0MIRn79EBt8EcCUhpRSlGgVSzJoFkdAsCj9N/OMVHV9lChoBmgJaA9DCBCtFW2OgxLAlIaUUpRoFUsyaBZHQLAn332mHgx1fZQoaAZoCWgPQwgBwocSLbkOwJSGlFKUaBVLMmgWR0CwK2HbmEGrdX2UKGgGaAloD0MIArfu5qlOFsCUhpRSlGgVSzJoFkdAsCpkrWiDd3V9lChoBmgJaA9DCD60jxX8hhbAlIaUUpRoFUsyaBZHQLApeigkC3h1fZQoaAZoCWgPQwhdv2A3bGsSwJSGlFKUaBVLMmgWR0CwKFxy8zyjdX2UKGgGaAloD0MIm1d1VgtMDsCUhpRSlGgVSzJoFkdAsCveYrrgO3V9lChoBmgJaA9DCAkbnl4pGxXAlIaUUpRoFUsyaBZHQLAq4T6zmfZ1fZQoaAZoCWgPQwiBI4EGm3oSwJSGlFKUaBVLMmgWR0CwKfa0D2aldX2UKGgGaAloD0MI7UW0HVO3BMCUhpRSlGgVSzJoFkdAsCjY8QqZt3V9lChoBmgJaA9DCNszSwLUtBHAlIaUUpRoFUsyaBZHQLAsWPS2H+J1fZQoaAZoCWgPQwiPpQ9dUN8OwJSGlFKUaBVLMmgWR0CwK1vJA+pwdX2UKGgGaAloD0MIP8dHizOGD8CUhpRSlGgVSzJoFkdAsCpxRMvh63V9lChoBmgJaA9DCMr6zcR0IQ3AlIaUUpRoFUsyaBZHQLApU4Pf8/F1fZQoaAZoCWgPQwgCYhIu5HEIwJSGlFKUaBVLMmgWR0CwLNr39JjEdX2UKGgGaAloD0MIHAdeLXcmCsCUhpRSlGgVSzJoFkdAsCvd4RmK7HV9lChoBmgJaA9DCHUCmggbDhLAlIaUUpRoFUsyaBZHQLAq811GLDR1fZQoaAZoCWgPQwhbecn/5C8JwJSGlFKUaBVLMmgWR0CwKdWyTpxFdX2UKGgGaAloD0MIiLzl6semCcCUhpRSlGgVSzJoFkdAsC1S1YyO73V9lChoBmgJaA9DCFyTbkvkAhLAlIaUUpRoFUsyaBZHQLAsVaXa8Hx1fZQoaAZoCWgPQwhLcyuE1YgRwJSGlFKUaBVLMmgWR0CwK2sjAzpHdX2UKGgGaAloD0MIw0Xu6epuDcCUhpRSlGgVSzJoFkdAsCpNZEDyOXV9lChoBmgJaA9DCPvqqkAtRhPAlIaUUpRoFUsyaBZHQLAt0Fkxyn11fZQoaAZoCWgPQwi1UZ0OZN0OwJSGlFKUaBVLMmgWR0CwLNMoc7yQdX2UKGgGaAloD0MI7rWg98awDMCUhpRSlGgVSzJoFkdAsCvoqMFUynV9lChoBmgJaA9DCEiHhzB++gXAlIaUUpRoFUsyaBZHQLAqyuh9LHx1fZQoaAZoCWgPQwhG7X4V4OsRwJSGlFKUaBVLMmgWR0CwLkutOmBOdX2UKGgGaAloD0MITU2CN6RxDcCUhpRSlGgVSzJoFkdAsC1OfRNRFnV9lChoBmgJaA9DCEimQ6fnjRXAlIaUUpRoFUsyaBZHQLAsY/wy6+Z1fZQoaAZoCWgPQwg+6Nms+rwMwJSGlFKUaBVLMmgWR0CwK0Y8U21ldX2UKGgGaAloD0MImpfD7jtmCcCUhpRSlGgVSzJoFkdAsC7KsRxtHnV9lChoBmgJaA9DCIeIm1PJgAvAlIaUUpRoFUsyaBZHQLAtzYpUgjh1fZQoaAZoCWgPQwhgIt46/7YJwJSGlFKUaBVLMmgWR0CwLOMGs3hodX2UKGgGaAloD0MITrNAu0MqCsCUhpRSlGgVSzJoFkdAsCvFP0qYq3V9lChoBmgJaA9DCO2BVmDIqhHAlIaUUpRoFUsyaBZHQLAvRhxo7FN1fZQoaAZoCWgPQwi1M0xtqcMOwJSGlFKUaBVLMmgWR0CwLkkDlo12dX2UKGgGaAloD0MIAcPy59vCEMCUhpRSlGgVSzJoFkdAsC1ef16E8XV9lChoBmgJaA9DCMOcoE0Ofw3AlIaUUpRoFUsyaBZHQLAsQNUwSJ11fZQoaAZoCWgPQwhNnx1wXdELwJSGlFKUaBVLMmgWR0CwL8LLdN34dX2UKGgGaAloD0MIiPNwAtMJHsCUhpRSlGgVSzJoFkdAsC7FpYcNpnV9lChoBmgJaA9DCIP4wI7/4gPAlIaUUpRoFUsyaBZHQLAt2zEaVD91fZQoaAZoCWgPQwit30xMF0IdwJSGlFKUaBVLMmgWR0CwLL2KuSwGdX2UKGgGaAloD0MIrVEP0ehuDsCUhpRSlGgVSzJoFkdAsDBBTn7pFHV9lChoBmgJaA9DCGrC9pMxBiDAlIaUUpRoFUsyaBZHQLAvRCMPz4F1fZQoaAZoCWgPQwhoQpPEkgITwJSGlFKUaBVLMmgWR0CwLlm3KB/adX2UKGgGaAloD0MIuk24V+atDsCUhpRSlGgVSzJoFkdAsC07/T9bYHV9lChoBmgJaA9DCMUe2scKPg/AlIaUUpRoFUsyaBZHQLAwwuVHFxZ1fZQoaAZoCWgPQwhkzjP2JdsOwJSGlFKUaBVLMmgWR0CwL8Wz0HyFdX2UKGgGaAloD0MILudSXFWWCsCUhpRSlGgVSzJoFkdAsC7bYRNAT3V9lChoBmgJaA9DCIgq/BnebArAlIaUUpRoFUsyaBZHQLAtveGwiaB1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 37500, "n_steps": 10, "gamma": 0.9005397464660235, "gae_lambda": 0.8043567334308052, "ent_coef": 0.0654376522770753, "vf_coef": 0.3415400217360765, "max_grad_norm": 0.472916136764715, "normalize_advantage": false, "system_info": {"OS": "Linux-5.10.16.3-microsoft-standard-WSL2-x86_64-with-glibc2.31 # 1 SMP Fri Apr 2 22:23:49 UTC 2021", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu117", "GPU Enabled": "True", "Numpy": "1.24.2", "Gym": "0.21.0"}}
|
replay.mp4
CHANGED
|
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward": -
|
|
|
|
| 1 |
+
{"mean_reward": -2.0801983545999976, "std_reward": 0.33162997076077927, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-02-26T23:29:42.176945"}
|
vec_normalize.pkl
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3056
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb5f6d5a9c66e3419b8fd1ee03768b09e0f1891ba33244869cbc6f9f2a50c449
|
| 3 |
size 3056
|