Initial commit
Browse files- README.md +1 -1
- a2c-PandaReachDense-v2.zip +2 -2
- a2c-PandaReachDense-v2/data +19 -19
- a2c-PandaReachDense-v2/policy.optimizer.pth +1 -1
- a2c-PandaReachDense-v2/policy.pth +1 -1
- config.json +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
- vec_normalize.pkl +1 -1
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: PandaReachDense-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value: -1.
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: PandaReachDense-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: -1.39 +/- 0.23
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
a2c-PandaReachDense-v2.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de68a4be76b0ee109082f3d9389342d258ceaecb7435005d872e157f48d4294d
|
| 3 |
+
size 108198
|
a2c-PandaReachDense-v2/data
CHANGED
|
@@ -4,9 +4,9 @@
|
|
| 4 |
":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
-
"__init__": "<function MultiInputActorCriticPolicy.__init__ at
|
| 8 |
"__abstractmethods__": "frozenset()",
|
| 9 |
-
"_abc_impl": "<_abc._abc_data object at
|
| 10 |
},
|
| 11 |
"verbose": 1,
|
| 12 |
"policy_kwargs": {
|
|
@@ -41,53 +41,53 @@
|
|
| 41 |
"_np_random": null
|
| 42 |
},
|
| 43 |
"n_envs": 4,
|
| 44 |
-
"num_timesteps":
|
| 45 |
"_total_timesteps": 1000000,
|
| 46 |
"_num_timesteps_at_start": 0,
|
| 47 |
"seed": null,
|
| 48 |
"action_noise": null,
|
| 49 |
-
"start_time":
|
| 50 |
-
"learning_rate": 0.
|
| 51 |
"tensorboard_log": null,
|
| 52 |
"lr_schedule": {
|
| 53 |
":type:": "<class 'function'>",
|
| 54 |
-
":serialized:": "gAWVAQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZy9ob21lL3UvbWluaWNvbmRhMy9lbnZzL2h1Z2dpbmdmYWNlLXVuaXQ2L2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGcvaG9tZS91L21pbmljb25kYTMvZW52cy9odWdnaW5nZmFjZS11bml0Ni9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+
|
| 55 |
},
|
| 56 |
"_last_obs": {
|
| 57 |
":type:": "<class 'collections.OrderedDict'>",
|
| 58 |
-
":serialized:": "
|
| 59 |
-
"achieved_goal": "[[0.
|
| 60 |
-
"desired_goal": "[[
|
| 61 |
-
"observation": "[[
|
| 62 |
},
|
| 63 |
"_last_episode_starts": {
|
| 64 |
":type:": "<class 'numpy.ndarray'>",
|
| 65 |
-
":serialized:": "
|
| 66 |
},
|
| 67 |
"_last_original_obs": {
|
| 68 |
":type:": "<class 'collections.OrderedDict'>",
|
| 69 |
-
":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////
|
| 70 |
"achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
|
| 71 |
-
"desired_goal": "[[ 0.
|
| 72 |
"observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
|
| 73 |
},
|
| 74 |
"_episode_num": 0,
|
| 75 |
"use_sde": false,
|
| 76 |
"sde_sample_freq": -1,
|
| 77 |
-
"_current_progress_remaining": 0.
|
| 78 |
"ep_info_buffer": {
|
| 79 |
":type:": "<class 'collections.deque'>",
|
| 80 |
-
":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////
|
| 81 |
},
|
| 82 |
"ep_success_buffer": {
|
| 83 |
":type:": "<class 'collections.deque'>",
|
| 84 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 85 |
},
|
| 86 |
-
"_n_updates":
|
| 87 |
-
"n_steps":
|
| 88 |
-
"gamma": 0.
|
| 89 |
"gae_lambda": 1.0,
|
| 90 |
-
"ent_coef": 0.
|
| 91 |
"vf_coef": 0.5,
|
| 92 |
"max_grad_norm": 0.5,
|
| 93 |
"normalize_advantage": false
|
|
|
|
| 4 |
":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
|
| 5 |
"__module__": "stable_baselines3.common.policies",
|
| 6 |
"__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
| 7 |
+
"__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7fb0446b6f70>",
|
| 8 |
"__abstractmethods__": "frozenset()",
|
| 9 |
+
"_abc_impl": "<_abc._abc_data object at 0x7fb0446b5e80>"
|
| 10 |
},
|
| 11 |
"verbose": 1,
|
| 12 |
"policy_kwargs": {
|
|
|
|
| 41 |
"_np_random": null
|
| 42 |
},
|
| 43 |
"n_envs": 4,
|
| 44 |
+
"num_timesteps": 1001472,
|
| 45 |
"_total_timesteps": 1000000,
|
| 46 |
"_num_timesteps_at_start": 0,
|
| 47 |
"seed": null,
|
| 48 |
"action_noise": null,
|
| 49 |
+
"start_time": 1680377738771037922,
|
| 50 |
+
"learning_rate": 0.0014735441345589378,
|
| 51 |
"tensorboard_log": null,
|
| 52 |
"lr_schedule": {
|
| 53 |
":type:": "<class 'function'>",
|
| 54 |
+
":serialized:": "gAWVAQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZy9ob21lL3UvbWluaWNvbmRhMy9lbnZzL2h1Z2dpbmdmYWNlLXVuaXQ2L2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGcvaG9tZS91L21pbmljb25kYTMvZW52cy9odWdnaW5nZmFjZS11bml0Ni9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9YJH33f0ZzhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
| 55 |
},
|
| 56 |
"_last_obs": {
|
| 57 |
":type:": "<class 'collections.OrderedDict'>",
|
| 58 |
+
":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA7/yPP5jVfb9HWig/HxRmP634zr9Hv2W//rTXP+kC3T767KW/doHHP+sxZb58/cw/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAABuaWP78aYb+JyR4/fpuFP5vvub9NOpy/s4LDP4o9tD5tDcK/2ciuP5+jsb5Ab9Y/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADv/I8/mNV9v0daKD8tfjq/ciuFvoj0w78fFGY/rfjOv0e/Zb8i8YC+zl1RPdQLE7/+tNc/6QLdPvrspb88gdg+R+c9PxUpez92gcc/6zFlvnz9zD8sj++8dqc0vxgeHz+UaA5LBEsGhpRoEnSUUpR1Lg==",
|
| 59 |
+
"achieved_goal": "[[ 1.1249064 -0.99154043 0.6576275 ]\n [ 0.8987445 -1.616964 -0.8974499 ]\n [ 1.685211 0.43166283 -1.2962945 ]\n [ 1.5586383 -0.22382323 1.6014857 ]]",
|
| 60 |
+
"desired_goal": "[[ 1.1788948 -0.87931436 0.6202627 ]\n [ 1.0438077 -1.4526247 -1.2205292 ]\n [ 1.5274261 0.352032 -1.5160347 ]\n [ 1.3655044 -0.34695145 1.6752701 ]]",
|
| 61 |
+
"observation": "[[ 1.1249064 -0.99154043 0.6576275 -0.7284878 -0.2600971 -1.5309 ]\n [ 0.8987445 -1.616964 -0.8974499 -0.2518397 0.05111485 -0.57439923]\n [ 1.685211 0.43166283 -1.2962945 0.42286098 0.74181026 0.9810956 ]\n [ 1.5586383 -0.22382323 1.6014857 -0.02924307 -0.70568025 0.62155294]]"
|
| 62 |
},
|
| 63 |
"_last_episode_starts": {
|
| 64 |
":type:": "<class 'numpy.ndarray'>",
|
| 65 |
+
":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="
|
| 66 |
},
|
| 67 |
"_last_original_obs": {
|
| 68 |
":type:": "<class 'collections.OrderedDict'>",
|
| 69 |
+
":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAbiURPmePFb7Mst87sEALvj8BCr1jG8U8yXLQPZkLgb1fexI9bBv/PUu2E777TxE+lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==",
|
| 70 |
"achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
|
| 71 |
+
"desired_goal": "[[ 0.14174435 -0.14605485 0.00682673]\n [-0.13598895 -0.03369259 0.02406091]\n [ 0.10178144 -0.0630104 0.03576219]\n [ 0.12456402 -0.14425008 0.14190666]]",
|
| 72 |
"observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
|
| 73 |
},
|
| 74 |
"_episode_num": 0,
|
| 75 |
"use_sde": false,
|
| 76 |
"sde_sample_freq": -1,
|
| 77 |
+
"_current_progress_remaining": -0.0014719999999999178,
|
| 78 |
"ep_info_buffer": {
|
| 79 |
":type:": "<class 'collections.deque'>",
|
| 80 |
+
":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI6+V3msw48b+UhpRSlIwBbJRLMowBdJRHQJcZN2St/4J1fZQoaAZoCWgPQwi8z/HR4oz4v5SGlFKUaBVLMmgWR0CXGOj7ALy+dX2UKGgGaAloD0MIOIO/X8wW+7+UhpRSlGgVSzJoFkdAlxipnlGPP3V9lChoBmgJaA9DCPUTzm4tk/i/lIaUUpRoFUsyaBZHQJcYUOby6MB1fZQoaAZoCWgPQwilhGBVvTz+v5SGlFKUaBVLMmgWR0CXGmajN6gNdX2UKGgGaAloD0MI/dmPFJGh9r+UhpRSlGgVSzJoFkdAlxoYXbdrPHV9lChoBmgJaA9DCO4E+69zk/2/lIaUUpRoFUsyaBZHQJcZ2TA31jB1fZQoaAZoCWgPQwhjmuleJzX4v5SGlFKUaBVLMmgWR0CXGYBC2MKkdX2UKGgGaAloD0MIlE4kmGom+r+UhpRSlGgVSzJoFkdAlxuTLwF1S3V9lChoBmgJaA9DCM3lBkMdFvi/lIaUUpRoFUsyaBZHQJcbRMdtEXt1fZQoaAZoCWgPQwiKWS+GciL+v5SGlFKUaBVLMmgWR0CXGwVhCtzTdX2UKGgGaAloD0MIPSr+74iK9b+UhpRSlGgVSzJoFkdAlxqschkiEHV9lChoBmgJaA9DCPgW1o13h/W/lIaUUpRoFUsyaBZHQJccueDnNgV1fZQoaAZoCWgPQwib5h2n6Ej1v5SGlFKUaBVLMmgWR0CXHGvaURnOdX2UKGgGaAloD0MIrdwLzArF+7+UhpRSlGgVSzJoFkdAlxwsl5WzW3V9lChoBmgJaA9DCNP6WwLwz/S/lIaUUpRoFUsyaBZHQJcb1BY3eep1fZQoaAZoCWgPQwhdxHdi1sv3v5SGlFKUaBVLMmgWR0CXHfVh1DBudX2UKGgGaAloD0MInZyhuOPN8r+UhpRSlGgVSzJoFkdAlx2m9+PRzHV9lChoBmgJaA9DCMnH7gIlRfq/lIaUUpRoFUsyaBZHQJcdZ6u4gA91fZQoaAZoCWgPQwimXrcIjLX7v5SGlFKUaBVLMmgWR0CXHQ619fCzdX2UKGgGaAloD0MIhq+vdamR+L+UhpRSlGgVSzJoFkdAlx8fIS13MnV9lChoBmgJaA9DCGkbf6KyYfq/lIaUUpRoFUsyaBZHQJce0LXtjTd1fZQoaAZoCWgPQwivzcZKzLP4v5SGlFKUaBVLMmgWR0CXHpFh5PdmdX2UKGgGaAloD0MIgbIpV3gX8r+UhpRSlGgVSzJoFkdAlx44ePq9oXV9lChoBmgJaA9DCJtattYXyfe/lIaUUpRoFUsyaBZHQJcgM1uR9w51fZQoaAZoCWgPQwg6rkZ2peX2v5SGlFKUaBVLMmgWR0CXH+T8YQ8PdX2UKGgGaAloD0MIJSL8i6Cx8r+UhpRSlGgVSzJoFkdAlx+lmOEM9nV9lChoBmgJaA9DCFvtYS8UcPq/lIaUUpRoFUsyaBZHQJcfTJ9y9251fZQoaAZoCWgPQwjylxb1Sa71v5SGlFKUaBVLMmgWR0CXIUT3qRlpdX2UKGgGaAloD0MIdO0L6IX7/r+UhpRSlGgVSzJoFkdAlyD2mP5pJ3V9lChoBmgJaA9DCEuuYvGbwva/lIaUUpRoFUsyaBZHQJcgt0ZFXq91fZQoaAZoCWgPQwg/rDdqhSn4v5SGlFKUaBVLMmgWR0CXIF5jpcHGdX2UKGgGaAloD0MI6ui4GtkV+L+UhpRSlGgVSzJoFkdAlyJpl8PWhHV9lChoBmgJaA9DCOOkMO9xpva/lIaUUpRoFUsyaBZHQJciG09hZyN1fZQoaAZoCWgPQwiMvKyJBf71v5SGlFKUaBVLMmgWR0CXIdv6j323dX2UKGgGaAloD0MI9WbUfJU8+b+UhpRSlGgVSzJoFkdAlyGDAaef7XV9lChoBmgJaA9DCBmveVVn9fe/lIaUUpRoFUsyaBZHQJcjlJI1+Ap1fZQoaAZoCWgPQwi0Hr5MFOH4v5SGlFKUaBVLMmgWR0CXI0YnOSntdX2UKGgGaAloD0MIrOC3IcZr+b+UhpRSlGgVSzJoFkdAlyMG1IAfdXV9lChoBmgJaA9DCL4uw3+6gfW/lIaUUpRoFUsyaBZHQJcireVLSNR1fZQoaAZoCWgPQwhqZ5jaUof1v5SGlFKUaBVLMmgWR0CXJL60pmVadX2UKGgGaAloD0MIn69ZLhsd+L+UhpRSlGgVSzJoFkdAlyRwX2ugYnV9lChoBmgJaA9DCMBfzJasiva/lIaUUpRoFUsyaBZHQJckMPpY9xJ1fZQoaAZoCWgPQwgtsp3vp8byv5SGlFKUaBVLMmgWR0CXI9gHu7YkdX2UKGgGaAloD0MIlC9oIQGj87+UhpRSlGgVSzJoFkdAlyXnIU8FIXV9lChoBmgJaA9DCNMSK6ORD/u/lIaUUpRoFUsyaBZHQJclmMXJo011fZQoaAZoCWgPQwgIc7uX+6T6v5SGlFKUaBVLMmgWR0CXJVlcyFfzdX2UKGgGaAloD0MIHNKowMn2+r+UhpRSlGgVSzJoFkdAlyUAaef7JnV9lChoBmgJaA9DCOmbNA2KZvu/lIaUUpRoFUsyaBZHQJcnFDPWxyJ1fZQoaAZoCWgPQwg7iQj/Iij3v5SGlFKUaBVLMmgWR0CXJsXKbKA8dX2UKGgGaAloD0MIMPKyJhb49r+UhpRSlGgVSzJoFkdAlyaGcnVoYnV9lChoBmgJaA9DCDRnfcoxmfq/lIaUUpRoFUsyaBZHQJcmLa24NI91fZQoaAZoCWgPQwgyPPazWIr4v5SGlFKUaBVLMmgWR0CXKDmAskIHdX2UKGgGaAloD0MIHaopyTrc+b+UhpRSlGgVSzJoFkdAlyfrGvOhTXV9lChoBmgJaA9DCN/7G7RX3/m/lIaUUpRoFUsyaBZHQJcnrB3zMA51fZQoaAZoCWgPQwi/tn76zxr5v5SGlFKUaBVLMmgWR0CXJ1McIZ62dX2UKGgGaAloD0MIQiJt40+U+7+UhpRSlGgVSzJoFkdAlylk1Muez3V9lChoBmgJaA9DCO6yX3e6s/m/lIaUUpRoFUsyaBZHQJcpFqfvnbJ1fZQoaAZoCWgPQwhZvi7Df3r4v5SGlFKUaBVLMmgWR0CXKNd7OVxCdX2UKGgGaAloD0MIkpVfBmOE+7+UhpRSlGgVSzJoFkdAlyh+zhP0qnV9lChoBmgJaA9DCMKFPIIbafi/lIaUUpRoFUsyaBZHQJcqm4Wk8A91fZQoaAZoCWgPQwijztxDwnf2v5SGlFKUaBVLMmgWR0CXKk0j1PFedX2UKGgGaAloD0MI9utOd544/7+UhpRSlGgVSzJoFkdAlyoOFQEZBXV9lChoBmgJaA9DCKD7cma7Qv2/lIaUUpRoFUsyaBZHQJcptXtBv751fZQoaAZoCWgPQwgaGeQuwtT8v5SGlFKUaBVLMmgWR0CXK8cYIjW1dX2UKGgGaAloD0MIQuvhy0QR+r+UhpRSlGgVSzJoFkdAlyt4sd1dPnV9lChoBmgJaA9DCN3T1R2LLfe/lIaUUpRoFUsyaBZHQJcrOU5dWyV1fZQoaAZoCWgPQwjOM/YlG8/1v5SGlFKUaBVLMmgWR0CXKuBN21UmdX2UKGgGaAloD0MIKUF/oUcM9r+UhpRSlGgVSzJoFkdAlyzx0lqrR3V9lChoBmgJaA9DCIV4JF6eTve/lIaUUpRoFUsyaBZHQJcso2vStvJ1fZQoaAZoCWgPQwgvaYzWUZX1v5SGlFKUaBVLMmgWR0CXLGQJokAxdX2UKGgGaAloD0MIqiwKuyh6+r+UhpRSlGgVSzJoFkdAlywLJOnEVHV9lChoBmgJaA9DCIMvTKYKhvi/lIaUUpRoFUsyaBZHQJcuHnNgSe11fZQoaAZoCWgPQwjWx0Pf3cr6v5SGlFKUaBVLMmgWR0CXLdALRa5gdX2UKGgGaAloD0MI6GZ/oNy29L+UhpRSlGgVSzJoFkdAly2QrUb1iHV9lChoBmgJaA9DCEW8df7tcvi/lIaUUpRoFUsyaBZHQJctN72L5yl1fZQoaAZoCWgPQwjItgw4S8n6v5SGlFKUaBVLMmgWR0CXL0gGr0aqdX2UKGgGaAloD0MIV0J3SZyV9L+UhpRSlGgVSzJoFkdAly75nctXgnV9lChoBmgJaA9DCB+7C5QUmPq/lIaUUpRoFUsyaBZHQJcuujqOcUd1fZQoaAZoCWgPQwjFAIkmUET0v5SGlFKUaBVLMmgWR0CXLmFId2gWdX2UKGgGaAloD0MILzTXaaRl9r+UhpRSlGgVSzJoFkdAlzBzT4L1EnV9lChoBmgJaA9DCJvkR/yKNfa/lIaUUpRoFUsyaBZHQJcwJRJmNBF1fZQoaAZoCWgPQwjWOnE5XsHyv5SGlFKUaBVLMmgWR0CXL+XZXdTHdX2UKGgGaAloD0MIKgDGM2jo+L+UhpRSlGgVSzJoFkdAly+M6vJRwnV9lChoBmgJaA9DCBk5C3va4fe/lIaUUpRoFUsyaBZHQJcxndLxqfx1fZQoaAZoCWgPQwj11VWBWsz4v5SGlFKUaBVLMmgWR0CXMU9vjwQUdX2UKGgGaAloD0MI5dL4hVcS+7+UhpRSlGgVSzJoFkdAlzEQOavzOHV9lChoBmgJaA9DCCOfVzz1SPi/lIaUUpRoFUsyaBZHQJcwtzvJA+p1fZQoaAZoCWgPQwjrNqj91o76v5SGlFKUaBVLMmgWR0CXMsrTpgTidX2UKGgGaAloD0MIfZI7bCIz+r+UhpRSlGgVSzJoFkdAlzJ8bFS88XV9lChoBmgJaA9DCDzbozfcB/e/lIaUUpRoFUsyaBZHQJcyPTTfBN51fZQoaAZoCWgPQwiWsgxxrAv6v5SGlFKUaBVLMmgWR0CXMeSaEzwddX2UKGgGaAloD0MIYRkbutkf+L+UhpRSlGgVSzJoFkdAlzP3r+o993V9lChoBmgJaA9DCKfNOA1RRfu/lIaUUpRoFUsyaBZHQJczqUJOWSl1fZQoaAZoCWgPQwj27SQi/Ev2v5SGlFKUaBVLMmgWR0CXM2nl4keIdX2UKGgGaAloD0MII9v5fmq89L+UhpRSlGgVSzJoFkdAlzMQ9FF2FHV9lChoBmgJaA9DCF+y8WCL3fe/lIaUUpRoFUsyaBZHQJc1JvtMPBl1fZQoaAZoCWgPQwgwL8A+OnX2v5SGlFKUaBVLMmgWR0CXNNiTMaCMdX2UKGgGaAloD0MIoOHNGrzv+b+UhpRSlGgVSzJoFkdAlzSZON5t33V9lChoBmgJaA9DCEt1AS8zbPe/lIaUUpRoFUsyaBZHQJc0QD0UXYV1ZS4="
|
| 81 |
},
|
| 82 |
"ep_success_buffer": {
|
| 83 |
":type:": "<class 'collections.deque'>",
|
| 84 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 85 |
},
|
| 86 |
+
"_n_updates": 489,
|
| 87 |
+
"n_steps": 512,
|
| 88 |
+
"gamma": 0.9546251877513446,
|
| 89 |
"gae_lambda": 1.0,
|
| 90 |
+
"ent_coef": 0.00012083804240540896,
|
| 91 |
"vf_coef": 0.5,
|
| 92 |
"max_grad_norm": 0.5,
|
| 93 |
"normalize_advantage": false
|
a2c-PandaReachDense-v2/policy.optimizer.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 44734
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f83726cdce6511fa20ebcc5902ad083ed5ca3f671ba7625140613f3b17261a17
|
| 3 |
size 44734
|
a2c-PandaReachDense-v2/policy.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 46014
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b4161230e925be80cb72f48c15bd3a9d5c2deb15e2f609ce3cb52ebd3d9eedf
|
| 3 |
size 46014
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7f413ff6eee0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f413ff708c0>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.dict.Dict'>", ":serialized:": "gAWVUgMAAAAAAACMD2d5bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwOZ3ltLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUaBCTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowGX3NoYXBllEsDhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZSMAUOUdJRSlIwEaGlnaJRoHSiWDAAAAAAAAAAAACBBAAAgQQAAIEGUaBVLA4WUaCB0lFKUjA1ib3VuZGVkX2JlbG93lGgdKJYDAAAAAAAAAAEBAZRoEowCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZRoIHSUUpSMDWJvdW5kZWRfYWJvdmWUaB0olgMAAAAAAAAAAQEBlGgsSwOFlGggdJRSlIwKX25wX3JhbmRvbZROdWKMDGRlc2lyZWRfZ29hbJRoDSmBlH2UKGgQaBVoGEsDhZRoGmgdKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZRoIHSUUpRoI2gdKJYMAAAAAAAAAAAAIEEAACBBAAAgQZRoFUsDhZRoIHSUUpRoKGgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoMmgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoN051YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgVaBhLBoWUaBpoHSiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBVLBoWUaCB0lFKUaCNoHSiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBVLBoWUaCB0lFKUaChoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDJoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDdOdWJ1aBhOaBBOaDdOdWIu", "spaces": "OrderedDict([('achieved_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('desired_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('observation', Box([-10. -10. -10. -10. -10. -10.], [10. 10. 10. 10. 10. 10.], (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaApLA4WUjAFDlHSUUpSMBGhpZ2iUaBIolgwAAAAAAAAAAACAPwAAgD8AAIA/lGgKSwOFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWAwAAAAAAAAABAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYDAAAAAAAAAAEBAZRoIUsDhZRoFXSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 1000000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1680364251981433255, "learning_rate": 0.0007, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVAQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZy9ob21lL3UvbWluaWNvbmRhMy9lbnZzL2h1Z2dpbmdmYWNlLXVuaXQ2L2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGcvaG9tZS91L21pbmljb25kYTMvZW52cy9odWdnaW5nZmFjZS11bml0Ni9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9G8AaNuLrHhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAz5W6PowegDuJMg0/z5W6PowegDuJMg0/z5W6PowegDuJMg0/z5W6PowegDuJMg0/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAtqpEv4tZUj/O6ha9wdtVP0HYuj+uFI4/Jsd1vVM/3r4ZheM+tVF5P/iEGT/fuKi/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADPlbo+jB6AO4kyDT/sM1Y7tZl2ukgL87rPlbo+jB6AO4kyDT/sM1Y7tZl2ukgL87rPlbo+jB6AO4kyDT/sM1Y7tZl2ukgL87rPlbo+jB6AO4kyDT/sM1Y7tZl2ukgL87qUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[0.3644242 0.00390989 0.55155236]\n [0.3644242 0.00390989 0.55155236]\n [0.3644242 0.00390989 0.55155236]\n [0.3644242 0.00390989 0.55155236]]", "desired_goal": "[[-0.76822984 0.8216788 -0.03684502]\n [ 0.8353844 1.4597245 1.1100061 ]\n [-0.06000438 -0.43407688 0.44437483]\n [ 0.973903 0.5996852 -1.3181418 ]]", "observation": "[[ 0.3644242 0.00390989 0.55155236 0.00326848 -0.00094071 -0.00185428]\n [ 0.3644242 0.00390989 0.55155236 0.00326848 -0.00094071 -0.00185428]\n [ 0.3644242 0.00390989 0.55155236 0.00326848 -0.00094071 -0.00185428]\n [ 0.3644242 0.00390989 0.55155236 0.00326848 -0.00094071 -0.00185428]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAA2lXNPa/10r3mIF0+mtHavY3QFr0Q6xA+VQ7HPAYM7b0jbGo+6wauPUXN0D0CjYk9lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[ 0.10026141 -0.10300767 0.21594581]\n [-0.1068451 -0.03681998 0.14152169]\n [ 0.02429883 -0.11574559 0.22892813]\n [ 0.08497413 0.10195402 0.06716348]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIVACMZ9DQ7b+UhpRSlIwBbJRLMowBdJRHQJ9cp+nZTQ51fZQoaAZoCWgPQwha1Ce5wybwv5SGlFKUaBVLMmgWR0CfXG2USqVAdX2UKGgGaAloD0MIyqSGNgCb5b+UhpRSlGgVSzJoFkdAn1w0ug6EJ3V9lChoBmgJaA9DCHkEN1K2SOq/lIaUUpRoFUsyaBZHQJ9b/HlwLmZ1fZQoaAZoCWgPQwhDAdvBiD35v5SGlFKUaBVLMmgWR0CfXiTLns9kdX2UKGgGaAloD0MIUigLX19r+r+UhpRSlGgVSzJoFkdAn13qoIfKZHV9lChoBmgJaA9DCNSYEHNJFfG/lIaUUpRoFUsyaBZHQJ9dsaR6nix1fZQoaAZoCWgPQwgukKD4Meb3v5SGlFKUaBVLMmgWR0CfXXlZX+2mdX2UKGgGaAloD0MIT+eKUkKw3L+UhpRSlGgVSzJoFkdAn1/PdAPd23V9lChoBmgJaA9DCPSpY5XSc/+/lIaUUpRoFUsyaBZHQJ9fleNT9891fZQoaAZoCWgPQwjGGFjH8UPsv5SGlFKUaBVLMmgWR0CfX13A2ycDdX2UKGgGaAloD0MIt11ortNI4r+UhpRSlGgVSzJoFkdAn18mIsRQJ3V9lChoBmgJaA9DCN2XM9sVOva/lIaUUpRoFUsyaBZHQJ9hWwmmce91fZQoaAZoCWgPQwgna9RDNDrvv5SGlFKUaBVLMmgWR0CfYSD/2kBTdX2UKGgGaAloD0MIEALyJVSw9b+UhpRSlGgVSzJoFkdAn2DoVIqb0HV9lChoBmgJaA9DCGvylNV0/fK/lIaUUpRoFUsyaBZHQJ9gr80k4WF1fZQoaAZoCWgPQwjMYIxIFJr4v5SGlFKUaBVLMmgWR0CfYsrs0HhTdX2UKGgGaAloD0MIu2JGeHsQ7r+UhpRSlGgVSzJoFkdAn2KQhGH58HV9lChoBmgJaA9DCLh0zHnGfv2/lIaUUpRoFUsyaBZHQJ9iV9iMHbB1fZQoaAZoCWgPQwhh304iwv/zv5SGlFKUaBVLMmgWR0CfYh+PBBRidX2UKGgGaAloD0MIZED2eveH8r+UhpRSlGgVSzJoFkdAn2Q5VsDW9XV9lChoBmgJaA9DCDGXVG03wfi/lIaUUpRoFUsyaBZHQJ9j/s6aLGd1fZQoaAZoCWgPQwhMb38uGrLiv5SGlFKUaBVLMmgWR0CfY8Xg9/z8dX2UKGgGaAloD0MIQYLix5g76L+UhpRSlGgVSzJoFkdAn2ONcjZ+QXV9lChoBmgJaA9DCPDce7jkuPu/lIaUUpRoFUsyaBZHQJ9lnzDn/1h1fZQoaAZoCWgPQwjRXRJnRdQAwJSGlFKUaBVLMmgWR0CfZWT0QK8ddX2UKGgGaAloD0MIKdAn8iRp4r+UhpRSlGgVSzJoFkdAn2UsK1G9YnV9lChoBmgJaA9DCJ6ymq4nOui/lIaUUpRoFUsyaBZHQJ9k8/bCaZx1fZQoaAZoCWgPQwhLj6Z6Mn/6v5SGlFKUaBVLMmgWR0CfZxJ7LMcIdX2UKGgGaAloD0MI7lutE5fj+L+UhpRSlGgVSzJoFkdAn2bYCZF5OnV9lChoBmgJaA9DCBCyLJj4I+q/lIaUUpRoFUsyaBZHQJ9mn0Gu9vl1fZQoaAZoCWgPQwiyZmSQuwjyv5SGlFKUaBVLMmgWR0CfZma/yoXLdX2UKGgGaAloD0MI5dTOMLWl8b+UhpRSlGgVSzJoFkdAn2hctCiRGXV9lChoBmgJaA9DCHKG4o43ufa/lIaUUpRoFUsyaBZHQJ9oIjopx3p1fZQoaAZoCWgPQwhAFMyYgvXyv5SGlFKUaBVLMmgWR0CfZ+lNUOurdX2UKGgGaAloD0MIpmPOM/Yl9b+UhpRSlGgVSzJoFkdAn2ewymALA3V9lChoBmgJaA9DCCocQSrFTvu/lIaUUpRoFUsyaBZHQJ9pt+6RQrN1fZQoaAZoCWgPQwjDEDl9PV/tv5SGlFKUaBVLMmgWR0CfaX3N9ph4dX2UKGgGaAloD0MIPL69a9AX6L+UhpRSlGgVSzJoFkdAn2lFBppN9HV9lChoBmgJaA9DCNPB+j+H+eu/lIaUUpRoFUsyaBZHQJ9pDLowEhd1fZQoaAZoCWgPQwgZPEz75j78v5SGlFKUaBVLMmgWR0Cfaxw22oegdX2UKGgGaAloD0MIfO9v0F796r+UhpRSlGgVSzJoFkdAn2rh0yP+43V9lChoBmgJaA9DCBL27SQivPO/lIaUUpRoFUsyaBZHQJ9qqTGHYYl1fZQoaAZoCWgPQwja5Vsf1pvlv5SGlFKUaBVLMmgWR0CfanCpm29ddX2UKGgGaAloD0MIFQDjGTR077+UhpRSlGgVSzJoFkdAn2yHs5XEInV9lChoBmgJaA9DCBb59UNscP2/lIaUUpRoFUsyaBZHQJ9sTYSQHRl1fZQoaAZoCWgPQwgnhA66hMPvv5SGlFKUaBVLMmgWR0CfbBS39aUzdX2UKGgGaAloD0MI3nGKjuRy8b+UhpRSlGgVSzJoFkdAn2vcasIVunV9lChoBmgJaA9DCHO8AtGTsuq/lIaUUpRoFUsyaBZHQJ9t5orWiDd1fZQoaAZoCWgPQwhvDAHAsWfrv5SGlFKUaBVLMmgWR0Cfbaw482aVdX2UKGgGaAloD0MIw5/hzRq897+UhpRSlGgVSzJoFkdAn21zOHFglXV9lChoBmgJaA9DCANDVrd6DvW/lIaUUpRoFUsyaBZHQJ9tOxlg+hZ1fZQoaAZoCWgPQwgQJVryeJr0v5SGlFKUaBVLMmgWR0Cfb0ZVn27GdX2UKGgGaAloD0MIDwnf+xu08b+UhpRSlGgVSzJoFkdAn28MANoak3V9lChoBmgJaA9DCBmO5zOgXu+/lIaUUpRoFUsyaBZHQJ9u0wUQCjl1fZQoaAZoCWgPQwgQlrGhmz31v5SGlFKUaBVLMmgWR0Cfbpq4H5aedX2UKGgGaAloD0MIzm4tk+H487+UhpRSlGgVSzJoFkdAn3C0iMYMv3V9lChoBmgJaA9DCHpyTYHMTve/lIaUUpRoFUsyaBZHQJ9welWOp851fZQoaAZoCWgPQwjqJcYy/ZLjv5SGlFKUaBVLMmgWR0CfcEFyaNModX2UKGgGaAloD0MIoib6fJQR/L+UhpRSlGgVSzJoFkdAn3AI9ovi+HV9lChoBmgJaA9DCMnJxK2CGOW/lIaUUpRoFUsyaBZHQJ9zdQ66reZ1fZQoaAZoCWgPQwhivVErTB/8v5SGlFKUaBVLMmgWR0CfczqnWJ7+dX2UKGgGaAloD0MIeAyP/SyW8L+UhpRSlGgVSzJoFkdAn3MBqO938nV9lChoBmgJaA9DCHbj3ZGxWvO/lIaUUpRoFUsyaBZHQJ9yySX+l0p1fZQoaAZoCWgPQwhr09heC3r8v5SGlFKUaBVLMmgWR0CfdN4vexfOdX2UKGgGaAloD0MI1NUdi23S8r+UhpRSlGgVSzJoFkdAn3Sj+3pfQnV9lChoBmgJaA9DCLSqJR3l4O6/lIaUUpRoFUsyaBZHQJ90a0/nnuB1fZQoaAZoCWgPQwhPXI5XIPrtv5SGlFKUaBVLMmgWR0CfdDLvCuU2dX2UKGgGaAloD0MIKA6g3/fv8L+UhpRSlGgVSzJoFkdAn3ZVJHy3C3V9lChoBmgJaA9DCCWWlLvPMfG/lIaUUpRoFUsyaBZHQJ92GwgTyrh1fZQoaAZoCWgPQwhKlpNQ+sL1v5SGlFKUaBVLMmgWR0CfdeJfpljFdX2UKGgGaAloD0MIGsBbIEFx6b+UhpRSlGgVSzJoFkdAn3WqFM7EHnV9lChoBmgJaA9DCLdif9k9+fC/lIaUUpRoFUsyaBZHQJ94CT6i0v51fZQoaAZoCWgPQwgXKCmwACblv5SGlFKUaBVLMmgWR0Cfd88RL9MsdX2UKGgGaAloD0MIY0fjUL+L8L+UhpRSlGgVSzJoFkdAn3eWW2PT5XV9lChoBmgJaA9DCFkV4Sajyua/lIaUUpRoFUsyaBZHQJ93XivPkaN1fZQoaAZoCWgPQwjiy0QRUjfnv5SGlFKUaBVLMmgWR0CfeZcL0BfbdX2UKGgGaAloD0MI7niT36KT4b+UhpRSlGgVSzJoFkdAn3lc4gieNHV9lChoBmgJaA9DCCZSms3jsPC/lIaUUpRoFUsyaBZHQJ95JDTjNpx1fZQoaAZoCWgPQwiF0axsH3Ltv5SGlFKUaBVLMmgWR0CfeOv24/eMdX2UKGgGaAloD0MIZwqd19il6r+UhpRSlGgVSzJoFkdAn3soiHIp6XV9lChoBmgJaA9DCJ31Kcdkcee/lIaUUpRoFUsyaBZHQJ967kuHvc91fZQoaAZoCWgPQwjbF9ALd67zv5SGlFKUaBVLMmgWR0CferWpZOi4dX2UKGgGaAloD0MImIkipG7n7b+UhpRSlGgVSzJoFkdAn3p9Pci4a3V9lChoBmgJaA9DCPDce7jkePO/lIaUUpRoFUsyaBZHQJ98j5mAbyZ1fZQoaAZoCWgPQwjJrUm3JXLpv5SGlFKUaBVLMmgWR0CffFVktmL+dX2UKGgGaAloD0MI+1ksRfLV+L+UhpRSlGgVSzJoFkdAn3wcs189fXV9lChoBmgJaA9DCJKvBFJi1+y/lIaUUpRoFUsyaBZHQJ975HjIaLp1fZQoaAZoCWgPQwgOMPMd/MTmv5SGlFKUaBVLMmgWR0CffgTLW7OFdX2UKGgGaAloD0MIpUqUvaUc67+UhpRSlGgVSzJoFkdAn33KxLTQV3V9lChoBmgJaA9DCAWIghlT8PG/lIaUUpRoFUsyaBZHQJ99kfIS13N1fZQoaAZoCWgPQwh1WyIXnEH0v5SGlFKUaBVLMmgWR0CffVml67d0dX2UKGgGaAloD0MIJF6ezhWl5r+UhpRSlGgVSzJoFkdAn3+eMyad+XV9lChoBmgJaA9DCOm4GtmVFuG/lIaUUpRoFUsyaBZHQJ9/ZARkEs91fZQoaAZoCWgPQwh0le6usyHlv5SGlFKUaBVLMmgWR0CffytWuHN5dX2UKGgGaAloD0MIoZ3TLNCu9b+UhpRSlGgVSzJoFkdAn37y1y/9HnV9lChoBmgJaA9DCLow0ovaPfG/lIaUUpRoFUsyaBZHQJ+BaPS2H+J1fZQoaAZoCWgPQwgq5iDoaNXlv5SGlFKUaBVLMmgWR0CfgS7MgU1ydX2UKGgGaAloD0MIqUwxB0FH2r+UhpRSlGgVSzJoFkdAn4D2KVII4XV9lChoBmgJaA9DCCZV203wze2/lIaUUpRoFUsyaBZHQJ+AvaWX1J11ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 50000, "n_steps": 5, "gamma": 0.99, "gae_lambda": 1.0, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.15.90.1-microsoft-standard-WSL2-x86_64-with-glibc2.35 # 1 SMP Fri Jan 27 02:56:13 UTC 2023", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "2.0.0+cu117", "GPU Enabled": "True", "Numpy": "1.24.2", "Gym": "0.21.0"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7fb0446b6f70>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fb0446b5e80>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.dict.Dict'>", ":serialized:": "gAWVUgMAAAAAAACMD2d5bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwOZ3ltLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUaBCTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowGX3NoYXBllEsDhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZSMAUOUdJRSlIwEaGlnaJRoHSiWDAAAAAAAAAAAACBBAAAgQQAAIEGUaBVLA4WUaCB0lFKUjA1ib3VuZGVkX2JlbG93lGgdKJYDAAAAAAAAAAEBAZRoEowCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZRoIHSUUpSMDWJvdW5kZWRfYWJvdmWUaB0olgMAAAAAAAAAAQEBlGgsSwOFlGggdJRSlIwKX25wX3JhbmRvbZROdWKMDGRlc2lyZWRfZ29hbJRoDSmBlH2UKGgQaBVoGEsDhZRoGmgdKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZRoIHSUUpRoI2gdKJYMAAAAAAAAAAAAIEEAACBBAAAgQZRoFUsDhZRoIHSUUpRoKGgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoMmgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoN051YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgVaBhLBoWUaBpoHSiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBVLBoWUaCB0lFKUaCNoHSiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBVLBoWUaCB0lFKUaChoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDJoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDdOdWJ1aBhOaBBOaDdOdWIu", "spaces": "OrderedDict([('achieved_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('desired_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('observation', Box([-10. -10. -10. -10. -10. -10.], [10. 10. 10. 10. 10. 10.], (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaApLA4WUjAFDlHSUUpSMBGhpZ2iUaBIolgwAAAAAAAAAAACAPwAAgD8AAIA/lGgKSwOFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWAwAAAAAAAAABAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYDAAAAAAAAAAEBAZRoIUsDhZRoFXSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 1001472, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1680377738771037922, "learning_rate": 0.0014735441345589378, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVAQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMZy9ob21lL3UvbWluaWNvbmRhMy9lbnZzL2h1Z2dpbmdmYWNlLXVuaXQ2L2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGcvaG9tZS91L21pbmljb25kYTMvZW52cy9odWdnaW5nZmFjZS11bml0Ni9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9YJH33f0ZzhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA7/yPP5jVfb9HWig/HxRmP634zr9Hv2W//rTXP+kC3T767KW/doHHP+sxZb58/cw/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAABuaWP78aYb+JyR4/fpuFP5vvub9NOpy/s4LDP4o9tD5tDcK/2ciuP5+jsb5Ab9Y/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADv/I8/mNV9v0daKD8tfjq/ciuFvoj0w78fFGY/rfjOv0e/Zb8i8YC+zl1RPdQLE7/+tNc/6QLdPvrspb88gdg+R+c9PxUpez92gcc/6zFlvnz9zD8sj++8dqc0vxgeHz+UaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 1.1249064 -0.99154043 0.6576275 ]\n [ 0.8987445 -1.616964 -0.8974499 ]\n [ 1.685211 0.43166283 -1.2962945 ]\n [ 1.5586383 -0.22382323 1.6014857 ]]", "desired_goal": "[[ 1.1788948 -0.87931436 0.6202627 ]\n [ 1.0438077 -1.4526247 -1.2205292 ]\n [ 1.5274261 0.352032 -1.5160347 ]\n [ 1.3655044 -0.34695145 1.6752701 ]]", "observation": "[[ 1.1249064 -0.99154043 0.6576275 -0.7284878 -0.2600971 -1.5309 ]\n [ 0.8987445 -1.616964 -0.8974499 -0.2518397 0.05111485 -0.57439923]\n [ 1.685211 0.43166283 -1.2962945 0.42286098 0.74181026 0.9810956 ]\n [ 1.5586383 -0.22382323 1.6014857 -0.02924307 -0.70568025 0.62155294]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAbiURPmePFb7Mst87sEALvj8BCr1jG8U8yXLQPZkLgb1fexI9bBv/PUu2E777TxE+lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[ 0.14174435 -0.14605485 0.00682673]\n [-0.13598895 -0.03369259 0.02406091]\n [ 0.10178144 -0.0630104 0.03576219]\n [ 0.12456402 -0.14425008 0.14190666]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0014719999999999178, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI6+V3msw48b+UhpRSlIwBbJRLMowBdJRHQJcZN2St/4J1fZQoaAZoCWgPQwi8z/HR4oz4v5SGlFKUaBVLMmgWR0CXGOj7ALy+dX2UKGgGaAloD0MIOIO/X8wW+7+UhpRSlGgVSzJoFkdAlxipnlGPP3V9lChoBmgJaA9DCPUTzm4tk/i/lIaUUpRoFUsyaBZHQJcYUOby6MB1fZQoaAZoCWgPQwilhGBVvTz+v5SGlFKUaBVLMmgWR0CXGmajN6gNdX2UKGgGaAloD0MI/dmPFJGh9r+UhpRSlGgVSzJoFkdAlxoYXbdrPHV9lChoBmgJaA9DCO4E+69zk/2/lIaUUpRoFUsyaBZHQJcZ2TA31jB1fZQoaAZoCWgPQwhjmuleJzX4v5SGlFKUaBVLMmgWR0CXGYBC2MKkdX2UKGgGaAloD0MIlE4kmGom+r+UhpRSlGgVSzJoFkdAlxuTLwF1S3V9lChoBmgJaA9DCM3lBkMdFvi/lIaUUpRoFUsyaBZHQJcbRMdtEXt1fZQoaAZoCWgPQwiKWS+GciL+v5SGlFKUaBVLMmgWR0CXGwVhCtzTdX2UKGgGaAloD0MIPSr+74iK9b+UhpRSlGgVSzJoFkdAlxqschkiEHV9lChoBmgJaA9DCPgW1o13h/W/lIaUUpRoFUsyaBZHQJccueDnNgV1fZQoaAZoCWgPQwib5h2n6Ej1v5SGlFKUaBVLMmgWR0CXHGvaURnOdX2UKGgGaAloD0MIrdwLzArF+7+UhpRSlGgVSzJoFkdAlxwsl5WzW3V9lChoBmgJaA9DCNP6WwLwz/S/lIaUUpRoFUsyaBZHQJcb1BY3eep1fZQoaAZoCWgPQwhdxHdi1sv3v5SGlFKUaBVLMmgWR0CXHfVh1DBudX2UKGgGaAloD0MInZyhuOPN8r+UhpRSlGgVSzJoFkdAlx2m9+PRzHV9lChoBmgJaA9DCMnH7gIlRfq/lIaUUpRoFUsyaBZHQJcdZ6u4gA91fZQoaAZoCWgPQwimXrcIjLX7v5SGlFKUaBVLMmgWR0CXHQ619fCzdX2UKGgGaAloD0MIhq+vdamR+L+UhpRSlGgVSzJoFkdAlx8fIS13MnV9lChoBmgJaA9DCGkbf6KyYfq/lIaUUpRoFUsyaBZHQJce0LXtjTd1fZQoaAZoCWgPQwivzcZKzLP4v5SGlFKUaBVLMmgWR0CXHpFh5PdmdX2UKGgGaAloD0MIgbIpV3gX8r+UhpRSlGgVSzJoFkdAlx44ePq9oXV9lChoBmgJaA9DCJtattYXyfe/lIaUUpRoFUsyaBZHQJcgM1uR9w51fZQoaAZoCWgPQwg6rkZ2peX2v5SGlFKUaBVLMmgWR0CXH+T8YQ8PdX2UKGgGaAloD0MIJSL8i6Cx8r+UhpRSlGgVSzJoFkdAlx+lmOEM9nV9lChoBmgJaA9DCFvtYS8UcPq/lIaUUpRoFUsyaBZHQJcfTJ9y9251fZQoaAZoCWgPQwjylxb1Sa71v5SGlFKUaBVLMmgWR0CXIUT3qRlpdX2UKGgGaAloD0MIdO0L6IX7/r+UhpRSlGgVSzJoFkdAlyD2mP5pJ3V9lChoBmgJaA9DCEuuYvGbwva/lIaUUpRoFUsyaBZHQJcgt0ZFXq91fZQoaAZoCWgPQwg/rDdqhSn4v5SGlFKUaBVLMmgWR0CXIF5jpcHGdX2UKGgGaAloD0MI6ui4GtkV+L+UhpRSlGgVSzJoFkdAlyJpl8PWhHV9lChoBmgJaA9DCOOkMO9xpva/lIaUUpRoFUsyaBZHQJciG09hZyN1fZQoaAZoCWgPQwiMvKyJBf71v5SGlFKUaBVLMmgWR0CXIdv6j323dX2UKGgGaAloD0MI9WbUfJU8+b+UhpRSlGgVSzJoFkdAlyGDAaef7XV9lChoBmgJaA9DCBmveVVn9fe/lIaUUpRoFUsyaBZHQJcjlJI1+Ap1fZQoaAZoCWgPQwi0Hr5MFOH4v5SGlFKUaBVLMmgWR0CXI0YnOSntdX2UKGgGaAloD0MIrOC3IcZr+b+UhpRSlGgVSzJoFkdAlyMG1IAfdXV9lChoBmgJaA9DCL4uw3+6gfW/lIaUUpRoFUsyaBZHQJcireVLSNR1fZQoaAZoCWgPQwhqZ5jaUof1v5SGlFKUaBVLMmgWR0CXJL60pmVadX2UKGgGaAloD0MIn69ZLhsd+L+UhpRSlGgVSzJoFkdAlyRwX2ugYnV9lChoBmgJaA9DCMBfzJasiva/lIaUUpRoFUsyaBZHQJckMPpY9xJ1fZQoaAZoCWgPQwgtsp3vp8byv5SGlFKUaBVLMmgWR0CXI9gHu7YkdX2UKGgGaAloD0MIlC9oIQGj87+UhpRSlGgVSzJoFkdAlyXnIU8FIXV9lChoBmgJaA9DCNMSK6ORD/u/lIaUUpRoFUsyaBZHQJclmMXJo011fZQoaAZoCWgPQwgIc7uX+6T6v5SGlFKUaBVLMmgWR0CXJVlcyFfzdX2UKGgGaAloD0MIHNKowMn2+r+UhpRSlGgVSzJoFkdAlyUAaef7JnV9lChoBmgJaA9DCOmbNA2KZvu/lIaUUpRoFUsyaBZHQJcnFDPWxyJ1fZQoaAZoCWgPQwg7iQj/Iij3v5SGlFKUaBVLMmgWR0CXJsXKbKA8dX2UKGgGaAloD0MIMPKyJhb49r+UhpRSlGgVSzJoFkdAlyaGcnVoYnV9lChoBmgJaA9DCDRnfcoxmfq/lIaUUpRoFUsyaBZHQJcmLa24NI91fZQoaAZoCWgPQwgyPPazWIr4v5SGlFKUaBVLMmgWR0CXKDmAskIHdX2UKGgGaAloD0MIHaopyTrc+b+UhpRSlGgVSzJoFkdAlyfrGvOhTXV9lChoBmgJaA9DCN/7G7RX3/m/lIaUUpRoFUsyaBZHQJcnrB3zMA51fZQoaAZoCWgPQwi/tn76zxr5v5SGlFKUaBVLMmgWR0CXJ1McIZ62dX2UKGgGaAloD0MIQiJt40+U+7+UhpRSlGgVSzJoFkdAlylk1Muez3V9lChoBmgJaA9DCO6yX3e6s/m/lIaUUpRoFUsyaBZHQJcpFqfvnbJ1fZQoaAZoCWgPQwhZvi7Df3r4v5SGlFKUaBVLMmgWR0CXKNd7OVxCdX2UKGgGaAloD0MIkpVfBmOE+7+UhpRSlGgVSzJoFkdAlyh+zhP0qnV9lChoBmgJaA9DCMKFPIIbafi/lIaUUpRoFUsyaBZHQJcqm4Wk8A91fZQoaAZoCWgPQwijztxDwnf2v5SGlFKUaBVLMmgWR0CXKk0j1PFedX2UKGgGaAloD0MI9utOd544/7+UhpRSlGgVSzJoFkdAlyoOFQEZBXV9lChoBmgJaA9DCKD7cma7Qv2/lIaUUpRoFUsyaBZHQJcptXtBv751fZQoaAZoCWgPQwgaGeQuwtT8v5SGlFKUaBVLMmgWR0CXK8cYIjW1dX2UKGgGaAloD0MIQuvhy0QR+r+UhpRSlGgVSzJoFkdAlyt4sd1dPnV9lChoBmgJaA9DCN3T1R2LLfe/lIaUUpRoFUsyaBZHQJcrOU5dWyV1fZQoaAZoCWgPQwjOM/YlG8/1v5SGlFKUaBVLMmgWR0CXKuBN21UmdX2UKGgGaAloD0MIKUF/oUcM9r+UhpRSlGgVSzJoFkdAlyzx0lqrR3V9lChoBmgJaA9DCIV4JF6eTve/lIaUUpRoFUsyaBZHQJcso2vStvJ1fZQoaAZoCWgPQwgvaYzWUZX1v5SGlFKUaBVLMmgWR0CXLGQJokAxdX2UKGgGaAloD0MIqiwKuyh6+r+UhpRSlGgVSzJoFkdAlywLJOnEVHV9lChoBmgJaA9DCIMvTKYKhvi/lIaUUpRoFUsyaBZHQJcuHnNgSe11fZQoaAZoCWgPQwjWx0Pf3cr6v5SGlFKUaBVLMmgWR0CXLdALRa5gdX2UKGgGaAloD0MI6GZ/oNy29L+UhpRSlGgVSzJoFkdAly2QrUb1iHV9lChoBmgJaA9DCEW8df7tcvi/lIaUUpRoFUsyaBZHQJctN72L5yl1fZQoaAZoCWgPQwjItgw4S8n6v5SGlFKUaBVLMmgWR0CXL0gGr0aqdX2UKGgGaAloD0MIV0J3SZyV9L+UhpRSlGgVSzJoFkdAly75nctXgnV9lChoBmgJaA9DCB+7C5QUmPq/lIaUUpRoFUsyaBZHQJcuujqOcUd1fZQoaAZoCWgPQwjFAIkmUET0v5SGlFKUaBVLMmgWR0CXLmFId2gWdX2UKGgGaAloD0MILzTXaaRl9r+UhpRSlGgVSzJoFkdAlzBzT4L1EnV9lChoBmgJaA9DCJvkR/yKNfa/lIaUUpRoFUsyaBZHQJcwJRJmNBF1fZQoaAZoCWgPQwjWOnE5XsHyv5SGlFKUaBVLMmgWR0CXL+XZXdTHdX2UKGgGaAloD0MIKgDGM2jo+L+UhpRSlGgVSzJoFkdAly+M6vJRwnV9lChoBmgJaA9DCBk5C3va4fe/lIaUUpRoFUsyaBZHQJcxndLxqfx1fZQoaAZoCWgPQwj11VWBWsz4v5SGlFKUaBVLMmgWR0CXMU9vjwQUdX2UKGgGaAloD0MI5dL4hVcS+7+UhpRSlGgVSzJoFkdAlzEQOavzOHV9lChoBmgJaA9DCCOfVzz1SPi/lIaUUpRoFUsyaBZHQJcwtzvJA+p1fZQoaAZoCWgPQwjrNqj91o76v5SGlFKUaBVLMmgWR0CXMsrTpgTidX2UKGgGaAloD0MIfZI7bCIz+r+UhpRSlGgVSzJoFkdAlzJ8bFS88XV9lChoBmgJaA9DCDzbozfcB/e/lIaUUpRoFUsyaBZHQJcyPTTfBN51fZQoaAZoCWgPQwiWsgxxrAv6v5SGlFKUaBVLMmgWR0CXMeSaEzwddX2UKGgGaAloD0MIYRkbutkf+L+UhpRSlGgVSzJoFkdAlzP3r+o993V9lChoBmgJaA9DCKfNOA1RRfu/lIaUUpRoFUsyaBZHQJczqUJOWSl1fZQoaAZoCWgPQwj27SQi/Ev2v5SGlFKUaBVLMmgWR0CXM2nl4keIdX2UKGgGaAloD0MII9v5fmq89L+UhpRSlGgVSzJoFkdAlzMQ9FF2FHV9lChoBmgJaA9DCF+y8WCL3fe/lIaUUpRoFUsyaBZHQJc1JvtMPBl1fZQoaAZoCWgPQwgwL8A+OnX2v5SGlFKUaBVLMmgWR0CXNNiTMaCMdX2UKGgGaAloD0MIoOHNGrzv+b+UhpRSlGgVSzJoFkdAlzSZON5t33V9lChoBmgJaA9DCEt1AS8zbPe/lIaUUpRoFUsyaBZHQJc0QD0UXYV1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 489, "n_steps": 512, "gamma": 0.9546251877513446, "gae_lambda": 1.0, "ent_coef": 0.00012083804240540896, "vf_coef": 0.5, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.15.90.1-microsoft-standard-WSL2-x86_64-with-glibc2.35 # 1 SMP Fri Jan 27 02:56:13 UTC 2023", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "2.0.0+cu117", "GPU Enabled": "True", "Numpy": "1.24.2", "Gym": "0.21.0"}}
|
replay.mp4
CHANGED
|
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward": -1.
|
|
|
|
| 1 |
+
{"mean_reward": -1.3912288814783096, "std_reward": 0.2311080100563121, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-04-02T06:09:35.884482"}
|
vec_normalize.pkl
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3056
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c516a5d23b7e6246b45fb4515c5f783afab6d41970c317a7e14555d336e4906
|
| 3 |
size 3056
|