commit with 1 000 000 iterations, but without discount (gamma 1) from unit1 notebook from local jupyterhub
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-g1.zip +2 -2
- ppo-LunarLander-g1/data +4 -4
- ppo-LunarLander-g1/policy.optimizer.pth +1 -1
- ppo-LunarLander-g1/policy.pth +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value:
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 16 |
type: LunarLander-v2
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: 284.65 +/- 12.11
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fcef6216d30>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fcef6216dc0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fcef6216e50>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fcef6216ee0>", "_build": "<function ActorCriticPolicy._build at 0x7fcef6216f70>", "forward": "<function ActorCriticPolicy.forward at 0x7fcef621b040>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fcef621b0d0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fcef621b160>", "_predict": "<function ActorCriticPolicy._predict at 0x7fcef621b1f0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fcef621b280>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fcef621b310>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fcef621b3a0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fcef62198c0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1680080295490888383, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV0QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMTy9ob21lL21pa2kvLmxvY2FsL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjE8vaG9tZS9taWtpLy5sb2NhbC9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAOAyE76ICAE/bjo4PizAAb8/P1y+oI/sPQAAAAAAAAAADRCDPY8KRbos0Ag5Q3CitY38BLumGKK0AACAPwAAgD8ztYM89uBGuixit7Zcycax8t//uv5z3DUAAIA/AACAP5olXD2FEKG7BDqMvDPstjyRXeC8huyZPQAAgD8AAIA/OttyPq+LOD81XYy+I+r2vh+qqD4+ya2+AAAAAAAAAAAAtfw8O1iCvAGshT5LZ5E86sOKPPtZ1D0AAIA/AACAP83gNjwfzYq5xDi0OzLC3zfcnso6s4hjtQAAgD8AAIA/5oZcPRXRsT/z+M0+lDZpvuxffT0tJok+AAAAAAAAAACmsLg9Upi0uaK9hzgt+Mszuz99O21lorcAAIA/AAAAAM0g4DtoM5q83fayPYpbf71hzuI92oENPgAAgD8AAIA/gEbbvir3ZD+rJo2+p6FAv7QAI7/NdOG9AAAAAAAAAACAeM89XMt5uv6lhrszu1M1HhdDu8aHvLQAAAAAAAAAAHPOhT1NGJ8/HqgTPg3qFr9xf2Q+lrR8vAAAAAAAAAAAAI/wPFwbe7q/A6a6vIyotVA/kDq+wcE5AACAPwAAgD8ATG49KeA5um7DiTmaQX40IO1eulZNo7gAAIA/AACAP5pRFjtc4xC6Th2hNYn3CS9/6LC4fj6wtAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVaBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMId76fGm9XckCUhpRSlIwBbJRNCwGMAXSUR0DAzZv4IrvtdX2UKGgGaAloD0MIH/KWq1+sckCUhpRSlGgVTbgBaBZHQMDNpLYoRZl1fZQoaAZoCWgPQwibjZWYZ2FyQJSGlFKUaBVL7WgWR0DAzb/HFPzndX2UKGgGaAloD0MIobskzsrYckCUhpRSlGgVTRoDaBZHQMDN010T1011fZQoaAZoCWgPQwg+JlKazYhQQJSGlFKUaBVLuGgWR0DAzdQmgJ1JdX2UKGgGaAloD0MIg7709ufLY0CUhpRSlGgVTegDaBZHQMDN5pVsDW91fZQoaAZoCWgPQwhJ8lzfh09yQJSGlFKUaBVNdgFoFkdAwM4FIpYs/nV9lChoBmgJaA9DCLtCHyyja3BAlIaUUpRoFU1pAWgWR0DAzgvRsuWbdX2UKGgGaAloD0MI3T8WokOBckCUhpRSlGgVTQwCaBZHQMDOKWXsw+N1fZQoaAZoCWgPQwgxfa8heBdyQJSGlFKUaBVNPwFoFkdAwM5P1XeWOnV9lChoBmgJaA9DCCzzVl1HOXNAlIaUUpRoFU3AAWgWR0DAzmeAf+0gdX2UKGgGaAloD0MIQNtq1tkIckCUhpRSlGgVS+5oFkdAwM50zv7WNHV9lChoBmgJaA9DCOf+6nFfxm5AlIaUUpRoFU05AWgWR0DAzpWPaL4vdX2UKGgGaAloD0MI2PM1y6U+cUCUhpRSlGgVTZoBaBZHQMDOtXTuv2Z1fZQoaAZoCWgPQwiKAKd3cYdnQJSGlFKUaBVN6ANoFkdAwM67rj5sTHV9lChoBmgJaA9DCPLrh9hgLXFAlIaUUpRoFU0sAWgWR0DAzr7NfPX1dX2UKGgGaAloD0MIABqlSz9FcECUhpRSlGgVTRkCaBZHQMDXuwb+98J1fZQoaAZoCWgPQwhUOe0peVlwQJSGlFKUaBVL52gWR0DA18LSE12rdX2UKGgGaAloD0MI7IoZ4a1+cECUhpRSlGgVTWUCaBZHQMDX3SrHU+d1fZQoaAZoCWgPQwjjxFc7ivByQJSGlFKUaBVNTwFoFkdAwNfv8a4tpXV9lChoBmgJaA9DCICBIEDGqnFAlIaUUpRoFU2eAWgWR0DA2A597WupdX2UKGgGaAloD0MIrMd9q7XmckCUhpRSlGgVTU0BaBZHQMDYPSlN1yN1fZQoaAZoCWgPQwhGs7J9yExxQJSGlFKUaBVNKQFoFkdAwNg/opx3mnV9lChoBmgJaA9DCMnk1M6wT25AlIaUUpRoFU0cAWgWR0DA2FsZ75VPdX2UKGgGaAloD0MIZ3+g3LbucUCUhpRSlGgVTVMBaBZHQMDYfdlum791fZQoaAZoCWgPQwiv0XKgB5BxQJSGlFKUaBVL/WgWR0DA2I/oLXtjdX2UKGgGaAloD0MIwhVQqCeOcECUhpRSlGgVTccBaBZHQMDYj/YBeX11fZQoaAZoCWgPQwgEq+rld/5zQJSGlFKUaBVNZAFoFkdAwNiQwbEP2HV9lChoBmgJaA9DCMR6o1YYM3FAlIaUUpRoFU0YAWgWR0DA2JzoIOYqdX2UKGgGaAloD0MIzczMzIwtcUCUhpRSlGgVTcsCaBZHQMDYvhClabF1fZQoaAZoCWgPQwhyUMJMG65zQJSGlFKUaBVNHwFoFkdAwNi/Bl+VknV9lChoBmgJaA9DCFteud6283BAlIaUUpRoFU3pAmgWR0DA2OdQbdaddX2UKGgGaAloD0MI5zbhXtlncUCUhpRSlGgVTUQBaBZHQMDZC2GRFJB1fZQoaAZoCWgPQwhuT5DYbtNnQJSGlFKUaBVN6ANoFkdAwNkzlI3BHnV9lChoBmgJaA9DCHnpJjHI4HBAlIaUUpRoFU1KAWgWR0DA2T//JeVtdX2UKGgGaAloD0MIpaDbS5r1cECUhpRSlGgVS/NoFkdAwNlQX1J173V9lChoBmgJaA9DCDcclgZ+AHFAlIaUUpRoFUv9aBZHQMDZWgXdj5N1fZQoaAZoCWgPQwjXE10XvjFyQJSGlFKUaBVNGAFoFkdAwNlcjvd/KHV9lChoBmgJaA9DCA2qDU7ECmNAlIaUUpRoFU3oA2gWR0DA2WwkRjBmdX2UKGgGaAloD0MICDpa1ZK2cUCUhpRSlGgVS/loFkdAwNmKynDR+nV9lChoBmgJaA9DCEp/L4WHmnBAlIaUUpRoFU1EAWgWR0DA2ZFb9qDcdX2UKGgGaAloD0MIeSKI87C4ckCUhpRSlGgVTV0BaBZHQMDZsqzqrzZ1fZQoaAZoCWgPQwgKZeHrK4RxQJSGlFKUaBVNUQFoFkdAwNnPDv3JxXV9lChoBmgJaA9DCOrOE8/Zg2NAlIaUUpRoFU3oA2gWR0DA2dqKLsKLdX2UKGgGaAloD0MICoZzDXONcECUhpRSlGgVS89oFkdAwNnbfb9IgHV9lChoBmgJaA9DCNQnucOmQ3FAlIaUUpRoFU1nAmgWR0DA2dtsenyedX2UKGgGaAloD0MIeedQhqqkN0CUhpRSlGgVS6toFkdAwNnvd30PH3V9lChoBmgJaA9DCPrRcMrch21AlIaUUpRoFU0+AWgWR0DA2gi0v4/NdX2UKGgGaAloD0MIUU1J1uH1cUCUhpRSlGgVTYYBaBZHQMDaHarFOwh1fZQoaAZoCWgPQwgnvW987UBwQJSGlFKUaBVL7WgWR0DA2kXJxNqQdX2UKGgGaAloD0MIZhah2Ao2VUCUhpRSlGgVS5VoFkdAwNpJpudf9nV9lChoBmgJaA9DCOKsiJoovHBAlIaUUpRoFUvGaBZHQMDacAc1fmd1fZQoaAZoCWgPQwio4PCCCF5vQJSGlFKUaBVNhAFoFkdAwNqKn752yXV9lChoBmgJaA9DCO87hsf+8XJAlIaUUpRoFUvaaBZHQMDaufVAiV11fZQoaAZoCWgPQwjvy5ntysVyQJSGlFKUaBVN7gFoFkdAwNrLM+NcW3V9lChoBmgJaA9DCElIpG08T3BAlIaUUpRoFUvRaBZHQMDbANMfzSV1fZQoaAZoCWgPQwh9CRUc3ulvQJSGlFKUaBVNhwFoFkdAwNsSW3z+WHV9lChoBmgJaA9DCOfkRSag2HFAlIaUUpRoFU3fAWgWR0DA2xNYW+GodX2UKGgGaAloD0MI28AdqFOuckCUhpRSlGgVTYUBaBZHQMDbHaHCXQd1fZQoaAZoCWgPQwjEPgEU4zRzQJSGlFKUaBVNAAFoFkdAwNtSs/6frnV9lChoBmgJaA9DCJlKP+HszGRAlIaUUpRoFU3oA2gWR0DA22oQHzH0dX2UKGgGaAloD0MIMnGrIIYackCUhpRSlGgVTYUBaBZHQMDbawr1/Uh1fZQoaAZoCWgPQwgUCaaa2RZzQJSGlFKUaBVNjQJoFkdAwNtxpDeCTXV9lChoBmgJaA9DCFx0stR66nJAlIaUUpRoFUvSaBZHQMDbgJxeb/h1fZQoaAZoCWgPQwgQI4RHG+NjQJSGlFKUaBVN6ANoFkdAwNuD+WGATnV9lChoBmgJaA9DCHDSNCganHJAlIaUUpRoFU0UAmgWR0DA26LEWIoFdX2UKGgGaAloD0MIvFtZonMGckCUhpRSlGgVTWYCaBZHQMDbpE5p8F91fZQoaAZoCWgPQwgxCoLHN6ZuQJSGlFKUaBVN+QJoFkdAwNux+lTFVHV9lChoBmgJaA9DCAg8MIAwsnJAlIaUUpRoFU19AWgWR0DA278Jx//edX2UKGgGaAloD0MIHCWvzrGOckCUhpRSlGgVTR0BaBZHQMDb4GuDBdl1fZQoaAZoCWgPQwgsnKT5I/lxQJSGlFKUaBVNlAFoFkdAwNvv5sTFl3V9lChoBmgJaA9DCJvkR/wKBXJAlIaUUpRoFUvkaBZHQMDb/rTYukF1fZQoaAZoCWgPQwjUX6+wIIBxQJSGlFKUaBVNWwJoFkdAwNwaxrSE13V9lChoBmgJaA9DCMed0sF6lXJAlIaUUpRoFU19AWgWR0DA3CKZF5OadX2UKGgGaAloD0MIC/FIvHw1c0CUhpRSlGgVTRkBaBZHQMDcJl9KEnN1fZQoaAZoCWgPQwjT+fAsQdttQJSGlFKUaBVNIQFoFkdAwNxGoLG7z3V9lChoBmgJaA9DCNXsgVagunFAlIaUUpRoFUvWaBZHQMDcVIkJKJ51fZQoaAZoCWgPQwhjfJi9bBlzQJSGlFKUaBVNwwFoFkdAwNxhiDujRHV9lChoBmgJaA9DCOoFn+YkN3JAlIaUUpRoFU0YAWgWR0DA3GSYw7DEdX2UKGgGaAloD0MIUDdQ4J3TcECUhpRSlGgVTQsBaBZHQMDca2gezUt1fZQoaAZoCWgPQwhDO6dZIBBwQJSGlFKUaBVN+QFoFkdAwNxx+CsfaHV9lChoBmgJaA9DCPyohv3ehHJAlIaUUpRoFUvPaBZHQMDcddORDCx1fZQoaAZoCWgPQwhdiUD1D49yQJSGlFKUaBVNQQFoFkdAwNx+xxDLKXV9lChoBmgJaA9DCCyC/63koHNAlIaUUpRoFUvIaBZHQMDcgG6oVEd1fZQoaAZoCWgPQwi5cYv5+dVwQJSGlFKUaBVNhAFoFkdAwNyHtIkJKXV9lChoBmgJaA9DCHjy6bHtKHBAlIaUUpRoFU3kAWgWR0DA3JvMt9QXdX2UKGgGaAloD0MIUDqRYCrZcECUhpRSlGgVS8toFkdAwNzGYdhiLHV9lChoBmgJaA9DCP1pozod/nFAlIaUUpRoFU0aAWgWR0DA3Nz8YQ8PdX2UKGgGaAloD0MI1LfM6TK/c0CUhpRSlGgVS/poFkdAwNz3lDneSHV9lChoBmgJaA9DCB3MJsAwnG5AlIaUUpRoFUvGaBZHQMDdAM6ij+J1fZQoaAZoCWgPQwiiuONNfrZuQJSGlFKUaBVL42gWR0DA3RWnuRcNdX2UKGgGaAloD0MIz6Chf8INcUCUhpRSlGgVTYQBaBZHQMDdKjp9qlB1fZQoaAZoCWgPQwgjE/BrJLlxQJSGlFKUaBVNHgFoFkdAwN0uBYFJQXV9lChoBmgJaA9DCB9I3jmUz3FAlIaUUpRoFU2AAWgWR0DA3TJdOZb7dX2UKGgGaAloD0MIY7Mj1Xekb0CUhpRSlGgVTdsBaBZHQMDdS4QJ5Vx1fZQoaAZoCWgPQwh32ERmrkdwQJSGlFKUaBVNeQFoFkdAwN10wY+B6XV9lChoBmgJaA9DCKuuQzVleHJAlIaUUpRoFU1ZAWgWR0DA3XeHLzPKdX2UKGgGaAloD0MI1eqrq4JXbkCUhpRSlGgVTZkBaBZHQMDdfeXJHRV1fZQoaAZoCWgPQwj1Lt6PG4hwQJSGlFKUaBVL8mgWR0DA3ZCG+K0ldX2UKGgGaAloD0MIaOif4GIVckCUhpRSlGgVTXMBaBZHQMDdo4e9zwN1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1240, "n_steps": 2048, "gamma": 1, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 8, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV0QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMTy9ob21lL21pa2kvLmxvY2FsL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjE8vaG9tZS9taWtpLy5sb2NhbC9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.14.0-239.el9.x86_64-x86_64-with-glibc2.34 # 1 SMP PREEMPT_DYNAMIC Thu Jan 19 14:14:19 UTC 2023", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu117", "GPU Enabled": "True", "Numpy": "1.24.1", "Gym": "0.21.0"}}
|
|
|
|
| 1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fcef6216d30>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fcef6216dc0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fcef6216e50>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fcef6216ee0>", "_build": "<function ActorCriticPolicy._build at 0x7fcef6216f70>", "forward": "<function ActorCriticPolicy.forward at 0x7fcef621b040>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fcef621b0d0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fcef621b160>", "_predict": "<function ActorCriticPolicy._predict at 0x7fcef621b1f0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fcef621b280>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fcef621b310>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fcef621b3a0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fcef62198c0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1680082258915377443, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV0QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMTy9ob21lL21pa2kvLmxvY2FsL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjE8vaG9tZS9taWtpLy5sb2NhbC9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAA42zuBbn4+zf6NPQfRxr7/GSE7rTKPPAAAAAAAAAAAACAMO/bkXbp9+kC5lSE1tCWx0LrwBGM4AACAPwAAgD+apBi9SEHWuJAn/jhvwFU2tQZEumZZGbgAAIA/AACAPzNfJz3DwUO6m6oyutXr97QNakk7TW9ROQAAgD8AAIA/zdjfO8OJe7ra3Uw7cxfgNT/Ogrp2V2+6AACAPwAAgD8mk1c+8pAJP0B+ib6WyMm+3c8OPui6Ir4AAAAAAAAAAGaS/7xIP5O6uvn7O0EitzYnzsi5reatNQAAgD8AAIA/mnn/Oq59kLoGDgM51tYANEUikDiZ2Be4AACAPwAAgD+aWaw59uwiukSxQjuhQs027RvgOtgMzDUAAIA/AACAP5qPPj1c6qs/ZDgKP3Sd8L4f+hc8Fgc+PgAAAAAAAAAAmlkkOq5Blro6eB+64J94tjIqrjrQrTg5AACAPwAAgD+ax3W9XNtXulhr4TQ9VhIwRxhruknnM7QAAIA/AACAPzO+ijzhgoC6RZNDuloFQbU4auY6fmRkOQAAgD8AAIA/zcpMPJzjRbw4Ue093BF+vTb6Qb1f67K6AACAPwAAgD8A0j69FKaFul5GiTuRafA19i4lO+D95jQAAIA/AACAP2ZySLxca1K6RmldOrpqTjXNLEE6SpaCuQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVdRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIijpzD8micUCUhpRSlIwBbJRL5owBdJRHQMSYVlwkxAV1fZQoaAZoCWgPQwhzS6shcSdzQJSGlFKUaBVNlwFoFkdAxJiAS5AhS3V9lChoBmgJaA9DCMmP+BXrXHFAlIaUUpRoFU2DAmgWR0DEmLDdSEUTdX2UKGgGaAloD0MIZOjYQaVbcECUhpRSlGgVTWsBaBZHQMSZAGZeAut1fZQoaAZoCWgPQwhUq6+uCn5zQJSGlFKUaBVL1WgWR0DEmQl6/qPfdX2UKGgGaAloD0MIwY7/AoFvckCUhpRSlGgVTfICaBZHQMSZGNwaR6p1fZQoaAZoCWgPQwhkd4GSQrhxQJSGlFKUaBVNUgFoFkdAxKG27iADrHV9lChoBmgJaA9DCFVLOsrBzmRAlIaUUpRoFU3oA2gWR0DEofPBnBcidX2UKGgGaAloD0MID5nyISg0ZUCUhpRSlGgVTegDaBZHQMSiDbNB4Ux1fZQoaAZoCWgPQwiQZcHEn1llQJSGlFKUaBVN6ANoFkdAxKI7aIN3GHV9lChoBmgJaA9DCJ8AipEldGhAlIaUUpRoFU3oA2gWR0DEokm98JD3dX2UKGgGaAloD0MIJGJKJNEuZECUhpRSlGgVTegDaBZHQMSib2YfGMp1fZQoaAZoCWgPQwi+ZrlsdNZwQJSGlFKUaBVNEgJoFkdAxKJ6JhvzfHV9lChoBmgJaA9DCCrj32dc0m9AlIaUUpRoFU3UAmgWR0DEooNbiZOSdX2UKGgGaAloD0MIlnmrrkM7UkCUhpRSlGgVS4VoFkdAxKKoEidJ8XV9lChoBmgJaA9DCGe610l9i2hAlIaUUpRoFU3oA2gWR0DEovgw/PgOdX2UKGgGaAloD0MIMBNFSF18cECUhpRSlGgVS/xoFkdAxKOZPhybQXV9lChoBmgJaA9DCK1M+KW+X3JAlIaUUpRoFU1JAWgWR0DEo7np8neBdX2UKGgGaAloD0MI1CtlGWLzZUCUhpRSlGgVTegDaBZHQMSjzJDNQj51fZQoaAZoCWgPQwheonpr4EtzQJSGlFKUaBVN6AJoFkdAxKPTEpAlfXV9lChoBmgJaA9DCJm36jqUHXJAlIaUUpRoFU3IAWgWR0DEpBpq46OpdX2UKGgGaAloD0MIZjOHpJbJakCUhpRSlGgVTegDaBZHQMSkP01ZTyd1fZQoaAZoCWgPQwjgDtQpj6pnQJSGlFKUaBVN6ANoFkdAxKSEFs54nnV9lChoBmgJaA9DCHnNqzrrvnBAlIaUUpRoFUvQaBZHQMSkjyeZof11fZQoaAZoCWgPQwjHm/wWnfltQJSGlFKUaBVNhQNoFkdAxKTM0vXbunV9lChoBmgJaA9DCGajc34KSnJAlIaUUpRoFU2CA2gWR0DEpOBXKbKBdX2UKGgGaAloD0MI8x5nmjA1c0CUhpRSlGgVTbwCaBZHQMSk/ytV7yB1fZQoaAZoCWgPQwhJ10y+WZdhQJSGlFKUaBVN6ANoFkdAxKUKQnx8UnV9lChoBmgJaA9DCJ/HKM+8rmVAlIaUUpRoFU3oA2gWR0DEpRLJQtSRdX2UKGgGaAloD0MI2o6puzLjZECUhpRSlGgVTegDaBZHQMSlcpFCswN1fZQoaAZoCWgPQwj+RGXDmpJkQJSGlFKUaBVN6ANoFkdAxKWMIt16mnV9lChoBmgJaA9DCHZSX5Z2DGlAlIaUUpRoFU3oA2gWR0DEpcoQHzH0dX2UKGgGaAloD0MIEw69xQO6ckCUhpRSlGgVS/FoFkdAxKXUhBZ6lnV9lChoBmgJaA9DCHI1sist6W9AlIaUUpRoFU2EAWgWR0DEpinkHUtqdX2UKGgGaAloD0MIDt3sD1Qjc0CUhpRSlGgVTecBaBZHQMSmMSCFsYV1fZQoaAZoCWgPQwhOYhBYOY1xQJSGlFKUaBVNRgNoFkdAxKZ84ku6E3V9lChoBmgJaA9DCPbv+sxZwWJAlIaUUpRoFU3oA2gWR0DEpn3FefI0dX2UKGgGaAloD0MIwqbOo+JlcUCUhpRSlGgVTVEBaBZHQMSmsD7Ikqt1fZQoaAZoCWgPQwj68ZcWtU5zQJSGlFKUaBVNlwNoFkdAxKbgLx7RfHV9lChoBmgJaA9DCNzwu+mWRXJAlIaUUpRoFU0mA2gWR0DEpvrdFfAsdX2UKGgGaAloD0MIZ/LNNjfZc0CUhpRSlGgVTVECaBZHQMSm/iT+vQp1fZQoaAZoCWgPQwjRArStZnVmQJSGlFKUaBVN6ANoFkdAxKc2q6OHWXV9lChoBmgJaA9DCKCobFiTKXJAlIaUUpRoFUvUaBZHQMSnN5pSJj51fZQoaAZoCWgPQwgbDeAtkMNmQJSGlFKUaBVN6ANoFkdAxKd/jLB9C3V9lChoBmgJaA9DCJq2f2Wl53FAlIaUUpRoFUvZaBZHQMSnvuUUwi91fZQoaAZoCWgPQwh5zas6K85pQJSGlFKUaBVN6ANoFkdAxKfwoWpIc3V9lChoBmgJaA9DCDj1geRdT3JAlIaUUpRoFU1TA2gWR0DEp/tt8/lidX2UKGgGaAloD0MIVmXfFQFHckCUhpRSlGgVTa0CaBZHQMSoKqYAsCl1fZQoaAZoCWgPQwhqFf2hGYJoQJSGlFKUaBVN6ANoFkdAxKg4WsRxtHV9lChoBmgJaA9DCBBbejRVD3NAlIaUUpRoFU0uA2gWR0DEqD96C17ZdX2UKGgGaAloD0MIUBvV6UCZckCUhpRSlGgVTb4BaBZHQMSoP3++/QB1fZQoaAZoCWgPQwgwYwrWuOVvQJSGlFKUaBVN4QJoFkdAxKiysny/bnV9lChoBmgJaA9DCO9yEd8J/nFAlIaUUpRoFU0hAWgWR0DEqLt9c8kldX2UKGgGaAloD0MIFVRU/QqpcUCUhpRSlGgVTYEDaBZHQMSxveB6KLt1fZQoaAZoCWgPQwinr+drFqVxQJSGlFKUaBVNUgFoFkdAxLHpedCmdnV9lChoBmgJaA9DCKLrwg/OPHNAlIaUUpRoFU05AWgWR0DEsgvdO6/ZdX2UKGgGaAloD0MItDo5Q7FOdECUhpRSlGgVTUUCaBZHQMSyDL4vexh1fZQoaAZoCWgPQwj6sx8pospvQJSGlFKUaBVNVQJoFkdAxLIbDSgGr3V9lChoBmgJaA9DCAJhp1g1oHFAlIaUUpRoFU2QAWgWR0DEsmujO9nLdX2UKGgGaAloD0MItYe9UEApZkCUhpRSlGgVTegDaBZHQMSydKaw2VF1fZQoaAZoCWgPQwiSIjKsImRwQJSGlFKUaBVNMgNoFkdAxLKDOu7pV3V9lChoBmgJaA9DCNRDNLqDXWRAlIaUUpRoFU3oA2gWR0DEsr32kBS2dX2UKGgGaAloD0MIVn+EYQCJc0CUhpRSlGgVTV4BaBZHQMSzHc5S3sp1fZQoaAZoCWgPQwim1vuNdl1tQJSGlFKUaBVNMwNoFkdAxLMo1uR9w3V9lChoBmgJaA9DCPm84qmHqXFAlIaUUpRoFUvbaBZHQMSzOT3yqdZ1fZQoaAZoCWgPQwjqQUEpWhBkQJSGlFKUaBVN6ANoFkdAxLNBe2uxKXV9lChoBmgJaA9DCCtPIOzULXFAlIaUUpRoFU3TAWgWR0DEs1ka86FNdX2UKGgGaAloD0MIOQ1Rhb+5cECUhpRSlGgVTSUDaBZHQMSzjIrvsqt1fZQoaAZoCWgPQwgUev1JvKNzQJSGlFKUaBVNbwJoFkdAxLOyq2Bre3V9lChoBmgJaA9DCAJlU64w0HNAlIaUUpRoFU2YAmgWR0DEs88IomXxdX2UKGgGaAloD0MI/wjDgKUAcECUhpRSlGgVTUUDaBZHQMSz7j3VTaV1fZQoaAZoCWgPQwh79fHQ93RyQJSGlFKUaBVNOwJoFkdAxLRuGdqcmXV9lChoBmgJaA9DCHtNDwpKMT5AlIaUUpRoFUuLaBZHQMS0crPldTp1fZQoaAZoCWgPQwjdW5GYIM5mQJSGlFKUaBVN6ANoFkdAxLSBI5o4/HV9lChoBmgJaA9DCPT6k/jcR3FAlIaUUpRoFU24AmgWR0DEtIvVTaTPdX2UKGgGaAloD0MIw2fr4ODNcUCUhpRSlGgVTQEBaBZHQMS1d9CE6DJ1fZQoaAZoCWgPQwi1FmahndNoQJSGlFKUaBVN6ANoFkdAxLW01BMSK3V9lChoBmgJaA9DCLcKYqDr02dAlIaUUpRoFU3oA2gWR0DEtbYPCl7/dX2UKGgGaAloD0MIVU/mH/0ScUCUhpRSlGgVTTwDaBZHQMS12NZmqYJ1fZQoaAZoCWgPQwhPPdLg9pN0QJSGlFKUaBVNbAFoFkdAxLX2tp22X3V9lChoBmgJaA9DCFDFjVvMqnFAlIaUUpRoFU3oA2gWR0DEtjfIfbKzdX2UKGgGaAloD0MIRwTj4BLYcUCUhpRSlGgVTf0BaBZHQMS2Z0AT7EZ1fZQoaAZoCWgPQwivtIzUO9dxQJSGlFKUaBVN3wJoFkdAxLacZn+Q2nV9lChoBmgJaA9DCIUmiSXlyXBAlIaUUpRoFU2lA2gWR0DEtrOGKyfMdX2UKGgGaAloD0MIol9bP/0aZkCUhpRSlGgVTegDaBZHQMS21Ofdykt1fZQoaAZoCWgPQwjbUgd5vS1lQJSGlFKUaBVN6ANoFkdAxLbfXz19OXV9lChoBmgJaA9DCL6ECg4v8WdAlIaUUpRoFU3oA2gWR0DEtvdOmBOIdX2UKGgGaAloD0MIoz8082SXakCUhpRSlGgVTegDaBZHQMS3DqQ7tAt1fZQoaAZoCWgPQwjekhywq4JpQJSGlFKUaBVN6ANoFkdAxLdDUNKAa3V9lChoBmgJaA9DCJxNRwA3rG9AlIaUUpRoFU03AWgWR0DEt0u4LCvYdX2UKGgGaAloD0MIJTyh1x/nZECUhpRSlGgVTegDaBZHQMS3ZcFyJbd1fZQoaAZoCWgPQwjhlo+kpFtVQJSGlFKUaBVLmmgWR0DEt80XSBsidX2UKGgGaAloD0MIzv5AuW0Lc0CUhpRSlGgVTTwBaBZHQMS34l6Avtd1fZQoaAZoCWgPQwhGCfoLfXBxQJSGlFKUaBVNCQFoFkdAxLfx5aePJnV9lChoBmgJaA9DCNLEO8BTknJAlIaUUpRoFU1IAWgWR0DEuBDMqz7edX2UKGgGaAloD0MIFHmSdM1CZ0CUhpRSlGgVTegDaBZHQMS4LsniNsF1fZQoaAZoCWgPQwhHyhZJe25yQJSGlFKUaBVNKAFoFkdAxLhlqv/za3V9lChoBmgJaA9DCMtHUtJDAHJAlIaUUpRoFU1jA2gWR0DEuIEzAN5MdX2UKGgGaAloD0MIUaG6ufiwcUCUhpRSlGgVTT0CaBZHQMS4iag/Tsp1fZQoaAZoCWgPQwiXcr7YOwVxQJSGlFKUaBVL5WgWR0DEuM5R8+ibdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1488, "n_steps": 2048, "gamma": 1, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 8, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV0QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMTy9ob21lL21pa2kvLmxvY2FsL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjE8vaG9tZS9taWtpLy5sb2NhbC9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.14.0-239.el9.x86_64-x86_64-with-glibc2.34 # 1 SMP PREEMPT_DYNAMIC Thu Jan 19 14:14:19 UTC 2023", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu117", "GPU Enabled": "True", "Numpy": "1.24.1", "Gym": "0.21.0"}}
|
ppo-LunarLander-g1.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:243292c7a1cdf4845bece26ace647d6b28aaeb118fbff51d3c0b8ed6a6daabac
|
| 3 |
+
size 147478
|
ppo-LunarLander-g1/data
CHANGED
|
@@ -48,7 +48,7 @@
|
|
| 48 |
"_num_timesteps_at_start": 0,
|
| 49 |
"seed": null,
|
| 50 |
"action_noise": null,
|
| 51 |
-
"start_time":
|
| 52 |
"learning_rate": 0.0003,
|
| 53 |
"tensorboard_log": null,
|
| 54 |
"lr_schedule": {
|
|
@@ -57,7 +57,7 @@
|
|
| 57 |
},
|
| 58 |
"_last_obs": {
|
| 59 |
":type:": "<class 'numpy.ndarray'>",
|
| 60 |
-
":serialized:": "
|
| 61 |
},
|
| 62 |
"_last_episode_starts": {
|
| 63 |
":type:": "<class 'numpy.ndarray'>",
|
|
@@ -70,13 +70,13 @@
|
|
| 70 |
"_current_progress_remaining": -0.015808000000000044,
|
| 71 |
"ep_info_buffer": {
|
| 72 |
":type:": "<class 'collections.deque'>",
|
| 73 |
-
":serialized:": "
|
| 74 |
},
|
| 75 |
"ep_success_buffer": {
|
| 76 |
":type:": "<class 'collections.deque'>",
|
| 77 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 78 |
},
|
| 79 |
-
"_n_updates":
|
| 80 |
"n_steps": 2048,
|
| 81 |
"gamma": 1,
|
| 82 |
"gae_lambda": 0.98,
|
|
|
|
| 48 |
"_num_timesteps_at_start": 0,
|
| 49 |
"seed": null,
|
| 50 |
"action_noise": null,
|
| 51 |
+
"start_time": 1680082258915377443,
|
| 52 |
"learning_rate": 0.0003,
|
| 53 |
"tensorboard_log": null,
|
| 54 |
"lr_schedule": {
|
|
|
|
| 57 |
},
|
| 58 |
"_last_obs": {
|
| 59 |
":type:": "<class 'numpy.ndarray'>",
|
| 60 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAA42zuBbn4+zf6NPQfRxr7/GSE7rTKPPAAAAAAAAAAAACAMO/bkXbp9+kC5lSE1tCWx0LrwBGM4AACAPwAAgD+apBi9SEHWuJAn/jhvwFU2tQZEumZZGbgAAIA/AACAPzNfJz3DwUO6m6oyutXr97QNakk7TW9ROQAAgD8AAIA/zdjfO8OJe7ra3Uw7cxfgNT/Ogrp2V2+6AACAPwAAgD8mk1c+8pAJP0B+ib6WyMm+3c8OPui6Ir4AAAAAAAAAAGaS/7xIP5O6uvn7O0EitzYnzsi5reatNQAAgD8AAIA/mnn/Oq59kLoGDgM51tYANEUikDiZ2Be4AACAPwAAgD+aWaw59uwiukSxQjuhQs027RvgOtgMzDUAAIA/AACAP5qPPj1c6qs/ZDgKP3Sd8L4f+hc8Fgc+PgAAAAAAAAAAmlkkOq5Blro6eB+64J94tjIqrjrQrTg5AACAPwAAgD+ax3W9XNtXulhr4TQ9VhIwRxhruknnM7QAAIA/AACAPzO+ijzhgoC6RZNDuloFQbU4auY6fmRkOQAAgD8AAIA/zcpMPJzjRbw4Ue093BF+vTb6Qb1f67K6AACAPwAAgD8A0j69FKaFul5GiTuRafA19i4lO+D95jQAAIA/AACAP2ZySLxca1K6RmldOrpqTjXNLEE6SpaCuQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
| 61 |
},
|
| 62 |
"_last_episode_starts": {
|
| 63 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
|
| 70 |
"_current_progress_remaining": -0.015808000000000044,
|
| 71 |
"ep_info_buffer": {
|
| 72 |
":type:": "<class 'collections.deque'>",
|
| 73 |
+
":serialized:": "gAWVdRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIijpzD8micUCUhpRSlIwBbJRL5owBdJRHQMSYVlwkxAV1fZQoaAZoCWgPQwhzS6shcSdzQJSGlFKUaBVNlwFoFkdAxJiAS5AhS3V9lChoBmgJaA9DCMmP+BXrXHFAlIaUUpRoFU2DAmgWR0DEmLDdSEUTdX2UKGgGaAloD0MIZOjYQaVbcECUhpRSlGgVTWsBaBZHQMSZAGZeAut1fZQoaAZoCWgPQwhUq6+uCn5zQJSGlFKUaBVL1WgWR0DEmQl6/qPfdX2UKGgGaAloD0MIwY7/AoFvckCUhpRSlGgVTfICaBZHQMSZGNwaR6p1fZQoaAZoCWgPQwhkd4GSQrhxQJSGlFKUaBVNUgFoFkdAxKG27iADrHV9lChoBmgJaA9DCFVLOsrBzmRAlIaUUpRoFU3oA2gWR0DEofPBnBcidX2UKGgGaAloD0MID5nyISg0ZUCUhpRSlGgVTegDaBZHQMSiDbNB4Ux1fZQoaAZoCWgPQwiQZcHEn1llQJSGlFKUaBVN6ANoFkdAxKI7aIN3GHV9lChoBmgJaA9DCJ8AipEldGhAlIaUUpRoFU3oA2gWR0DEokm98JD3dX2UKGgGaAloD0MIJGJKJNEuZECUhpRSlGgVTegDaBZHQMSib2YfGMp1fZQoaAZoCWgPQwi+ZrlsdNZwQJSGlFKUaBVNEgJoFkdAxKJ6JhvzfHV9lChoBmgJaA9DCCrj32dc0m9AlIaUUpRoFU3UAmgWR0DEooNbiZOSdX2UKGgGaAloD0MIlnmrrkM7UkCUhpRSlGgVS4VoFkdAxKKoEidJ8XV9lChoBmgJaA9DCGe610l9i2hAlIaUUpRoFU3oA2gWR0DEovgw/PgOdX2UKGgGaAloD0MIMBNFSF18cECUhpRSlGgVS/xoFkdAxKOZPhybQXV9lChoBmgJaA9DCK1M+KW+X3JAlIaUUpRoFU1JAWgWR0DEo7np8neBdX2UKGgGaAloD0MI1CtlGWLzZUCUhpRSlGgVTegDaBZHQMSjzJDNQj51fZQoaAZoCWgPQwheonpr4EtzQJSGlFKUaBVN6AJoFkdAxKPTEpAlfXV9lChoBmgJaA9DCJm36jqUHXJAlIaUUpRoFU3IAWgWR0DEpBpq46OpdX2UKGgGaAloD0MIZjOHpJbJakCUhpRSlGgVTegDaBZHQMSkP01ZTyd1fZQoaAZoCWgPQwjgDtQpj6pnQJSGlFKUaBVN6ANoFkdAxKSEFs54nnV9lChoBmgJaA9DCHnNqzrrvnBAlIaUUpRoFUvQaBZHQMSkjyeZof11fZQoaAZoCWgPQwjHm/wWnfltQJSGlFKUaBVNhQNoFkdAxKTM0vXbunV9lChoBmgJaA9DCGajc34KSnJAlIaUUpRoFU2CA2gWR0DEpOBXKbKBdX2UKGgGaAloD0MI8x5nmjA1c0CUhpRSlGgVTbwCaBZHQMSk/ytV7yB1fZQoaAZoCWgPQwhJ10y+WZdhQJSGlFKUaBVN6ANoFkdAxKUKQnx8UnV9lChoBmgJaA9DCJ/HKM+8rmVAlIaUUpRoFU3oA2gWR0DEpRLJQtSRdX2UKGgGaAloD0MI2o6puzLjZECUhpRSlGgVTegDaBZHQMSlcpFCswN1fZQoaAZoCWgPQwj+RGXDmpJkQJSGlFKUaBVN6ANoFkdAxKWMIt16mnV9lChoBmgJaA9DCHZSX5Z2DGlAlIaUUpRoFU3oA2gWR0DEpcoQHzH0dX2UKGgGaAloD0MIEw69xQO6ckCUhpRSlGgVS/FoFkdAxKXUhBZ6lnV9lChoBmgJaA9DCHI1sist6W9AlIaUUpRoFU2EAWgWR0DEpinkHUtqdX2UKGgGaAloD0MIDt3sD1Qjc0CUhpRSlGgVTecBaBZHQMSmMSCFsYV1fZQoaAZoCWgPQwhOYhBYOY1xQJSGlFKUaBVNRgNoFkdAxKZ84ku6E3V9lChoBmgJaA9DCPbv+sxZwWJAlIaUUpRoFU3oA2gWR0DEpn3FefI0dX2UKGgGaAloD0MIwqbOo+JlcUCUhpRSlGgVTVEBaBZHQMSmsD7Ikqt1fZQoaAZoCWgPQwj68ZcWtU5zQJSGlFKUaBVNlwNoFkdAxKbgLx7RfHV9lChoBmgJaA9DCNzwu+mWRXJAlIaUUpRoFU0mA2gWR0DEpvrdFfAsdX2UKGgGaAloD0MIZ/LNNjfZc0CUhpRSlGgVTVECaBZHQMSm/iT+vQp1fZQoaAZoCWgPQwjRArStZnVmQJSGlFKUaBVN6ANoFkdAxKc2q6OHWXV9lChoBmgJaA9DCKCobFiTKXJAlIaUUpRoFUvUaBZHQMSnN5pSJj51fZQoaAZoCWgPQwgbDeAtkMNmQJSGlFKUaBVN6ANoFkdAxKd/jLB9C3V9lChoBmgJaA9DCJq2f2Wl53FAlIaUUpRoFUvZaBZHQMSnvuUUwi91fZQoaAZoCWgPQwh5zas6K85pQJSGlFKUaBVN6ANoFkdAxKfwoWpIc3V9lChoBmgJaA9DCDj1geRdT3JAlIaUUpRoFU1TA2gWR0DEp/tt8/lidX2UKGgGaAloD0MIVmXfFQFHckCUhpRSlGgVTa0CaBZHQMSoKqYAsCl1fZQoaAZoCWgPQwhqFf2hGYJoQJSGlFKUaBVN6ANoFkdAxKg4WsRxtHV9lChoBmgJaA9DCBBbejRVD3NAlIaUUpRoFU0uA2gWR0DEqD96C17ZdX2UKGgGaAloD0MIUBvV6UCZckCUhpRSlGgVTb4BaBZHQMSoP3++/QB1fZQoaAZoCWgPQwgwYwrWuOVvQJSGlFKUaBVN4QJoFkdAxKiysny/bnV9lChoBmgJaA9DCO9yEd8J/nFAlIaUUpRoFU0hAWgWR0DEqLt9c8kldX2UKGgGaAloD0MIFVRU/QqpcUCUhpRSlGgVTYEDaBZHQMSxveB6KLt1fZQoaAZoCWgPQwinr+drFqVxQJSGlFKUaBVNUgFoFkdAxLHpedCmdnV9lChoBmgJaA9DCKLrwg/OPHNAlIaUUpRoFU05AWgWR0DEsgvdO6/ZdX2UKGgGaAloD0MItDo5Q7FOdECUhpRSlGgVTUUCaBZHQMSyDL4vexh1fZQoaAZoCWgPQwj6sx8pospvQJSGlFKUaBVNVQJoFkdAxLIbDSgGr3V9lChoBmgJaA9DCAJhp1g1oHFAlIaUUpRoFU2QAWgWR0DEsmujO9nLdX2UKGgGaAloD0MItYe9UEApZkCUhpRSlGgVTegDaBZHQMSydKaw2VF1fZQoaAZoCWgPQwiSIjKsImRwQJSGlFKUaBVNMgNoFkdAxLKDOu7pV3V9lChoBmgJaA9DCNRDNLqDXWRAlIaUUpRoFU3oA2gWR0DEsr32kBS2dX2UKGgGaAloD0MIVn+EYQCJc0CUhpRSlGgVTV4BaBZHQMSzHc5S3sp1fZQoaAZoCWgPQwim1vuNdl1tQJSGlFKUaBVNMwNoFkdAxLMo1uR9w3V9lChoBmgJaA9DCPm84qmHqXFAlIaUUpRoFUvbaBZHQMSzOT3yqdZ1fZQoaAZoCWgPQwjqQUEpWhBkQJSGlFKUaBVN6ANoFkdAxLNBe2uxKXV9lChoBmgJaA9DCCtPIOzULXFAlIaUUpRoFU3TAWgWR0DEs1ka86FNdX2UKGgGaAloD0MIOQ1Rhb+5cECUhpRSlGgVTSUDaBZHQMSzjIrvsqt1fZQoaAZoCWgPQwgUev1JvKNzQJSGlFKUaBVNbwJoFkdAxLOyq2Bre3V9lChoBmgJaA9DCAJlU64w0HNAlIaUUpRoFU2YAmgWR0DEs88IomXxdX2UKGgGaAloD0MI/wjDgKUAcECUhpRSlGgVTUUDaBZHQMSz7j3VTaV1fZQoaAZoCWgPQwh79fHQ93RyQJSGlFKUaBVNOwJoFkdAxLRuGdqcmXV9lChoBmgJaA9DCHtNDwpKMT5AlIaUUpRoFUuLaBZHQMS0crPldTp1fZQoaAZoCWgPQwjdW5GYIM5mQJSGlFKUaBVN6ANoFkdAxLSBI5o4/HV9lChoBmgJaA9DCPT6k/jcR3FAlIaUUpRoFU24AmgWR0DEtIvVTaTPdX2UKGgGaAloD0MIw2fr4ODNcUCUhpRSlGgVTQEBaBZHQMS1d9CE6DJ1fZQoaAZoCWgPQwi1FmahndNoQJSGlFKUaBVN6ANoFkdAxLW01BMSK3V9lChoBmgJaA9DCLcKYqDr02dAlIaUUpRoFU3oA2gWR0DEtbYPCl7/dX2UKGgGaAloD0MIVU/mH/0ScUCUhpRSlGgVTTwDaBZHQMS12NZmqYJ1fZQoaAZoCWgPQwhPPdLg9pN0QJSGlFKUaBVNbAFoFkdAxLX2tp22X3V9lChoBmgJaA9DCFDFjVvMqnFAlIaUUpRoFU3oA2gWR0DEtjfIfbKzdX2UKGgGaAloD0MIRwTj4BLYcUCUhpRSlGgVTf0BaBZHQMS2Z0AT7EZ1fZQoaAZoCWgPQwivtIzUO9dxQJSGlFKUaBVN3wJoFkdAxLacZn+Q2nV9lChoBmgJaA9DCIUmiSXlyXBAlIaUUpRoFU2lA2gWR0DEtrOGKyfMdX2UKGgGaAloD0MIol9bP/0aZkCUhpRSlGgVTegDaBZHQMS21Ofdykt1fZQoaAZoCWgPQwjbUgd5vS1lQJSGlFKUaBVN6ANoFkdAxLbfXz19OXV9lChoBmgJaA9DCL6ECg4v8WdAlIaUUpRoFU3oA2gWR0DEtvdOmBOIdX2UKGgGaAloD0MIoz8082SXakCUhpRSlGgVTegDaBZHQMS3DqQ7tAt1fZQoaAZoCWgPQwjekhywq4JpQJSGlFKUaBVN6ANoFkdAxLdDUNKAa3V9lChoBmgJaA9DCJxNRwA3rG9AlIaUUpRoFU03AWgWR0DEt0u4LCvYdX2UKGgGaAloD0MIJTyh1x/nZECUhpRSlGgVTegDaBZHQMS3ZcFyJbd1fZQoaAZoCWgPQwjhlo+kpFtVQJSGlFKUaBVLmmgWR0DEt80XSBsidX2UKGgGaAloD0MIzv5AuW0Lc0CUhpRSlGgVTTwBaBZHQMS34l6Avtd1fZQoaAZoCWgPQwhGCfoLfXBxQJSGlFKUaBVNCQFoFkdAxLfx5aePJnV9lChoBmgJaA9DCNLEO8BTknJAlIaUUpRoFU1IAWgWR0DEuBDMqz7edX2UKGgGaAloD0MIFHmSdM1CZ0CUhpRSlGgVTegDaBZHQMS4LsniNsF1fZQoaAZoCWgPQwhHyhZJe25yQJSGlFKUaBVNKAFoFkdAxLhlqv/za3V9lChoBmgJaA9DCMtHUtJDAHJAlIaUUpRoFU1jA2gWR0DEuIEzAN5MdX2UKGgGaAloD0MIUaG6ufiwcUCUhpRSlGgVTT0CaBZHQMS4iag/Tsp1fZQoaAZoCWgPQwiXcr7YOwVxQJSGlFKUaBVL5WgWR0DEuM5R8+ibdWUu"
|
| 74 |
},
|
| 75 |
"ep_success_buffer": {
|
| 76 |
":type:": "<class 'collections.deque'>",
|
| 77 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
| 78 |
},
|
| 79 |
+
"_n_updates": 1488,
|
| 80 |
"n_steps": 2048,
|
| 81 |
"gamma": 1,
|
| 82 |
"gae_lambda": 0.98,
|
ppo-LunarLander-g1/policy.optimizer.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87929
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ee2c3413dd9d76c6fb5831e1af0771248d019775a91b4eaaacdb78e979da902
|
| 3 |
size 87929
|
ppo-LunarLander-g1/policy.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 43393
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b293c2313888dfa61181d125715b027d68cf68ca80912111eaba13cefbbb96e4
|
| 3 |
size 43393
|
replay.mp4
CHANGED
|
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
|
results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"mean_reward":
|
|
|
|
| 1 |
+
{"mean_reward": 284.6548097550211, "std_reward": 12.105835830261688, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-29T13:34:42.102100"}
|