pableitorr commited on
Commit
90486bd
·
verified ·
1 Parent(s): 95554ae

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 280.19 +/- 23.27
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 261.28 +/- 26.18
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7bb2389d5a20>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7bb2389d5ab0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7bb2389d5b40>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7bb2389d5bd0>", "_build": "<function ActorCriticPolicy._build at 0x7bb2389d5c60>", "forward": "<function ActorCriticPolicy.forward at 0x7bb2389d5cf0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7bb2389d5d80>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7bb2389d5e10>", "_predict": "<function ActorCriticPolicy._predict at 0x7bb2389d5ea0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7bb2389d5f30>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7bb2389d5fc0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7bb2389d6050>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7bb238b624c0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1726532143493315846, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWVNwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwhkAXwAFABTAJSMVgogIExlYXJuaW5nIHJhdGUgc2NoZWR1bGUuCgogIDpwYXJhbSBwcm9ncmVzc19yZW1haW5pbmc6IChmbG9hdCkKICA6cmV0dXJuOiAoZmxvYXQpCiAglEc/gm6XjU/fO4aUKYwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjB88aXB5dGhvbi1pbnB1dC00NS1mNzVkZWEzMTBiMmE+lIwLbHJfc2NoZWR1bGWUSwFDAggHlCkpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5OdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgXfZR9lChoFGgOjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBWMB19fZG9jX1+UaAmMC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGb+CrzZ6aY/VLTFvX1kIr/jDkM7PX1qPAAAAAAAAAAAAADkvdfOnz+L5R2/pksUv+vapL3QdX++AAAAAAAAAAD68qo+n+wjPzP+db5p7Qu/x8+NPsUpOr4AAAAAAAAAADPWiTx/DA8+I9ZyvRkzg75AVbm9m2wGPQAAAAAAAAAAgJk4vkxanj6S3ho+RSSavsqRmr2Lk988AAAAAAAAAACatwk8K7qZP2ZBkzyHqxq/aZTRPOKsFD0AAAAAAAAAAJo5kb0pLEu6PySUNzP3qrCPj+W6tSistgAAgD8AAIA/s9+fvpZehT+3qgm/PHo2v2sXob4V01C9AAAAAAAAAACaKZQ8Ya/vO31ST75y9cO9DlwjvUrcfj8AAIA/AAAAAFqkjj64P6M/zXIkP3rQIL/nJI8+WT2kPgAAAAAAAAAATcklvWpeoD+6ZrG+FQkmv4Bsrry+KNG9AAAAAAAAAADA8Ra+hAazP3pn177rjeK+oaVmveNNBr4AAAAAAAAAAGaPwjxiOHw+2xdqvfvel74BmFa8RMOJvQAAAAAAAAAAGpDiPbUGlz+yScs+bJIXv2RwLT448lY+AAAAAAAAAACaOXI6wNWePsTLI76xRJW+udxgvSR1mLwAAAAAAAAAAJrYkrwUqKS61tJKs8+hL7CDlkY6lrvDMwAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV7AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG+hLZ8KG+OMAWyUS8WMAXSUR0C58MuAI6bOdX2UKGgGR0BwNiBMBZIQaAdL7WgIR0C58N5/oaDPdX2UKGgGR0BxU/4k/r0KaAdLwGgIR0C58PDJyQxOdX2UKGgGR0BwKaFQEZBLaAdL5mgIR0C58P3ctXgcdX2UKGgGR0BxckUzsQd0aAdL2mgIR0C58QzG1hLHdX2UKGgGR0ByztwT/Q0GaAdLwmgIR0C58SRmkFfRdX2UKGgGR0Bw+jgWJrLyaAdL4mgIR0C58Sv2saKldX2UKGgGR0BwDaluWKMvaAdL32gIR0C58TPAj6eodX2UKGgGR0Bw9ZhmXgLraAdL1mgIR0C58USsCDEndX2UKGgGR0BxKU+Y+jdpaAdL7GgIR0C58Wd6gM+edX2UKGgGR0ByvzL4etCBaAdLzWgIR0C58WwuEmICdX2UKGgGR0BupZC0F8ohaAdL62gIR0C58a5bdJrddX2UKGgGR0BusGB8QZn+aAdLz2gIR0C58cDjWCmNdX2UKGgGR0Bu4kO/cnE3aAdL2mgIR0C58eT6i0v5dX2UKGgGR0BvCctkFwDOaAdL2GgIR0C58f6KtPpIdX2UKGgGR0BzyKg6EJ0GaAdNIwFoCEdAufIJRVIZqHV9lChoBkdAchItCiRGMGgHS91oCEdAufIax2SuAHV9lChoBkdAboUVh1DBuWgHS9toCEdAufIq6Zpi7XV9lChoBkdAc1t/yoXKsGgHS8ZoCEdAufJX8tPHk3V9lChoBkdAcmdwX668QWgHS/BoCEdAufJaPT5O8HV9lChoBkdAb5H9JjDsMWgHS99oCEdAufJ2SDAaenV9lChoBkdAcL+e7+T/yWgHS8xoCEdAufJ2R/3Fk3V9lChoBkdAc/oPUrkKeGgHS/1oCEdAufKADNhVl3V9lChoBkdAcVO5U96kZmgHS/RoCEdAufKMMb3oLXV9lChoBkdAcOA7L+xW1mgHS8doCEdAufKQxASnL3V9lChoBkdAcnlFs54nnmgHS81oCEdAufKc5Lh73XV9lChoBkdAUF6cBltj1GgHS5FoCEdAufLp6C17Y3V9lChoBkdAcC2zt1IRRWgHS+toCEdAufMdy5qdpnV9lChoBkdAbbEPdVNpNGgHS9toCEdAufMrQVsUI3V9lChoBkdAc0DcvM8oyGgHTQABaAhHQLnzLJ3gUDd1fZQoaAZHQG1rbSJCSidoB03jAWgIR0C596VchTwVdX2UKGgGR0Bxe0wmE5AAaAdLz2gIR0C598xyCFsYdX2UKGgGR0BxFE7NjbztaAdL/WgIR0C59+8QiA2AdX2UKGgGR0BykPJEH+qBaAdL2mgIR0C5+CL7GecydX2UKGgGR0BxQ1PEbYK6aAdLzWgIR0C5+FIN3GGVdX2UKGgGR0Bw4MQSSNfgaAdL7mgIR0C5+FIhY/3WdX2UKGgGR0BxS2pKjBVNaAdL3GgIR0C5+F6nrIHUdX2UKGgGR0Bym5nanJkoaAdL1GgIR0C5+GeYYzi0dX2UKGgGR0BvbcLORkmQaAdL62gIR0C5+G5++dsjdX2UKGgGR0BxrVnOB19waAdL2WgIR0C5+ILamGdqdX2UKGgGR0BwsR7IDHOsaAdLwmgIR0C5+Sbjo6jndX2UKGgGR0BwcIdFOO81aAdL3WgIR0C5+VhY7q6fdX2UKGgGR0BDFDpkf9xZaAdLuGgIR0C5+WDfm9xqdX2UKGgGR0BzjVqM3qA0aAdL2mgIR0C5+WPVurIYdX2UKGgGR0ByUwrGza9LaAdL5GgIR0C5+Z6kVN5/dX2UKGgGR0By55Q+EAYIaAdNLwFoCEdAufnAnLJSznV9lChoBkdAcpdv99+gDmgHS9hoCEdAufnD4QBgeHV9lChoBkdAcBx6Rhc7hmgHS9loCEdAufntuqFRHnV9lChoBkdAcJnVn27FsGgHS9hoCEdAufoPbVSXMXV9lChoBkdAcQxK+zt1IWgHS9ZoCEdAufoeLHdXT3V9lChoBkdAc92cKPXCj2gHS9doCEdAufomRgZ0jnV9lChoBkdAcv1ffoA4oGgHS+hoCEdAufoqc3EQ5HV9lChoBkdAcXRfYjB2wGgHTcgBaAhHQLn6L9hZyMl1fZQoaAZHQG560WdmQKdoB0vuaAhHQLn6O0E5hjR1fZQoaAZHQHHCkPhAGB5oB0voaAhHQLn6SyTINmV1fZQoaAZHQHDorfxc3VFoB0viaAhHQLn6syhSLqF1fZQoaAZHQHIYbmdRR/FoB0vdaAhHQLn6zsvIwM91fZQoaAZHQHGWajBVMmFoB0vJaAhHQLn61zoEB8x1fZQoaAZHQG6BL+5vtMRoB0vmaAhHQLn63xFAmiR1fZQoaAZHQHHzLcTJyQxoB0vEaAhHQLn67elKsdV1fZQoaAZHQHHODCLuQZJoB0vCaAhHQLn7NeQMhHN1fZQoaAZHQHIc/ZyuIRBoB0u6aAhHQLn7N7vG6wt1fZQoaAZHQHJ73wCr92poB00FAWgIR0C5+1kM5OrRdX2UKGgGR0BzitKtga3raAdL7mgIR0C5+16eTV2BdX2UKGgGR0By3mFQEZBLaAdL1mgIR0C5+3Jm7J4jdX2UKGgGR0BzJ8RjBl+WaAdL5mgIR0C5+4e3pfQbdX2UKGgGR0BtYTsv7FbWaAdL4WgIR0C5+4mVVxS6dX2UKGgGR0BxsZU6xPfsaAdL5GgIR0C5+5nTI/7jdX2UKGgGR0BvXhjSXt0FaAdL9GgIR0C5+8WmP5pKdX2UKGgGR0Bw290ihWYGaAdLwmgIR0C5+/2w3YL9dX2UKGgGR0BzNIr7O3UhaAdNpQFoCEdAufwBic5Ke3V9lChoBkdAcNrLYf4h2WgHS9toCEdAufwKEEkjYHV9lChoBkdAcGRhAWznimgHS+toCEdAufxejdpItnV9lChoBkdAcYHC3PRiPWgHS/hoCEdAufxi7nPmgnV9lChoBkdAcoaqqwQlKWgHS8NoCEdAufxpt8/lhnV9lChoBkdAcThll9SdfGgHTRMBaAhHQLn8hC1JDmd1fZQoaAZHQHBLY4ZMtbtoB0vJaAhHQLn8pziCJ411fZQoaAZHQHFCDBEa2ndoB0viaAhHQLn8uCQcPvt1fZQoaAZHQHKVRwhnrY5oB0v5aAhHQLn84LThHb11fZQoaAZHQHAX4od+5OJoB0vsaAhHQLn89TefqX51fZQoaAZHQG50NcW0qpdoB00fAWgIR0C5/PfZVXFMdX2UKGgGR0Bw9m16Vt4zaAdL52gIR0C5/QEa2nbZdX2UKGgGR0BwWb3pOerdaAdLymgIR0C5/QC/fwZwdX2UKGgGR0Bx6QOavzOHaAdL9mgIR0C5/QYvalDXdX2UKGgGR0BfExrzoUzsaAdN6ANoCEdAuf0Gup0fYHV9lChoBkdAbxMxptaY/mgHS9xoCEdAuf1DK+zt1XV9lChoBkdAc6CQUpNKy2gHS9VoCEdAuf1EgNgBtHV9lChoBkdAcdpOclPac2gHTQcBaAhHQLn9gsEJSix1fZQoaAZHQG+NDrJKaodoB0vKaAhHQLn9ioRIz311fZQoaAZHQHEhTK1XvH9oB0vMaAhHQLn9pyO7xut1fZQoaAZHQHQF4dIXj2loB0vnaAhHQLn9qssQNCt1fZQoaAZHQHMcWrGR3eNoB0v7aAhHQLn9zSNwR5F1fZQoaAZHQHLDIOH31z1oB0vsaAhHQLn9+ykKu0V1fZQoaAZHQHOQI1gpjMFoB0vVaAhHQLn+D2JBPbh1fZQoaAZHQHGROI68xsVoB0vIaAhHQLn+Gk3S8ap1fZQoaAZHQHIt8CDEm6ZoB00AAWgIR0C5/ilMIu5CdX2UKGgGR0ByvS7/XGwSaAdL1GgIR0C5/izdDYywdX2UKGgGR0BwcyCYkVvdaAdL4GgIR0C5/jLeqJdjdX2UKGgGR0Bv1bIeYD1XaAdL5GgIR0C5/jmpyZKGdX2UKGgGR0BxAwvUSZjQaAdL3WgIR0C5/j2Jm/WUdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 368, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVNwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwhkAXwAFABTAJSMVgogIExlYXJuaW5nIHJhdGUgc2NoZWR1bGUuCgogIDpwYXJhbSBwcm9ncmVzc19yZW1haW5pbmc6IChmbG9hdCkKICA6cmV0dXJuOiAoZmxvYXQpCiAglEc/gm6XjU/fO4aUKYwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjB88aXB5dGhvbi1pbnB1dC00NS1mNzVkZWEzMTBiMmE+lIwLbHJfc2NoZWR1bGWUSwFDAggHlCkpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5OdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgXfZR9lChoFGgOjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBWMB19fZG9jX1+UaAmMC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.0+cu121", "GPU Enabled": "True", "Numpy": "1.26.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7cde4a719900>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7cde4a719990>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7cde4a719a20>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7cde4a719ab0>", "_build": "<function ActorCriticPolicy._build at 0x7cde4a719b40>", "forward": "<function ActorCriticPolicy.forward at 0x7cde4a719bd0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7cde4a719c60>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7cde4a719cf0>", "_predict": "<function ActorCriticPolicy._predict at 0x7cde4a719d80>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7cde4a719e10>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7cde4a719ea0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7cde4a719f30>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7cde4a8a99c0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 2015232, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1726560783775658137, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWVQwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwxkAXwAFABkAhcAUwCUjFYKICBMZWFybmluZyByYXRlIHNjaGVkdWxlLgoKICA6cGFyYW0gcHJvZ3Jlc3NfcmVtYWluaW5nOiAoZmxvYXQpCiAgOnJldHVybjogKGZsb2F0KQogIJRHP3ysCDEm6XlHP2iTdLxqfvqHlCmMEnByb2dyZXNzX3JlbWFpbmluZ5SFlIwePGlweXRob24taW5wdXQtOC01MjEwZTkzZTMzYmY+lIwLbHJfc2NoZWR1bGWUSwFDAgwHlCkpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5OdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgXfZR9lChoFGgOjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBWMB19fZG9jX1+UaAmMC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAPojXz6wqos+e5bDvrahgL677Cg9ttT5vQAAAAAAAAAAgJ1iPgk4Tj6etoK+QFpqvpmOij0vL8y6AAAAAAAAAAAAvHW8IJUtP6UPoT26Dfe+EyrIvLzxiTwAAAAAAAAAAGatq7zHZi0/dt8XPifYCb/2LUK9zTj9PQAAAAAAAAAAzW7wvDoUuT9C0Ti/duuyPmQ0sjz2aR09AAAAAAAAAACANFU9XNWtP5dVHT+Ze8W+m9a3u50RCT4AAAAAAAAAAHMZuD24JrC5Vs6TvL8jF7XI1YC6dax/NAAAgD8AAIA/GqgMPh/+3btYgQq6i0q3N7svK727sjI5AACAPwAAgD/NDFQ7aX0svP6yn76ki3e9ulaXPUsYTj4AAIA/AACAPwD59LyC9qI/om8EvmpT4r5jicm9bs1LvQAAAAAAAAAAQByQvXvtfT9B1Ae8tsAMv4gn672yHBk8AAAAAAAAAADzIGs+/CddPr3FZ75XIJi+ByspPh2VbL0AAAAAAAAAAAAZYr2PSlI/1iJKPYoRA7/bD9+9+zm7PQAAAAAAAAAAZsYRPTig/rs8eg+8aXI7PO3vTb2ntB89AACAPwAAgD+IlZG+OJgGP721Lj4nYMO+fdZJvvrj5j0AAAAAAAAAAIv0ir5IcZE++MOiPmql377BNsG9NIQTPgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.007616000000000067, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV/QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHMgTByjpLWMAWyUTQoBjAF0lEdAoOVzb8FY+3V9lChoBkdAb5iJqIrOJWgHS9poCEdAoOV8yFfzBnV9lChoBkdAcl/CEpRXOmgHS+1oCEdAoOXWO801qHV9lChoBkdAcioFt8/lhmgHS9FoCEdAoOYU45tFa3V9lChoBkdAcTs+JgsshGgHS/doCEdAoOZYf6oES3V9lChoBkdAcaQtRNyo42gHS9poCEdAoOZcEovzv3V9lChoBkdAcimzXjENv2gHS+ZoCEdAoOaw4yXUpnV9lChoBkdAc+rfZ26kI2gHS/doCEdAoOcY8OkLyHV9lChoBkdAcoSVy3kPtmgHS+FoCEdAoOcjbL2YfHV9lChoBkdAbqYLgn+hoWgHTQYBaAhHQKDngoiLVFx1fZQoaAZHQHCutQj2SMdoB0veaAhHQKDnxztkWh11fZQoaAZHQHBIvpQk5ZNoB0vhaAhHQKDoAsvIwM91fZQoaAZHQHEDAyhzvJBoB0vZaAhHQKDoaifQKKJ1fZQoaAZHQHPG88s+V1RoB0vxaAhHQKDokASWZ7Z1fZQoaAZHQG9pRp1zQu5oB00iAWgIR0Cg6SfHPu5SdX2UKGgGR0Bxie89Oh0yaAdNFwFoCEdAoOkzDl5nlHV9lChoBkdAcN97vXsgMmgHTRUBaAhHQKDpZ8E3bVV1fZQoaAZHQHK6BHf/FR5oB0v+aAhHQKDp5i97F851fZQoaAZHQHHtcSf16E9oB0v3aAhHQKDqHshPj4p1fZQoaAZHQHHQcZxaPjpoB0vnaAhHQKDqPpwCKaZ1fZQoaAZHQHDYsu3+dbxoB0v0aAhHQKDqdMr3Cbd1fZQoaAZHQHAuZ/G2kSFoB0vlaAhHQKDqnkupS751fZQoaAZHQHGZABPsRg9oB000AWgIR0Cg6qXYL9dedX2UKGgGR0BxDQXMyJsPaAdLy2gIR0Cg6tDVYp2EdX2UKGgGR0BzE8H3UQTVaAdNAAFoCEdAoOtGw5eZ5XV9lChoBkdAck0YrJ8v3GgHS9toCEdAoOueDe0ojXV9lChoBkdAcdpF2mpEQWgHS79oCEdAoOvYE6kqMHV9lChoBkdAbaFES/TLGWgHS/toCEdAoOvqmALApXV9lChoBkdAb/0gBcRlH2gHS/VoCEdAoOyN2ki2UnV9lChoBkdAc682NedCmmgHS/9oCEdAoOzwYaYNRXV9lChoBkdAcyeppvgm7mgHS+ZoCEdAoO0WFg2If3V9lChoBkdAb/WJcgQpWmgHS9RoCEdAoO1n29L6DXV9lChoBkdAcJyrNGEwnGgHS+poCEdAoO2ArvsqrnV9lChoBkdAbndMMZxaPmgHS9NoCEdAoO2W2TgVGnV9lChoBkdAc9qwA2hqTWgHTQ4BaAhHQKDt4K+BYmt1fZQoaAZHQHJY4xQBPsRoB00+AmgIR0Cg7eWznieedX2UKGgGR0BzVN+so2GZaAdNBAFoCEdAoO46swL3K3V9lChoBkdAcD7XzlLeymgHS/ZoCEdAoO4+1a4c3nV9lChoBkdAcokra/RE4WgHS+RoCEdAoO538dgfEHV9lChoBkdASTdVT72tdWgHS6loCEdAoO7rJEH+qHV9lChoBkdAcsysRxtHhGgHS+BoCEdAoPeIexOclXV9lChoBkdAcrFyVfNRnGgHTQ4BaAhHQKD4UM9bHIZ1fZQoaAZHQHEuaVdHDrJoB0vjaAhHQKD4xmHxjKB1fZQoaAZHQG9AKaoddVxoB0vQaAhHQKD49fUF0Pp1fZQoaAZHQG+Xygf2bodoB0vMaAhHQKD5AifQKKJ1fZQoaAZHQHCQV18stkFoB00GAWgIR0Cg+XXdbgTAdX2UKGgGR0BxTGRGMGX5aAdL+GgIR0Cg+cppN9H+dX2UKGgGR0BxqjRF7UobaAdL7GgIR0Cg+fQLeANHdX2UKGgGR0BpWmQXAM2FaAdNIQNoCEdAoPoOrU9ZBHV9lChoBkdAcwZYU34sVmgHS/ZoCEdAoPoUiliz9nV9lChoBkdAcmSw9JSR82gHS+toCEdAoPpGnO0LMXV9lChoBkdAcnat6HCXQmgHS+BoCEdAoPpdzZHuqnV9lChoBkdAcKt3o9s7+2gHS+hoCEdAoPr1U+9rXXV9lChoBkdAcOavJiiItWgHTQEBaAhHQKD7Qfe1rqN1fZQoaAZHQG/L2KdhAnloB0vQaAhHQKD8B5YYBNp1fZQoaAZHQG5KUDEFW4poB0vvaAhHQKD8DRLK3d91fZQoaAZHQHGyc6BAfMhoB0vWaAhHQKD8cuoP07N1fZQoaAZHQF5gmJm/WUdoB03oA2gIR0Cg/L7muDBedX2UKGgGR0Byb0FW4mTlaAdNKAFoCEdAoP4QOz6acHV9lChoBkdAch8WIoE0SGgHTQ4BaAhHQKD+O0dBBzF1fZQoaAZHQHL2oVRDTjNoB0vwaAhHQKD+bBInSfF1fZQoaAZHQHN8VfqoqCpoB0v7aAhHQKD+e/t6X0J1fZQoaAZHQHHrb3Cbc45oB00LAWgIR0Cg/pYLkS26dX2UKGgGR0BynPyvs7dSaAdL72gIR0Cg/tW912aEdX2UKGgGR0Byb+wpvxYraAdNDQFoCEdAoP78JrtVrHV9lChoBkdAcIzSx7iQ1mgHS+poCEdAoP+/8CPp6nV9lChoBkdAc0wVlwtJ4GgHTSIBaAhHQKD/26PKdQR1fZQoaAZHQDpgFC9h7VtoB0u3aAhHQKD/9Jd0JWx1fZQoaAZHQHFsn4oJAt5oB0v7aAhHQKEAm18b70p1fZQoaAZHQHF3ESh8IAxoB0vbaAhHQKEBEIInjQ11fZQoaAZHQHRUVPrOZ9doB00dAWgIR0ChAdrLhaTwdX2UKGgGR0ByTJPJq7AdaAdNBAFoCEdAoQIAYNy5qnV9lChoBkdAcWntl7MPjGgHS9doCEdAoQJMcfeUIXV9lChoBkdAbgNrpqynk2gHS9hoCEdAoQJqZnctXnV9lChoBkdAcMvIoE0SAmgHS/FoCEdAoQLmlEZzgnV9lChoBkdAbmrFNL127mgHS/ZoCEdAoQMWbgCOm3V9lChoBkdAcSKkFwDNhWgHTQIBaAhHQKEDLSWJJoV1fZQoaAZHQHAQ544ZMtdoB0v0aAhHQKEDPEwWWQh1fZQoaAZHQG+XDAJswcpoB0vkaAhHQKEDnUQ04zd1fZQoaAZHQHMuKxHG0eFoB00NAWgIR0ChA6nKOktVdX2UKGgGR0BxjlkVeruIaAdL5WgIR0ChA6oIfKZEdX2UKGgGR0BxOrPrv9cbaAdL+mgIR0ChA9d0aIepdX2UKGgGR0BtkMnmaH9FaAdL3mgIR0ChBE/l6qsEdX2UKGgGR0Bjji+i8FpxaAdN6ANoCEdAoQRv9rGipXV9lChoBkdAcvPYJ3PiUGgHTSgBaAhHQKEE8Zof0Vd1fZQoaAZHQHK8p1zQu29oB0vxaAhHQKEFH6po9LZ1fZQoaAZHQHMdQHeJpFloB0v3aAhHQKEFVhaTwDx1fZQoaAZHQHECoj4YaYNoB0vvaAhHQKEFlqY7aIx1fZQoaAZHQHFEBDPWxyJoB0vfaAhHQKEF0+t8uz11fZQoaAZHQHMRKXv6TGJoB0vtaAhHQKEGNKr7wa11fZQoaAZHQG4GDPGACnxoB0vnaAhHQKEGNnzQNTd1fZQoaAZHQG9fvhQ3xWloB0vaaAhHQKEGg2itaIN1fZQoaAZHQHBx5HmRvFZoB0vjaAhHQKEGlVDrqt51fZQoaAZHQHMN/LxI8QtoB00BAWgIR0ChBppW3jMndX2UKGgGR0BiVRE6T4cnaAdN6ANoCEdAoQbVnmJWNnV9lChoBkdAcy3c9GI9DGgHS+loCEdAoQbdjNIK+nV9lChoBkdAclL8DB/I82gHS/xoCEdAoQbq7ulXR3V9lChoBkdAcLRhufmLcmgHS/BoCEdAoQdyiEg4fnV9lChoBkdAcS91mrbQC2gHTQcBaAhHQKEHnddE9dN1fZQoaAZHQHFmAxnFo+RoB0vaaAhHQKEHqz0pVjt1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 492, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVQwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwxkAXwAFABkAhcAUwCUjFYKICBMZWFybmluZyByYXRlIHNjaGVkdWxlLgoKICA6cGFyYW0gcHJvZ3Jlc3NfcmVtYWluaW5nOiAoZmxvYXQpCiAgOnJldHVybjogKGZsb2F0KQogIJRHP3ysCDEm6XlHP2iTdLxqfvqHlCmMEnByb2dyZXNzX3JlbWFpbmluZ5SFlIwePGlweXRob24taW5wdXQtOC01MjEwZTkzZTMzYmY+lIwLbHJfc2NoZWR1bGWUSwFDAgwHlCkpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5OdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgXfZR9lChoFGgOjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBWMB19fZG9jX1+UaAmMC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.4.0+cu121", "GPU Enabled": "True", "Numpy": "1.26.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:939139178084454d7eadd5f7a2595c072be542d237f2c9ab91442082085892c4
3
- size 148620
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:235a20fe63e8d7b3be1531a78d98dd07f2b0f7d6c2799427177dd94092823aa2
3
+ size 148676
ppo-LunarLander-v2/data CHANGED
@@ -4,37 +4,37 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7bb2389d5a20>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7bb2389d5ab0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7bb2389d5b40>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7bb2389d5bd0>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7bb2389d5c60>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7bb2389d5cf0>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7bb2389d5d80>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7bb2389d5e10>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7bb2389d5ea0>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7bb2389d5f30>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7bb2389d5fc0>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7bb2389d6050>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7bb238b624c0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
- "num_timesteps": 1507328,
25
- "_total_timesteps": 1500000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1726532143493315846,
30
  "learning_rate": {
31
  ":type:": "<class 'function'>",
32
- ":serialized:": "gAWVNwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwhkAXwAFABTAJSMVgogIExlYXJuaW5nIHJhdGUgc2NoZWR1bGUuCgogIDpwYXJhbSBwcm9ncmVzc19yZW1haW5pbmc6IChmbG9hdCkKICA6cmV0dXJuOiAoZmxvYXQpCiAglEc/gm6XjU/fO4aUKYwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjB88aXB5dGhvbi1pbnB1dC00NS1mNzVkZWEzMTBiMmE+lIwLbHJfc2NoZWR1bGWUSwFDAggHlCkpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5OdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgXfZR9lChoFGgOjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBWMB19fZG9jX1+UaAmMC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
33
  },
34
  "tensorboard_log": null,
35
  "_last_obs": {
36
  ":type:": "<class 'numpy.ndarray'>",
37
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGb+CrzZ6aY/VLTFvX1kIr/jDkM7PX1qPAAAAAAAAAAAAADkvdfOnz+L5R2/pksUv+vapL3QdX++AAAAAAAAAAD68qo+n+wjPzP+db5p7Qu/x8+NPsUpOr4AAAAAAAAAADPWiTx/DA8+I9ZyvRkzg75AVbm9m2wGPQAAAAAAAAAAgJk4vkxanj6S3ho+RSSavsqRmr2Lk988AAAAAAAAAACatwk8K7qZP2ZBkzyHqxq/aZTRPOKsFD0AAAAAAAAAAJo5kb0pLEu6PySUNzP3qrCPj+W6tSistgAAgD8AAIA/s9+fvpZehT+3qgm/PHo2v2sXob4V01C9AAAAAAAAAACaKZQ8Ya/vO31ST75y9cO9DlwjvUrcfj8AAIA/AAAAAFqkjj64P6M/zXIkP3rQIL/nJI8+WT2kPgAAAAAAAAAATcklvWpeoD+6ZrG+FQkmv4Bsrry+KNG9AAAAAAAAAADA8Ra+hAazP3pn177rjeK+oaVmveNNBr4AAAAAAAAAAGaPwjxiOHw+2xdqvfvel74BmFa8RMOJvQAAAAAAAAAAGpDiPbUGlz+yScs+bJIXv2RwLT448lY+AAAAAAAAAACaOXI6wNWePsTLI76xRJW+udxgvSR1mLwAAAAAAAAAAJrYkrwUqKS61tJKs8+hL7CDlkY6lrvDMwAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
38
  },
39
  "_last_episode_starts": {
40
  ":type:": "<class 'numpy.ndarray'>",
@@ -44,17 +44,17 @@
44
  "_episode_num": 0,
45
  "use_sde": false,
46
  "sde_sample_freq": -1,
47
- "_current_progress_remaining": -0.004885333333333408,
48
  "_stats_window_size": 100,
49
  "ep_info_buffer": {
50
  ":type:": "<class 'collections.deque'>",
51
- ":serialized:": "gAWV7AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG+hLZ8KG+OMAWyUS8WMAXSUR0C58MuAI6bOdX2UKGgGR0BwNiBMBZIQaAdL7WgIR0C58N5/oaDPdX2UKGgGR0BxU/4k/r0KaAdLwGgIR0C58PDJyQxOdX2UKGgGR0BwKaFQEZBLaAdL5mgIR0C58P3ctXgcdX2UKGgGR0BxckUzsQd0aAdL2mgIR0C58QzG1hLHdX2UKGgGR0ByztwT/Q0GaAdLwmgIR0C58SRmkFfRdX2UKGgGR0Bw+jgWJrLyaAdL4mgIR0C58Sv2saKldX2UKGgGR0BwDaluWKMvaAdL32gIR0C58TPAj6eodX2UKGgGR0Bw9ZhmXgLraAdL1mgIR0C58USsCDEndX2UKGgGR0BxKU+Y+jdpaAdL7GgIR0C58Wd6gM+edX2UKGgGR0ByvzL4etCBaAdLzWgIR0C58WwuEmICdX2UKGgGR0BupZC0F8ohaAdL62gIR0C58a5bdJrddX2UKGgGR0BusGB8QZn+aAdLz2gIR0C58cDjWCmNdX2UKGgGR0Bu4kO/cnE3aAdL2mgIR0C58eT6i0v5dX2UKGgGR0BvCctkFwDOaAdL2GgIR0C58f6KtPpIdX2UKGgGR0BzyKg6EJ0GaAdNIwFoCEdAufIJRVIZqHV9lChoBkdAchItCiRGMGgHS91oCEdAufIax2SuAHV9lChoBkdAboUVh1DBuWgHS9toCEdAufIq6Zpi7XV9lChoBkdAc1t/yoXKsGgHS8ZoCEdAufJX8tPHk3V9lChoBkdAcmdwX668QWgHS/BoCEdAufJaPT5O8HV9lChoBkdAb5H9JjDsMWgHS99oCEdAufJ2SDAaenV9lChoBkdAcL+e7+T/yWgHS8xoCEdAufJ2R/3Fk3V9lChoBkdAc/oPUrkKeGgHS/1oCEdAufKADNhVl3V9lChoBkdAcVO5U96kZmgHS/RoCEdAufKMMb3oLXV9lChoBkdAcOA7L+xW1mgHS8doCEdAufKQxASnL3V9lChoBkdAcnlFs54nnmgHS81oCEdAufKc5Lh73XV9lChoBkdAUF6cBltj1GgHS5FoCEdAufLp6C17Y3V9lChoBkdAcC2zt1IRRWgHS+toCEdAufMdy5qdpnV9lChoBkdAbbEPdVNpNGgHS9toCEdAufMrQVsUI3V9lChoBkdAc0DcvM8oyGgHTQABaAhHQLnzLJ3gUDd1fZQoaAZHQG1rbSJCSidoB03jAWgIR0C596VchTwVdX2UKGgGR0Bxe0wmE5AAaAdLz2gIR0C598xyCFsYdX2UKGgGR0BxFE7NjbztaAdL/WgIR0C59+8QiA2AdX2UKGgGR0BykPJEH+qBaAdL2mgIR0C5+CL7GecydX2UKGgGR0BxQ1PEbYK6aAdLzWgIR0C5+FIN3GGVdX2UKGgGR0Bw4MQSSNfgaAdL7mgIR0C5+FIhY/3WdX2UKGgGR0BxS2pKjBVNaAdL3GgIR0C5+F6nrIHUdX2UKGgGR0Bym5nanJkoaAdL1GgIR0C5+GeYYzi0dX2UKGgGR0BvbcLORkmQaAdL62gIR0C5+G5++dsjdX2UKGgGR0BxrVnOB19waAdL2WgIR0C5+ILamGdqdX2UKGgGR0BwsR7IDHOsaAdLwmgIR0C5+Sbjo6jndX2UKGgGR0BwcIdFOO81aAdL3WgIR0C5+VhY7q6fdX2UKGgGR0BDFDpkf9xZaAdLuGgIR0C5+WDfm9xqdX2UKGgGR0BzjVqM3qA0aAdL2mgIR0C5+WPVurIYdX2UKGgGR0ByUwrGza9LaAdL5GgIR0C5+Z6kVN5/dX2UKGgGR0By55Q+EAYIaAdNLwFoCEdAufnAnLJSznV9lChoBkdAcpdv99+gDmgHS9hoCEdAufnD4QBgeHV9lChoBkdAcBx6Rhc7hmgHS9loCEdAufntuqFRHnV9lChoBkdAcJnVn27FsGgHS9hoCEdAufoPbVSXMXV9lChoBkdAcQxK+zt1IWgHS9ZoCEdAufoeLHdXT3V9lChoBkdAc92cKPXCj2gHS9doCEdAufomRgZ0jnV9lChoBkdAcv1ffoA4oGgHS+hoCEdAufoqc3EQ5HV9lChoBkdAcXRfYjB2wGgHTcgBaAhHQLn6L9hZyMl1fZQoaAZHQG560WdmQKdoB0vuaAhHQLn6O0E5hjR1fZQoaAZHQHHCkPhAGB5oB0voaAhHQLn6SyTINmV1fZQoaAZHQHDorfxc3VFoB0viaAhHQLn6syhSLqF1fZQoaAZHQHIYbmdRR/FoB0vdaAhHQLn6zsvIwM91fZQoaAZHQHGWajBVMmFoB0vJaAhHQLn61zoEB8x1fZQoaAZHQG6BL+5vtMRoB0vmaAhHQLn63xFAmiR1fZQoaAZHQHHzLcTJyQxoB0vEaAhHQLn67elKsdV1fZQoaAZHQHHODCLuQZJoB0vCaAhHQLn7NeQMhHN1fZQoaAZHQHIc/ZyuIRBoB0u6aAhHQLn7N7vG6wt1fZQoaAZHQHJ73wCr92poB00FAWgIR0C5+1kM5OrRdX2UKGgGR0BzitKtga3raAdL7mgIR0C5+16eTV2BdX2UKGgGR0By3mFQEZBLaAdL1mgIR0C5+3Jm7J4jdX2UKGgGR0BzJ8RjBl+WaAdL5mgIR0C5+4e3pfQbdX2UKGgGR0BtYTsv7FbWaAdL4WgIR0C5+4mVVxS6dX2UKGgGR0BxsZU6xPfsaAdL5GgIR0C5+5nTI/7jdX2UKGgGR0BvXhjSXt0FaAdL9GgIR0C5+8WmP5pKdX2UKGgGR0Bw290ihWYGaAdLwmgIR0C5+/2w3YL9dX2UKGgGR0BzNIr7O3UhaAdNpQFoCEdAufwBic5Ke3V9lChoBkdAcNrLYf4h2WgHS9toCEdAufwKEEkjYHV9lChoBkdAcGRhAWznimgHS+toCEdAufxejdpItnV9lChoBkdAcYHC3PRiPWgHS/hoCEdAufxi7nPmgnV9lChoBkdAcoaqqwQlKWgHS8NoCEdAufxpt8/lhnV9lChoBkdAcThll9SdfGgHTRMBaAhHQLn8hC1JDmd1fZQoaAZHQHBLY4ZMtbtoB0vJaAhHQLn8pziCJ411fZQoaAZHQHFCDBEa2ndoB0viaAhHQLn8uCQcPvt1fZQoaAZHQHKVRwhnrY5oB0v5aAhHQLn84LThHb11fZQoaAZHQHAX4od+5OJoB0vsaAhHQLn89TefqX51fZQoaAZHQG50NcW0qpdoB00fAWgIR0C5/PfZVXFMdX2UKGgGR0Bw9m16Vt4zaAdL52gIR0C5/QEa2nbZdX2UKGgGR0BwWb3pOerdaAdLymgIR0C5/QC/fwZwdX2UKGgGR0Bx6QOavzOHaAdL9mgIR0C5/QYvalDXdX2UKGgGR0BfExrzoUzsaAdN6ANoCEdAuf0Gup0fYHV9lChoBkdAbxMxptaY/mgHS9xoCEdAuf1DK+zt1XV9lChoBkdAc6CQUpNKy2gHS9VoCEdAuf1EgNgBtHV9lChoBkdAcdpOclPac2gHTQcBaAhHQLn9gsEJSix1fZQoaAZHQG+NDrJKaodoB0vKaAhHQLn9ioRIz311fZQoaAZHQHEhTK1XvH9oB0vMaAhHQLn9pyO7xut1fZQoaAZHQHQF4dIXj2loB0vnaAhHQLn9qssQNCt1fZQoaAZHQHMcWrGR3eNoB0v7aAhHQLn9zSNwR5F1fZQoaAZHQHLDIOH31z1oB0vsaAhHQLn9+ykKu0V1fZQoaAZHQHOQI1gpjMFoB0vVaAhHQLn+D2JBPbh1fZQoaAZHQHGROI68xsVoB0vIaAhHQLn+Gk3S8ap1fZQoaAZHQHIt8CDEm6ZoB00AAWgIR0C5/ilMIu5CdX2UKGgGR0ByvS7/XGwSaAdL1GgIR0C5/izdDYywdX2UKGgGR0BwcyCYkVvdaAdL4GgIR0C5/jLeqJdjdX2UKGgGR0Bv1bIeYD1XaAdL5GgIR0C5/jmpyZKGdX2UKGgGR0BxAwvUSZjQaAdL3WgIR0C5/j2Jm/WUdWUu"
52
  },
53
  "ep_success_buffer": {
54
  ":type:": "<class 'collections.deque'>",
55
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
56
  },
57
- "_n_updates": 368,
58
  "observation_space": {
59
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
60
  ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
@@ -97,6 +97,6 @@
97
  "target_kl": null,
98
  "lr_schedule": {
99
  ":type:": "<class 'function'>",
100
- ":serialized:": "gAWVNwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwhkAXwAFABTAJSMVgogIExlYXJuaW5nIHJhdGUgc2NoZWR1bGUuCgogIDpwYXJhbSBwcm9ncmVzc19yZW1haW5pbmc6IChmbG9hdCkKICA6cmV0dXJuOiAoZmxvYXQpCiAglEc/gm6XjU/fO4aUKYwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjB88aXB5dGhvbi1pbnB1dC00NS1mNzVkZWEzMTBiMmE+lIwLbHJfc2NoZWR1bGWUSwFDAggHlCkpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5OdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgXfZR9lChoFGgOjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBWMB19fZG9jX1+UaAmMC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
101
  }
102
  }
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7cde4a719900>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7cde4a719990>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7cde4a719a20>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7cde4a719ab0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7cde4a719b40>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7cde4a719bd0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7cde4a719c60>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7cde4a719cf0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7cde4a719d80>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7cde4a719e10>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7cde4a719ea0>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7cde4a719f30>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7cde4a8a99c0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
24
+ "num_timesteps": 2015232,
25
+ "_total_timesteps": 2000000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1726560783775658137,
30
  "learning_rate": {
31
  ":type:": "<class 'function'>",
32
+ ":serialized:": "gAWVQwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwxkAXwAFABkAhcAUwCUjFYKICBMZWFybmluZyByYXRlIHNjaGVkdWxlLgoKICA6cGFyYW0gcHJvZ3Jlc3NfcmVtYWluaW5nOiAoZmxvYXQpCiAgOnJldHVybjogKGZsb2F0KQogIJRHP3ysCDEm6XlHP2iTdLxqfvqHlCmMEnByb2dyZXNzX3JlbWFpbmluZ5SFlIwePGlweXRob24taW5wdXQtOC01MjEwZTkzZTMzYmY+lIwLbHJfc2NoZWR1bGWUSwFDAgwHlCkpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5OdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgXfZR9lChoFGgOjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBWMB19fZG9jX1+UaAmMC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
33
  },
34
  "tensorboard_log": null,
35
  "_last_obs": {
36
  ":type:": "<class 'numpy.ndarray'>",
37
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAPojXz6wqos+e5bDvrahgL677Cg9ttT5vQAAAAAAAAAAgJ1iPgk4Tj6etoK+QFpqvpmOij0vL8y6AAAAAAAAAAAAvHW8IJUtP6UPoT26Dfe+EyrIvLzxiTwAAAAAAAAAAGatq7zHZi0/dt8XPifYCb/2LUK9zTj9PQAAAAAAAAAAzW7wvDoUuT9C0Ti/duuyPmQ0sjz2aR09AAAAAAAAAACANFU9XNWtP5dVHT+Ze8W+m9a3u50RCT4AAAAAAAAAAHMZuD24JrC5Vs6TvL8jF7XI1YC6dax/NAAAgD8AAIA/GqgMPh/+3btYgQq6i0q3N7svK727sjI5AACAPwAAgD/NDFQ7aX0svP6yn76ki3e9ulaXPUsYTj4AAIA/AACAPwD59LyC9qI/om8EvmpT4r5jicm9bs1LvQAAAAAAAAAAQByQvXvtfT9B1Ae8tsAMv4gn672yHBk8AAAAAAAAAADzIGs+/CddPr3FZ75XIJi+ByspPh2VbL0AAAAAAAAAAAAZYr2PSlI/1iJKPYoRA7/bD9+9+zm7PQAAAAAAAAAAZsYRPTig/rs8eg+8aXI7PO3vTb2ntB89AACAPwAAgD+IlZG+OJgGP721Lj4nYMO+fdZJvvrj5j0AAAAAAAAAAIv0ir5IcZE++MOiPmql377BNsG9NIQTPgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
38
  },
39
  "_last_episode_starts": {
40
  ":type:": "<class 'numpy.ndarray'>",
 
44
  "_episode_num": 0,
45
  "use_sde": false,
46
  "sde_sample_freq": -1,
47
+ "_current_progress_remaining": -0.007616000000000067,
48
  "_stats_window_size": 100,
49
  "ep_info_buffer": {
50
  ":type:": "<class 'collections.deque'>",
51
+ ":serialized:": "gAWV/QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHMgTByjpLWMAWyUTQoBjAF0lEdAoOVzb8FY+3V9lChoBkdAb5iJqIrOJWgHS9poCEdAoOV8yFfzBnV9lChoBkdAcl/CEpRXOmgHS+1oCEdAoOXWO801qHV9lChoBkdAcioFt8/lhmgHS9FoCEdAoOYU45tFa3V9lChoBkdAcTs+JgsshGgHS/doCEdAoOZYf6oES3V9lChoBkdAcaQtRNyo42gHS9poCEdAoOZcEovzv3V9lChoBkdAcimzXjENv2gHS+ZoCEdAoOaw4yXUpnV9lChoBkdAc+rfZ26kI2gHS/doCEdAoOcY8OkLyHV9lChoBkdAcoSVy3kPtmgHS+FoCEdAoOcjbL2YfHV9lChoBkdAbqYLgn+hoWgHTQYBaAhHQKDngoiLVFx1fZQoaAZHQHCutQj2SMdoB0veaAhHQKDnxztkWh11fZQoaAZHQHBIvpQk5ZNoB0vhaAhHQKDoAsvIwM91fZQoaAZHQHEDAyhzvJBoB0vZaAhHQKDoaifQKKJ1fZQoaAZHQHPG88s+V1RoB0vxaAhHQKDokASWZ7Z1fZQoaAZHQG9pRp1zQu5oB00iAWgIR0Cg6SfHPu5SdX2UKGgGR0Bxie89Oh0yaAdNFwFoCEdAoOkzDl5nlHV9lChoBkdAcN97vXsgMmgHTRUBaAhHQKDpZ8E3bVV1fZQoaAZHQHK6BHf/FR5oB0v+aAhHQKDp5i97F851fZQoaAZHQHHtcSf16E9oB0v3aAhHQKDqHshPj4p1fZQoaAZHQHHQcZxaPjpoB0vnaAhHQKDqPpwCKaZ1fZQoaAZHQHDYsu3+dbxoB0v0aAhHQKDqdMr3Cbd1fZQoaAZHQHAuZ/G2kSFoB0vlaAhHQKDqnkupS751fZQoaAZHQHGZABPsRg9oB000AWgIR0Cg6qXYL9dedX2UKGgGR0BxDQXMyJsPaAdLy2gIR0Cg6tDVYp2EdX2UKGgGR0BzE8H3UQTVaAdNAAFoCEdAoOtGw5eZ5XV9lChoBkdAck0YrJ8v3GgHS9toCEdAoOueDe0ojXV9lChoBkdAcdpF2mpEQWgHS79oCEdAoOvYE6kqMHV9lChoBkdAbaFES/TLGWgHS/toCEdAoOvqmALApXV9lChoBkdAb/0gBcRlH2gHS/VoCEdAoOyN2ki2UnV9lChoBkdAc682NedCmmgHS/9oCEdAoOzwYaYNRXV9lChoBkdAcyeppvgm7mgHS+ZoCEdAoO0WFg2If3V9lChoBkdAb/WJcgQpWmgHS9RoCEdAoO1n29L6DXV9lChoBkdAcJyrNGEwnGgHS+poCEdAoO2ArvsqrnV9lChoBkdAbndMMZxaPmgHS9NoCEdAoO2W2TgVGnV9lChoBkdAc9qwA2hqTWgHTQ4BaAhHQKDt4K+BYmt1fZQoaAZHQHJY4xQBPsRoB00+AmgIR0Cg7eWznieedX2UKGgGR0BzVN+so2GZaAdNBAFoCEdAoO46swL3K3V9lChoBkdAcD7XzlLeymgHS/ZoCEdAoO4+1a4c3nV9lChoBkdAcokra/RE4WgHS+RoCEdAoO538dgfEHV9lChoBkdASTdVT72tdWgHS6loCEdAoO7rJEH+qHV9lChoBkdAcsysRxtHhGgHS+BoCEdAoPeIexOclXV9lChoBkdAcrFyVfNRnGgHTQ4BaAhHQKD4UM9bHIZ1fZQoaAZHQHEuaVdHDrJoB0vjaAhHQKD4xmHxjKB1fZQoaAZHQG9AKaoddVxoB0vQaAhHQKD49fUF0Pp1fZQoaAZHQG+Xygf2bodoB0vMaAhHQKD5AifQKKJ1fZQoaAZHQHCQV18stkFoB00GAWgIR0Cg+XXdbgTAdX2UKGgGR0BxTGRGMGX5aAdL+GgIR0Cg+cppN9H+dX2UKGgGR0BxqjRF7UobaAdL7GgIR0Cg+fQLeANHdX2UKGgGR0BpWmQXAM2FaAdNIQNoCEdAoPoOrU9ZBHV9lChoBkdAcwZYU34sVmgHS/ZoCEdAoPoUiliz9nV9lChoBkdAcmSw9JSR82gHS+toCEdAoPpGnO0LMXV9lChoBkdAcnat6HCXQmgHS+BoCEdAoPpdzZHuqnV9lChoBkdAcKt3o9s7+2gHS+hoCEdAoPr1U+9rXXV9lChoBkdAcOavJiiItWgHTQEBaAhHQKD7Qfe1rqN1fZQoaAZHQG/L2KdhAnloB0vQaAhHQKD8B5YYBNp1fZQoaAZHQG5KUDEFW4poB0vvaAhHQKD8DRLK3d91fZQoaAZHQHGyc6BAfMhoB0vWaAhHQKD8cuoP07N1fZQoaAZHQF5gmJm/WUdoB03oA2gIR0Cg/L7muDBedX2UKGgGR0Byb0FW4mTlaAdNKAFoCEdAoP4QOz6acHV9lChoBkdAch8WIoE0SGgHTQ4BaAhHQKD+O0dBBzF1fZQoaAZHQHL2oVRDTjNoB0vwaAhHQKD+bBInSfF1fZQoaAZHQHN8VfqoqCpoB0v7aAhHQKD+e/t6X0J1fZQoaAZHQHHrb3Cbc45oB00LAWgIR0Cg/pYLkS26dX2UKGgGR0BynPyvs7dSaAdL72gIR0Cg/tW912aEdX2UKGgGR0Byb+wpvxYraAdNDQFoCEdAoP78JrtVrHV9lChoBkdAcIzSx7iQ1mgHS+poCEdAoP+/8CPp6nV9lChoBkdAc0wVlwtJ4GgHTSIBaAhHQKD/26PKdQR1fZQoaAZHQDpgFC9h7VtoB0u3aAhHQKD/9Jd0JWx1fZQoaAZHQHFsn4oJAt5oB0v7aAhHQKEAm18b70p1fZQoaAZHQHF3ESh8IAxoB0vbaAhHQKEBEIInjQ11fZQoaAZHQHRUVPrOZ9doB00dAWgIR0ChAdrLhaTwdX2UKGgGR0ByTJPJq7AdaAdNBAFoCEdAoQIAYNy5qnV9lChoBkdAcWntl7MPjGgHS9doCEdAoQJMcfeUIXV9lChoBkdAbgNrpqynk2gHS9hoCEdAoQJqZnctXnV9lChoBkdAcMvIoE0SAmgHS/FoCEdAoQLmlEZzgnV9lChoBkdAbmrFNL127mgHS/ZoCEdAoQMWbgCOm3V9lChoBkdAcSKkFwDNhWgHTQIBaAhHQKEDLSWJJoV1fZQoaAZHQHAQ544ZMtdoB0v0aAhHQKEDPEwWWQh1fZQoaAZHQG+XDAJswcpoB0vkaAhHQKEDnUQ04zd1fZQoaAZHQHMuKxHG0eFoB00NAWgIR0ChA6nKOktVdX2UKGgGR0BxjlkVeruIaAdL5WgIR0ChA6oIfKZEdX2UKGgGR0BxOrPrv9cbaAdL+mgIR0ChA9d0aIepdX2UKGgGR0BtkMnmaH9FaAdL3mgIR0ChBE/l6qsEdX2UKGgGR0Bjji+i8FpxaAdN6ANoCEdAoQRv9rGipXV9lChoBkdAcvPYJ3PiUGgHTSgBaAhHQKEE8Zof0Vd1fZQoaAZHQHK8p1zQu29oB0vxaAhHQKEFH6po9LZ1fZQoaAZHQHMdQHeJpFloB0v3aAhHQKEFVhaTwDx1fZQoaAZHQHECoj4YaYNoB0vvaAhHQKEFlqY7aIx1fZQoaAZHQHFEBDPWxyJoB0vfaAhHQKEF0+t8uz11fZQoaAZHQHMRKXv6TGJoB0vtaAhHQKEGNKr7wa11fZQoaAZHQG4GDPGACnxoB0vnaAhHQKEGNnzQNTd1fZQoaAZHQG9fvhQ3xWloB0vaaAhHQKEGg2itaIN1fZQoaAZHQHBx5HmRvFZoB0vjaAhHQKEGlVDrqt51fZQoaAZHQHMN/LxI8QtoB00BAWgIR0ChBppW3jMndX2UKGgGR0BiVRE6T4cnaAdN6ANoCEdAoQbVnmJWNnV9lChoBkdAcy3c9GI9DGgHS+loCEdAoQbdjNIK+nV9lChoBkdAclL8DB/I82gHS/xoCEdAoQbq7ulXR3V9lChoBkdAcLRhufmLcmgHS/BoCEdAoQdyiEg4fnV9lChoBkdAcS91mrbQC2gHTQcBaAhHQKEHnddE9dN1fZQoaAZHQHFmAxnFo+RoB0vaaAhHQKEHqz0pVjt1ZS4="
52
  },
53
  "ep_success_buffer": {
54
  ":type:": "<class 'collections.deque'>",
55
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
56
  },
57
+ "_n_updates": 492,
58
  "observation_space": {
59
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
60
  ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
 
97
  "target_kl": null,
98
  "lr_schedule": {
99
  ":type:": "<class 'function'>",
100
+ ":serialized:": "gAWVQwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwxkAXwAFABkAhcAUwCUjFYKICBMZWFybmluZyByYXRlIHNjaGVkdWxlLgoKICA6cGFyYW0gcHJvZ3Jlc3NfcmVtYWluaW5nOiAoZmxvYXQpCiAgOnJldHVybjogKGZsb2F0KQogIJRHP3ysCDEm6XlHP2iTdLxqfvqHlCmMEnByb2dyZXNzX3JlbWFpbmluZ5SFlIwePGlweXRob24taW5wdXQtOC01MjEwZTkzZTMzYmY+lIwLbHJfc2NoZWR1bGWUSwFDAgwHlCkpdJRSlH2UKIwLX19wYWNrYWdlX1+UTowIX19uYW1lX1+UjAhfX21haW5fX5R1Tk5OdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgXfZR9lChoFGgOjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBWMB19fZG9jX1+UaAmMC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
101
  }
102
  }
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2505bff0436a1ab9584fc7b58b55b84b881f373c83b87306874e91deb0967a3
3
  size 88362
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a4eb99954d0cc393f03d9340b364032ba1e839f8a0c58f20d7543baf135bbc5
3
  size 88362
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3909f367c7264073deb208d8ad1aed3c5192174d1a7cc8944a8879f14f829bf5
3
  size 43762
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4708d86f233b53c4d0f841012b4c2847dbee08a2e5ea859c75b94ea7061d3ef7
3
  size 43762
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 280.1876054563404, "std_reward": 23.273564500331258, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-09-17T00:51:12.671419"}
 
1
+ {"mean_reward": 261.27906820689833, "std_reward": 26.176545261548164, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-09-17T08:48:02.704522"}