sametayhan commited on
Commit
a49a83c
·
verified ·
1 Parent(s): c01ff3c

A commit with ppo-lunarLander-v2 model

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 251.91 +/- 23.55
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 262.74 +/- 14.48
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7af4fcebba30>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7af4fcebbac0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7af4fcebbb50>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7af4fcebbbe0>", "_build": "<function ActorCriticPolicy._build at 0x7af4fcebbc70>", "forward": "<function ActorCriticPolicy.forward at 0x7af4fcebbd00>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7af4fcebbd90>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7af4fcebbe20>", "_predict": "<function ActorCriticPolicy._predict at 0x7af4fcebbeb0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7af4fcebbf40>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7af4fcec4040>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7af4fcec40d0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7af4fceb3280>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1770578468713797764, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAAwFT39hQE82QEHvpaAWr6IrzK9pF/HPQAAAAAAAAAA5c0UP8+MSb5FOII5Mp2Yt8VURL5mzRq3AACAPwAAgD/NIpC8j95Vugw7NDmrHOI1b3VWOth1ULgAAIA/AACAP4bCaL5EoSo/C5pqvf5f6b4b6CS+Ps60PQAAAAAAAAAA7RWlProVID8wW969mkTHviB/JT5SS0a+AAAAAAAAAABTlKU+TkkZP7tX371k07y+fu7rPbIqs70AAAAAAAAAAGY+DjtlcLg/E+AVPWWJHz7wTiG7gD0GvAAAAAAAAAAAzdeXvOGogboCHEk31XxMMpKTK7pDhGq2AACAPwAAgD8aYq+94hR9P0YcM7wME/m+sFG0vdVoVDwAAAAAAAAAAJrIBj25t4o/tiXGPSP1CL9+ZqI9SFvDPQAAAAAAAAAAbXCKvrz0Wz9+44u+6+rvvsoLyb7uSSg9AAAAAAAAAABzpLM9bMrmPtiZ17z1Va++KzZDuxi+ib0AAAAAAAAAAEAbmz3hQyY/GgUCPVWEzr7ubA49yo+qOwAAAAAAAAAAGkKRPhEULL2jUg47halPulxbl74dntu5AACAPwAAgD/T9Xs+/M2tPttJl76LpYG+6G9bvY1v970AAAAAAAAAADV9l76TPXs/rKm0voGK7r6aEta+kNGDvQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVGgwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHLQnpr1uiyMAWyUTREBjAF0lEdAjXdOUdJaq3V9lChoBkdAciR/4ZdfLWgHTRMBaAhHQI15E052hZh1fZQoaAZHQHChX7+DOC5oB00LAWgIR0CNeQ0SAYpEdX2UKGgGR0BxN6nCO3lTaAdNBgFoCEdAjXuZKODJ2nV9lChoBkdAcsc6dDpkgGgHTTABaAhHQI17uWD6Fdt1fZQoaAZHQHIXA/keZG9oB0vuaAhHQI18VR+BpYd1fZQoaAZHQHGz76P8yetoB00bAWgIR0CNfgOhkAggdX2UKGgGR0BwVE6aLGaQaAdNKQFoCEdAjX4mig00nHV9lChoBkdAcbToJRfnfWgHS+RoCEdAjX8GRmseXHV9lChoBkdAcJJjJdSl32gHS+FoCEdAjX8j9n9NvnV9lChoBkdAcOx0dRzij2gHS89oCEdAjX+gPEsJ6nV9lChoBkdAcRqudPLxJGgHTQMBaAhHQI2AlNi6QNl1fZQoaAZHQHArrFsHjZNoB0v6aAhHQI2Bi2tuDSR1fZQoaAZHQHDaCBf8dghoB0v3aAhHQI2CEl7dBSl1fZQoaAZHQHIQ2bCrLhdoB0v9aAhHQI2EJrP+n651fZQoaAZHQHInq68QI2RoB00TAWgIR0CNhIRU3n6mdX2UKGgGR0BxYIA80UGnaAdNEAFoCEdAjYV69sabWnV9lChoBkdAQjyZnctXgmgHS7NoCEdAjYZ2qkuYhXV9lChoBkdAcBGdLg4wRGgHTQkBaAhHQI2G2SlnAZd1fZQoaAZHQHDYphfBvaVoB00OAWgIR0CNhx2OhkAhdX2UKGgGR0BxrOIWP91maAdNAgFoCEdAjYi4cFQl8nV9lChoBkdAccxpj+aScWgHTRIBaAhHQI2Jsi0OVgR1fZQoaAZHQG4iDLbHp8poB00hAWgIR0CNiveQdS2qdX2UKGgGR0BzbUV/MGHIaAdL3WgIR0CNi3PHktEodX2UKGgGR0Bxd7jQzDXOaAdNGQFoCEdAjYvaE8JUpHV9lChoBkdAcWHgjyFwk2gHTQ0BaAhHQI2L+mpEQXh1fZQoaAZHQHJzCuIRAbBoB00KAWgIR0CNjHqiXY16dX2UKGgGR0BwZqV4X40uaAdNKwFoCEdAjY2TND+irXV9lChoBkdAcIVaTOgQH2gHTQkBaAhHQI2PtnK4hEB1fZQoaAZHQHLHOzyBkI5oB0v2aAhHQI2RFNN8E3d1fZQoaAZHQHK9urZJ04loB0vxaAhHQI2SFiay8jB1fZQoaAZHQHJxjfaYeDFoB0vgaAhHQI2SQnH/9511fZQoaAZHQHIK1UlzEJloB00aAWgIR0CNk5OymhugdX2UKGgGR0Bwzj8gpz91aAdL8WgIR0CNlJw9aEBbdX2UKGgGR0Bxe2Y5T6zmaAdNDAFoCEdAjZZ90Rvm5nV9lChoBkdAcN9sdDIBBGgHS/9oCEdAjZj7TtsvZnV9lChoBkdAbr+b6P8ye2gHS+9oCEdAjZ3EdvKlpHV9lChoBkdAcUPq33Hq/2gHS/9oCEdAjZ3rdFfAsXV9lChoBkdAco+0T101ZWgHTRIBaAhHQI2eD4vexfR1fZQoaAZHQHGZcp5NXYFoB00MAWgIR0CNnsz6ab4KdX2UKGgGR0BzHsAMlTm5aAdNGQFoCEdAjZ7wxWT5f3V9lChoBkdAcIo/NJOFg2gHTQMBaAhHQI2f/dl/Yrd1fZQoaAZHQG9ym0eEIxBoB0vwaAhHQI2jRF1B+nZ1fZQoaAZHQHEU7Ackt29oB00rAWgIR0CNuth60IC2dX2UKGgGR0By4BWT5ftyaAdNFAFoCEdAjbx606YE4nV9lChoBkdAccHabWmP52gHS/1oCEdAjbziT2WY4XV9lChoBkdAcVYnjhky12gHTTwBaAhHQI2+mQ2dd3V1fZQoaAZHQG4RELx7RfFoB00LAWgIR0CNvuvLX+VDdX2UKGgGR0Bx/X446wMZaAdNBgFoCEdAjb/5GKAJ9nV9lChoBkdAcC8Jm/WUbGgHS+poCEdAjcHDIJZ4fXV9lChoBkdAck0VX3g1nGgHS9hoCEdAjcHl7laKUHV9lChoBkdAcXv8YAKfF2gHS+JoCEdAjcJNdqtYCHV9lChoBkdAcXh9eQdS22gHTQIBaAhHQI3DR3NcGC91fZQoaAZHQG82EAHVwxZoB00GAWgIR0CNw18BuGbkdX2UKGgGR0BwF4ZsKsuGaAdNmQFoCEdAjcTxC6YmcHV9lChoBkdAcuQr2QGOdWgHS+VoCEdAjcX2Ebo8p3V9lChoBkdAcXDaoMrmQ2gHTSkBaAhHQI3H09fTkQx1fZQoaAZHQHIL8YuTRploB00XAWgIR0CNy52h7E5ydX2UKGgGR0By5xVU+9rXaAdNBgFoCEdAjcy9pZfUnXV9lChoBkdAcgJrhR64UmgHTRcBaAhHQI3NagoPTXt1fZQoaAZHQHFqbUXpGF1oB0voaAhHQI3OYBtDUmV1fZQoaAZHQHBEHMEA5rBoB00RAWgIR0CNz96cAimmdX2UKGgGR0BvnTBMzuWsaAdL8WgIR0CN0Pb6guh9dX2UKGgGR0BxuamALApKaAdL6mgIR0CN0R9Aood/dX2UKGgGR0BW9Wyon8baaAdN6ANoCEdAjdUjV6NVBHV9lChoBkdAcX6IRh+fAmgHTRsBaAhHQI3VhQk5ZKZ1fZQoaAZHQHEswmReTmpoB0vsaAhHQI3VqKaXrt51fZQoaAZHQG/B3++/QBxoB0vcaAhHQI3WWyVv/BF1fZQoaAZHQHHNxQN0/4ZoB00NAWgIR0CN1q19fCyhdX2UKGgGR0BymNP3ztkXaAdNTwFoCEdAjdcgqur6tXV9lChoBkdAcohdEb5uZWgHTYcBaAhHQI3XHtBv73x1fZQoaAZHQHA0UaZQYUFoB0vhaAhHQI3aZZr56+p1fZQoaAZHQG+bvcrRSgpoB0vpaAhHQI3c2GmDUVl1fZQoaAZHQFDVehPCVKRoB03oA2gIR0CN4DhBJI1+dX2UKGgGR0BwIAuctoSMaAdNKgFoCEdAjeCEehf0E3V9lChoBkdAcPYNEw35vmgHS/RoCEdAjeE/eDWbw3V9lChoBkdAc6cP+4smOWgHTSIBaAhHQI3jU8Tzund1fZQoaAZHQG4EbGFSKm9oB00rAWgIR0CN5PRO1v2odX2UKGgGR0ByciO6unuRaAdL2WgIR0CN5VbDdgv2dX2UKGgGR0Bv7NWyTpxFaAdL82gIR0CN5YM98qnWdX2UKGgGR0Bw1s3974SIaAdL2mgIR0CN5dvhIe5ndX2UKGgGR0BwyUo3Jgb7aAdNCQFoCEdAjecYkeIVM3V9lChoBkdAcULQlruYyGgHTRABaAhHQI3nbbg0j1R1fZQoaAZHQHAz5avA44poB00cAWgIR0CN6aGUwBYFdX2UKGgGR0Bxl0JD3M6jaAdL3GgIR0CN62Gxlg+hdX2UKGgGR0BymIwqRU3oaAdNBgFoCEdAjevRYA80UHV9lChoBkdAcdRKKYRdyGgHTUwBaAhHQI3sfsAvL5h1fZQoaAZHQD+QCJXQtz1oB0uvaAhHQI3tNsUIsy11fZQoaAZHQHAsKNAC4jNoB0vxaAhHQI3xVNnGsFN1fZQoaAZHQHEBNw71ZkloB00LAWgIR0CN9ozkZJkHdX2UKGgGR0BzIhDlYEGJaAdL9mgIR0CN9uLdepn6dX2UKGgGR0By0n+YMOPOaAdNPAFoCEdAjfcX18LKFXV9lChoBkdAbqhkiliz9mgHS/FoCEdAjfelqi48U3V9lChoBkdAciQwazeGf2gHTQcBaAhHQI34j7qIJqt1fZQoaAZHQDe28274BWBoB0u5aAhHQI35oxtYSxt1fZQoaAZHQHElwj+rELpoB0v6aAhHQI35wNNJvpB1fZQoaAZHQHD/iNKh+ORoB00oAWgIR0CN+s5OrQw9dX2UKGgGR0Bw5a5oXbdraAdNCQFoCEdAjfsBCdBjWnV9lChoBkdAc73TKkl/pmgHS9poCEdAjfyMMiKR+3V9lChoBkdAcZnv5xiobWgHS/ZoCEdAjf3JjUd7wHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVIwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeC9ob21lL3JsL1B5Y2hhcm1Qcm9qZWN0cy9PcHRpbWl6ZWRMdW5hckxhbmRlci12Mi1QUE8vdmVudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMeC9ob21lL3JsL1B5Y2hhcm1Qcm9qZWN0cy9PcHRpbWl6ZWRMdW5hckxhbmRlci12Mi1QUE8vdmVudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVIwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeC9ob21lL3JsL1B5Y2hhcm1Qcm9qZWN0cy9PcHRpbWl6ZWRMdW5hckxhbmRlci12Mi1QUE8vdmVudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMeC9ob21lL3JsL1B5Y2hhcm1Qcm9qZWN0cy9PcHRpbWl6ZWRMdW5hckxhbmRlci12Mi1QUE8vdmVudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "system_info": {"OS": "Linux-6.8.0-87-generic-x86_64-with-glibc2.35 # 88~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Tue Oct 14 14:03:14 UTC 2", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu117", "GPU Enabled": "False", "Numpy": "1.26.0", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x705d08ac3a30>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x705d08ac3ac0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x705d08ac3b50>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x705d08ac3be0>", "_build": "<function ActorCriticPolicy._build at 0x705d08ac3c70>", "forward": "<function ActorCriticPolicy.forward at 0x705d08ac3d00>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x705d08ac3d90>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x705d08ac3e20>", "_predict": "<function ActorCriticPolicy._predict at 0x705d08ac3eb0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x705d08ac3f40>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x705d08ad0040>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x705d08ad00d0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x705d08acd500>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1770686618978238999, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAFPhfD43SDq9iD0IPTO4ybwDjqK+EKx1PQAAAAAAAAAAM5kvvdBosz9y4zG/QWgKvjqsnzyS6uG8AAAAAAAAAADmu7G9hVO4ubSiDjoS/h82uuI7uxZ6JbkAAAAAAACAP5oFmjuuQZO6JphNtoIiPDEuno463qZvNQAAgD8AAIA/GnQOvV6R5T2WjCg+meR6vhTGNzyaujQ7AAAAAAAAAACg10o+u8CovPIhgDqjtRm4etEUvtf1obkAAIA/AACAP5qwiz0Fcr+7EiWku+alpDzWfhc9DoCKvQAAgD8AAIA/gBEOPT0xC7szVVo8OT+UPP0U+LvD4389AACAPwAAgD9mY0Q99gAJusa0rbt7WrE2qaPCu6m0IbYAAAAAAAAAANpxab5KTDU/OWuePfBUz75WQtS9UrEDPgAAAAAAAAAAQOGzvRkFsD4qnyk+/xt/vvpbGz13jqk9AAAAAAAAAADasyk+dahUP/ZDirxxna2+aoK8PX2tlr0AAAAAAAAAAM3Qejysp/4+4+9oPXoTqb5l94e8yeslPAAAAAAAAAAAGjb6PUmAJz25mIc9swCCvmNn8TwjmFo9AAAAAAAAAADNBOi7rkeRN1rLB7iJqU2zgZiiu8vCITcAAIA/AACAP03Zp72PjFo+V3sLPuNXVr782Mk8hfb1vAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVPAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG+jy5qdpZiMAWyUTZIBjAF0lEdAjrisniNsFnV9lChoBkdAceg5WRzRyGgHTSkBaAhHQI642M+/xlR1fZQoaAZHQHEyrypaRp1oB00SAWgIR0COvc2Hck+pdX2UKGgGR0Bvds/2TPjXaAdNCAFoCEdAjr4QGGEf1nV9lChoBkdAcjLr7fpD/mgHTRMBaAhHQI6+VPci4ax1fZQoaAZHQHDJjhUBGQVoB01aAWgIR0COvwYYzi0fdX2UKGgGR0ByZbobGWD6aAdNPQFoCEdAjr+XQMQVbnV9lChoBkdAcDSsabWmQGgHTQsBaAhHQI6/sUsWfsh1fZQoaAZHQHC8CS/0ulJoB00NAWgIR0COwUXJo0yhdX2UKGgGR0ByBxxVAAyVaAdNDQFoCEdAjsWHh86V+3V9lChoBkdAcVOeIEbHZWgHTRgBaAhHQI7He4smOVB1fZQoaAZHQG/Zet8uzyBoB00sAWgIR0COySQ+2VmjdX2UKGgGR0BvtzKkl/pdaAdL+2gIR0COyYIzFdcCdX2UKGgGR0BuS+0kWykcaAdNGAFoCEdAjst4NRWLgnV9lChoBkdAcLNP557gKmgHTSwBaAhHQI7MsPYnOSp1fZQoaAZHQHApaEWZZ0VoB01lAWgIR0COzZX7Lt/ndX2UKGgGR0ByCjDfm9xqaAdNSgFoCEdAjs4ex4Y773V9lChoBkdAcAwnbZezEGgHS/hoCEdAjs4n/tICl3V9lChoBkdAcQ+/8l5WzWgHTQkBaAhHQI7RTj3mFJx1fZQoaAZHQHIo+RkmQbNoB00vAWgIR0CO0lAWSEDhdX2UKGgGR0Bw84065oXbaAdNJgFoCEdAjtKVkDp1R3V9lChoBkdAb0RZ/Tb35GgHTT0BaAhHQI7S88JUo8Z1fZQoaAZHQG9rzY/Vy3loB001AWgIR0CO1Vb5dnkDdX2UKGgGR0Bybe9alk6LaAdNbQFoCEdAjtdNHH3lCHV9lChoBkdAcC0qzJIUamgHTRwBaAhHQI7YB64UeuF1fZQoaAZHQHMEb9ycTaloB00cAWgIR0CO2xtLteD4dX2UKGgGR0ByC8h5gPVeaAdNGQFoCEdAjttcU21lXnV9lChoBkdAcFDWmP5pJ2gHTSIBaAhHQI7ePalDWsl1fZQoaAZHQHBtqoqCpWFoB00aAWgIR0CO39ch1TzedX2UKGgGR0BviDbN8ma6aAdNHgFoCEdAjuDnxJ/XoXV9lChoBkdAbW7N9ph4MWgHTT4BaAhHQI7hcKu0TlF1fZQoaAZHQHFr31OCXhRoB02oAWgIR0CO5H+Vkc0cdX2UKGgGR0BW+tALRa5gaAdN6ANoCEdAjuVIAwPAf3V9lChoBkdAb/BoDgZTAGgHTRQBaAhHQI7l9IsiB5J1fZQoaAZHQHEWKXnhbW5oB00sAWgIR0CO5fTgEU0vdX2UKGgGR0BtkoqwyIpIaAdNLgFoCEdAjubb2USqVHV9lChoBkdAca8nsLORkmgHTXcBaAhHQI7nmLP2PDJ1fZQoaAZHQGt7NDlYEGJoB01BAWgIR0CO6KaBI4EPdX2UKGgGR0BxuoysS00FaAdNFQFoCEdAjuvuk+HJtHV9lChoBkdAcQoy+6Ae72gHTToBaAhHQI7sA9eQdS51fZQoaAZHQHAQpgogFHJoB00oAWgIR0CO7zn+yZ8bdX2UKGgGR0Bx8/O4XoC/aAdNDQFoCEdAjvM0q6OHWXV9lChoBkdAceazsyBTXWgHTQgBaAhHQI70gd2gWad1fZQoaAZHQHIVmpIczZZoB01GAWgIR0CO9JeyiVSodX2UKGgGR0BxLF32VVxTaAdNVAFoCEdAjvXWkBS1mnV9lChoBkdAcF5WgezUqmgHTRYBaAhHQI72VTkyULV1fZQoaAZHQHL55qIrOJNoB000AWgIR0CO+HwAlv61dX2UKGgGR0BJxoatLcsUaAdL62gIR0CO+Uzk6tDEdX2UKGgGR0ByvFEjPfKqaAdNBwFoCEdAjvl5Grjo6nV9lChoBkdAcIVuiN83M2gHTRkBaAhHQI75q1kUbkx1fZQoaAZHQG2ksqrilzloB00NAWgIR0CPFL8n/kvLdX2UKGgGR0Bv3GX/o7muaAdNNgFoCEdAjxW1LJ0W/XV9lChoBkdAcJ5K508vEmgHTQ4BaAhHQI8WEcyWRih1fZQoaAZHQFBS1XvH93toB0vCaAhHQI8YucH4XXR1fZQoaAZHQHL9IexOclRoB00LAWgIR0CPGYpYs/Y8dX2UKGgGR0Bx1Moa1kUcaAdNjQFoCEdAjxqn1FpfyHV9lChoBkdAbxqSxJNCaGgHTWMBaAhHQI8cwwdsBQx1fZQoaAZHQFPyEal1r7BoB0u6aAhHQI8dAHAymAN1fZQoaAZHQHG8OyVv/BFoB00RAWgIR0CPHmnrpqyodX2UKGgGR0BvQ8SqU/wBaAdNOwFoCEdAjyGXvH93r3V9lChoBkdAcWrvBrN4aGgHTSgBaAhHQI8iYrWiDdx1fZQoaAZHQG/JSFfzBhxoB00QAWgIR0CPJDqesgdPdX2UKGgGR0Bu00lolD4QaAdNIQFoCEdAjyWk30f5lHV9lChoBkdAcDayXD3ueGgHTSgBaAhHQI8mcWXTmXB1fZQoaAZHQHEzTewcHW1oB01nAWgIR0CPJoI55qubdX2UKGgGR0Bw99VvMr3CaAdNCwFoCEdAjybWTxG2C3V9lChoBkdAcCIaMJhOQGgHTSEBaAhHQI8nGVopQUJ1fZQoaAZHQHDAwFotcwBoB039AWgIR0CPJ9oePq9odX2UKGgGR0BtqenIhhYvaAdNLAFoCEdAjyjgSFoL5XV9lChoBkdAbhmZPVNHpmgHTRABaAhHQI8qMAq/dqN1fZQoaAZHQHDJdEXtShtoB00hAWgIR0CPK81He7+UdX2UKGgGR0BwJ0/bCaZyaAdNFwFoCEdAjyxGxUvPC3V9lChoBkdAcxP/Aj6eoWgHTQ4BaAhHQI8t9Q0oBq91fZQoaAZHQHJskoWpIc1oB00UAWgIR0CPL7zV+Zw5dX2UKGgGR0BwJmofjjrBaAdNMgFoCEdAjzAZBC2MKnV9lChoBkdAbf8NhmXgL2gHTSYBaAhHQI8zm4oZydZ1fZQoaAZHQHCT/aDf3vhoB00gAWgIR0CPM70163RYdX2UKGgGR0BxGeFHrhR7aAdL8WgIR0CPNHQa72+PdX2UKGgGR0Bu6g2sJY1YaAdNIAFoCEdAjzT/NJOFg3V9lChoBkdAbba/C66J7GgHTQQBaAhHQI81wl2NedF1fZQoaAZHQHDfJmI0qH5oB00YAWgIR0CPNjWxyGSIdX2UKGgGR0Bx+/fFaSs9aAdNJQFoCEdAjzZjdpItlXV9lChoBkdATWVTDO1OTWgHS9JoCEdAjzZht+CsfnV9lChoBkdAckmYNAkcCGgHTSwBaAhHQI83NzMibDx1fZQoaAZHQG5HtRvWH1xoB004AWgIR0CPOSGNaQmvdX2UKGgGR0Bv1ic7QswtaAdNHAFoCEdAjzwSbhFVk3V9lChoBkdAcXQ3Lmp2lmgHTQkBaAhHQI8/bEDQqqh1fZQoaAZHQHEjVmnO0LNoB005AWgIR0CPQHGH58BudX2UKGgGR0BympoWYWtVaAdL92gIR0CPQzEsrd30dX2UKGgGR0Bw9OdPLxI8aAdNCwFoCEdAj0XfXf642HV9lChoBkdAblpSYw7DEWgHTQIBaAhHQI9F/WxyGSJ1fZQoaAZHQHLy7eqJdjZoB01QAWgIR0CPRhW912aEdX2UKGgGR0BvzbEP1+RYaAdNIQFoCEdAj0kpxWDHwXV9lChoBkdAcAD1QZXMhWgHTUwBaAhHQI9JbblA/s51fZQoaAZHQHDpq/RE4NtoB00eAWgIR0CPSaFh5PdmdX2UKGgGR0ByiUCU5dWyaAdNGQFoCEdAj0y5J04io3V9lChoBkdAc3hgeRxLkGgHTVMBaAhHQI9M187ZFod1fZQoaAZHQG/q40VJtixoB010AWgIR0CPTsQhfShKdX2UKGgGR0BxIv6Hj6vaaAdNZgFoCEdAj08n8baRIXV9lChoBkdAcTpI/JNj9WgHTWEBaAhHQI9U6N6w+t91ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVIwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeC9ob21lL3JsL1B5Y2hhcm1Qcm9qZWN0cy9PcHRpbWl6ZWRMdW5hckxhbmRlci12Mi1QUE8vdmVudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMeC9ob21lL3JsL1B5Y2hhcm1Qcm9qZWN0cy9PcHRpbWl6ZWRMdW5hckxhbmRlci12Mi1QUE8vdmVudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVIwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMeC9ob21lL3JsL1B5Y2hhcm1Qcm9qZWN0cy9PcHRpbWl6ZWRMdW5hckxhbmRlci12Mi1QUE8vdmVudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMeC9ob21lL3JsL1B5Y2hhcm1Qcm9qZWN0cy9PcHRpbWl6ZWRMdW5hckxhbmRlci12Mi1QUE8vdmVudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "system_info": {"OS": "Linux-6.8.0-87-generic-x86_64-with-glibc2.35 # 88~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Tue Oct 14 14:03:14 UTC 2", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu117", "GPU Enabled": "False", "Numpy": "1.26.0", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1"}}
ppo-lunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f248f1f67abe04265ed40be1ab05ea959a1d216707f88a033fcc020f116d73ce
3
- size 146479
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5d62f5f1945cd510b5fb137fdc030fd7fb3ba5650233212c82114acdc586ffe
3
+ size 146523
ppo-lunarLander-v2/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7af4fcebba30>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7af4fcebbac0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7af4fcebbb50>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7af4fcebbbe0>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7af4fcebbc70>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7af4fcebbd00>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7af4fcebbd90>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7af4fcebbe20>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7af4fcebbeb0>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7af4fcebbf40>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7af4fcec4040>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7af4fcec40d0>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7af4fceb3280>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
@@ -26,12 +26,12 @@
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1770578468713797764,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAAwFT39hQE82QEHvpaAWr6IrzK9pF/HPQAAAAAAAAAA5c0UP8+MSb5FOII5Mp2Yt8VURL5mzRq3AACAPwAAgD/NIpC8j95Vugw7NDmrHOI1b3VWOth1ULgAAIA/AACAP4bCaL5EoSo/C5pqvf5f6b4b6CS+Ps60PQAAAAAAAAAA7RWlProVID8wW969mkTHviB/JT5SS0a+AAAAAAAAAABTlKU+TkkZP7tX371k07y+fu7rPbIqs70AAAAAAAAAAGY+DjtlcLg/E+AVPWWJHz7wTiG7gD0GvAAAAAAAAAAAzdeXvOGogboCHEk31XxMMpKTK7pDhGq2AACAPwAAgD8aYq+94hR9P0YcM7wME/m+sFG0vdVoVDwAAAAAAAAAAJrIBj25t4o/tiXGPSP1CL9+ZqI9SFvDPQAAAAAAAAAAbXCKvrz0Wz9+44u+6+rvvsoLyb7uSSg9AAAAAAAAAABzpLM9bMrmPtiZ17z1Va++KzZDuxi+ib0AAAAAAAAAAEAbmz3hQyY/GgUCPVWEzr7ubA49yo+qOwAAAAAAAAAAGkKRPhEULL2jUg47halPulxbl74dntu5AACAPwAAgD/T9Xs+/M2tPttJl76LpYG+6G9bvY1v970AAAAAAAAAADV9l76TPXs/rKm0voGK7r6aEta+kNGDvQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -45,7 +45,7 @@
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWVGgwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHLQnpr1uiyMAWyUTREBjAF0lEdAjXdOUdJaq3V9lChoBkdAciR/4ZdfLWgHTRMBaAhHQI15E052hZh1fZQoaAZHQHChX7+DOC5oB00LAWgIR0CNeQ0SAYpEdX2UKGgGR0BxN6nCO3lTaAdNBgFoCEdAjXuZKODJ2nV9lChoBkdAcsc6dDpkgGgHTTABaAhHQI17uWD6Fdt1fZQoaAZHQHIXA/keZG9oB0vuaAhHQI18VR+BpYd1fZQoaAZHQHGz76P8yetoB00bAWgIR0CNfgOhkAggdX2UKGgGR0BwVE6aLGaQaAdNKQFoCEdAjX4mig00nHV9lChoBkdAcbToJRfnfWgHS+RoCEdAjX8GRmseXHV9lChoBkdAcJJjJdSl32gHS+FoCEdAjX8j9n9NvnV9lChoBkdAcOx0dRzij2gHS89oCEdAjX+gPEsJ6nV9lChoBkdAcRqudPLxJGgHTQMBaAhHQI2AlNi6QNl1fZQoaAZHQHArrFsHjZNoB0v6aAhHQI2Bi2tuDSR1fZQoaAZHQHDaCBf8dghoB0v3aAhHQI2CEl7dBSl1fZQoaAZHQHIQ2bCrLhdoB0v9aAhHQI2EJrP+n651fZQoaAZHQHInq68QI2RoB00TAWgIR0CNhIRU3n6mdX2UKGgGR0BxYIA80UGnaAdNEAFoCEdAjYV69sabWnV9lChoBkdAQjyZnctXgmgHS7NoCEdAjYZ2qkuYhXV9lChoBkdAcBGdLg4wRGgHTQkBaAhHQI2G2SlnAZd1fZQoaAZHQHDYphfBvaVoB00OAWgIR0CNhx2OhkAhdX2UKGgGR0BxrOIWP91maAdNAgFoCEdAjYi4cFQl8nV9lChoBkdAccxpj+aScWgHTRIBaAhHQI2Jsi0OVgR1fZQoaAZHQG4iDLbHp8poB00hAWgIR0CNiveQdS2qdX2UKGgGR0BzbUV/MGHIaAdL3WgIR0CNi3PHktEodX2UKGgGR0Bxd7jQzDXOaAdNGQFoCEdAjYvaE8JUpHV9lChoBkdAcWHgjyFwk2gHTQ0BaAhHQI2L+mpEQXh1fZQoaAZHQHJzCuIRAbBoB00KAWgIR0CNjHqiXY16dX2UKGgGR0BwZqV4X40uaAdNKwFoCEdAjY2TND+irXV9lChoBkdAcIVaTOgQH2gHTQkBaAhHQI2PtnK4hEB1fZQoaAZHQHLHOzyBkI5oB0v2aAhHQI2RFNN8E3d1fZQoaAZHQHK9urZJ04loB0vxaAhHQI2SFiay8jB1fZQoaAZHQHJxjfaYeDFoB0vgaAhHQI2SQnH/9511fZQoaAZHQHIK1UlzEJloB00aAWgIR0CNk5OymhugdX2UKGgGR0Bwzj8gpz91aAdL8WgIR0CNlJw9aEBbdX2UKGgGR0Bxe2Y5T6zmaAdNDAFoCEdAjZZ90Rvm5nV9lChoBkdAcN9sdDIBBGgHS/9oCEdAjZj7TtsvZnV9lChoBkdAbr+b6P8ye2gHS+9oCEdAjZ3EdvKlpHV9lChoBkdAcUPq33Hq/2gHS/9oCEdAjZ3rdFfAsXV9lChoBkdAco+0T101ZWgHTRIBaAhHQI2eD4vexfR1fZQoaAZHQHGZcp5NXYFoB00MAWgIR0CNnsz6ab4KdX2UKGgGR0BzHsAMlTm5aAdNGQFoCEdAjZ7wxWT5f3V9lChoBkdAcIo/NJOFg2gHTQMBaAhHQI2f/dl/Yrd1fZQoaAZHQG9ym0eEIxBoB0vwaAhHQI2jRF1B+nZ1fZQoaAZHQHEU7Ackt29oB00rAWgIR0CNuth60IC2dX2UKGgGR0By4BWT5ftyaAdNFAFoCEdAjbx606YE4nV9lChoBkdAccHabWmP52gHS/1oCEdAjbziT2WY4XV9lChoBkdAcVYnjhky12gHTTwBaAhHQI2+mQ2dd3V1fZQoaAZHQG4RELx7RfFoB00LAWgIR0CNvuvLX+VDdX2UKGgGR0Bx/X446wMZaAdNBgFoCEdAjb/5GKAJ9nV9lChoBkdAcC8Jm/WUbGgHS+poCEdAjcHDIJZ4fXV9lChoBkdAck0VX3g1nGgHS9hoCEdAjcHl7laKUHV9lChoBkdAcXv8YAKfF2gHS+JoCEdAjcJNdqtYCHV9lChoBkdAcXh9eQdS22gHTQIBaAhHQI3DR3NcGC91fZQoaAZHQG82EAHVwxZoB00GAWgIR0CNw18BuGbkdX2UKGgGR0BwF4ZsKsuGaAdNmQFoCEdAjcTxC6YmcHV9lChoBkdAcuQr2QGOdWgHS+VoCEdAjcX2Ebo8p3V9lChoBkdAcXDaoMrmQ2gHTSkBaAhHQI3H09fTkQx1fZQoaAZHQHIL8YuTRploB00XAWgIR0CNy52h7E5ydX2UKGgGR0By5xVU+9rXaAdNBgFoCEdAjcy9pZfUnXV9lChoBkdAcgJrhR64UmgHTRcBaAhHQI3NagoPTXt1fZQoaAZHQHFqbUXpGF1oB0voaAhHQI3OYBtDUmV1fZQoaAZHQHBEHMEA5rBoB00RAWgIR0CNz96cAimmdX2UKGgGR0BvnTBMzuWsaAdL8WgIR0CN0Pb6guh9dX2UKGgGR0BxuamALApKaAdL6mgIR0CN0R9Aood/dX2UKGgGR0BW9Wyon8baaAdN6ANoCEdAjdUjV6NVBHV9lChoBkdAcX6IRh+fAmgHTRsBaAhHQI3VhQk5ZKZ1fZQoaAZHQHEswmReTmpoB0vsaAhHQI3VqKaXrt51fZQoaAZHQG/B3++/QBxoB0vcaAhHQI3WWyVv/BF1fZQoaAZHQHHNxQN0/4ZoB00NAWgIR0CN1q19fCyhdX2UKGgGR0BymNP3ztkXaAdNTwFoCEdAjdcgqur6tXV9lChoBkdAcohdEb5uZWgHTYcBaAhHQI3XHtBv73x1fZQoaAZHQHA0UaZQYUFoB0vhaAhHQI3aZZr56+p1fZQoaAZHQG+bvcrRSgpoB0vpaAhHQI3c2GmDUVl1fZQoaAZHQFDVehPCVKRoB03oA2gIR0CN4DhBJI1+dX2UKGgGR0BwIAuctoSMaAdNKgFoCEdAjeCEehf0E3V9lChoBkdAcPYNEw35vmgHS/RoCEdAjeE/eDWbw3V9lChoBkdAc6cP+4smOWgHTSIBaAhHQI3jU8Tzund1fZQoaAZHQG4EbGFSKm9oB00rAWgIR0CN5PRO1v2odX2UKGgGR0ByciO6unuRaAdL2WgIR0CN5VbDdgv2dX2UKGgGR0Bv7NWyTpxFaAdL82gIR0CN5YM98qnWdX2UKGgGR0Bw1s3974SIaAdL2mgIR0CN5dvhIe5ndX2UKGgGR0BwyUo3Jgb7aAdNCQFoCEdAjecYkeIVM3V9lChoBkdAcULQlruYyGgHTRABaAhHQI3nbbg0j1R1fZQoaAZHQHAz5avA44poB00cAWgIR0CN6aGUwBYFdX2UKGgGR0Bxl0JD3M6jaAdL3GgIR0CN62Gxlg+hdX2UKGgGR0BymIwqRU3oaAdNBgFoCEdAjevRYA80UHV9lChoBkdAcdRKKYRdyGgHTUwBaAhHQI3sfsAvL5h1fZQoaAZHQD+QCJXQtz1oB0uvaAhHQI3tNsUIsy11fZQoaAZHQHAsKNAC4jNoB0vxaAhHQI3xVNnGsFN1fZQoaAZHQHEBNw71ZkloB00LAWgIR0CN9ozkZJkHdX2UKGgGR0BzIhDlYEGJaAdL9mgIR0CN9uLdepn6dX2UKGgGR0By0n+YMOPOaAdNPAFoCEdAjfcX18LKFXV9lChoBkdAbqhkiliz9mgHS/FoCEdAjfelqi48U3V9lChoBkdAciQwazeGf2gHTQcBaAhHQI34j7qIJqt1fZQoaAZHQDe28274BWBoB0u5aAhHQI35oxtYSxt1fZQoaAZHQHElwj+rELpoB0v6aAhHQI35wNNJvpB1fZQoaAZHQHD/iNKh+ORoB00oAWgIR0CN+s5OrQw9dX2UKGgGR0Bw5a5oXbdraAdNCQFoCEdAjfsBCdBjWnV9lChoBkdAc73TKkl/pmgHS9poCEdAjfyMMiKR+3V9lChoBkdAcZnv5xiobWgHS/ZoCEdAjf3JjUd7wHVlLg=="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x705d08ac3a30>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x705d08ac3ac0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x705d08ac3b50>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x705d08ac3be0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x705d08ac3c70>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x705d08ac3d00>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x705d08ac3d90>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x705d08ac3e20>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x705d08ac3eb0>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x705d08ac3f40>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x705d08ad0040>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x705d08ad00d0>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x705d08acd500>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
 
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1770686618978238999,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAFPhfD43SDq9iD0IPTO4ybwDjqK+EKx1PQAAAAAAAAAAM5kvvdBosz9y4zG/QWgKvjqsnzyS6uG8AAAAAAAAAADmu7G9hVO4ubSiDjoS/h82uuI7uxZ6JbkAAAAAAACAP5oFmjuuQZO6JphNtoIiPDEuno463qZvNQAAgD8AAIA/GnQOvV6R5T2WjCg+meR6vhTGNzyaujQ7AAAAAAAAAACg10o+u8CovPIhgDqjtRm4etEUvtf1obkAAIA/AACAP5qwiz0Fcr+7EiWku+alpDzWfhc9DoCKvQAAgD8AAIA/gBEOPT0xC7szVVo8OT+UPP0U+LvD4389AACAPwAAgD9mY0Q99gAJusa0rbt7WrE2qaPCu6m0IbYAAAAAAAAAANpxab5KTDU/OWuePfBUz75WQtS9UrEDPgAAAAAAAAAAQOGzvRkFsD4qnyk+/xt/vvpbGz13jqk9AAAAAAAAAADasyk+dahUP/ZDirxxna2+aoK8PX2tlr0AAAAAAAAAAM3Qejysp/4+4+9oPXoTqb5l94e8yeslPAAAAAAAAAAAGjb6PUmAJz25mIc9swCCvmNn8TwjmFo9AAAAAAAAAADNBOi7rkeRN1rLB7iJqU2zgZiiu8vCITcAAIA/AACAP03Zp72PjFo+V3sLPuNXVr782Mk8hfb1vAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWVPAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG+jy5qdpZiMAWyUTZIBjAF0lEdAjrisniNsFnV9lChoBkdAceg5WRzRyGgHTSkBaAhHQI642M+/xlR1fZQoaAZHQHEyrypaRp1oB00SAWgIR0COvc2Hck+pdX2UKGgGR0Bvds/2TPjXaAdNCAFoCEdAjr4QGGEf1nV9lChoBkdAcjLr7fpD/mgHTRMBaAhHQI6+VPci4ax1fZQoaAZHQHDJjhUBGQVoB01aAWgIR0COvwYYzi0fdX2UKGgGR0ByZbobGWD6aAdNPQFoCEdAjr+XQMQVbnV9lChoBkdAcDSsabWmQGgHTQsBaAhHQI6/sUsWfsh1fZQoaAZHQHC8CS/0ulJoB00NAWgIR0COwUXJo0yhdX2UKGgGR0ByBxxVAAyVaAdNDQFoCEdAjsWHh86V+3V9lChoBkdAcVOeIEbHZWgHTRgBaAhHQI7He4smOVB1fZQoaAZHQG/Zet8uzyBoB00sAWgIR0COySQ+2VmjdX2UKGgGR0BvtzKkl/pdaAdL+2gIR0COyYIzFdcCdX2UKGgGR0BuS+0kWykcaAdNGAFoCEdAjst4NRWLgnV9lChoBkdAcLNP557gKmgHTSwBaAhHQI7MsPYnOSp1fZQoaAZHQHApaEWZZ0VoB01lAWgIR0COzZX7Lt/ndX2UKGgGR0ByCjDfm9xqaAdNSgFoCEdAjs4ex4Y773V9lChoBkdAcAwnbZezEGgHS/hoCEdAjs4n/tICl3V9lChoBkdAcQ+/8l5WzWgHTQkBaAhHQI7RTj3mFJx1fZQoaAZHQHIo+RkmQbNoB00vAWgIR0CO0lAWSEDhdX2UKGgGR0Bw84065oXbaAdNJgFoCEdAjtKVkDp1R3V9lChoBkdAb0RZ/Tb35GgHTT0BaAhHQI7S88JUo8Z1fZQoaAZHQG9rzY/Vy3loB001AWgIR0CO1Vb5dnkDdX2UKGgGR0Bybe9alk6LaAdNbQFoCEdAjtdNHH3lCHV9lChoBkdAcC0qzJIUamgHTRwBaAhHQI7YB64UeuF1fZQoaAZHQHMEb9ycTaloB00cAWgIR0CO2xtLteD4dX2UKGgGR0ByC8h5gPVeaAdNGQFoCEdAjttcU21lXnV9lChoBkdAcFDWmP5pJ2gHTSIBaAhHQI7ePalDWsl1fZQoaAZHQHBtqoqCpWFoB00aAWgIR0CO39ch1TzedX2UKGgGR0BviDbN8ma6aAdNHgFoCEdAjuDnxJ/XoXV9lChoBkdAbW7N9ph4MWgHTT4BaAhHQI7hcKu0TlF1fZQoaAZHQHFr31OCXhRoB02oAWgIR0CO5H+Vkc0cdX2UKGgGR0BW+tALRa5gaAdN6ANoCEdAjuVIAwPAf3V9lChoBkdAb/BoDgZTAGgHTRQBaAhHQI7l9IsiB5J1fZQoaAZHQHEWKXnhbW5oB00sAWgIR0CO5fTgEU0vdX2UKGgGR0BtkoqwyIpIaAdNLgFoCEdAjubb2USqVHV9lChoBkdAca8nsLORkmgHTXcBaAhHQI7nmLP2PDJ1fZQoaAZHQGt7NDlYEGJoB01BAWgIR0CO6KaBI4EPdX2UKGgGR0BxuoysS00FaAdNFQFoCEdAjuvuk+HJtHV9lChoBkdAcQoy+6Ae72gHTToBaAhHQI7sA9eQdS51fZQoaAZHQHAQpgogFHJoB00oAWgIR0CO7zn+yZ8bdX2UKGgGR0Bx8/O4XoC/aAdNDQFoCEdAjvM0q6OHWXV9lChoBkdAceazsyBTXWgHTQgBaAhHQI70gd2gWad1fZQoaAZHQHIVmpIczZZoB01GAWgIR0CO9JeyiVSodX2UKGgGR0BxLF32VVxTaAdNVAFoCEdAjvXWkBS1mnV9lChoBkdAcF5WgezUqmgHTRYBaAhHQI72VTkyULV1fZQoaAZHQHL55qIrOJNoB000AWgIR0CO+HwAlv61dX2UKGgGR0BJxoatLcsUaAdL62gIR0CO+Uzk6tDEdX2UKGgGR0ByvFEjPfKqaAdNBwFoCEdAjvl5Grjo6nV9lChoBkdAcIVuiN83M2gHTRkBaAhHQI75q1kUbkx1fZQoaAZHQG2ksqrilzloB00NAWgIR0CPFL8n/kvLdX2UKGgGR0Bv3GX/o7muaAdNNgFoCEdAjxW1LJ0W/XV9lChoBkdAcJ5K508vEmgHTQ4BaAhHQI8WEcyWRih1fZQoaAZHQFBS1XvH93toB0vCaAhHQI8YucH4XXR1fZQoaAZHQHL9IexOclRoB00LAWgIR0CPGYpYs/Y8dX2UKGgGR0Bx1Moa1kUcaAdNjQFoCEdAjxqn1FpfyHV9lChoBkdAbxqSxJNCaGgHTWMBaAhHQI8cwwdsBQx1fZQoaAZHQFPyEal1r7BoB0u6aAhHQI8dAHAymAN1fZQoaAZHQHG8OyVv/BFoB00RAWgIR0CPHmnrpqyodX2UKGgGR0BvQ8SqU/wBaAdNOwFoCEdAjyGXvH93r3V9lChoBkdAcWrvBrN4aGgHTSgBaAhHQI8iYrWiDdx1fZQoaAZHQG/JSFfzBhxoB00QAWgIR0CPJDqesgdPdX2UKGgGR0Bu00lolD4QaAdNIQFoCEdAjyWk30f5lHV9lChoBkdAcDayXD3ueGgHTSgBaAhHQI8mcWXTmXB1fZQoaAZHQHEzTewcHW1oB01nAWgIR0CPJoI55qubdX2UKGgGR0Bw99VvMr3CaAdNCwFoCEdAjybWTxG2C3V9lChoBkdAcCIaMJhOQGgHTSEBaAhHQI8nGVopQUJ1fZQoaAZHQHDAwFotcwBoB039AWgIR0CPJ9oePq9odX2UKGgGR0BtqenIhhYvaAdNLAFoCEdAjyjgSFoL5XV9lChoBkdAbhmZPVNHpmgHTRABaAhHQI8qMAq/dqN1fZQoaAZHQHDJdEXtShtoB00hAWgIR0CPK81He7+UdX2UKGgGR0BwJ0/bCaZyaAdNFwFoCEdAjyxGxUvPC3V9lChoBkdAcxP/Aj6eoWgHTQ4BaAhHQI8t9Q0oBq91fZQoaAZHQHJskoWpIc1oB00UAWgIR0CPL7zV+Zw5dX2UKGgGR0BwJmofjjrBaAdNMgFoCEdAjzAZBC2MKnV9lChoBkdAbf8NhmXgL2gHTSYBaAhHQI8zm4oZydZ1fZQoaAZHQHCT/aDf3vhoB00gAWgIR0CPM70163RYdX2UKGgGR0BxGeFHrhR7aAdL8WgIR0CPNHQa72+PdX2UKGgGR0Bu6g2sJY1YaAdNIAFoCEdAjzT/NJOFg3V9lChoBkdAbba/C66J7GgHTQQBaAhHQI81wl2NedF1fZQoaAZHQHDfJmI0qH5oB00YAWgIR0CPNjWxyGSIdX2UKGgGR0Bx+/fFaSs9aAdNJQFoCEdAjzZjdpItlXV9lChoBkdATWVTDO1OTWgHS9JoCEdAjzZht+CsfnV9lChoBkdAckmYNAkcCGgHTSwBaAhHQI83NzMibDx1fZQoaAZHQG5HtRvWH1xoB004AWgIR0CPOSGNaQmvdX2UKGgGR0Bv1ic7QswtaAdNHAFoCEdAjzwSbhFVk3V9lChoBkdAcXQ3Lmp2lmgHTQkBaAhHQI8/bEDQqqh1fZQoaAZHQHEjVmnO0LNoB005AWgIR0CPQHGH58BudX2UKGgGR0BympoWYWtVaAdL92gIR0CPQzEsrd30dX2UKGgGR0Bw9OdPLxI8aAdNCwFoCEdAj0XfXf642HV9lChoBkdAblpSYw7DEWgHTQIBaAhHQI9F/WxyGSJ1fZQoaAZHQHLy7eqJdjZoB01QAWgIR0CPRhW912aEdX2UKGgGR0BvzbEP1+RYaAdNIQFoCEdAj0kpxWDHwXV9lChoBkdAcAD1QZXMhWgHTUwBaAhHQI9JbblA/s51fZQoaAZHQHDpq/RE4NtoB00eAWgIR0CPSaFh5PdmdX2UKGgGR0ByiUCU5dWyaAdNGQFoCEdAj0y5J04io3V9lChoBkdAc3hgeRxLkGgHTVMBaAhHQI9M187ZFod1fZQoaAZHQG/q40VJtixoB010AWgIR0CPTsQhfShKdX2UKGgGR0BxIv6Hj6vaaAdNZgFoCEdAj08n8baRIXV9lChoBkdAcTpI/JNj9WgHTWEBaAhHQI9U6N6w+t91ZS4="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
ppo-lunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:556f673bb98f42aa354eb16a1cf5197f2d911459dd534a16a4497ca9982daee1
3
  size 87545
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09e62e1f7f221d8eb731619d9daaa291f9cb31e23c25a6dbb00d2ab5b413faa6
3
  size 87545
ppo-lunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54c47007368fb6ad34e712ca7ea75e34e8564ebf648ff980b94478434971ff4e
3
  size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:baae9f8fb2725c3b842c7e3e24fd9674f0c6dbec83467cf33cb927abbba2adee
3
  size 43201
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f170bfa75161da5eb9e8982a446909e4992a320e015ede13fe54aa78e288057a
3
- size 166470
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d70b13c967a2381c1dd3672619549553d6284fa4172213012b37ed21f45be458
3
+ size 191673
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 251.9112059, "std_reward": 23.55290627089305, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2026-02-08T14:37:16.798721"}
 
1
+ {"mean_reward": 262.73879420000003, "std_reward": 14.478935544867799, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2026-02-09T20:40:29.744195"}