Kallinteris-Andreas commited on
Commit
11bdc3f
·
verified ·
1 Parent(s): 022ffc7
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnNhYy5wb2xpY2llc5SMCVNBQ1BvbGljeZSTlC4=", "__module__": "stable_baselines3.sac.policies", "__annotations__": "{'actor': <class 'stable_baselines3.sac.policies.Actor'>, 'critic': <class 'stable_baselines3.common.policies.ContinuousCritic'>, 'critic_target': <class 'stable_baselines3.common.policies.ContinuousCritic'>}", "__doc__": "\n Policy class (with both actor and critic) for SAC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ", "__init__": "<function SACPolicy.__init__ at 0x7f72d161c4a0>", "_build": "<function SACPolicy._build at 0x7f72d161cae0>", "_get_constructor_parameters": "<function SACPolicy._get_constructor_parameters at 0x7f72d161cb80>", "reset_noise": "<function SACPolicy.reset_noise at 0x7f72d161cc20>", "make_actor": "<function SACPolicy.make_actor at 0x7f72d161ccc0>", "make_critic": "<function SACPolicy.make_critic at 0x7f72d161cd60>", "forward": "<function SACPolicy.forward at 0x7f72d161ce00>", "_predict": "<function SACPolicy._predict at 0x7f72d161cea0>", "set_training_mode": "<function SACPolicy.set_training_mode at 0x7f72d161cf40>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f72d1620fc0>"}, "verbose": 0, "policy_kwargs": {"use_sde": false}, "num_timesteps": 1000000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": 0, "action_noise": null, "start_time": 1730956112387218563, "learning_rate": 0.0003, "tensorboard_log": "runs/efmz9y24", "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVLQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJa4AQAAAAAAAN5lw3la7fE/O5DnbXrzrT9J5JGS2hLRv3p9bdkvxdO/tlN1D6lB6T/PURp0XrD3P/b/NDSQGPa/pVJAqTeH67/eVMWlJ1gHwKzy5OefP+E/SzKWBcqQpr8uOiftOiXxP1FSzXpbBq2/66kMefpBxr+XKI6OeSbiv3es0U5pWuI/ZX7FlmRNBUCmzlN+KofEv8w5z3NMkQNA/+WdH2cZ2T9mCb5ovrS3v03w8jzHgAfATeP3hPsg+D+p05tbClitP/I14ulij6i/oYDeL+Eo4b81Iet1sEXZvwr0tf4kxvw/Nj77p7Xj2r8QSEcxE5uxv3O2/IDNA/s/nxiVDX1qBcBPlnzqnDQYQAKYtTkKOPY/HdrqSP7goD+YY/wM4jivvwnEKW96gua/m+VLDeFX1L8xJxs+Xt7+P4J6xbR4y+2/SvMgBVTF07+tLkqipTTyPy0gOLC+rfy/IIcC3hfWHUD9/6KHBTP4P+vTpPo2grU/hdabhm/Wgz9aGsSedEPkvyDnOC2QsuW/keZ58Q6IAUAc/JS9EZ3iP+puFNvIddq/jHE9q++U2T8adOaaYTDyv7rnsUIXaQlAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksFSwuGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVeAAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYFAAAAAAAAAAEBAQEBlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksFhZSMAUOUdJRSlC4="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVLQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJa4AQAAAAAAAA8cDRYnGfI/gSnTk7LPsD+a0iuQtVLPv2QjHDNF2dO/tCH0/zRF6T9Q15bE4OP2P1p7LatQrvS/xLyEzkDX7b89Dt3Hm8cEwAREKrbo382/IQuTFObJsL9JyhL/djLxP7H9Cb833LK/qFNY6l9Mxr963ROqGyDiv99y9Sz6LuM/r66xQhFOBUBmG7Ec/Ublv9vhjMcYsvw/A4iJRwn/07/CuXoFmF27v2ynXIiY4gzAqPdgIcgt+D+UB9mrrM+vP3TnXC0GRq6/MFcmzChW4L9lnnKtYBzcvxLoG9eIEvo/UZ4qm/oA178TD+LtZzbyv0y92dIHnfE/soHEbSsKDsBdWp9U/yQUQIrukzfyVPY/C+3EawV6oj+XSXz4DdSxvxobOquhCua/9OwYygz1179IaQlqG37+P35wjow5quq/vcBrtscz3r+6hs6RhHDwP3U8mv8j1f2/CLdOcoOgGkDVhh1NHB/4Pw/AgLkBCLY/ye//KIHlbz/bR8JSVebjv6BQ2s3Gk+a/wCWGx2JxAUByDkX8ak7kP0wmfDeY66G/IdLjTZoC8j/r2Vo0yWj7vy/bGZ0Mkg1AlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksFSwuGlIwBQ5R0lFKULg=="}, "_episode_num": 4163, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQIw6VyT6i0yMAWyUTQ0BjAF0lEdAp1g30Gu9vnV9lChoBkdAipA8nE2pAGgHS/5oCEdAp1ooq7ROUXV9lChoBkdAhCq+JP69CmgHS85oCEdAp1rFPP9k0HV9lChoBkdAgpTSauwHJWgHS61oCEdAp1yZ5qubJHV9lChoBkdAhKCmmce8w2gHS9BoCEdAp15eMuOCG3V9lChoBkdAg8VHww0wamgHS8FoCEdAp1/6U7jkuHV9lChoBkdAhNsq+i8Fp2gHS9NoCEdAp2EYekpI+XV9lChoBkdAhwP/qgRK6GgHS9xoCEdAp2UE4//vOXV9lChoBkdAhEDPxhDw6WgHS8xoCEdAp2cWez2OAHV9lChoBkdAlJlF/pdKNGgHTYcBaAhHQKdrq5PM0P91fZQoaAZHQIkwO7YkE9toB0vwaAhHQKdsKMBp5/t1fZQoaAZHQIR3ANI9TxZoB0vOaAhHQKdtVmkFfRh1fZQoaAZHQKhvZnbqQiloB03oA2gIR0CncRjyvs7ddX2UKGgGR0CE7ZHBk7OnaAdL02gIR0CnchL/82rGdX2UKGgGR0CFngN0eU6gaAdL0WgIR0Cnc7xq46OpdX2UKGgGR0CRcyE+PikwaAdNSwFoCEdAp3YkjeKsMnV9lChoBkdAhI/ir1dxAGgHS85oCEdAp3g3Ov+wT3V9lChoBkdAi8FBHbypaWgHTQIBaAhHQKd4xYISlFd1fZQoaAZHQIPn2jmCAc1oB0vJaAhHQKd5z12aDwp1fZQoaAZHQKhZLZVXFLpoB03oA2gIR0CnesAAZKnOdX2UKGgGR0CIRimReTmoaAdL5GgIR0CnfQ4c/+sHdX2UKGgGR0CEUJ4xk/bCaAdLymgIR0CnftvEsJ6ZdX2UKGgGR0CH2RsP8Q7LaAdL4mgIR0Cnfw4QSSNgdX2UKGgGR0CEPTMxGlQ/aAdLwWgIR0Cnf5QHAymAdX2UKGgGR0CLL30r9VFQaAdL+WgIR0CnglFwT/Q0dX2UKGgGR0CFW96kZaV2aAdLzmgIR0CnhPW5H3DfdX2UKGgGR0CDwx5/smfHaAdLv2gIR0CnhTtbcGkfdX2UKGgGR0CGaqiL2pQ2aAdL2GgIR0CnhXgu7HyVdX2UKGgGR0CIC+M8YAKfaAdL4mgIR0CniRAmAskIdX2UKGgGR0CEHzJOnEVGaAdLv2gIR0Cni0DPWxyGdX2UKGgGR0CHt9a/yoXLaAdL4mgIR0CnjH+eOGTLdX2UKGgGR0CNZokka/ATaAdNGQFoCEdAp42YOz6acHV9lChoBkdAiOl3xnWat2gHS+xoCEdAp5SajSG8EnV9lChoBkdAjZ5dqDbrT2gHTRoBaAhHQKeU6L1EmY11fZQoaAZHQJaf6fZmI0toB02tAWgIR0CnmA4Vh1DCdX2UKGgGR0CDkGMz/IbPaAdLt2gIR0CnmiUtRNypdX2UKGgGR0CoUpe8PFvRaAdN6ANoCEdAp5s5vYODrnV9lChoBkdAih2SCe2/jGgHS/JoCEdAp59QTEit73V9lChoBkdAiL8C2DxsmGgHS+doCEdAp6D1zwMH8nV9lChoBkdAkgjGqT8pC2gHTVQBaAhHQKelWXTmW+p1fZQoaAZHQIhlPetSydFoB0vfaAhHQKel7nnuAqd1fZQoaAZHQKhma176YVtoB03oA2gIR0CnpxkzoEB9dX2UKGgGR0CRWlq7AckuaAdNQwFoCEdAp6ql5yEL6XV9lChoBkdAhKHmBOHnEGgHS9FoCEdAp6twpBomHHV9lChoBkdAhO1y4OMER2gHS8xoCEdAp60I4VARkHV9lChoBkdAg9Y5avA442gHS79oCEdAp7BC3/givHV9lChoBkdAhL9AG8mKImgHS8xoCEdAp7GPsu3+dnV9lChoBkdAqDsF78ejmGgHTegDaAhHQKeyxi6xxDN1fZQoaAZHQIgd6RyOrABoB0vkaAhHQKe5Ytvn8sN1fZQoaAZHQJDOBlz2exxoB004AWgIR0CnuX25H3DfdX2UKGgGR0CEEl/nW8RMaAdLxGgIR0CnvpCMYMvzdX2UKGgGR0CFv9WUbDMvaAdL1GgIR0CnvxHj6vaDdX2UKGgGR0Cha3Ma86FNaAdNsQJoCEdAp8CZ1Tzd13V9lChoBkdAqFTLWCmMwWgHTegDaAhHQKfCee0Xxe91fZQoaAZHQJFVTsQd0aJoB01GAWgIR0CnyAyOR1YAdX2UKGgGR0CoHFdweeWfaAdN6ANoCEdAp80r+irT6XV9lChoBkdAm0dvUSZjQWgHTSUCaAhHQKfNdEIgNgB1fZQoaAZHQJVzAUFjd59oB02oAWgIR0CnzgNYbKigdX2UKGgGR0COhyenyd4FaAdNKwFoCEdAp9W+hAWznnV9lChoBkdApN57G5tm+WgHTTgDaAhHQKfXIAfdRBN1fZQoaAZHQJANXIDHOr1oB00xAWgIR0Cn35ztsvZidX2UKGgGR0ComvyiM5wPaAdN6ANoCEdAp+PxQ+EAYHV9lChoBkdApb6FIZqEe2gHTVEDaAhHQKflGPH1e0J1fZQoaAZHQI6QUBU70WdoB00sAWgIR0Cn6Iw7DEWJdX2UKGgGR0CoreBcJMQFaAdN6ANoCEdAp+pswQDmsHV9lChoBkdAkh0lYMfA9GgHTVkBaAhHQKfu4fEGZ/l1fZQoaAZHQKizACDmKZVoB03oA2gIR0Cn8l24NI9UdX2UKGgGR0Co5rsz/IbPaAdN0gNoCEdAqABnV3EAHXV9lChoBkdAqEX09wFTvWgHTegDaAhHQKgGKC6pYLd1fZQoaAZHQKiDUkWykbhoB03oA2gIR0CoCCn/LkjpdX2UKGgGR0CRc3yT6i0waAdNSAFoCEdAqAp96PbO/3V9lChoBkdAqI5GFHrhSGgHTegDaAhHQKgM37qIJqt1fZQoaAZHQKghWr7O3UhoB03oA2gIR0CoEEOPFNtZdX2UKGgGR0CTgeiliz9kaAdNdwFoCEdAqBE7FhoduHV9lChoBkdAl25FVLi++WgHTckBaAhHQKgXy2a2F391fZQoaAZHQKHRml/H5rRoB02tAmgIR0CoG/WexwAEdX2UKGgGR0CoRnKEeyRkaAdN6ANoCEdAqCnQzWPLgXV9lChoBkdAp/icgyM1j2gHTegDaAhHQKgtV2r4nF51fZQoaAZHQKfvl0aIeo1oB03oA2gIR0CoLk0iILw4dX2UKGgGR0Cn6tdrXUYsaAdN6ANoCEdAqDUBYvFm4HV9lChoBkdAqC+E1EVnEmgHTegDaAhHQKg5OiUxEfF1fZQoaAZHQKWSo7T2FnJoB01oA2gIR0CoRoZb6guidX2UKGgGR0Coc0QvHtF8aAdN6ANoCEdAqEbgTCcf/3V9lChoBkdAqFyEKmbb12gHTegDaAhHQKhLHA+IM0B1fZQoaAZHQJEl759E1EVoB01DAWgIR0CoT+21c+qzdX2UKGgGR0CoQTXg9/z8aAdN6ANoCEdAqFbZTCLuQnV9lChoBkdAqDnocinpCGgHTegDaAhHQKhbELH+6y11fZQoaAZHQJHXO48U21loB01iAWgIR0CoX6ndXT3JdX2UKGgGR0CSVILZzxPPaAdNXwFoCEdAqGE7/dZaFHV9lChoBkdAqHsFOh0yQGgHTegDaAhHQKho49X9zfd1fZQoaAZHQJS6XvH93r5oB02SAWgIR0CobSad+XqrdX2UKGgGR0CoaqNjkMkQaAdN6ANoCEdAqG2t3np0OnV9lChoBkdAlEmU8NhE0GgHTZgBaAhHQKh06JcgQpZ1fZQoaAZHQKiRjta6jFhoB03oA2gIR0CoeIVnVXmvdX2UKGgGR0CZ5xNsFdLQaAdN7AFoCEdAqHwSemNzbXV9lChoBkdAqIv7UNKAa2gHTegDaAhHQKh9FKq4pc51fZQoaAZHQJDgOgHu7YloB00/AWgIR0CofkX6yjYadX2UKGgGR0CQfH9rXUYsaAdNSwFoCEdAqIdiZ+hGpnV9lChoBkdAknhWRNh3JWgHTWMBaAhHQKiJMXMQmNR1fZQoaAZHQKhijl/YraxoB03oA2gIR0CoivavA44qdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 198000, "buffer_size": 1000000, "batch_size": 256, "learning_starts": 10000, "tau": 0.005, "gamma": 0.99, "gradient_steps": 1, "optimize_memory_usage": false, "replay_buffer_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==", "__module__": "stable_baselines3.common.buffers", "__annotations__": "{'observations': <class 'numpy.ndarray'>, 'next_observations': <class 'numpy.ndarray'>, 'actions': <class 'numpy.ndarray'>, 'rewards': <class 'numpy.ndarray'>, 'dones': <class 'numpy.ndarray'>, 'timeouts': <class 'numpy.ndarray'>}", "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ", "__init__": "<function ReplayBuffer.__init__ at 0x7f72e0564cc0>", "add": "<function ReplayBuffer.add at 0x7f72e0564e00>", "sample": "<function ReplayBuffer.sample at 0x7f72e0564ea0>", "_get_samples": "<function ReplayBuffer._get_samples at 0x7f72e0564f40>", "_maybe_cast_dtype": "<staticmethod(<function ReplayBuffer._maybe_cast_dtype at 0x7f72e0564fe0>)>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f72e055a600>"}, "replay_buffer_kwargs": {}, "train_freq": {":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>", ":serialized:": "gAWVYQAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLAWgAjBJUcmFpbkZyZXF1ZW5jeVVuaXSUk5SMBHN0ZXCUhZRSlIaUgZQu"}, "use_sde_at_warmup": false, "target_entropy": -3.0, "ent_coef": "auto", "target_update_interval": 1, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVRQIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLC4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWWAAAAAAAAAAAAAAAAADw/wAAAAAAAPD/AAAAAAAA8P8AAAAAAADw/wAAAAAAAPD/AAAAAAAA8P8AAAAAAADw/wAAAAAAAPD/AAAAAAAA8P8AAAAAAADw/wAAAAAAAPD/lGgLSwuFlIwBQ5R0lFKUjA1ib3VuZGVkX2JlbG93lGgTKJYLAAAAAAAAAAAAAAAAAAAAAAAAlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwuFlGgWdJRSlIwEaGlnaJRoEyiWWAAAAAAAAAAAAAAAAADwfwAAAAAAAPB/AAAAAAAA8H8AAAAAAADwfwAAAAAAAPB/AAAAAAAA8H8AAAAAAADwfwAAAAAAAPB/AAAAAAAA8H8AAAAAAADwfwAAAAAAAPB/lGgLSwuFlGgWdJRSlIwNYm91bmRlZF9hYm92ZZRoEyiWCwAAAAAAAAAAAAAAAAAAAAAAAJRoHUsLhZRoFnSUUpSMCGxvd19yZXBylIwELWluZpSMCWhpZ2hfcmVwcpSMA2luZpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float64", "_shape": [11], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "bounded_below": "[False False False False False False False False False False False]", "high": "[inf inf inf inf inf inf inf inf inf inf inf]", "bounded_above": "[False False False False False False False False False False False]", "low_repr": "-inf", "high_repr": "inf", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVYAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaAtLA4WUjAFDlHSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolgMAAAAAAAAAAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwOFlGgWdJRSlIwEaGlnaJRoEyiWDAAAAAAAAAAAAIA/AACAPwAAgD+UaAtLA4WUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYDAAAAAAAAAAEBAZRoHUsDhZRoFnSUUpSMCGxvd19yZXBylIwELTEuMJSMCWhpZ2hfcmVwcpSMAzEuMJSMCl9ucF9yYW5kb22UjBRudW1weS5yYW5kb20uX3BpY2tsZZSMEF9fZ2VuZXJhdG9yX2N0b3KUk5SMBVBDRzY0lGgyjBRfX2JpdF9nZW5lcmF0b3JfY3RvcpSTlIaUUpR9lCiMDWJpdF9nZW5lcmF0b3KUjAVQQ0c2NJSMBXN0YXRllH2UKGg9ihDjYZWmt15YCS1Fllk0taEajANpbmOUihCpc3hEvDOBWIIa9zrb2o1BdYwKaGFzX3VpbnQzMpRLAIwIdWludGVnZXKUSwB1YnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "bounded_below": "[ True True True]", "high": "[1. 1. 1.]", "bounded_above": "[ True True True]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": "Generator(PCG64)"}, "n_envs": 5, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVHgQAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLBUsTQyaVAZcAdAEAAAAAAAAAAAIAiQF8AKsBAAAAAAAAqwEAAAAAAABTAJROhZSMBWZsb2F0lIWUjBJwcm9ncmVzc19yZW1haW5pbmeUhZSMVC9ob21lL21hc3Rlci1hbmRyZWFzL2dlbl9kYXRhc2V0L3N0YWJsZS1iYXNlbGluZXMzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMCDxsYW1iZGE+lIwhZ2V0X3NjaGVkdWxlX2ZuLjxsb2NhbHM+LjxsYW1iZGE+lEthQxD4gACkZalO0DtN0yxO1CZPlEMAlIwOdmFsdWVfc2NoZWR1bGWUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxUL2hvbWUvbWFzdGVyLWFuZHJlYXMvZ2VuX2RhdGFzZXQvc3RhYmxlLWJhc2VsaW5lczMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgjfZR9lChoGowIPGxhbWJkYT6UjAxfX3F1YWxuYW1lX1+UjCFnZXRfc2NoZWR1bGVfZm4uPGxvY2Fscz4uPGxhbWJkYT6UjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgbjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOUaAIoaAcoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJRoCSmMAV+UhZRoDowEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4VDCPiAANgPEogKlGgSjAN2YWyUhZQpdJRSlGgXTk5oHylSlIWUdJRSlGglaEF9lH2UKGgajARmdW5jlGgpjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlGgrfZRoLU5oLk5oL2gbaDBOaDFoM0c/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwhZRSlIWUaEpdlGhMfZR1hpSGUjAu"}, "batch_norm_stats": [], "batch_norm_stats_target": [], "system_info": {"OS": "Linux-6.6.59-1-MANJARO-x86_64-with-glibc2.40 # 1 SMP PREEMPT_DYNAMIC Fri Nov 1 05:33:52 UTC 2024", "Python": "3.12.7", "Stable-Baselines3": "2.4.0a10", "PyTorch": "2.4.1+cu121", "GPU Enabled": "True", "Numpy": "1.26.4", "Cloudpickle": "3.1.0", "Gymnasium": "1.0.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnNhYy5wb2xpY2llc5SMCVNBQ1BvbGljeZSTlC4=", "__module__": "stable_baselines3.sac.policies", "__annotations__": "{'actor': <class 'stable_baselines3.sac.policies.Actor'>, 'critic': <class 'stable_baselines3.common.policies.ContinuousCritic'>, 'critic_target': <class 'stable_baselines3.common.policies.ContinuousCritic'>}", "__doc__": "\n Policy class (with both actor and critic) for SAC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ", "__init__": "<function SACPolicy.__init__ at 0x7fc00380c4a0>", "_build": "<function SACPolicy._build at 0x7fc00380cae0>", "_get_constructor_parameters": "<function SACPolicy._get_constructor_parameters at 0x7fc00380cb80>", "reset_noise": "<function SACPolicy.reset_noise at 0x7fc00380cc20>", "make_actor": "<function SACPolicy.make_actor at 0x7fc00380ccc0>", "make_critic": "<function SACPolicy.make_critic at 0x7fc00380cd60>", "forward": "<function SACPolicy.forward at 0x7fc00380ce00>", "_predict": "<function SACPolicy._predict at 0x7fc00380cea0>", "set_training_mode": "<function SACPolicy.set_training_mode at 0x7fc00380cf40>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fc0038112c0>"}, "verbose": 0, "policy_kwargs": {"use_sde": false}, "num_timesteps": 1000000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": 0, "action_noise": null, "start_time": 1731417232377162777, "learning_rate": 0.0003, "tensorboard_log": "runs/ff8r1mba", "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVLQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJa4AQAAAAAAAN5lw3la7fE/O5DnbXrzrT9J5JGS2hLRv3p9bdkvxdO/tlN1D6lB6T/PURp0XrD3P/b/NDSQGPa/pVJAqTeH67/eVMWlJ1gHwKzy5OefP+E/SzKWBcqQpr8uOiftOiXxP1FSzXpbBq2/66kMefpBxr+XKI6OeSbiv3es0U5pWuI/ZX7FlmRNBUCmzlN+KofEv8w5z3NMkQNA/+WdH2cZ2T9mCb5ovrS3v03w8jzHgAfATeP3hPsg+D+p05tbClitP/I14ulij6i/oYDeL+Eo4b81Iet1sEXZvwr0tf4kxvw/Nj77p7Xj2r8QSEcxE5uxv3O2/IDNA/s/nxiVDX1qBcBPlnzqnDQYQAKYtTkKOPY/HdrqSP7goD+YY/wM4jivvwnEKW96gua/m+VLDeFX1L8xJxs+Xt7+P4J6xbR4y+2/SvMgBVTF07+tLkqipTTyPy0gOLC+rfy/IIcC3hfWHUD9/6KHBTP4P+vTpPo2grU/hdabhm/Wgz9aGsSedEPkvyDnOC2QsuW/keZ58Q6IAUAc/JS9EZ3iP+puFNvIddq/jHE9q++U2T8adOaaYTDyv7rnsUIXaQlAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksFSwuGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVeAAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYFAAAAAAAAAAEBAQEBlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksFhZSMAUOUdJRSlC4="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVLQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJa4AQAAAAAAAA8cDRYnGfI/gSnTk7LPsD+a0iuQtVLPv2QjHDNF2dO/tCH0/zRF6T9Q15bE4OP2P1p7LatQrvS/xLyEzkDX7b89Dt3Hm8cEwAREKrbo382/IQuTFObJsL9JyhL/djLxP7H9Cb833LK/qFNY6l9Mxr963ROqGyDiv99y9Sz6LuM/r66xQhFOBUBmG7Ec/Ublv9vhjMcYsvw/A4iJRwn/07/CuXoFmF27v2ynXIiY4gzAqPdgIcgt+D+UB9mrrM+vP3TnXC0GRq6/MFcmzChW4L9lnnKtYBzcvxLoG9eIEvo/UZ4qm/oA178TD+LtZzbyv0y92dIHnfE/soHEbSsKDsBdWp9U/yQUQIrukzfyVPY/C+3EawV6oj+XSXz4DdSxvxobOquhCua/9OwYygz1179IaQlqG37+P35wjow5quq/vcBrtscz3r+6hs6RhHDwP3U8mv8j1f2/CLdOcoOgGkDVhh1NHB/4Pw/AgLkBCLY/ye//KIHlbz/bR8JSVebjv6BQ2s3Gk+a/wCWGx2JxAUByDkX8ak7kP0wmfDeY66G/IdLjTZoC8j/r2Vo0yWj7vy/bGZ0Mkg1AlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksFSwuGlIwBQ5R0lFKULg=="}, "_episode_num": 4163, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQIw6VyT6i0yMAWyUTQ0BjAF0lEdArFr9HYpUgnV9lChoBkdAipA8nE2pAGgHS/5oCEdArF08fT1CgXV9lChoBkdAhCq+JP69CmgHS85oCEdArF3sXWOIZnV9lChoBkdAgpTSauwHJWgHS61oCEdArGAOy3Td+HV9lChoBkdAhKCmmce8w2gHS9BoCEdArGIKJ0nw5XV9lChoBkdAg8VHww0wamgHS8FoCEdArGO5A6dUbXV9lChoBkdAhNsq+i8Fp2gHS9NoCEdArGTtXgccVHV9lChoBkdAhwP/qgRK6GgHS9xoCEdArGktZvDP4XV9lChoBkdAhEDPxhDw6WgHS8xoCEdArGvMdq+JxnV9lChoBkdAlJlF/pdKNGgHTYcBaAhHQKxwGSTQmeF1fZQoaAZHQIkwO7YkE9toB0vwaAhHQKxwjyNGViZ1fZQoaAZHQIR3ANI9TxZoB0vOaAhHQKxx6ieumrN1fZQoaAZHQKhvZnbqQiloB03oA2gIR0Csdch4D9wWdX2UKGgGR0CE7ZHBk7OnaAdL02gIR0CsdwZEUj9odX2UKGgGR0CFngN0eU6gaAdL0WgIR0CseLaWw/xEdX2UKGgGR0CRcyE+PikwaAdNSwFoCEdArHtV03fhuXV9lChoBkdAhI/ir1dxAGgHS85oCEdArH1gBYFJQXV9lChoBkdAi8FBHbypaWgHTQIBaAhHQKx94aScLBt1fZQoaAZHQIPn2jmCAc1oB0vJaAhHQKx+7VEuxr11fZQoaAZHQKhZLZVXFLpoB03oA2gIR0Csf/c2BJ7LdX2UKGgGR0CIRimReTmoaAdL5GgIR0CsgohwMpgDdX2UKGgGR0CEUJ4xk/bCaAdLymgIR0CshIKebutwdX2UKGgGR0CH2RsP8Q7LaAdL4mgIR0CshMntv4ucdX2UKGgGR0CEPTMxGlQ/aAdLwWgIR0CshWCu2Zy/dX2UKGgGR0CLL30r9VFQaAdL+WgIR0CsiFPxH5JsdX2UKGgGR0CFW96kZaV2aAdLzmgIR0Csi4reIl+mdX2UKGgGR0CDwx5/smfHaAdLv2gIR0Csi86H0se5dX2UKGgGR0CGaqiL2pQ2aAdL2GgIR0CsjAQVsUItdX2UKGgGR0CIC+M8YAKfaAdL4mgIR0Csj5n6MzdldX2UKGgGR0CEHzJOnEVGaAdLv2gIR0Cskaec6NlzdX2UKGgGR0CHt9a/yoXLaAdL4mgIR0CskwjGT9sKdX2UKGgGR0CNZokka/ATaAdNGQFoCEdArJRjQXyiEnV9lChoBkdAiOl3xnWat2gHS+xoCEdArJu3hXKbKHV9lChoBkdAjZ5dqDbrT2gHTRoBaAhHQKyb+OCoS+R1fZQoaAZHQJaf6fZmI0toB02tAWgIR0CsnwK814xDdX2UKGgGR0CDkGMz/IbPaAdLt2gIR0CsoVQLmZE2dX2UKGgGR0CoUpe8PFvRaAdN6ANoCEdArKJpof0VanV9lChoBkdAih2SCe2/jGgHS/JoCEdArKbeh4+r2nV9lChoBkdAiL8C2DxsmGgHS+doCEdArKi8lXzUZ3V9lChoBkdAkgjGqT8pC2gHTVQBaAhHQKytXkDp1Rt1fZQoaAZHQIhlPetSydFoB0vfaAhHQKyuDgeA/cF1fZQoaAZHQKhma176YVtoB03oA2gIR0Csr1fseGO/dX2UKGgGR0CRWlq7AckuaAdNQwFoCEdArLNF/H5rQHV9lChoBkdAhKHmBOHnEGgHS9FoCEdArLQ7SRbKR3V9lChoBkdAhO1y4OMER2gHS8xoCEdArLW7Zcs19HV9lChoBkdAg9Y5avA442gHS79oCEdArLjvqkdmx3V9lChoBkdAhL9AG8mKImgHS8xoCEdArLo3JFLFoHV9lChoBkdAqDsF78ejmGgHTegDaAhHQKy7aqMm4RV1fZQoaAZHQIgd6RyOrABoB0vkaAhHQKzCw9mHxjJ1fZQoaAZHQJDOBlz2exxoB004AWgIR0CswuGHgxagdX2UKGgGR0CEEl/nW8RMaAdLxGgIR0CsyMO3MINWdX2UKGgGR0CFv9WUbDMvaAdL1GgIR0CsyU7zCk44dX2UKGgGR0Cha3Ma86FNaAdNsQJoCEdArMsc1IiC8XV9lChoBkdAqFTLWCmMwWgHTegDaAhHQKzNRjwQUYd1fZQoaAZHQJFVTsQd0aJoB01GAWgIR0Cs1CYL9deIdX2UKGgGR0CoHFdweeWfaAdN6ANoCEdArNparYGt63V9lChoBkdAm0dvUSZjQWgHTSUCaAhHQKzatbRnezl1fZQoaAZHQJVzAUFjd59oB02oAWgIR0Cs21NTcZccdX2UKGgGR0COhyenyd4FaAdNKwFoCEdArOQA4Qz1snV9lChoBkdApN57G5tm+WgHTTgDaAhHQKzlzOj7AL11fZQoaAZHQJANXIDHOr1oB00xAWgIR0Cs708QqZtvdX2UKGgGR0ComvyiM5wPaAdN6ANoCEdArPOlWhh6SnV9lChoBkdApb6FIZqEe2gHTVEDaAhHQKz0+auwHJN1fZQoaAZHQI6QUBU70WdoB00sAWgIR0Cs+QyxzJZGdX2UKGgGR0CoreBcJMQFaAdN6ANoCEdArPsViWmgrnV9lChoBkdAkh0lYMfA9GgHTVkBaAhHQK0AUX9BKL91fZQoaAZHQKizACDmKZVoB03oA2gIR0CtBAyfDk2hdX2UKGgGR0Co5rsz/IbPaAdN0gNoCEdArRKb+JgssnV9lChoBkdAqEX09wFTvWgHTegDaAhHQK0YQ0sOG0x1fZQoaAZHQKiDUkWykbhoB03oA2gIR0CtGl2wV0tAdX2UKGgGR0CRc3yT6i0waAdNSAFoCEdArRzwxgy/K3V9lChoBkdAqI5GFHrhSGgHTegDaAhHQK0frlrdnCh1fZQoaAZHQKghWr7O3UhoB03oA2gIR0CtIz1QIldDdX2UKGgGR0CTgeiliz9kaAdNdwFoCEdArSRO0b961XV9lChoBkdAl25FVLi++WgHTckBaAhHQK0r5kMkQf91fZQoaAZHQKHRml/H5rRoB02tAmgIR0CtMGAC4jKQdX2UKGgGR0CoRnKEeyRkaAdN6ANoCEdArUMwnH/953V9lChoBkdAp/icgyM1j2gHTegDaAhHQK1HUebNKRN1fZQoaAZHQKfvl0aIeo1oB03oA2gIR0CtSIFDWsijdX2UKGgGR0Cn6tdrXUYsaAdN6ANoCEdArU92OsDGLnV9lChoBkdAqC+E1EVnEmgHTegDaAhHQK1T/W6K+BZ1fZQoaAZHQKWSo7T2FnJoB01oA2gIR0CtYzOvdM0xdX2UKGgGR0Coc0QvHtF8aAdN6ANoCEdArWOer0aqCHV9lChoBkdAqFyEKmbb12gHTegDaAhHQK1ofMCcPOJ1fZQoaAZHQJEl759E1EVoB01DAWgIR0Ctbjz5oGpudX2UKGgGR0CoQTXg9/z8aAdN6ANoCEdArW/vwd8zAXV9lChoBkdAqDnocinpCGgHTegDaAhHQK10kVII4VB1fZQoaAZHQJHXO48U21loB01iAWgIR0CteX6WPcSHdX2UKGgGR0CSVILZzxPPaAdNXwFoCEdArXsXE0iyIHV9lChoBkdAqHsFOh0yQGgHTegDaAhHQK2DqdqcmSh1fZQoaAZHQJS6XvH93r5oB02SAWgIR0CtiIwEIPbxdX2UKGgGR0CoaqNjkMkQaAdN6ANoCEdArYkcaCL/CXV9lChoBkdAlEmU8NhE0GgHTZgBaAhHQK2RpOdoWYZ1fZQoaAZHQKiRjta6jFhoB03oA2gIR0Ctlfhpg1FZdX2UKGgGR0CZ5xNsFdLQaAdN7AFoCEdArZnrWqcVg3V9lChoBkdAqIv7UNKAa2gHTegDaAhHQK2bDwHZ9NN1fZQoaAZHQJDgOgHu7YloB00/AWgIR0CtnHB8IAwPdX2UKGgGR0CQfH9rXUYsaAdNSwFoCEdAraXn4AS39nV9lChoBkdAknhWRNh3JWgHTWMBaAhHQK2n8zZ6D5F1fZQoaAZHQKhijl/YraxoB03oA2gIR0CtqgX7UG3XdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 198000, "buffer_size": 1000000, "batch_size": 256, "learning_starts": 10000, "tau": 0.005, "gamma": 0.99, "gradient_steps": 1, "optimize_memory_usage": false, "replay_buffer_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==", "__module__": "stable_baselines3.common.buffers", "__annotations__": "{'observations': <class 'numpy.ndarray'>, 'next_observations': <class 'numpy.ndarray'>, 'actions': <class 'numpy.ndarray'>, 'rewards': <class 'numpy.ndarray'>, 'dones': <class 'numpy.ndarray'>, 'timeouts': <class 'numpy.ndarray'>}", "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ", "__init__": "<function ReplayBuffer.__init__ at 0x7fc00e6f0cc0>", "add": "<function ReplayBuffer.add at 0x7fc00e6f0e00>", "sample": "<function ReplayBuffer.sample at 0x7fc00e6f0ea0>", "_get_samples": "<function ReplayBuffer._get_samples at 0x7fc00e6f0f40>", "_maybe_cast_dtype": "<staticmethod(<function ReplayBuffer._maybe_cast_dtype at 0x7fc00e6f0fe0>)>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fc00e6ea340>"}, "replay_buffer_kwargs": {}, "train_freq": {":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>", ":serialized:": "gAWVYQAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLAWgAjBJUcmFpbkZyZXF1ZW5jeVVuaXSUk5SMBHN0ZXCUhZRSlIaUgZQu"}, "use_sde_at_warmup": false, "target_entropy": -3.0, "ent_coef": "auto", "target_update_interval": 1, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVRQIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLC4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWWAAAAAAAAAAAAAAAAADw/wAAAAAAAPD/AAAAAAAA8P8AAAAAAADw/wAAAAAAAPD/AAAAAAAA8P8AAAAAAADw/wAAAAAAAPD/AAAAAAAA8P8AAAAAAADw/wAAAAAAAPD/lGgLSwuFlIwBQ5R0lFKUjA1ib3VuZGVkX2JlbG93lGgTKJYLAAAAAAAAAAAAAAAAAAAAAAAAlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwuFlGgWdJRSlIwEaGlnaJRoEyiWWAAAAAAAAAAAAAAAAADwfwAAAAAAAPB/AAAAAAAA8H8AAAAAAADwfwAAAAAAAPB/AAAAAAAA8H8AAAAAAADwfwAAAAAAAPB/AAAAAAAA8H8AAAAAAADwfwAAAAAAAPB/lGgLSwuFlGgWdJRSlIwNYm91bmRlZF9hYm92ZZRoEyiWCwAAAAAAAAAAAAAAAAAAAAAAAJRoHUsLhZRoFnSUUpSMCGxvd19yZXBylIwELWluZpSMCWhpZ2hfcmVwcpSMA2luZpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float64", "_shape": [11], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "bounded_below": "[False False False False False False False False False False False]", "high": "[inf inf inf inf inf inf inf inf inf inf inf]", "bounded_above": "[False False False False False False False False False False False]", "low_repr": "-inf", "high_repr": "inf", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVYAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaAtLA4WUjAFDlHSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolgMAAAAAAAAAAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwOFlGgWdJRSlIwEaGlnaJRoEyiWDAAAAAAAAAAAAIA/AACAPwAAgD+UaAtLA4WUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYDAAAAAAAAAAEBAZRoHUsDhZRoFnSUUpSMCGxvd19yZXBylIwELTEuMJSMCWhpZ2hfcmVwcpSMAzEuMJSMCl9ucF9yYW5kb22UjBRudW1weS5yYW5kb20uX3BpY2tsZZSMEF9fZ2VuZXJhdG9yX2N0b3KUk5SMBVBDRzY0lGgyjBRfX2JpdF9nZW5lcmF0b3JfY3RvcpSTlIaUUpR9lCiMDWJpdF9nZW5lcmF0b3KUjAVQQ0c2NJSMBXN0YXRllH2UKGg9ihDjYZWmt15YCS1Fllk0taEajANpbmOUihCpc3hEvDOBWIIa9zrb2o1BdYwKaGFzX3VpbnQzMpRLAIwIdWludGVnZXKUSwB1YnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "bounded_below": "[ True True True]", "high": "[1. 1. 1.]", "bounded_above": "[ True True True]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": "Generator(PCG64)"}, "n_envs": 5, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVHgQAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLBUsTQyaVAZcAdAEAAAAAAAAAAAIAiQF8AKsBAAAAAAAAqwEAAAAAAABTAJROhZSMBWZsb2F0lIWUjBJwcm9ncmVzc19yZW1haW5pbmeUhZSMVC9ob21lL21hc3Rlci1hbmRyZWFzL2dlbl9kYXRhc2V0L3N0YWJsZS1iYXNlbGluZXMzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMCDxsYW1iZGE+lIwhZ2V0X3NjaGVkdWxlX2ZuLjxsb2NhbHM+LjxsYW1iZGE+lEthQxD4gACkZalO0DtN0yxO1CZPlEMAlIwOdmFsdWVfc2NoZWR1bGWUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxUL2hvbWUvbWFzdGVyLWFuZHJlYXMvZ2VuX2RhdGFzZXQvc3RhYmxlLWJhc2VsaW5lczMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgjfZR9lChoGowIPGxhbWJkYT6UjAxfX3F1YWxuYW1lX1+UjCFnZXRfc2NoZWR1bGVfZm4uPGxvY2Fscz4uPGxhbWJkYT6UjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgbjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOUaAIoaAcoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJRoCSmMAV+UhZRoDowEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4VDCPiAANgPEogKlGgSjAN2YWyUhZQpdJRSlGgXTk5oHylSlIWUdJRSlGglaEF9lH2UKGgajARmdW5jlGgpjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlGgrfZRoLU5oLk5oL2gbaDBOaDFoM0c/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwhZRSlIWUaEpdlGhMfZR1hpSGUjAu"}, "batch_norm_stats": [], "batch_norm_stats_target": [], "system_info": {"OS": "Linux-6.6.59-1-MANJARO-x86_64-with-glibc2.40 # 1 SMP PREEMPT_DYNAMIC Fri Nov 1 05:33:52 UTC 2024", "Python": "3.12.7", "Stable-Baselines3": "2.4.0a10", "PyTorch": "2.4.1+cu121", "GPU Enabled": "True", "Numpy": "1.26.4", "Cloudpickle": "3.1.0", "Gymnasium": "1.0.0"}}
hopper-v5-sac-simple.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41a0b43b5071462763f88deed7b5a011ea7bc7f517cfccfb9523b7f78d30bc00
3
  size 3130867
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ef27c0f9a8645e0895bf78c5a249d6bb725924fbcc223abdebca9cd08596983
3
  size 3130867
hopper-v5-sac-simple/data CHANGED
@@ -5,17 +5,17 @@
5
  "__module__": "stable_baselines3.sac.policies",
6
  "__annotations__": "{'actor': <class 'stable_baselines3.sac.policies.Actor'>, 'critic': <class 'stable_baselines3.common.policies.ContinuousCritic'>, 'critic_target': <class 'stable_baselines3.common.policies.ContinuousCritic'>}",
7
  "__doc__": "\n Policy class (with both actor and critic) for SAC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
8
- "__init__": "<function SACPolicy.__init__ at 0x7f72d161c4a0>",
9
- "_build": "<function SACPolicy._build at 0x7f72d161cae0>",
10
- "_get_constructor_parameters": "<function SACPolicy._get_constructor_parameters at 0x7f72d161cb80>",
11
- "reset_noise": "<function SACPolicy.reset_noise at 0x7f72d161cc20>",
12
- "make_actor": "<function SACPolicy.make_actor at 0x7f72d161ccc0>",
13
- "make_critic": "<function SACPolicy.make_critic at 0x7f72d161cd60>",
14
- "forward": "<function SACPolicy.forward at 0x7f72d161ce00>",
15
- "_predict": "<function SACPolicy._predict at 0x7f72d161cea0>",
16
- "set_training_mode": "<function SACPolicy.set_training_mode at 0x7f72d161cf40>",
17
  "__abstractmethods__": "frozenset()",
18
- "_abc_impl": "<_abc._abc_data object at 0x7f72d1620fc0>"
19
  },
20
  "verbose": 0,
21
  "policy_kwargs": {
@@ -26,9 +26,9 @@
26
  "_num_timesteps_at_start": 0,
27
  "seed": 0,
28
  "action_noise": null,
29
- "start_time": 1730956112387218563,
30
  "learning_rate": 0.0003,
31
- "tensorboard_log": "runs/efmz9y24",
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
  ":serialized:": "gAWVLQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJa4AQAAAAAAAN5lw3la7fE/O5DnbXrzrT9J5JGS2hLRv3p9bdkvxdO/tlN1D6lB6T/PURp0XrD3P/b/NDSQGPa/pVJAqTeH67/eVMWlJ1gHwKzy5OefP+E/SzKWBcqQpr8uOiftOiXxP1FSzXpbBq2/66kMefpBxr+XKI6OeSbiv3es0U5pWuI/ZX7FlmRNBUCmzlN+KofEv8w5z3NMkQNA/+WdH2cZ2T9mCb5ovrS3v03w8jzHgAfATeP3hPsg+D+p05tbClitP/I14ulij6i/oYDeL+Eo4b81Iet1sEXZvwr0tf4kxvw/Nj77p7Xj2r8QSEcxE5uxv3O2/IDNA/s/nxiVDX1qBcBPlnzqnDQYQAKYtTkKOPY/HdrqSP7goD+YY/wM4jivvwnEKW96gua/m+VLDeFX1L8xJxs+Xt7+P4J6xbR4y+2/SvMgBVTF07+tLkqipTTyPy0gOLC+rfy/IIcC3hfWHUD9/6KHBTP4P+vTpPo2grU/hdabhm/Wgz9aGsSedEPkvyDnOC2QsuW/keZ58Q6IAUAc/JS9EZ3iP+puFNvIddq/jHE9q++U2T8adOaaYTDyv7rnsUIXaQlAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksFSwuGlIwBQ5R0lFKULg=="
@@ -48,7 +48,7 @@
48
  "_stats_window_size": 100,
49
  "ep_info_buffer": {
50
  ":type:": "<class 'collections.deque'>",
51
- ":serialized:": "gAWVHwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQIw6VyT6i0yMAWyUTQ0BjAF0lEdAp1g30Gu9vnV9lChoBkdAipA8nE2pAGgHS/5oCEdAp1ooq7ROUXV9lChoBkdAhCq+JP69CmgHS85oCEdAp1rFPP9k0HV9lChoBkdAgpTSauwHJWgHS61oCEdAp1yZ5qubJHV9lChoBkdAhKCmmce8w2gHS9BoCEdAp15eMuOCG3V9lChoBkdAg8VHww0wamgHS8FoCEdAp1/6U7jkuHV9lChoBkdAhNsq+i8Fp2gHS9NoCEdAp2EYekpI+XV9lChoBkdAhwP/qgRK6GgHS9xoCEdAp2UE4//vOXV9lChoBkdAhEDPxhDw6WgHS8xoCEdAp2cWez2OAHV9lChoBkdAlJlF/pdKNGgHTYcBaAhHQKdrq5PM0P91fZQoaAZHQIkwO7YkE9toB0vwaAhHQKdsKMBp5/t1fZQoaAZHQIR3ANI9TxZoB0vOaAhHQKdtVmkFfRh1fZQoaAZHQKhvZnbqQiloB03oA2gIR0CncRjyvs7ddX2UKGgGR0CE7ZHBk7OnaAdL02gIR0CnchL/82rGdX2UKGgGR0CFngN0eU6gaAdL0WgIR0Cnc7xq46OpdX2UKGgGR0CRcyE+PikwaAdNSwFoCEdAp3YkjeKsMnV9lChoBkdAhI/ir1dxAGgHS85oCEdAp3g3Ov+wT3V9lChoBkdAi8FBHbypaWgHTQIBaAhHQKd4xYISlFd1fZQoaAZHQIPn2jmCAc1oB0vJaAhHQKd5z12aDwp1fZQoaAZHQKhZLZVXFLpoB03oA2gIR0CnesAAZKnOdX2UKGgGR0CIRimReTmoaAdL5GgIR0CnfQ4c/+sHdX2UKGgGR0CEUJ4xk/bCaAdLymgIR0CnftvEsJ6ZdX2UKGgGR0CH2RsP8Q7LaAdL4mgIR0Cnfw4QSSNgdX2UKGgGR0CEPTMxGlQ/aAdLwWgIR0Cnf5QHAymAdX2UKGgGR0CLL30r9VFQaAdL+WgIR0CnglFwT/Q0dX2UKGgGR0CFW96kZaV2aAdLzmgIR0CnhPW5H3DfdX2UKGgGR0CDwx5/smfHaAdLv2gIR0CnhTtbcGkfdX2UKGgGR0CGaqiL2pQ2aAdL2GgIR0CnhXgu7HyVdX2UKGgGR0CIC+M8YAKfaAdL4mgIR0CniRAmAskIdX2UKGgGR0CEHzJOnEVGaAdLv2gIR0Cni0DPWxyGdX2UKGgGR0CHt9a/yoXLaAdL4mgIR0CnjH+eOGTLdX2UKGgGR0CNZokka/ATaAdNGQFoCEdAp42YOz6acHV9lChoBkdAiOl3xnWat2gHS+xoCEdAp5SajSG8EnV9lChoBkdAjZ5dqDbrT2gHTRoBaAhHQKeU6L1EmY11fZQoaAZHQJaf6fZmI0toB02tAWgIR0CnmA4Vh1DCdX2UKGgGR0CDkGMz/IbPaAdLt2gIR0CnmiUtRNypdX2UKGgGR0CoUpe8PFvRaAdN6ANoCEdAp5s5vYODrnV9lChoBkdAih2SCe2/jGgHS/JoCEdAp59QTEit73V9lChoBkdAiL8C2DxsmGgHS+doCEdAp6D1zwMH8nV9lChoBkdAkgjGqT8pC2gHTVQBaAhHQKelWXTmW+p1fZQoaAZHQIhlPetSydFoB0vfaAhHQKel7nnuAqd1fZQoaAZHQKhma176YVtoB03oA2gIR0CnpxkzoEB9dX2UKGgGR0CRWlq7AckuaAdNQwFoCEdAp6ql5yEL6XV9lChoBkdAhKHmBOHnEGgHS9FoCEdAp6twpBomHHV9lChoBkdAhO1y4OMER2gHS8xoCEdAp60I4VARkHV9lChoBkdAg9Y5avA442gHS79oCEdAp7BC3/givHV9lChoBkdAhL9AG8mKImgHS8xoCEdAp7GPsu3+dnV9lChoBkdAqDsF78ejmGgHTegDaAhHQKeyxi6xxDN1fZQoaAZHQIgd6RyOrABoB0vkaAhHQKe5Ytvn8sN1fZQoaAZHQJDOBlz2exxoB004AWgIR0CnuX25H3DfdX2UKGgGR0CEEl/nW8RMaAdLxGgIR0CnvpCMYMvzdX2UKGgGR0CFv9WUbDMvaAdL1GgIR0CnvxHj6vaDdX2UKGgGR0Cha3Ma86FNaAdNsQJoCEdAp8CZ1Tzd13V9lChoBkdAqFTLWCmMwWgHTegDaAhHQKfCee0Xxe91fZQoaAZHQJFVTsQd0aJoB01GAWgIR0CnyAyOR1YAdX2UKGgGR0CoHFdweeWfaAdN6ANoCEdAp80r+irT6XV9lChoBkdAm0dvUSZjQWgHTSUCaAhHQKfNdEIgNgB1fZQoaAZHQJVzAUFjd59oB02oAWgIR0CnzgNYbKigdX2UKGgGR0COhyenyd4FaAdNKwFoCEdAp9W+hAWznnV9lChoBkdApN57G5tm+WgHTTgDaAhHQKfXIAfdRBN1fZQoaAZHQJANXIDHOr1oB00xAWgIR0Cn35ztsvZidX2UKGgGR0ComvyiM5wPaAdN6ANoCEdAp+PxQ+EAYHV9lChoBkdApb6FIZqEe2gHTVEDaAhHQKflGPH1e0J1fZQoaAZHQI6QUBU70WdoB00sAWgIR0Cn6Iw7DEWJdX2UKGgGR0CoreBcJMQFaAdN6ANoCEdAp+pswQDmsHV9lChoBkdAkh0lYMfA9GgHTVkBaAhHQKfu4fEGZ/l1fZQoaAZHQKizACDmKZVoB03oA2gIR0Cn8l24NI9UdX2UKGgGR0Co5rsz/IbPaAdN0gNoCEdAqABnV3EAHXV9lChoBkdAqEX09wFTvWgHTegDaAhHQKgGKC6pYLd1fZQoaAZHQKiDUkWykbhoB03oA2gIR0CoCCn/LkjpdX2UKGgGR0CRc3yT6i0waAdNSAFoCEdAqAp96PbO/3V9lChoBkdAqI5GFHrhSGgHTegDaAhHQKgM37qIJqt1fZQoaAZHQKghWr7O3UhoB03oA2gIR0CoEEOPFNtZdX2UKGgGR0CTgeiliz9kaAdNdwFoCEdAqBE7FhoduHV9lChoBkdAl25FVLi++WgHTckBaAhHQKgXy2a2F391fZQoaAZHQKHRml/H5rRoB02tAmgIR0CoG/WexwAEdX2UKGgGR0CoRnKEeyRkaAdN6ANoCEdAqCnQzWPLgXV9lChoBkdAp/icgyM1j2gHTegDaAhHQKgtV2r4nF51fZQoaAZHQKfvl0aIeo1oB03oA2gIR0CoLk0iILw4dX2UKGgGR0Cn6tdrXUYsaAdN6ANoCEdAqDUBYvFm4HV9lChoBkdAqC+E1EVnEmgHTegDaAhHQKg5OiUxEfF1fZQoaAZHQKWSo7T2FnJoB01oA2gIR0CoRoZb6guidX2UKGgGR0Coc0QvHtF8aAdN6ANoCEdAqEbgTCcf/3V9lChoBkdAqFyEKmbb12gHTegDaAhHQKhLHA+IM0B1fZQoaAZHQJEl759E1EVoB01DAWgIR0CoT+21c+qzdX2UKGgGR0CoQTXg9/z8aAdN6ANoCEdAqFbZTCLuQnV9lChoBkdAqDnocinpCGgHTegDaAhHQKhbELH+6y11fZQoaAZHQJHXO48U21loB01iAWgIR0CoX6ndXT3JdX2UKGgGR0CSVILZzxPPaAdNXwFoCEdAqGE7/dZaFHV9lChoBkdAqHsFOh0yQGgHTegDaAhHQKho49X9zfd1fZQoaAZHQJS6XvH93r5oB02SAWgIR0CobSad+XqrdX2UKGgGR0CoaqNjkMkQaAdN6ANoCEdAqG2t3np0OnV9lChoBkdAlEmU8NhE0GgHTZgBaAhHQKh06JcgQpZ1fZQoaAZHQKiRjta6jFhoB03oA2gIR0CoeIVnVXmvdX2UKGgGR0CZ5xNsFdLQaAdN7AFoCEdAqHwSemNzbXV9lChoBkdAqIv7UNKAa2gHTegDaAhHQKh9FKq4pc51fZQoaAZHQJDgOgHu7YloB00/AWgIR0CofkX6yjYadX2UKGgGR0CQfH9rXUYsaAdNSwFoCEdAqIdiZ+hGpnV9lChoBkdAknhWRNh3JWgHTWMBaAhHQKiJMXMQmNR1fZQoaAZHQKhijl/YraxoB03oA2gIR0CoivavA44qdWUu"
52
  },
53
  "ep_success_buffer": {
54
  ":type:": "<class 'collections.deque'>",
@@ -68,13 +68,13 @@
68
  "__module__": "stable_baselines3.common.buffers",
69
  "__annotations__": "{'observations': <class 'numpy.ndarray'>, 'next_observations': <class 'numpy.ndarray'>, 'actions': <class 'numpy.ndarray'>, 'rewards': <class 'numpy.ndarray'>, 'dones': <class 'numpy.ndarray'>, 'timeouts': <class 'numpy.ndarray'>}",
70
  "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
71
- "__init__": "<function ReplayBuffer.__init__ at 0x7f72e0564cc0>",
72
- "add": "<function ReplayBuffer.add at 0x7f72e0564e00>",
73
- "sample": "<function ReplayBuffer.sample at 0x7f72e0564ea0>",
74
- "_get_samples": "<function ReplayBuffer._get_samples at 0x7f72e0564f40>",
75
- "_maybe_cast_dtype": "<staticmethod(<function ReplayBuffer._maybe_cast_dtype at 0x7f72e0564fe0>)>",
76
  "__abstractmethods__": "frozenset()",
77
- "_abc_impl": "<_abc._abc_data object at 0x7f72e055a600>"
78
  },
79
  "replay_buffer_kwargs": {},
80
  "train_freq": {
 
5
  "__module__": "stable_baselines3.sac.policies",
6
  "__annotations__": "{'actor': <class 'stable_baselines3.sac.policies.Actor'>, 'critic': <class 'stable_baselines3.common.policies.ContinuousCritic'>, 'critic_target': <class 'stable_baselines3.common.policies.ContinuousCritic'>}",
7
  "__doc__": "\n Policy class (with both actor and critic) for SAC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
8
+ "__init__": "<function SACPolicy.__init__ at 0x7fc00380c4a0>",
9
+ "_build": "<function SACPolicy._build at 0x7fc00380cae0>",
10
+ "_get_constructor_parameters": "<function SACPolicy._get_constructor_parameters at 0x7fc00380cb80>",
11
+ "reset_noise": "<function SACPolicy.reset_noise at 0x7fc00380cc20>",
12
+ "make_actor": "<function SACPolicy.make_actor at 0x7fc00380ccc0>",
13
+ "make_critic": "<function SACPolicy.make_critic at 0x7fc00380cd60>",
14
+ "forward": "<function SACPolicy.forward at 0x7fc00380ce00>",
15
+ "_predict": "<function SACPolicy._predict at 0x7fc00380cea0>",
16
+ "set_training_mode": "<function SACPolicy.set_training_mode at 0x7fc00380cf40>",
17
  "__abstractmethods__": "frozenset()",
18
+ "_abc_impl": "<_abc._abc_data object at 0x7fc0038112c0>"
19
  },
20
  "verbose": 0,
21
  "policy_kwargs": {
 
26
  "_num_timesteps_at_start": 0,
27
  "seed": 0,
28
  "action_noise": null,
29
+ "start_time": 1731417232377162777,
30
  "learning_rate": 0.0003,
31
+ "tensorboard_log": "runs/ff8r1mba",
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
  ":serialized:": "gAWVLQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJa4AQAAAAAAAN5lw3la7fE/O5DnbXrzrT9J5JGS2hLRv3p9bdkvxdO/tlN1D6lB6T/PURp0XrD3P/b/NDSQGPa/pVJAqTeH67/eVMWlJ1gHwKzy5OefP+E/SzKWBcqQpr8uOiftOiXxP1FSzXpbBq2/66kMefpBxr+XKI6OeSbiv3es0U5pWuI/ZX7FlmRNBUCmzlN+KofEv8w5z3NMkQNA/+WdH2cZ2T9mCb5ovrS3v03w8jzHgAfATeP3hPsg+D+p05tbClitP/I14ulij6i/oYDeL+Eo4b81Iet1sEXZvwr0tf4kxvw/Nj77p7Xj2r8QSEcxE5uxv3O2/IDNA/s/nxiVDX1qBcBPlnzqnDQYQAKYtTkKOPY/HdrqSP7goD+YY/wM4jivvwnEKW96gua/m+VLDeFX1L8xJxs+Xt7+P4J6xbR4y+2/SvMgBVTF07+tLkqipTTyPy0gOLC+rfy/IIcC3hfWHUD9/6KHBTP4P+vTpPo2grU/hdabhm/Wgz9aGsSedEPkvyDnOC2QsuW/keZ58Q6IAUAc/JS9EZ3iP+puFNvIddq/jHE9q++U2T8adOaaYTDyv7rnsUIXaQlAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksFSwuGlIwBQ5R0lFKULg=="
 
48
  "_stats_window_size": 100,
49
  "ep_info_buffer": {
50
  ":type:": "<class 'collections.deque'>",
51
+ ":serialized:": "gAWVHwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQIw6VyT6i0yMAWyUTQ0BjAF0lEdArFr9HYpUgnV9lChoBkdAipA8nE2pAGgHS/5oCEdArF08fT1CgXV9lChoBkdAhCq+JP69CmgHS85oCEdArF3sXWOIZnV9lChoBkdAgpTSauwHJWgHS61oCEdArGAOy3Td+HV9lChoBkdAhKCmmce8w2gHS9BoCEdArGIKJ0nw5XV9lChoBkdAg8VHww0wamgHS8FoCEdArGO5A6dUbXV9lChoBkdAhNsq+i8Fp2gHS9NoCEdArGTtXgccVHV9lChoBkdAhwP/qgRK6GgHS9xoCEdArGktZvDP4XV9lChoBkdAhEDPxhDw6WgHS8xoCEdArGvMdq+JxnV9lChoBkdAlJlF/pdKNGgHTYcBaAhHQKxwGSTQmeF1fZQoaAZHQIkwO7YkE9toB0vwaAhHQKxwjyNGViZ1fZQoaAZHQIR3ANI9TxZoB0vOaAhHQKxx6ieumrN1fZQoaAZHQKhvZnbqQiloB03oA2gIR0Csdch4D9wWdX2UKGgGR0CE7ZHBk7OnaAdL02gIR0CsdwZEUj9odX2UKGgGR0CFngN0eU6gaAdL0WgIR0CseLaWw/xEdX2UKGgGR0CRcyE+PikwaAdNSwFoCEdArHtV03fhuXV9lChoBkdAhI/ir1dxAGgHS85oCEdArH1gBYFJQXV9lChoBkdAi8FBHbypaWgHTQIBaAhHQKx94aScLBt1fZQoaAZHQIPn2jmCAc1oB0vJaAhHQKx+7VEuxr11fZQoaAZHQKhZLZVXFLpoB03oA2gIR0Csf/c2BJ7LdX2UKGgGR0CIRimReTmoaAdL5GgIR0CsgohwMpgDdX2UKGgGR0CEUJ4xk/bCaAdLymgIR0CshIKebutwdX2UKGgGR0CH2RsP8Q7LaAdL4mgIR0CshMntv4ucdX2UKGgGR0CEPTMxGlQ/aAdLwWgIR0CshWCu2Zy/dX2UKGgGR0CLL30r9VFQaAdL+WgIR0CsiFPxH5JsdX2UKGgGR0CFW96kZaV2aAdLzmgIR0Csi4reIl+mdX2UKGgGR0CDwx5/smfHaAdLv2gIR0Csi86H0se5dX2UKGgGR0CGaqiL2pQ2aAdL2GgIR0CsjAQVsUItdX2UKGgGR0CIC+M8YAKfaAdL4mgIR0Csj5n6MzdldX2UKGgGR0CEHzJOnEVGaAdLv2gIR0Cskaec6NlzdX2UKGgGR0CHt9a/yoXLaAdL4mgIR0CskwjGT9sKdX2UKGgGR0CNZokka/ATaAdNGQFoCEdArJRjQXyiEnV9lChoBkdAiOl3xnWat2gHS+xoCEdArJu3hXKbKHV9lChoBkdAjZ5dqDbrT2gHTRoBaAhHQKyb+OCoS+R1fZQoaAZHQJaf6fZmI0toB02tAWgIR0CsnwK814xDdX2UKGgGR0CDkGMz/IbPaAdLt2gIR0CsoVQLmZE2dX2UKGgGR0CoUpe8PFvRaAdN6ANoCEdArKJpof0VanV9lChoBkdAih2SCe2/jGgHS/JoCEdArKbeh4+r2nV9lChoBkdAiL8C2DxsmGgHS+doCEdArKi8lXzUZ3V9lChoBkdAkgjGqT8pC2gHTVQBaAhHQKytXkDp1Rt1fZQoaAZHQIhlPetSydFoB0vfaAhHQKyuDgeA/cF1fZQoaAZHQKhma176YVtoB03oA2gIR0Csr1fseGO/dX2UKGgGR0CRWlq7AckuaAdNQwFoCEdArLNF/H5rQHV9lChoBkdAhKHmBOHnEGgHS9FoCEdArLQ7SRbKR3V9lChoBkdAhO1y4OMER2gHS8xoCEdArLW7Zcs19HV9lChoBkdAg9Y5avA442gHS79oCEdArLjvqkdmx3V9lChoBkdAhL9AG8mKImgHS8xoCEdArLo3JFLFoHV9lChoBkdAqDsF78ejmGgHTegDaAhHQKy7aqMm4RV1fZQoaAZHQIgd6RyOrABoB0vkaAhHQKzCw9mHxjJ1fZQoaAZHQJDOBlz2exxoB004AWgIR0CswuGHgxagdX2UKGgGR0CEEl/nW8RMaAdLxGgIR0CsyMO3MINWdX2UKGgGR0CFv9WUbDMvaAdL1GgIR0CsyU7zCk44dX2UKGgGR0Cha3Ma86FNaAdNsQJoCEdArMsc1IiC8XV9lChoBkdAqFTLWCmMwWgHTegDaAhHQKzNRjwQUYd1fZQoaAZHQJFVTsQd0aJoB01GAWgIR0Cs1CYL9deIdX2UKGgGR0CoHFdweeWfaAdN6ANoCEdArNparYGt63V9lChoBkdAm0dvUSZjQWgHTSUCaAhHQKzatbRnezl1fZQoaAZHQJVzAUFjd59oB02oAWgIR0Cs21NTcZccdX2UKGgGR0COhyenyd4FaAdNKwFoCEdArOQA4Qz1snV9lChoBkdApN57G5tm+WgHTTgDaAhHQKzlzOj7AL11fZQoaAZHQJANXIDHOr1oB00xAWgIR0Cs708QqZtvdX2UKGgGR0ComvyiM5wPaAdN6ANoCEdArPOlWhh6SnV9lChoBkdApb6FIZqEe2gHTVEDaAhHQKz0+auwHJN1fZQoaAZHQI6QUBU70WdoB00sAWgIR0Cs+QyxzJZGdX2UKGgGR0CoreBcJMQFaAdN6ANoCEdArPsViWmgrnV9lChoBkdAkh0lYMfA9GgHTVkBaAhHQK0AUX9BKL91fZQoaAZHQKizACDmKZVoB03oA2gIR0CtBAyfDk2hdX2UKGgGR0Co5rsz/IbPaAdN0gNoCEdArRKb+JgssnV9lChoBkdAqEX09wFTvWgHTegDaAhHQK0YQ0sOG0x1fZQoaAZHQKiDUkWykbhoB03oA2gIR0CtGl2wV0tAdX2UKGgGR0CRc3yT6i0waAdNSAFoCEdArRzwxgy/K3V9lChoBkdAqI5GFHrhSGgHTegDaAhHQK0frlrdnCh1fZQoaAZHQKghWr7O3UhoB03oA2gIR0CtIz1QIldDdX2UKGgGR0CTgeiliz9kaAdNdwFoCEdArSRO0b961XV9lChoBkdAl25FVLi++WgHTckBaAhHQK0r5kMkQf91fZQoaAZHQKHRml/H5rRoB02tAmgIR0CtMGAC4jKQdX2UKGgGR0CoRnKEeyRkaAdN6ANoCEdArUMwnH/953V9lChoBkdAp/icgyM1j2gHTegDaAhHQK1HUebNKRN1fZQoaAZHQKfvl0aIeo1oB03oA2gIR0CtSIFDWsijdX2UKGgGR0Cn6tdrXUYsaAdN6ANoCEdArU92OsDGLnV9lChoBkdAqC+E1EVnEmgHTegDaAhHQK1T/W6K+BZ1fZQoaAZHQKWSo7T2FnJoB01oA2gIR0CtYzOvdM0xdX2UKGgGR0Coc0QvHtF8aAdN6ANoCEdArWOer0aqCHV9lChoBkdAqFyEKmbb12gHTegDaAhHQK1ofMCcPOJ1fZQoaAZHQJEl759E1EVoB01DAWgIR0Ctbjz5oGpudX2UKGgGR0CoQTXg9/z8aAdN6ANoCEdArW/vwd8zAXV9lChoBkdAqDnocinpCGgHTegDaAhHQK10kVII4VB1fZQoaAZHQJHXO48U21loB01iAWgIR0CteX6WPcSHdX2UKGgGR0CSVILZzxPPaAdNXwFoCEdArXsXE0iyIHV9lChoBkdAqHsFOh0yQGgHTegDaAhHQK2DqdqcmSh1fZQoaAZHQJS6XvH93r5oB02SAWgIR0CtiIwEIPbxdX2UKGgGR0CoaqNjkMkQaAdN6ANoCEdArYkcaCL/CXV9lChoBkdAlEmU8NhE0GgHTZgBaAhHQK2RpOdoWYZ1fZQoaAZHQKiRjta6jFhoB03oA2gIR0Ctlfhpg1FZdX2UKGgGR0CZ5xNsFdLQaAdN7AFoCEdArZnrWqcVg3V9lChoBkdAqIv7UNKAa2gHTegDaAhHQK2bDwHZ9NN1fZQoaAZHQJDgOgHu7YloB00/AWgIR0CtnHB8IAwPdX2UKGgGR0CQfH9rXUYsaAdNSwFoCEdAraXn4AS39nV9lChoBkdAknhWRNh3JWgHTWMBaAhHQK2n8zZ6D5F1fZQoaAZHQKhijl/YraxoB03oA2gIR0CtqgX7UG3XdWUu"
52
  },
53
  "ep_success_buffer": {
54
  ":type:": "<class 'collections.deque'>",
 
68
  "__module__": "stable_baselines3.common.buffers",
69
  "__annotations__": "{'observations': <class 'numpy.ndarray'>, 'next_observations': <class 'numpy.ndarray'>, 'actions': <class 'numpy.ndarray'>, 'rewards': <class 'numpy.ndarray'>, 'dones': <class 'numpy.ndarray'>, 'timeouts': <class 'numpy.ndarray'>}",
70
  "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
71
+ "__init__": "<function ReplayBuffer.__init__ at 0x7fc00e6f0cc0>",
72
+ "add": "<function ReplayBuffer.add at 0x7fc00e6f0e00>",
73
+ "sample": "<function ReplayBuffer.sample at 0x7fc00e6f0ea0>",
74
+ "_get_samples": "<function ReplayBuffer._get_samples at 0x7fc00e6f0f40>",
75
+ "_maybe_cast_dtype": "<staticmethod(<function ReplayBuffer._maybe_cast_dtype at 0x7fc00e6f0fe0>)>",
76
  "__abstractmethods__": "frozenset()",
77
+ "_abc_impl": "<_abc._abc_data object at 0x7fc00e6ea340>"
78
  },
79
  "replay_buffer_kwargs": {},
80
  "train_freq": {
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ec6f16538dcbac21264d764ccf5f17060c9fa0c45819fb9c0da617e8d920d44
3
  size 1459591
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ffc19e5b703f3bd332da711763d250afd5d554a3f38c07125eae4be907583b2
3
  size 1459591
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 3112.2047958000003, "std_reward": 3.5531871170395797, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-11-07T08:01:16.532667"}
 
1
+ {"mean_reward": 3112.2047958000003, "std_reward": 3.5531871170395797, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-11-12T16:17:28.963587"}