mortenaas commited on
Commit
dc0f35f
·
verified ·
1 Parent(s): c813287

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLanderContinuous-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 230.68 +/- 7.84
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLanderContinuous-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 6.61 +/- 15.77
20
  name: mean_reward
21
  verified: false
22
  ---
SACdyn.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bb6390997b2ad671fa9d9e49fbac021ab369b70eb30f143ceeb4af8c57ad6fe
3
+ size 3082023
SACdyn/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 2.0.0a5
SACdyn/actor.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:307a338eb02a17a7a242d729e69201eeb3ae16535fa373fd26ef50c2cf4b1a09
3
+ size 559694
SACdyn/critic.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f00ace000a33db7a91a6bbcbd8e1316bfaf4277b82bf3edc678493b6bcd5b61f
3
+ size 1111466
SACdyn/data ADDED
@@ -0,0 +1,126 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnNhYy5wb2xpY2llc5SMCVNBQ1BvbGljeZSTlC4=",
5
+ "__module__": "stable_baselines3.sac.policies",
6
+ "__annotations__": "{'actor': <class 'stable_baselines3.sac.policies.Actor'>, 'critic': <class 'stable_baselines3.common.policies.ContinuousCritic'>, 'critic_target': <class 'stable_baselines3.common.policies.ContinuousCritic'>}",
7
+ "__doc__": "\n Policy class (with both actor and critic) for SAC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
8
+ "__init__": "<function SACPolicy.__init__ at 0x7d227e6ccd30>",
9
+ "_build": "<function SACPolicy._build at 0x7d227e6ccdc0>",
10
+ "_get_constructor_parameters": "<function SACPolicy._get_constructor_parameters at 0x7d227e6cce50>",
11
+ "reset_noise": "<function SACPolicy.reset_noise at 0x7d227e6ccee0>",
12
+ "make_actor": "<function SACPolicy.make_actor at 0x7d227e6ccf70>",
13
+ "make_critic": "<function SACPolicy.make_critic at 0x7d227e6cd000>",
14
+ "forward": "<function SACPolicy.forward at 0x7d227e6cd090>",
15
+ "_predict": "<function SACPolicy._predict at 0x7d227e6cd120>",
16
+ "set_training_mode": "<function SACPolicy.set_training_mode at 0x7d227e6cd1b0>",
17
+ "__abstractmethods__": "frozenset()",
18
+ "_abc_impl": "<_abc._abc_data object at 0x7d227e6bbec0>"
19
+ },
20
+ "verbose": 1,
21
+ "policy_kwargs": {
22
+ "use_sde": false
23
+ },
24
+ "num_timesteps": 500000,
25
+ "_total_timesteps": 500000,
26
+ "_num_timesteps_at_start": 0,
27
+ "seed": null,
28
+ "action_noise": null,
29
+ "start_time": 1716478454985334697,
30
+ "learning_rate": {
31
+ ":type:": "<class 'function'>",
32
+ ":serialized:": "gAWVeQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwVLBEtDQzRkAX0BZAJ8ARQAfQJkA30DZAR9BHwAfAJrAHIYfAN8AHwCGwB8A3wEGAAUABgAUwB8BFMAlChOTZABS0tHP0frrxAjY7JHPzBiTdLxqfx0lCkojAF0lIwSYXZnX2VwaXNvZGVfbGVuZ3RolIwUdHJhbnNpdGlvbl90aW1lc3RlcHOUjBVpbml0aWFsX2xlYXJuaW5nX3JhdGWUjBNmaW5hbF9sZWFybmluZ19yYXRllHSUjB48aXB5dGhvbi1pbnB1dC02LTRlZTZjYWFkNDFlYz6UjBZsZWFybmluZ19yYXRlX3NjaGVkdWxllEsHQw4EAggBBAEEAQgCFAIEA5QpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGn2UfZQoaBdoEYwMX19xdWFsbmFtZV9flGgRjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
33
+ },
34
+ "tensorboard_log": null,
35
+ "_last_obs": {
36
+ ":type:": "<class 'numpy.ndarray'>",
37
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAABqZYL1DCJk+SqMKvtWUxbzvME+9xdffPAAAAAAAAAAAMxtYvE9eUz7DPtk9l7jlvLNMijxCdhS8AAAAAAAAAACGRys+K4awPZgl1z0/vfc76HQTPQZjHD0AAAAAAAAAAABHjDxLNIc/a1aKPbcy8L6SpiI8FY5MPQAAAAAAAAAA+iI8vlaIkj+qCdm+u194vtHzWr57yBK+AAAAAAAAAAAzI3Q8xieiPyr79D3J3wy/tqiOOp7UGLsAAAAAAAAAAECG2D1k1849ShcqvSAIDj1k6hK8QAFqvQAAAAAAAAAATTyKPs47rT1mpe08H6psPPJ0pTyNnRu8AAAAAAAAAADzUkE+IdeJPeoHK70Uy+88GP8MvPPclb0AAAAAAAAAALq6kT4EHcI9hY5TPWksMzxfQiQ9zW7OPAAAAAAAAAAAzTIiPQHIzT0Nnpi8PfwePKrL2rzOWZK6AAAAAAAAAAAmRz4+LVmhP8H5iD4pN+e9VNk0PgB51bwAAAAAAAAAAHOruD5GiqM/hQ+VPS+YiL7qzEc+tSWvvQAAAAAAAAAATbqxPXt7oT0cLYC8truhPK6kPrvaAvm7AAAAAAAAAADmFSU+gUq2PaUxgD0R7Ms88jOtPJMhg7wAAAAAAAAAAMh4h75twJY/4gypvk5dlrzf26a+kye6vQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
38
+ },
39
+ "_last_episode_starts": {
40
+ ":type:": "<class 'numpy.ndarray'>",
41
+ ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAEBAQEBAQEBAQEBAQEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
42
+ },
43
+ "_last_original_obs": {
44
+ ":type:": "<class 'numpy.ndarray'>",
45
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAOYbW72IT5k+oDD2vc6mIb2IyVS9dU/eOgAAAAAAAAAAM2lpvLkDVD7qruQ9o13AvN4CjjzyhIm7AAAAAAAAAAATLyo+eCywPar7yT1soFa8J6MLPX2S8jwAAAAAAAAAADOJhjwsjog/6KNpPT3X876wevM7R0chPQAAAAAAAAAAJrk3vmw6kz+gMNq+pJJ4vv6cU76/vwy+AAAAAAAAAADNjmA8fr2jP1hd5T3M0hG/+PCdOrJV3DwAAAAAAAAAACZv2T0oPs09m8znvO3thbugOsi7egkzvQAAAAAAAAAA6haKPnuRrD1xHsE8r9q1O9xYqTyuzIG8AAAAAAAAAAAaykE+pH2IPdPf9LzzEeo7QBqiu9EIt70AAAAAAAAAAFp1kT6km8E9hqNNPUp+ZDw1GR89WvO3PAAAAAAAAAAAzfYiPYRVzT0qYpa8dU1HuplW2rzB7hg6AAAAAAAAAAA6jTs+iKyhP4a9iz6V39m94y42Pi6VDTwAAAAAAAAAAJ1RuD5kT6Q/PsmCPSk5d77bLUw+H8ZGvQAAAAAAAAAAWg6yPZGSoD32hwO8C2NrvNm9JbvTk5M2AAAAAAAAAADtcyQ+/iS1PUTcjj3UjoU8bMKzPLzdJrwAAAAAAAAAAErChb4+zZY/xwypvm00CDwtiKS+qie6vQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
46
+ },
47
+ "_episode_num": 685,
48
+ "use_sde": false,
49
+ "sde_sample_freq": -1,
50
+ "_current_progress_remaining": 0.0,
51
+ "_stats_window_size": 100,
52
+ "ep_info_buffer": {
53
+ ":type:": "<class 'collections.deque'>",
54
+ ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGt67blA/s6MAWyUTTgDjAF0lEdApjJXc32mHnV9lChoBkfAHiXQ+lj3EmgHTegDaAhHQKY5eZKFqSJ1fZQoaAZHwDXZERaouPFoB03oA2gIR0CmPFhsQ/X5dX2UKGgGR8A73ZtvXK8taAdN6ANoCEdApj2wDYAbQ3V9lChoBkfANR9h/iHZb2gHTegDaAhHQKY+26bONYN1fZQoaAZHQGIRikfs/ptoB02WA2gIR0CmQHBy8zyjdX2UKGgGR0A49xyGSIP9aAdN6ANoCEdAplIjMC9ytHV9lChoBkfAIAqmKqGUOmgHTegDaAhHQKZYc6QvHtF1fZQoaAZHwD4S3z+WGAVoB03oA2gIR0CmXdGD15B1dX2UKGgGR0Bp5yA+Y+jeaAdNQwNoCEdApl5C7dznzXV9lChoBkdAYuOOOsDGLmgHTckDaAhHQKZmQy44Ia91fZQoaAZHQGbV+KCQLeBoB03YAmgIR0CmbbUqx1PndX2UKGgGRz//oNNJvo/zaAdN6ANoCEdAppeZdhRZU3V9lChoBkdAKu/CZWq95GgHTegDaAhHQKbWXJMg2ZR1fZQoaAZHwC9jbJwKjSJoB03oA2gIR0Cm7h7coH9ndX2UKGgGR0AhJK5kK/mDaAdN6ANoCEdApvlJO1v2oXV9lChoBkdAN/OtbLU1AWgHTegDaAhHQKb8uPH1e0J1fZQoaAZHwEC+7gbZOBVoB03oA2gIR0CnAqqPfbbldX2UKGgGR8BFngsbvPToaAdN6ANoCEdApwWc7yQPqnV9lChoBkdAPSnLmp2lmGgHTegDaAhHQKcHCGIsRQJ1fZQoaAZHQDBZ2C/XXiBoB03oA2gIR0CnCI/bCaZydX2UKGgGR8Arm2gFotcwaAdN6ANoCEdApwrZkd3jdnV9lChoBke/+b1ZkkKNQ2gHTegDaAhHQKcd48QqZtx1fZQoaAZHQDPf8+A3DN1oB03oA2gIR0CnInGw7kn1dX2UKGgGRz/SAJLM9r44aAdN6ANoCEdApyfevB7/oHV9lChoBkfAQjaNbTtsvmgHTegDaAhHQKcoYr3j+711fZQoaAZHQDXlJe3QUpNoB03oA2gIR0CnM+ve54GEdX2UKGgGR8A3co7V8Ti9aAdN6ANoCEdApzsteyAxz3V9lChoBkfAI1d2HLzPKWgHTegDaAhHQKdkXjyWiUR1fZQoaAZHQCjvTPSlWOpoB03oA2gIR0CnpQ6fJ3gUdX2UKGgGR8A85zE74i5eaAdN6ANoCEdAp76mKTB68nV9lChoBkfAGYW3BpHqeWgHTegDaAhHQKfJwo3Jgb91fZQoaAZHQGWnzdUKiPBoB02yA2gIR0CnzNZbhWHUdX2UKGgGR0BkQ/+l0o0AaAdNuwNoCEdAp81e2mYShHV9lChoBkfARZVkUbkwOGgHTegDaAhHQKfOryS3b211fZQoaAZHwEFqTSsr/bVoB03oA2gIR0Cn1DVeSjgydX2UKGgGR0As6eZof0VaaAdN6ANoCEdAp9kataIN3HV9lChoBkfANbMXvYvnKWgHTegDaAhHQKfazCk43m51fZQoaAZHwC2FkvsZ5zJoB03oA2gIR0Cn78mGVRk3dX2UKGgGRz/t7Y02tMfzaAdN6ANoCEdAp/R466reZXV9lChoBkfAMPr5Ec81XWgHTegDaAhHQKf6Ioc7yQR1fZQoaAZHwAYDjBEa2ndoB03oA2gIR0Cn+pIGQjlgdX2UKGgGR0Ax3RqXWvr4aAdN6ANoCEdAqAKVBhQWN3V9lChoBkfAFMVrAP/aQGgHTegDaAhHQKgMVEgntv51fZQoaAZHwDOrWZqmCRRoB03oA2gIR0CoNY0QkHD8dX2UKGgGR0AQ9Mh5gPVeaAdN6ANoCEdAqHZsuYhManV9lChoBkdAQeGPPszEaWgHTegDaAhHQKiPxLowEhd1fZQoaAZHQDdyB06o2n9oB03oA2gIR0CombyTINmUdX2UKGgGR8AyUD1XeWOZaAdN6ANoCEdAqJwak2xY73V9lChoBkfAQ0iWom5UcWgHTegDaAhHQKicmprk8zR1fZQoaAZHwArSQPqcEvFoB03oA2gIR0ConiU1yeZodX2UKGgGR0Aix81n/T9baAdN6ANoCEdAqKVbGkvboXV9lChoBkfAJRR+BpYcN2gHTegDaAhHQKirDxwQ1791fZQoaAZHQEDWuuA7PppoB03oA2gIR0CorMf6fra/dX2UKGgGR8A2D84PwuuiaAdN6ANoCEdAqL8Wz6ab4XV9lChoBkdAO1nV5KODJ2gHTegDaAhHQKjF8tXgccV1fZQoaAZHwB1s0UGmk31oB03oA2gIR0Coy85dWyTqdX2UKGgGR8A1D39aUzKtaAdN6ANoCEdAqMxL15B1LnV9lChoBkdAJKCm2sq8UWgHTegDaAhHQKjU2fA9FF51fZQoaAZHQGSMw8fV7QdoB022A2gIR0Co1ShvJiiJdX2UKGgGR8AHgVTJhfBvaAdN6ANoCEdAqQkIQ6IWQHV9lChoBkfAGEoa1kUbk2gHTegDaAhHQKlLgzu4PPN1fZQoaAZHwDrA/u9eyAxoB03oA2gIR0CpZc1aGHpKdX2UKGgGR8A3GUi6g/TtaAdN6ANoCEdAqXBJH/cWTHV9lChoBkfAN2/j4pMHr2gHTegDaAhHQKlyxpyIYWN1fZQoaAZHwCrYSlFc6eZoB03oA2gIR0Cpc07nX/YKdX2UKGgGR0AykfvWpZOjaAdN6ANoCEdAqXScVLzwt3V9lChoBkdAIbhxxT850mgHTegDaAhHQKl8cXFcY651fZQoaAZHwEHE6dUbT+hoB03oA2gIR0CpggafapPzdX2UKGgGR0BDnn2ys0YTaAdN6ANoCEdAqYPVszl90HV9lChoBkdAKVOQyRB/qmgHTegDaAhHQKmYQ1qFh5R1fZQoaAZHwBN/mT1TR6ZoB03oA2gIR0CpniNCAtnPdX2UKGgGR8BM3lKTSsr/aAdN6ANoCEdAqaSEr3CbdHV9lChoBkdAFygF5fMOgGgHTegDaAhHQKmlCstCiRJ1fZQoaAZHwCyoCfYjB2xoB03oA2gIR0CpraagmJFcdX2UKGgGR8A4UO8CgbqAaAdN6ANoCEdAqa3zwBo243V9lChoBkfAOCnLRrrPdGgHTegDaAhHQKniBlIVdop1fZQoaAZHQCG2PaL4vexoB03oA2gIR0CqJveQU5+6dX2UKGgGR0ACCcurZJ05aAdN6ANoCEdAqkHnwkPcz3V9lChoBkfACz8w5/9YOmgHTegDaAhHQKpPfWbPQfJ1fZQoaAZHwCUs0cfeUINoB03oA2gIR0CqUpCgbp/xdX2UKGgGR8Aav0Gu9vjwaAdN6ANoCEdAqlLusV+I/XV9lChoBkfAJN31J17pmmgHTegDaAhHQKpT5iVjZth1fZQoaAZHwBHxv73wkPdoB03oA2gIR0CqWVQeV9ncdX2UKGgGR0A7o2aDwpfAaAdN6ANoCEdAql7u+dsi0XV9lChoBkfAORdXHR1HOWgHTegDaAhHQKpgzMA3kxR1fZQoaAZHwAxAprk8zRBoB03oA2gIR0Cqdc1v/BFedX2UKGgGR8A0/h4dIXj3aAdN6ANoCEdAqnrMCeVcEHV9lChoBkfAQcoQL/jsEGgHTegDaAhHQKqA9i4rjHZ1fZQoaAZHwBMdtdiUgSxoB03oA2gIR0CqgW0XP7emdX2UKGgGR8A3Jl8gIQe4aAdN6ANoCEdAqoujx3FDOXV9lChoBkdAPoCNsFdLQGgHTegDaAhHQKqME6nzg/F1fZQoaAZHP/eona37UG5oB03oA2gIR0Cqv0LJbMX8dX2UKGgGR0AKocDKYAsDaAdN6ANoCEdAqwOhjawljXV9lChoBkdAMfsNDtw71mgHTegDaAhHQKsdBschkiF1fZQoaAZHQDDvG4qgAZNoB03oA2gIR0CrKk7zbvgFdX2UKGgGR8Aw0SBshxHYaAdN6ANoCEdAqyyw/qxC6nV9lChoBkfASVeFBY3eemgHTegDaAhHQKstEkrwvxp1fZQoaAZHwDCHtAs052hoB03oA2gIR0CrLgCNCJGfdX2UKGgGR8BCXiX6ZYxMaAdN6ANoCEdAqzNhpcophHVlLg=="
55
+ },
56
+ "ep_success_buffer": {
57
+ ":type:": "<class 'collections.deque'>",
58
+ ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
59
+ },
60
+ "_n_updates": 30625,
61
+ "observation_space": {
62
+ ":type:": "<class 'gymnasium.spaces.box.Box'>",
63
+ ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
64
+ "dtype": "float32",
65
+ "bounded_below": "[ True True True True True True True True]",
66
+ "bounded_above": "[ True True True True True True True True]",
67
+ "_shape": [
68
+ 8
69
+ ],
70
+ "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
71
+ "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
72
+ "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
73
+ "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
74
+ "_np_random": null
75
+ },
76
+ "action_space": {
77
+ ":type:": "<class 'gymnasium.spaces.box.Box'>",
78
+ ":serialized:": "gAWVVwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAgAAAAAAAAABAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksChZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWAgAAAAAAAAABAZRoFUsChZRoGXSUUpSMBl9zaGFwZZRLAoWUjANsb3eUaBEolggAAAAAAAAAAACAvwAAgL+UaAtLAoWUaBl0lFKUjARoaWdolGgRKJYIAAAAAAAAAAAAgD8AAIA/lGgLSwKFlGgZdJRSlIwIbG93X3JlcHKUjAQtMS4wlIwJaGlnaF9yZXBylIwDMS4wlIwKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwQX19nZW5lcmF0b3JfY3RvcpSTlIwFUENHNjSUaDKMFF9fYml0X2dlbmVyYXRvcl9jdG9ylJOUhpRSlH2UKIwNYml0X2dlbmVyYXRvcpSMBVBDRzY0lIwFc3RhdGWUfZQoaD2KEH/TU1ElOl8LAFmK/9h4lGCMA2luY5SKEdtwj51LNCFdT4Kcw6fikLQAdYwKaGFzX3VpbnQzMpRLAIwIdWludGVnZXKUSwB1YnViLg==",
79
+ "dtype": "float32",
80
+ "bounded_below": "[ True True]",
81
+ "bounded_above": "[ True True]",
82
+ "_shape": [
83
+ 2
84
+ ],
85
+ "low": "[-1. -1.]",
86
+ "high": "[1. 1.]",
87
+ "low_repr": "-1.0",
88
+ "high_repr": "1.0",
89
+ "_np_random": "Generator(PCG64)"
90
+ },
91
+ "n_envs": 16,
92
+ "buffer_size": 1000000,
93
+ "batch_size": 256,
94
+ "learning_starts": 10000,
95
+ "tau": 0.01,
96
+ "gamma": 0.99,
97
+ "gradient_steps": 1,
98
+ "optimize_memory_usage": false,
99
+ "replay_buffer_class": {
100
+ ":type:": "<class 'abc.ABCMeta'>",
101
+ ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
102
+ "__module__": "stable_baselines3.common.buffers",
103
+ "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
104
+ "__init__": "<function ReplayBuffer.__init__ at 0x7d227e693be0>",
105
+ "add": "<function ReplayBuffer.add at 0x7d227e693c70>",
106
+ "sample": "<function ReplayBuffer.sample at 0x7d227e693d00>",
107
+ "_get_samples": "<function ReplayBuffer._get_samples at 0x7d227e693d90>",
108
+ "__abstractmethods__": "frozenset()",
109
+ "_abc_impl": "<_abc._abc_data object at 0x7d227e69b000>"
110
+ },
111
+ "replay_buffer_kwargs": {},
112
+ "train_freq": {
113
+ ":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>",
114
+ ":serialized:": "gAWVYQAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLAWgAjBJUcmFpbkZyZXF1ZW5jeVVuaXSUk5SMBHN0ZXCUhZRSlIaUgZQu"
115
+ },
116
+ "use_sde_at_warmup": false,
117
+ "target_entropy": -2.0,
118
+ "ent_coef": "auto",
119
+ "target_update_interval": 1,
120
+ "lr_schedule": {
121
+ ":type:": "<class 'function'>",
122
+ ":serialized:": "gAWVeQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwVLBEtDQzRkAX0BZAJ8ARQAfQJkA30DZAR9BHwAfAJrAHIYfAN8AHwCGwB8A3wEGAAUABgAUwB8BFMAlChOTZABS0tHP0frrxAjY7JHPzBiTdLxqfx0lCkojAF0lIwSYXZnX2VwaXNvZGVfbGVuZ3RolIwUdHJhbnNpdGlvbl90aW1lc3RlcHOUjBVpbml0aWFsX2xlYXJuaW5nX3JhdGWUjBNmaW5hbF9sZWFybmluZ19yYXRllHSUjB48aXB5dGhvbi1pbnB1dC02LTRlZTZjYWFkNDFlYz6UjBZsZWFybmluZ19yYXRlX3NjaGVkdWxllEsHQw4EAggBBAEEAQgCFAIEA5QpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGn2UfZQoaBdoEYwMX19xdWFsbmFtZV9flGgRjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
123
+ },
124
+ "batch_norm_stats": [],
125
+ "batch_norm_stats_target": []
126
+ }
SACdyn/ent_coef_optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88418a740778335ee13456699c5a69ddbf515bba2b75787e9e47e42fb5890e24
3
+ size 1940
SACdyn/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbbb9cf9adc21c628e4e835b5091cea047e3ba170cf7f59a4c2049cbebc09895
3
+ size 1389302
SACdyn/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:629465712f7b4eb98c344e1a7d2af49baf65542c622db200f6d7d5aea2ed55f4
3
+ size 1180
SACdyn/system_info.txt ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ - OS: Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Apr 28 14:29:16 UTC 2024
2
+ - Python: 3.10.12
3
+ - Stable-Baselines3: 2.0.0a5
4
+ - PyTorch: 2.3.0+cu121
5
+ - GPU Enabled: False
6
+ - Numpy: 1.25.2
7
+ - Cloudpickle: 2.2.1
8
+ - Gymnasium: 0.28.1
9
+ - OpenAI Gym: 0.25.2
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnNhYy5wb2xpY2llc5SMCVNBQ1BvbGljeZSTlC4=", "__module__": "stable_baselines3.sac.policies", "__annotations__": "{'actor': <class 'stable_baselines3.sac.policies.Actor'>, 'critic': <class 'stable_baselines3.common.policies.ContinuousCritic'>, 'critic_target': <class 'stable_baselines3.common.policies.ContinuousCritic'>}", "__doc__": "\n Policy class (with both actor and critic) for SAC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ", "__init__": "<function SACPolicy.__init__ at 0x7dac02c1c5e0>", "_build": "<function SACPolicy._build at 0x7dac02c1c670>", "_get_constructor_parameters": "<function SACPolicy._get_constructor_parameters at 0x7dac02c1c700>", "reset_noise": "<function SACPolicy.reset_noise at 0x7dac02c1c790>", "make_actor": "<function SACPolicy.make_actor at 0x7dac02c1c820>", "make_critic": "<function SACPolicy.make_critic at 0x7dac02c1c8b0>", "forward": "<function SACPolicy.forward at 0x7dac02c1c940>", "_predict": "<function SACPolicy._predict at 0x7dac02c1c9d0>", "set_training_mode": "<function SACPolicy.set_training_mode at 0x7dac02c1ca60>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7dac02c14d00>"}, "verbose": 1, "policy_kwargs": {"use_sde": false}, "num_timesteps": 500000, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1716470270197926850, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWV/gEAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwh0AHwAFABTAJROhZSMFWluaXRpYWxfbGVhcm5pbmdfcmF0ZZSFlIwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjB88aXB5dGhvbi1pbnB1dC0zMi0wMWZiZTIxOTZlZGE+lIwPbGluZWFyX3NjaGVkdWxllEsIQwIIAZQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGH2UfZQoaBVoD4wMX19xdWFsbmFtZV9flGgPjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgWjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lGgKRz9H668QI2Oyc3WGlIZSMC4="}, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM0m1byRX2g+pq9QPM6Abb1xsmC98p98PQAAAAAAAAAAWuhCPuw70DqutZO87c71O4fsrzxazOi8AACAPwAAgD8zqhI+KQkRvDWwHzuQ5Yq53EuIvWTxiroAAIA/AACAP/riJz70Eoe8Mv4vOu05nLh5ley9dYpzuQAAgD8AAIA/ZvcWPnY9E7ws3K26orydONI2fL0YCt85AACAPwAAgD9mRzU9tkufP/nCgj7TKSO/Et4NPSUu/bsAAAAAAAAAAIBLW77csSQ/Rp82Pj661r5sLzG8MoKWPQAAAAAAAAAAgOMEPY/uFboMKBO6+0WoNZhVr7q+gys5AACAPwAAgD9A8OQ9+IuTPFtAJ71c/iS9+c0CvXS+I7wAAAAAAAAAAFrfGj6lQ3E+6nb/vEaolb29wke9qWeaPQAAAAAAAAAAGu8iPlanfD1zbh28Z9ZCvQZ/qLv2pEE8AAAAAAAAAABaOa09yV05P+53JD55Ni+/LA1wvHqXwTwAAAAAAAAAAJM3Fj522yC8AH3huvco2Dhw0Iq9bzoTOgAAgD8AAIA/sJ64Poi0aT9PazS+Gxn5vrdBBT5Kjxq9AAAAAAAAAAAzJwq8H0qtuxaMAb1FbPm6LpEAPaUB1DsAAIA/AACAPwZjYD7qbWo/gRC5PpTFvr7zRSw+USKuPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAEBAQEBAQEBAQEBAQEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZz1rxCtmk+EBhfPFvgWr0LVG29H+GDPQAAAAAAAAAAZhtDPoUrujriC5m8nyX7PFuQuzwas+G9AACAPwAAgD/toxI+Q/AQvO+nAbqLkdI3EzCIvWHKMTkAAIA/AACAP0DhJz6BD4e8fMC2uc/xTzhBj+y9VrYBOQAAgD8AAIA/0/oWPlxEE7wgWFM6NWH/t6ZNfL1SxoW5AACAPwAAgD+A1So9oiGhP8TCgj4SVhy/InMPPQP7/LsAAAAAAAAAAMMoXb5SHCc/x0Q8PoYRyb6MY228XpFSPQAAAAAAAAAATekEPY/uFbo4qtQ6qzrDNC1wsLr7H/i5AACAPwAAgD8AyeU9LPiaPEdAPL2erFq8/8EAvY6TLTwAAAAAAAAAABonGz5s83I+P/Unvb3OPb2DM1e9COjqPQAAAAAAAAAAugYjPtuEgD1+sS281mgVvVbcu7u47DM8AAAAAAAAAADz6Kk9CE89P/HcIj5+6ze/grSBvH2HwDwAAAAAAAAAAPM7Fj4P5SC8AifzudpVFjiB34q9Y/4gOQAAgD8AAIA/HYi5Pi6CbD8q0Su+9XT4vk4wBz4eaA29AAAAAAAAAAAzBwW80uSru1IYQL1Pt7u8Jnr+PN4LoD0AAIA/AACAP2CkXD6kkmw/UILGPnk/ur5+6yc+rZCKPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_episode_num": 926, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHAgH8KohpyMAWyUTRIBjAF0lEdAk0/OpS75EnV9lChoBkdAbYrwVCXyAmgHTZcBaAhHQJNaNccENfB1fZQoaAZHQG7fazNUwSJoB03nAWgIR0CTW4T238XOdX2UKGgGR0BuzSRhc7hfaAdNNAFoCEdAk14emJm/WXV9lChoBkdAbYmqioKlYWgHTUQCaAhHQJNefU2DQJJ1fZQoaAZHQGqUoXCTEBNoB00IAmgIR0CTXrYrJ8v3dX2UKGgGR0BwTJe2NNrTaAdN3gFoCEdAk1/hsl9jPXV9lChoBkdAcM5Ge+VTrGgHTbQBaAhHQJNleCuloDh1fZQoaAZHQGv1Mfq5byJoB03KAWgIR0CTbAm/336AdX2UKGgGR0BqapuAI6bOaAdNqwFoCEdAk2yHDm8ujHV9lChoBkdAa8yg1WKdhGgHTXkBaAhHQJN5b5YYBNp1fZQoaAZHQGyksMZxaPloB01sAWgIR0CTfVj5bhWHdX2UKGgGR0BvRGhkAggYaAdNvQFoCEdAk37EL2HtW3V9lChoBkdAa49/Q0GeMGgHTZkBaAhHQJN+4eii7Cl1fZQoaAZHQG3nmfwqiGpoB01tAWgIR0CTgDzWf9P2dX2UKGgGR0BpkkNc4YJmaAdNnAFoCEdAk4GsHSnccnV9lChoBkdAatoTtb9qDmgHTU0BaAhHQJOHLJbMX8B1fZQoaAZHQG6MG2TgVGloB003AWgIR0CTiNMg2ZRbdX2UKGgGR0Bt5/xpcophaAdNDgJoCEdAk5CMa86FNHV9lChoBkdAb3bkhA4XGmgHTbQBaAhHQJORzl5nlGR1fZQoaAZHQG1en2h7E51oB01tAWgIR0CTmfZ3s5XEdX2UKGgGR0BuJUYdhiLEaAdNAAJoCEdAk6DLBTGYKXV9lChoBkdAZe9a9sabWmgHTdgBaAhHQJOkRH09QoF1fZQoaAZHQG6QmlqJuVJoB02/AWgIR0CTqEnBLwnZdX2UKGgGR0BtL88vEjxDaAdNrwFoCEdAk7rF0gbIcXV9lChoBkdAbQ+XNTtLMGgHTX0BaAhHQJO/BAu7HyV1fZQoaAZHQG8gj0UXYUZoB02zAWgIR0CTv4qLjxTbdX2UKGgGR0Br7Up7TlT4aAdNyAFoCEdAk8DKJdjXnXV9lChoBkdAa2TzDn/1hGgHTVoBaAhHQJPF9uHerMl1fZQoaAZHQHDVRKL876poB02oAWgIR0CTx3g5BC2MdX2UKGgGR0BsZZradtl7aAdNRgFoCEdAk9cxwqAjIXV9lChoBkdAcBr9/z8P4GgHTcQBaAhHQJPjjU8V58l1fZQoaAZHQGsChrWRRuVoB03QAmgIR0CT546O5rgwdX2UKGgGR0BsGw371qWUaAdNvANoCEdAk+kKzE74jHV9lChoBkdAbpfaWX1J2GgHTbgBaAhHQJPpN/6O5rh1fZQoaAZHQFyQWOp84PxoB03oA2gIR0CT73FPSDywdX2UKGgGR0BnmmgDifg8aAdNYgJoCEdAk/EmQwK0D3V9lChoBkdAbzgvVVghKWgHTeQBaAhHQJP0qJSBK+V1fZQoaAZHQG8SnO0LMLZoB02MAWgIR0CT964t6HCXdX2UKGgGR0BuFfvx6OYIaAdNpAFoCEdAk/51lbu+iHV9lChoBkdAb5/OymhufmgHTcABaAhHQJQB+cNH6M11fZQoaAZHQGmBzEJjUd9oB03AA2gIR0CUA/LeANG3dX2UKGgGR0BsXt8VpKzzaAdNlgFoCEdAlAQ9apxWDHV9lChoBkdAb5H4rSVnmWgHTcUBaAhHQJQEP+jua4N1fZQoaAZHQF8CrrgOz6doB03oA2gIR0CUDhPN3W4FdX2UKGgGR0BriUGNaQmvaAdNUAFoCEdAlBfinDR+jXV9lChoBkdAbo2cxTKkmGgHTVMBaAhHQJQYSDYh+v11fZQoaAZHQG4sizsyBTZoB027AWgIR0CUGhblA/s3dX2UKGgGR0BqvpZKWcBmaAdNrgFoCEdAlCSFtGd7OXV9lChoBkdAa3KSxJNCaGgHTZcBaAhHQJQrQ5YHPeJ1fZQoaAZHQG1CYrSVnmJoB03aAWgIR0CUM5piZv1ldX2UKGgGR0BtF5wQ176YaAdNtQFoCEdAlDPNAPd2xXV9lChoBkdAbm4+X7cfvGgHTeQCaAhHQJQ0FQuVX3h1fZQoaAZHQG4cRKQJXyRoB01hAWgIR0CUNewFC9h7dX2UKGgGR0Bs7+uaF23baAdNdgFoCEdAlDpmvbGm13V9lChoBkdAb9LOnEVFhGgHTagBaAhHQJQ7t6Vt4zJ1fZQoaAZHQGwgERSP2f1oB02ZAWgIR0CUPr7BfrrxdX2UKGgGR0BqLUhkiD/VaAdNDwJoCEdAlEGYtcv/R3V9lChoBkdAa7KHJtBOYmgHTZIBaAhHQJRG9Fx4ptt1fZQoaAZHQG3yDziCJ41oB033AWgIR0CUSrJ53TuwdX2UKGgGR0Bsd7NliBoVaAdNLAFoCEdAlE1T63y7PXV9lChoBkdAamzDMvAXVWgHTXUBaAhHQJRNyJJoTPB1fZQoaAZHQG6NyQgcLjRoB00QA2gIR0CUUmoL5RCQdX2UKGgGR0BwUh5zHS4OaAdNvAFoCEdAlFcTDTBqK3V9lChoBkdAaBc7lJYkmmgHTdYBaAhHQJRZljgAIY51fZQoaAZHQGqwXeN1hb5oB01QAWgIR0CUXy/Tb349dX2UKGgGR0BtOxvFWGRFaAdNhwFoCEdAlGhXw1BMSXV9lChoBkdAboN8baRISWgHTdsBaAhHQJRp5zOoo/l1fZQoaAZHQGoPAQHzH0doB02lAWgIR0CUag3ztkWidX2UKGgGR0BwriY1He7+aAdNzgFoCEdAlG+Js0pEyHV9lChoBkdAbpRgYxcmjWgHTaQBaAhHQJRwcunMt9R1fZQoaAZHQG1He1a4c3loB02BAWgIR0CUcKqmCROldX2UKGgGR0Bs7r7j1f3OaAdNuQFoCEdAlHQ/phWo33V9lChoBkdAavi6r/82rGgHTZMBaAhHQJR+bPhQ3xZ1fZQoaAZHQGzikUKzAvdoB03mAWgIR0CUgPCcwxnGdX2UKGgGR0BpPVgBtDUmaAdNvAFoCEdAlIHIzi0fHXV9lChoBkdAbbi6Oo5xR2gHTaABaAhHQJSDub3Gn4x1fZQoaAZHQGyxKMNtqHpoB02bAWgIR0CUjVsP8Q7LdX2UKGgGR0Burh4yGi5/aAdN9gFoCEdAlJGqy8jAz3V9lChoBkdAbavxusLfDWgHTboBaAhHQJScnbfxc3V1fZQoaAZHQGk7NMoMKCxoB02oAWgIR0CUpplIEr5JdX2UKGgGR0BuVg+lj3EiaAdNSQJoCEdAlKrQqur6tXV9lChoBkdAb5fprULDymgHTdEBaAhHQJStGLZSNwR1fZQoaAZHQG5u3Onl4khoB02lAWgIR0CUrhvlU6xPdX2UKGgGR0Buc7D2rXDnaAdNMAFoCEdAlLAnHJcPfHV9lChoBkdAba6GQCCBgGgHTasBaAhHQJSy7/ACW/t1fZQoaAZHQG6RoegctGxoB03RAWgIR0CUs+fUWl/IdX2UKGgGR0Btty0F8ohIaAdNywJoCEdAlLS3eBQN1HV9lChoBkdAbcg5dWyTp2gHTf0BaAhHQJS3zRtxdY51fZQoaAZHQG3y/uCwr2BoB03BAWgIR0CUwOEoOQQudX2UKGgGR0Bt24WLxZuAaAdNggFoCEdAlMTmkzoECHV9lChoBkdAb36VC5VfeGgHTc4BaAhHQJTFcBGQSzx1fZQoaAZHQGu9rtE5QxhoB01QAWgIR0CUzIAuqWC3dX2UKGgGR0BvnfbGm1pkaAdNbQJoCEdAlNyxrWRRuXV9lChoBkdAa9y54GD+SGgHTVkDaAhHQJTg44p+c6N1fZQoaAZHQG2j6eXiR4hoB02NAWgIR0CU4WDGcWj5dX2UKGgGR0BtTRVIZqEfaAdNrgFoCEdAlOI7xVhkRXV9lChoBkdAa7XVZs9B8mgHTb4BaAhHQJTuR6Ww/xF1fZQoaAZHQG42e5vtMPBoB03TAWgIR0CU7ynM+u/2dX2UKGgGR0BuHw1m8M/haAdNQgFoCEdAlPOeRkmQbXVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 30625, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVVwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAgAAAAAAAAABAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksChZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWAgAAAAAAAAABAZRoFUsChZRoGXSUUpSMBl9zaGFwZZRLAoWUjANsb3eUaBEolggAAAAAAAAAAACAvwAAgL+UaAtLAoWUaBl0lFKUjARoaWdolGgRKJYIAAAAAAAAAAAAgD8AAIA/lGgLSwKFlGgZdJRSlIwIbG93X3JlcHKUjAQtMS4wlIwJaGlnaF9yZXBylIwDMS4wlIwKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwQX19nZW5lcmF0b3JfY3RvcpSTlIwFUENHNjSUaDKMFF9fYml0X2dlbmVyYXRvcl9jdG9ylJOUhpRSlH2UKIwNYml0X2dlbmVyYXRvcpSMBVBDRzY0lIwFc3RhdGWUfZQoaD2KEVr7DZw2+r84qMY0Hw9YBuMAjANpbmOUihAFPvXog3v6hHmU/x6XftImdYwKaGFzX3VpbnQzMpRLAIwIdWludGVnZXKUSwB1YnViLg==", "dtype": "float32", "bounded_below": "[ True True]", "bounded_above": "[ True True]", "_shape": [2], "low": "[-1. -1.]", "high": "[1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": "Generator(PCG64)"}, "n_envs": 16, "buffer_size": 1000000, "batch_size": 256, "learning_starts": 10000, "tau": 0.01, "gamma": 0.99, "gradient_steps": 1, "optimize_memory_usage": false, "replay_buffer_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==", "__module__": "stable_baselines3.common.buffers", "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ", "__init__": "<function ReplayBuffer.__init__ at 0x7dac02bd7490>", "add": "<function ReplayBuffer.add at 0x7dac02bd7520>", "sample": "<function ReplayBuffer.sample at 0x7dac02bd75b0>", "_get_samples": "<function ReplayBuffer._get_samples at 0x7dac02bd7640>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7dac02be2400>"}, "replay_buffer_kwargs": {}, "train_freq": {":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>", ":serialized:": "gAWVYQAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLAWgAjBJUcmFpbkZyZXF1ZW5jeVVuaXSUk5SMBHN0ZXCUhZRSlIaUgZQu"}, "use_sde_at_warmup": false, "target_entropy": -2.0, "ent_coef": "auto", "target_update_interval": 1, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV/gEAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAktDQwh0AHwAFABTAJROhZSMFWluaXRpYWxfbGVhcm5pbmdfcmF0ZZSFlIwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjB88aXB5dGhvbi1pbnB1dC0zMi0wMWZiZTIxOTZlZGE+lIwPbGluZWFyX3NjaGVkdWxllEsIQwIIAZQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGH2UfZQoaBVoD4wMX19xdWFsbmFtZV9flGgPjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgWjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lGgKRz9H668QI2Oyc3WGlIZSMC4="}, "batch_norm_stats": [], "batch_norm_stats_target": [], "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Apr 28 14:29:16 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.3.0+cu121", "GPU Enabled": "True", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnNhYy5wb2xpY2llc5SMCVNBQ1BvbGljeZSTlC4=", "__module__": "stable_baselines3.sac.policies", "__annotations__": "{'actor': <class 'stable_baselines3.sac.policies.Actor'>, 'critic': <class 'stable_baselines3.common.policies.ContinuousCritic'>, 'critic_target': <class 'stable_baselines3.common.policies.ContinuousCritic'>}", "__doc__": "\n Policy class (with both actor and critic) for SAC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ", "__init__": "<function SACPolicy.__init__ at 0x7d227e6ccd30>", "_build": "<function SACPolicy._build at 0x7d227e6ccdc0>", "_get_constructor_parameters": "<function SACPolicy._get_constructor_parameters at 0x7d227e6cce50>", "reset_noise": "<function SACPolicy.reset_noise at 0x7d227e6ccee0>", "make_actor": "<function SACPolicy.make_actor at 0x7d227e6ccf70>", "make_critic": "<function SACPolicy.make_critic at 0x7d227e6cd000>", "forward": "<function SACPolicy.forward at 0x7d227e6cd090>", "_predict": "<function SACPolicy._predict at 0x7d227e6cd120>", "set_training_mode": "<function SACPolicy.set_training_mode at 0x7d227e6cd1b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7d227e6bbec0>"}, "verbose": 1, "policy_kwargs": {"use_sde": false}, "num_timesteps": 500000, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1716478454985334697, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWVeQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwVLBEtDQzRkAX0BZAJ8ARQAfQJkA30DZAR9BHwAfAJrAHIYfAN8AHwCGwB8A3wEGAAUABgAUwB8BFMAlChOTZABS0tHP0frrxAjY7JHPzBiTdLxqfx0lCkojAF0lIwSYXZnX2VwaXNvZGVfbGVuZ3RolIwUdHJhbnNpdGlvbl90aW1lc3RlcHOUjBVpbml0aWFsX2xlYXJuaW5nX3JhdGWUjBNmaW5hbF9sZWFybmluZ19yYXRllHSUjB48aXB5dGhvbi1pbnB1dC02LTRlZTZjYWFkNDFlYz6UjBZsZWFybmluZ19yYXRlX3NjaGVkdWxllEsHQw4EAggBBAEEAQgCFAIEA5QpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGn2UfZQoaBdoEYwMX19xdWFsbmFtZV9flGgRjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAABqZYL1DCJk+SqMKvtWUxbzvME+9xdffPAAAAAAAAAAAMxtYvE9eUz7DPtk9l7jlvLNMijxCdhS8AAAAAAAAAACGRys+K4awPZgl1z0/vfc76HQTPQZjHD0AAAAAAAAAAABHjDxLNIc/a1aKPbcy8L6SpiI8FY5MPQAAAAAAAAAA+iI8vlaIkj+qCdm+u194vtHzWr57yBK+AAAAAAAAAAAzI3Q8xieiPyr79D3J3wy/tqiOOp7UGLsAAAAAAAAAAECG2D1k1849ShcqvSAIDj1k6hK8QAFqvQAAAAAAAAAATTyKPs47rT1mpe08H6psPPJ0pTyNnRu8AAAAAAAAAADzUkE+IdeJPeoHK70Uy+88GP8MvPPclb0AAAAAAAAAALq6kT4EHcI9hY5TPWksMzxfQiQ9zW7OPAAAAAAAAAAAzTIiPQHIzT0Nnpi8PfwePKrL2rzOWZK6AAAAAAAAAAAmRz4+LVmhP8H5iD4pN+e9VNk0PgB51bwAAAAAAAAAAHOruD5GiqM/hQ+VPS+YiL7qzEc+tSWvvQAAAAAAAAAATbqxPXt7oT0cLYC8truhPK6kPrvaAvm7AAAAAAAAAADmFSU+gUq2PaUxgD0R7Ms88jOtPJMhg7wAAAAAAAAAAMh4h75twJY/4gypvk5dlrzf26a+kye6vQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAEBAQEBAQEBAQEBAQEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAOYbW72IT5k+oDD2vc6mIb2IyVS9dU/eOgAAAAAAAAAAM2lpvLkDVD7qruQ9o13AvN4CjjzyhIm7AAAAAAAAAAATLyo+eCywPar7yT1soFa8J6MLPX2S8jwAAAAAAAAAADOJhjwsjog/6KNpPT3X876wevM7R0chPQAAAAAAAAAAJrk3vmw6kz+gMNq+pJJ4vv6cU76/vwy+AAAAAAAAAADNjmA8fr2jP1hd5T3M0hG/+PCdOrJV3DwAAAAAAAAAACZv2T0oPs09m8znvO3thbugOsi7egkzvQAAAAAAAAAA6haKPnuRrD1xHsE8r9q1O9xYqTyuzIG8AAAAAAAAAAAaykE+pH2IPdPf9LzzEeo7QBqiu9EIt70AAAAAAAAAAFp1kT6km8E9hqNNPUp+ZDw1GR89WvO3PAAAAAAAAAAAzfYiPYRVzT0qYpa8dU1HuplW2rzB7hg6AAAAAAAAAAA6jTs+iKyhP4a9iz6V39m94y42Pi6VDTwAAAAAAAAAAJ1RuD5kT6Q/PsmCPSk5d77bLUw+H8ZGvQAAAAAAAAAAWg6yPZGSoD32hwO8C2NrvNm9JbvTk5M2AAAAAAAAAADtcyQ+/iS1PUTcjj3UjoU8bMKzPLzdJrwAAAAAAAAAAErChb4+zZY/xwypvm00CDwtiKS+qie6vQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_episode_num": 685, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGt67blA/s6MAWyUTTgDjAF0lEdApjJXc32mHnV9lChoBkfAHiXQ+lj3EmgHTegDaAhHQKY5eZKFqSJ1fZQoaAZHwDXZERaouPFoB03oA2gIR0CmPFhsQ/X5dX2UKGgGR8A73ZtvXK8taAdN6ANoCEdApj2wDYAbQ3V9lChoBkfANR9h/iHZb2gHTegDaAhHQKY+26bONYN1fZQoaAZHQGIRikfs/ptoB02WA2gIR0CmQHBy8zyjdX2UKGgGR0A49xyGSIP9aAdN6ANoCEdAplIjMC9ytHV9lChoBkfAIAqmKqGUOmgHTegDaAhHQKZYc6QvHtF1fZQoaAZHwD4S3z+WGAVoB03oA2gIR0CmXdGD15B1dX2UKGgGR0Bp5yA+Y+jeaAdNQwNoCEdApl5C7dznzXV9lChoBkdAYuOOOsDGLmgHTckDaAhHQKZmQy44Ia91fZQoaAZHQGbV+KCQLeBoB03YAmgIR0CmbbUqx1PndX2UKGgGRz//oNNJvo/zaAdN6ANoCEdAppeZdhRZU3V9lChoBkdAKu/CZWq95GgHTegDaAhHQKbWXJMg2ZR1fZQoaAZHwC9jbJwKjSJoB03oA2gIR0Cm7h7coH9ndX2UKGgGR0AhJK5kK/mDaAdN6ANoCEdApvlJO1v2oXV9lChoBkdAN/OtbLU1AWgHTegDaAhHQKb8uPH1e0J1fZQoaAZHwEC+7gbZOBVoB03oA2gIR0CnAqqPfbbldX2UKGgGR8BFngsbvPToaAdN6ANoCEdApwWc7yQPqnV9lChoBkdAPSnLmp2lmGgHTegDaAhHQKcHCGIsRQJ1fZQoaAZHQDBZ2C/XXiBoB03oA2gIR0CnCI/bCaZydX2UKGgGR8Arm2gFotcwaAdN6ANoCEdApwrZkd3jdnV9lChoBke/+b1ZkkKNQ2gHTegDaAhHQKcd48QqZtx1fZQoaAZHQDPf8+A3DN1oB03oA2gIR0CnInGw7kn1dX2UKGgGRz/SAJLM9r44aAdN6ANoCEdApyfevB7/oHV9lChoBkfAQjaNbTtsvmgHTegDaAhHQKcoYr3j+711fZQoaAZHQDXlJe3QUpNoB03oA2gIR0CnM+ve54GEdX2UKGgGR8A3co7V8Ti9aAdN6ANoCEdApzsteyAxz3V9lChoBkfAI1d2HLzPKWgHTegDaAhHQKdkXjyWiUR1fZQoaAZHQCjvTPSlWOpoB03oA2gIR0CnpQ6fJ3gUdX2UKGgGR8A85zE74i5eaAdN6ANoCEdAp76mKTB68nV9lChoBkfAGYW3BpHqeWgHTegDaAhHQKfJwo3Jgb91fZQoaAZHQGWnzdUKiPBoB02yA2gIR0CnzNZbhWHUdX2UKGgGR0BkQ/+l0o0AaAdNuwNoCEdAp81e2mYShHV9lChoBkfARZVkUbkwOGgHTegDaAhHQKfOryS3b211fZQoaAZHwEFqTSsr/bVoB03oA2gIR0Cn1DVeSjgydX2UKGgGR0As6eZof0VaaAdN6ANoCEdAp9kataIN3HV9lChoBkfANbMXvYvnKWgHTegDaAhHQKfazCk43m51fZQoaAZHwC2FkvsZ5zJoB03oA2gIR0Cn78mGVRk3dX2UKGgGRz/t7Y02tMfzaAdN6ANoCEdAp/R466reZXV9lChoBkfAMPr5Ec81XWgHTegDaAhHQKf6Ioc7yQR1fZQoaAZHwAYDjBEa2ndoB03oA2gIR0Cn+pIGQjlgdX2UKGgGR0Ax3RqXWvr4aAdN6ANoCEdAqAKVBhQWN3V9lChoBkfAFMVrAP/aQGgHTegDaAhHQKgMVEgntv51fZQoaAZHwDOrWZqmCRRoB03oA2gIR0CoNY0QkHD8dX2UKGgGR0AQ9Mh5gPVeaAdN6ANoCEdAqHZsuYhManV9lChoBkdAQeGPPszEaWgHTegDaAhHQKiPxLowEhd1fZQoaAZHQDdyB06o2n9oB03oA2gIR0CombyTINmUdX2UKGgGR8AyUD1XeWOZaAdN6ANoCEdAqJwak2xY73V9lChoBkfAQ0iWom5UcWgHTegDaAhHQKicmprk8zR1fZQoaAZHwArSQPqcEvFoB03oA2gIR0ConiU1yeZodX2UKGgGR0Aix81n/T9baAdN6ANoCEdAqKVbGkvboXV9lChoBkfAJRR+BpYcN2gHTegDaAhHQKirDxwQ1791fZQoaAZHQEDWuuA7PppoB03oA2gIR0CorMf6fra/dX2UKGgGR8A2D84PwuuiaAdN6ANoCEdAqL8Wz6ab4XV9lChoBkdAO1nV5KODJ2gHTegDaAhHQKjF8tXgccV1fZQoaAZHwB1s0UGmk31oB03oA2gIR0Coy85dWyTqdX2UKGgGR8A1D39aUzKtaAdN6ANoCEdAqMxL15B1LnV9lChoBkdAJKCm2sq8UWgHTegDaAhHQKjU2fA9FF51fZQoaAZHQGSMw8fV7QdoB022A2gIR0Co1ShvJiiJdX2UKGgGR8AHgVTJhfBvaAdN6ANoCEdAqQkIQ6IWQHV9lChoBkfAGEoa1kUbk2gHTegDaAhHQKlLgzu4PPN1fZQoaAZHwDrA/u9eyAxoB03oA2gIR0CpZc1aGHpKdX2UKGgGR8A3GUi6g/TtaAdN6ANoCEdAqXBJH/cWTHV9lChoBkfAN2/j4pMHr2gHTegDaAhHQKlyxpyIYWN1fZQoaAZHwCrYSlFc6eZoB03oA2gIR0Cpc07nX/YKdX2UKGgGR0AykfvWpZOjaAdN6ANoCEdAqXScVLzwt3V9lChoBkdAIbhxxT850mgHTegDaAhHQKl8cXFcY651fZQoaAZHwEHE6dUbT+hoB03oA2gIR0CpggafapPzdX2UKGgGR0BDnn2ys0YTaAdN6ANoCEdAqYPVszl90HV9lChoBkdAKVOQyRB/qmgHTegDaAhHQKmYQ1qFh5R1fZQoaAZHwBN/mT1TR6ZoB03oA2gIR0CpniNCAtnPdX2UKGgGR8BM3lKTSsr/aAdN6ANoCEdAqaSEr3CbdHV9lChoBkdAFygF5fMOgGgHTegDaAhHQKmlCstCiRJ1fZQoaAZHwCyoCfYjB2xoB03oA2gIR0CpraagmJFcdX2UKGgGR8A4UO8CgbqAaAdN6ANoCEdAqa3zwBo243V9lChoBkfAOCnLRrrPdGgHTegDaAhHQKniBlIVdop1fZQoaAZHQCG2PaL4vexoB03oA2gIR0CqJveQU5+6dX2UKGgGR0ACCcurZJ05aAdN6ANoCEdAqkHnwkPcz3V9lChoBkfACz8w5/9YOmgHTegDaAhHQKpPfWbPQfJ1fZQoaAZHwCUs0cfeUINoB03oA2gIR0CqUpCgbp/xdX2UKGgGR8Aav0Gu9vjwaAdN6ANoCEdAqlLusV+I/XV9lChoBkfAJN31J17pmmgHTegDaAhHQKpT5iVjZth1fZQoaAZHwBHxv73wkPdoB03oA2gIR0CqWVQeV9ncdX2UKGgGR0A7o2aDwpfAaAdN6ANoCEdAql7u+dsi0XV9lChoBkfAORdXHR1HOWgHTegDaAhHQKpgzMA3kxR1fZQoaAZHwAxAprk8zRBoB03oA2gIR0Cqdc1v/BFedX2UKGgGR8A0/h4dIXj3aAdN6ANoCEdAqnrMCeVcEHV9lChoBkfAQcoQL/jsEGgHTegDaAhHQKqA9i4rjHZ1fZQoaAZHwBMdtdiUgSxoB03oA2gIR0CqgW0XP7emdX2UKGgGR8A3Jl8gIQe4aAdN6ANoCEdAqoujx3FDOXV9lChoBkdAPoCNsFdLQGgHTegDaAhHQKqME6nzg/F1fZQoaAZHP/eona37UG5oB03oA2gIR0Cqv0LJbMX8dX2UKGgGR0AKocDKYAsDaAdN6ANoCEdAqwOhjawljXV9lChoBkdAMfsNDtw71mgHTegDaAhHQKsdBschkiF1fZQoaAZHQDDvG4qgAZNoB03oA2gIR0CrKk7zbvgFdX2UKGgGR8Aw0SBshxHYaAdN6ANoCEdAqyyw/qxC6nV9lChoBkfASVeFBY3eemgHTegDaAhHQKstEkrwvxp1fZQoaAZHwDCHtAs052hoB03oA2gIR0CrLgCNCJGfdX2UKGgGR8BCXiX6ZYxMaAdN6ANoCEdAqzNhpcophHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 30625, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVVwIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAgAAAAAAAAABAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksChZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWAgAAAAAAAAABAZRoFUsChZRoGXSUUpSMBl9zaGFwZZRLAoWUjANsb3eUaBEolggAAAAAAAAAAACAvwAAgL+UaAtLAoWUaBl0lFKUjARoaWdolGgRKJYIAAAAAAAAAAAAgD8AAIA/lGgLSwKFlGgZdJRSlIwIbG93X3JlcHKUjAQtMS4wlIwJaGlnaF9yZXBylIwDMS4wlIwKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwQX19nZW5lcmF0b3JfY3RvcpSTlIwFUENHNjSUaDKMFF9fYml0X2dlbmVyYXRvcl9jdG9ylJOUhpRSlH2UKIwNYml0X2dlbmVyYXRvcpSMBVBDRzY0lIwFc3RhdGWUfZQoaD2KEH/TU1ElOl8LAFmK/9h4lGCMA2luY5SKEdtwj51LNCFdT4Kcw6fikLQAdYwKaGFzX3VpbnQzMpRLAIwIdWludGVnZXKUSwB1YnViLg==", "dtype": "float32", "bounded_below": "[ True True]", "bounded_above": "[ True True]", "_shape": [2], "low": "[-1. -1.]", "high": "[1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": "Generator(PCG64)"}, "n_envs": 16, "buffer_size": 1000000, "batch_size": 256, "learning_starts": 10000, "tau": 0.01, "gamma": 0.99, "gradient_steps": 1, "optimize_memory_usage": false, "replay_buffer_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==", "__module__": "stable_baselines3.common.buffers", "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ", "__init__": "<function ReplayBuffer.__init__ at 0x7d227e693be0>", "add": "<function ReplayBuffer.add at 0x7d227e693c70>", "sample": "<function ReplayBuffer.sample at 0x7d227e693d00>", "_get_samples": "<function ReplayBuffer._get_samples at 0x7d227e693d90>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7d227e69b000>"}, "replay_buffer_kwargs": {}, "train_freq": {":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>", ":serialized:": "gAWVYQAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLAWgAjBJUcmFpbkZyZXF1ZW5jeVVuaXSUk5SMBHN0ZXCUhZRSlIaUgZQu"}, "use_sde_at_warmup": false, "target_entropy": -2.0, "ent_coef": "auto", "target_update_interval": 1, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVeQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwVLBEtDQzRkAX0BZAJ8ARQAfQJkA30DZAR9BHwAfAJrAHIYfAN8AHwCGwB8A3wEGAAUABgAUwB8BFMAlChOTZABS0tHP0frrxAjY7JHPzBiTdLxqfx0lCkojAF0lIwSYXZnX2VwaXNvZGVfbGVuZ3RolIwUdHJhbnNpdGlvbl90aW1lc3RlcHOUjBVpbml0aWFsX2xlYXJuaW5nX3JhdGWUjBNmaW5hbF9sZWFybmluZ19yYXRllHSUjB48aXB5dGhvbi1pbnB1dC02LTRlZTZjYWFkNDFlYz6UjBZsZWFybmluZ19yYXRlX3NjaGVkdWxllEsHQw4EAggBBAEEAQgCFAIEA5QpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGn2UfZQoaBdoEYwMX19xdWFsbmFtZV9flGgRjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "batch_norm_stats": [], "batch_norm_stats_target": [], "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Apr 28 14:29:16 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.3.0+cu121", "GPU Enabled": "False", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 230.68447329957976, "std_reward": 7.839936749907468, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-05-23T14:07:59.724642"}
 
1
+ {"mean_reward": 6.611782643266634, "std_reward": 15.771835625560266, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-05-23T16:38:17.863074"}