Upload results for SAC on RBC3D-hard-v0.
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +20 -0
- 0/ckpt_latest.zip +3 -0
- 0/config.yaml +60 -0
- 0/hydra.yaml +163 -0
- 0/multirun.yaml +223 -0
- 0/overrides.yaml +4 -0
- 0/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 0/test/test_eval_episode_0.csv +0 -0
- 0/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 0/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 0/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 0/training_log.csv +111 -0
- 1/ckpt_latest.zip +3 -0
- 1/config.yaml +60 -0
- 1/hydra.yaml +163 -0
- 1/multirun.yaml +223 -0
- 1/overrides.yaml +4 -0
- 1/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 1/test/test_eval_episode_0.csv +0 -0
- 1/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 1/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 1/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 1/training_log.csv +111 -0
- 2/ckpt_latest.zip +3 -0
- 2/config.yaml +60 -0
- 2/hydra.yaml +163 -0
- 2/multirun.yaml +223 -0
- 2/overrides.yaml +4 -0
- 2/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 2/test/test_eval_episode_0.csv +0 -0
- 2/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 2/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 2/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 2/training_log.csv +111 -0
- 3/ckpt_latest.zip +3 -0
- 3/config.yaml +60 -0
- 3/hydra.yaml +163 -0
- 3/multirun.yaml +223 -0
- 3/overrides.yaml +4 -0
- 3/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 3/test/test_eval_episode_0.csv +0 -0
- 3/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 3/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 3/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 3/training_log.csv +111 -0
- 4/ckpt_latest.zip +3 -0
- 4/config.yaml +60 -0
- 4/hydra.yaml +163 -0
- 4/multirun.yaml +223 -0
- 4/overrides.yaml +4 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,23 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
0/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
0/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
0/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
0/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
1/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
1/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
1/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
1/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
2/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
2/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
2/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
2/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
3/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
3/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
3/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
3/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
4/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
4/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
4/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
4/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
0/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1dad1e654c8891698f0e61f5b6b51fdf03d0172823422042070043bc5925e65
|
| 3 |
+
size 58086507
|
0/config.yaml
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 0
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: SAC
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
buffer_size: 1000000
|
| 30 |
+
learning_starts: 100
|
| 31 |
+
batch_size: 256
|
| 32 |
+
tau: 0.005
|
| 33 |
+
gamma: 0.99
|
| 34 |
+
train_freq: 1
|
| 35 |
+
gradient_steps: -1
|
| 36 |
+
action_noise: null
|
| 37 |
+
replay_buffer_class: null
|
| 38 |
+
replay_buffer_kwargs: null
|
| 39 |
+
optimize_memory_usage: false
|
| 40 |
+
ent_coef: auto
|
| 41 |
+
target_update_interval: 1
|
| 42 |
+
target_entropy: auto
|
| 43 |
+
use_sde: false
|
| 44 |
+
sde_sample_freq: -1
|
| 45 |
+
use_sde_at_warmup: false
|
| 46 |
+
stats_window_size: 100
|
| 47 |
+
tensorboard_log: null
|
| 48 |
+
policy_kwargs: {}
|
| 49 |
+
verbose: 0
|
| 50 |
+
seed: ${seed}
|
| 51 |
+
device: cuda
|
| 52 |
+
_init_setup_model: true
|
| 53 |
+
cluster: {}
|
| 54 |
+
test_env_id: ${env_id}
|
| 55 |
+
test_env_kwargs: ${env_kwargs}
|
| 56 |
+
test_rl_mode: ${rl_mode}
|
| 57 |
+
n_test_episodes: 10
|
| 58 |
+
deterministic: true
|
| 59 |
+
save_frames: true
|
| 60 |
+
render_3d: true
|
0/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=0
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=0
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/SAC/0
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
0/multirun.yaml
ADDED
|
@@ -0,0 +1,223 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=0
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=0
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 0
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: SAC
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
buffer_size: 1000000
|
| 193 |
+
learning_starts: 100
|
| 194 |
+
batch_size: 256
|
| 195 |
+
tau: 0.005
|
| 196 |
+
gamma: 0.99
|
| 197 |
+
train_freq: 1
|
| 198 |
+
gradient_steps: -1
|
| 199 |
+
action_noise: null
|
| 200 |
+
replay_buffer_class: null
|
| 201 |
+
replay_buffer_kwargs: null
|
| 202 |
+
optimize_memory_usage: false
|
| 203 |
+
ent_coef: auto
|
| 204 |
+
target_update_interval: 1
|
| 205 |
+
target_entropy: auto
|
| 206 |
+
use_sde: false
|
| 207 |
+
sde_sample_freq: -1
|
| 208 |
+
use_sde_at_warmup: false
|
| 209 |
+
stats_window_size: 100
|
| 210 |
+
tensorboard_log: null
|
| 211 |
+
policy_kwargs: {}
|
| 212 |
+
verbose: 0
|
| 213 |
+
seed: ${seed}
|
| 214 |
+
device: cuda
|
| 215 |
+
_init_setup_model: true
|
| 216 |
+
cluster: {}
|
| 217 |
+
test_env_id: ${env_id}
|
| 218 |
+
test_env_kwargs: ${env_kwargs}
|
| 219 |
+
test_rl_mode: ${rl_mode}
|
| 220 |
+
n_test_episodes: 10
|
| 221 |
+
deterministic: true
|
| 222 |
+
save_frames: true
|
| 223 |
+
render_3d: true
|
0/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_sac
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=0
|
0/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
0/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/training_log.csv
ADDED
|
@@ -0,0 +1,111 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,0.024334125220775604,0.024334121227264405,2.659598898410797,,
|
| 3 |
+
1000,0.2624503970146179,0.26245042419433595,2.4214825954437256,,
|
| 4 |
+
1500,0.35953813791275024,0.3595381588935852,2.3243948607444764,,
|
| 5 |
+
2000,0.36718568205833435,0.36718566513061524,2.3167473545074464,,
|
| 6 |
+
2500,0.36084315180778503,0.360843141078949,2.3230898785591125,,
|
| 7 |
+
3000,0.3312532901763916,0.33125330877304077,2.352679710865021,,
|
| 8 |
+
3500,0.33391037583351135,0.3339103684425354,2.350022651195526,,
|
| 9 |
+
4000,0.34455594420433044,0.3445559396743774,2.339377079963684,,
|
| 10 |
+
4500,0.3756142556667328,0.37561428833007815,2.3083187313079834,,
|
| 11 |
+
5000,0.38598138093948364,0.3859814014434814,2.2979516181945803,,
|
| 12 |
+
5000,,,,2.3237505912780763,0.36018240451812744
|
| 13 |
+
5500,0.3767675757408142,0.3767676148414612,2.3071654047966,,
|
| 14 |
+
6000,0.38073307275772095,0.38073307371139525,2.303199945926666,,
|
| 15 |
+
6500,0.3662646412849426,0.36626463651657104,2.3176683831214904,,
|
| 16 |
+
7000,0.3904113173484802,0.390411283493042,2.2935217361450198,,
|
| 17 |
+
7500,0.3787308633327484,0.3787308506965637,2.3052021689414977,,
|
| 18 |
+
8000,0.3718392550945282,0.3718392949104309,2.3120937247276308,,
|
| 19 |
+
8500,0.37776491045951843,0.37776491737365725,2.3061681022644045,,
|
| 20 |
+
9000,0.3708631992340088,0.37086317157745363,2.313069848060608,,
|
| 21 |
+
9500,0.38530001044273376,0.3853000316619873,2.2986329879760743,,
|
| 22 |
+
10000,0.3701469898223877,0.3701469955444336,2.313786024093628,,
|
| 23 |
+
10000,,,,2.33200471162796,0.35192832350730896
|
| 24 |
+
10500,0.371250182390213,0.3712501668930054,2.312682852745056,,
|
| 25 |
+
11000,0.36005133390426636,0.3600513195991516,2.32388170003891,,
|
| 26 |
+
11500,0.36593225598335266,0.36593223524093627,2.318000784397125,,
|
| 27 |
+
12000,0.3506813943386078,0.3506813745498657,2.333251645088196,,
|
| 28 |
+
12500,0.34689468145370483,0.34689472723007203,2.3370382924079895,,
|
| 29 |
+
13000,0.3328351378440857,0.3328351325988769,2.3510978870391845,,
|
| 30 |
+
13500,0.32760584354400635,0.3276058340072632,2.356327185630798,,
|
| 31 |
+
14000,0.32396844029426575,0.32396845769882204,2.3599645619392393,,
|
| 32 |
+
14500,0.3112345039844513,0.3112345261573792,2.3726984934806823,,
|
| 33 |
+
15000,0.2970444858074188,0.2970444750785828,2.3868885445594787,,
|
| 34 |
+
15000,,,,2.4974724411964417,0.18646056950092316
|
| 35 |
+
15500,0.2933638393878937,0.2933638062477112,2.3905692133903504,,
|
| 36 |
+
16000,0.2843990921974182,0.28439907741546633,2.3995339422225954,,
|
| 37 |
+
16500,0.34524768590927124,0.34524767780303955,2.338685341835022,,
|
| 38 |
+
17000,0.3667249381542206,0.36672496843338015,2.3172080512046813,,
|
| 39 |
+
17500,0.35660773515701294,0.35660772275924685,2.3273252968788145,,
|
| 40 |
+
18000,0.344329833984375,0.34432986211776734,2.339603157520294,,
|
| 41 |
+
18500,0.3768962025642395,0.3768962044715881,2.3070368151664735,,
|
| 42 |
+
19000,0.40714362263679504,0.4071436634063721,2.2767893562316894,,
|
| 43 |
+
19500,0.3576985001564026,0.3576985297203064,2.326234489917755,,
|
| 44 |
+
20000,0.36372071504592896,0.3637206988334656,2.320212320804596,,
|
| 45 |
+
20000,,,,2.345616182088852,0.3383168578147888
|
| 46 |
+
20500,0.36746519804000854,0.36746525144577025,2.3164677681922914,,
|
| 47 |
+
21000,0.3630509376525879,0.3630509223937988,2.3208820972442625,,
|
| 48 |
+
21500,0.3734363317489624,0.37343637228012083,2.3104966473579407,,
|
| 49 |
+
22000,0.3743448555469513,0.3743448691368103,2.309588150501251,,
|
| 50 |
+
22500,0.37149685621261597,0.3714968810081482,2.3124361386299133,,
|
| 51 |
+
23000,0.3609534204006195,0.360953489780426,2.3229795298576357,,
|
| 52 |
+
23500,0.35798317193984985,0.3579831943511963,2.325949825286865,,
|
| 53 |
+
24000,0.36004963517189026,0.3600496459007263,2.3238833737373352,,
|
| 54 |
+
24500,0.35610634088516235,0.35610634326934815,2.3278266763687134,,
|
| 55 |
+
25000,0.3485834300518036,0.34858342027664185,2.3353495993614195,,
|
| 56 |
+
25000,,,,2.379871265888214,0.30406174063682556
|
| 57 |
+
25500,0.34725385904312134,0.3472538433074951,2.3366791763305663,,
|
| 58 |
+
26000,0.35197943449020386,0.3519794182777405,2.331953601360321,,
|
| 59 |
+
26500,0.3582424223423004,0.35824246644973756,2.325690553188324,,
|
| 60 |
+
27000,0.35206305980682373,0.352063081741333,2.3318699378967285,,
|
| 61 |
+
27500,0.34522876143455505,0.34522877645492556,2.338704243183136,,
|
| 62 |
+
28000,0.3227401077747345,0.32274007177352904,2.3611929478645326,,
|
| 63 |
+
28500,0.3392401337623596,0.33924011659622194,2.3446929030418397,,
|
| 64 |
+
29000,0.36245307326316833,0.36245307970046997,2.3214799399375914,,
|
| 65 |
+
29500,0.32731521129608154,0.3273151850700378,2.3566178345680235,,
|
| 66 |
+
30000,0.3360752463340759,0.3360752668380737,2.347857752799988,,
|
| 67 |
+
30000,,,,2.3262969970703127,0.357636034488678
|
| 68 |
+
30500,0.32054057717323303,0.3205405993461609,2.3633924202919006,,
|
| 69 |
+
31000,0.36444732546806335,0.36444735956192015,2.3194856600761415,,
|
| 70 |
+
31500,0.3549940884113312,0.3549940209388733,2.328938998699188,,
|
| 71 |
+
32000,0.3843594491481781,0.38435945653915404,2.2995735630989076,,
|
| 72 |
+
32500,0.3849279284477234,0.3849278755187988,2.2990051441192625,,
|
| 73 |
+
33000,0.39491337537765503,0.394913348197937,2.2890196714401245,,
|
| 74 |
+
33500,0.3920864760875702,0.3920865015983582,2.291846518039703,,
|
| 75 |
+
34000,0.39170318841934204,0.39170316791534426,2.292229851722717,,
|
| 76 |
+
34500,0.420412540435791,0.4204125347137451,2.2635204849243165,,
|
| 77 |
+
35000,0.34662899374961853,0.34662902069091794,2.3373039989471436,,
|
| 78 |
+
35000,,,,2.3692104506492613,0.31472259759902954
|
| 79 |
+
35500,0.35252904891967773,0.35252904319763184,2.3314039764404297,,
|
| 80 |
+
36000,0.32034236192703247,0.3203423891067505,2.363590630531311,,
|
| 81 |
+
36500,0.3476278781890869,0.34762785577774047,2.336305163860321,,
|
| 82 |
+
37000,0.3439163863658905,0.3439163794517517,2.3400166401863096,,
|
| 83 |
+
37500,0.34822696447372437,0.34822696352005006,2.3357060561180116,,
|
| 84 |
+
38000,0.33781173825263977,0.33781173610687254,2.346121283531189,,
|
| 85 |
+
38500,0.3199111819267273,0.31991121435165404,2.3640218052864075,,
|
| 86 |
+
39000,0.31628549098968506,0.3162854771614075,2.367647542476654,,
|
| 87 |
+
39500,0.3104632496833801,0.31046322917938235,2.373469790458679,,
|
| 88 |
+
40000,0.31474560499191284,0.314745614528656,2.3691874051094057,,
|
| 89 |
+
40000,,,,2.3955817461013793,0.28835129737854004
|
| 90 |
+
40500,0.29504793882369995,0.2950479545593262,2.3888850650787354,,
|
| 91 |
+
41000,0.28457191586494446,0.28457193803787234,2.399361081600189,,
|
| 92 |
+
41500,0.272605299949646,0.2726052570343018,2.4113277626037597,,
|
| 93 |
+
42000,0.27886706590652466,0.2788670420646667,2.4050659775733947,,
|
| 94 |
+
42500,0.2861153781414032,0.28611536741256716,2.3978176522254944,,
|
| 95 |
+
43000,0.32526740431785583,0.32526741933822634,2.3586656002998354,,
|
| 96 |
+
43500,0.2914542257785797,0.29145421838760377,2.3924788012504576,,
|
| 97 |
+
44000,0.30094438791275024,0.30094439268112183,2.38298862695694,,
|
| 98 |
+
44500,0.34661510586738586,0.34661513185501097,2.3373178877830507,,
|
| 99 |
+
45000,0.38904449343681335,0.3890444746017456,2.294888545036316,,
|
| 100 |
+
45000,,,,2.2740820169448854,0.4098510146141052
|
| 101 |
+
45500,0.40971922874450684,0.4097192544937134,2.2742137651443484,,
|
| 102 |
+
46000,0.4111744463443756,0.41117440700531005,2.2727586126327513,,
|
| 103 |
+
46500,0.4461890161037445,0.44618902063369753,2.237743999004364,,
|
| 104 |
+
47000,0.3991549015045166,0.39915493297576904,2.2847780866622927,,
|
| 105 |
+
47500,0.4061412215232849,0.4061412315368652,2.2777917881011964,,
|
| 106 |
+
48000,0.3889833390712738,0.3889833664894104,2.294949653148651,,
|
| 107 |
+
48500,0.387422114610672,0.387422110080719,2.2965109095573424,,
|
| 108 |
+
49000,0.38070225715637207,0.3807022848129272,2.303230734825134,,
|
| 109 |
+
49500,0.3346402645111084,0.3346402645111084,2.349292755126953,,
|
| 110 |
+
50000,0.3522387742996216,0.35223875284194944,2.331694266796112,,
|
| 111 |
+
50000,,,,2.4375158941745756,0.2464171200990677
|
1/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d7f7bf8a910d040dda104db751872ce36cc1ce0054abfb8890e8a004d560dac
|
| 3 |
+
size 58086507
|
1/config.yaml
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 1
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: SAC
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
buffer_size: 1000000
|
| 30 |
+
learning_starts: 100
|
| 31 |
+
batch_size: 256
|
| 32 |
+
tau: 0.005
|
| 33 |
+
gamma: 0.99
|
| 34 |
+
train_freq: 1
|
| 35 |
+
gradient_steps: -1
|
| 36 |
+
action_noise: null
|
| 37 |
+
replay_buffer_class: null
|
| 38 |
+
replay_buffer_kwargs: null
|
| 39 |
+
optimize_memory_usage: false
|
| 40 |
+
ent_coef: auto
|
| 41 |
+
target_update_interval: 1
|
| 42 |
+
target_entropy: auto
|
| 43 |
+
use_sde: false
|
| 44 |
+
sde_sample_freq: -1
|
| 45 |
+
use_sde_at_warmup: false
|
| 46 |
+
stats_window_size: 100
|
| 47 |
+
tensorboard_log: null
|
| 48 |
+
policy_kwargs: {}
|
| 49 |
+
verbose: 0
|
| 50 |
+
seed: ${seed}
|
| 51 |
+
device: cuda
|
| 52 |
+
_init_setup_model: true
|
| 53 |
+
cluster: {}
|
| 54 |
+
test_env_id: ${env_id}
|
| 55 |
+
test_env_kwargs: ${env_kwargs}
|
| 56 |
+
test_rl_mode: ${rl_mode}
|
| 57 |
+
n_test_episodes: 10
|
| 58 |
+
deterministic: true
|
| 59 |
+
save_frames: true
|
| 60 |
+
render_3d: true
|
1/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=1
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=1
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/SAC/1
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
1/multirun.yaml
ADDED
|
@@ -0,0 +1,223 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=1
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=1
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 1
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: SAC
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
buffer_size: 1000000
|
| 193 |
+
learning_starts: 100
|
| 194 |
+
batch_size: 256
|
| 195 |
+
tau: 0.005
|
| 196 |
+
gamma: 0.99
|
| 197 |
+
train_freq: 1
|
| 198 |
+
gradient_steps: -1
|
| 199 |
+
action_noise: null
|
| 200 |
+
replay_buffer_class: null
|
| 201 |
+
replay_buffer_kwargs: null
|
| 202 |
+
optimize_memory_usage: false
|
| 203 |
+
ent_coef: auto
|
| 204 |
+
target_update_interval: 1
|
| 205 |
+
target_entropy: auto
|
| 206 |
+
use_sde: false
|
| 207 |
+
sde_sample_freq: -1
|
| 208 |
+
use_sde_at_warmup: false
|
| 209 |
+
stats_window_size: 100
|
| 210 |
+
tensorboard_log: null
|
| 211 |
+
policy_kwargs: {}
|
| 212 |
+
verbose: 0
|
| 213 |
+
seed: ${seed}
|
| 214 |
+
device: cuda
|
| 215 |
+
_init_setup_model: true
|
| 216 |
+
cluster: {}
|
| 217 |
+
test_env_id: ${env_id}
|
| 218 |
+
test_env_kwargs: ${env_kwargs}
|
| 219 |
+
test_rl_mode: ${rl_mode}
|
| 220 |
+
n_test_episodes: 10
|
| 221 |
+
deterministic: true
|
| 222 |
+
save_frames: true
|
| 223 |
+
render_3d: true
|
1/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_sac
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=1
|
1/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
1/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/training_log.csv
ADDED
|
@@ -0,0 +1,111 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,0.11955216526985168,0.11955216455459594,2.5643808550834657,,
|
| 3 |
+
1000,0.2615123391151428,0.2615123200416565,2.422420699596405,,
|
| 4 |
+
1500,0.3377384543418884,0.3377384281158447,2.3461945915222167,,
|
| 5 |
+
2000,0.37330174446105957,0.3733017725944519,2.3106312470436094,,
|
| 6 |
+
2500,0.36323750019073486,0.3632375411987305,2.320695478439331,,
|
| 7 |
+
3000,0.38001587986946106,0.38001586723327635,2.303917152404785,,
|
| 8 |
+
3500,0.3918974697589874,0.39189748859405515,2.2920355310440064,,
|
| 9 |
+
4000,0.37987634539604187,0.37987632036209107,2.3040566992759706,,
|
| 10 |
+
4500,0.3700489401817322,0.370048969745636,2.3138840498924256,,
|
| 11 |
+
5000,0.35506853461265564,0.3550685710906982,2.328864448547363,,
|
| 12 |
+
5000,,,,2.3816866993904116,0.3022463321685791
|
| 13 |
+
5500,0.33614617586135864,0.3361461639404297,2.347786855697632,,
|
| 14 |
+
6000,0.34670740365982056,0.3467073812484741,2.3372256383895875,,
|
| 15 |
+
6500,0.33137086033821106,0.331370867729187,2.3525621519088746,,
|
| 16 |
+
7000,0.3285955786705017,0.32859555578231814,2.3553374638557436,,
|
| 17 |
+
7500,0.3073640763759613,0.30736405992507937,2.376568959712982,,
|
| 18 |
+
8000,0.2992413640022278,0.2992413635253906,2.384691656112671,,
|
| 19 |
+
8500,0.2893831729888916,0.28938315725326536,2.394549862384796,,
|
| 20 |
+
9000,0.2997531294822693,0.29975313901901246,2.3841798806190493,,
|
| 21 |
+
9500,0.28909119963645935,0.28909121704101565,2.3948418025970457,,
|
| 22 |
+
10000,0.3136785328388214,0.31367854690551755,2.370254472732544,,
|
| 23 |
+
10000,,,,2.3711638617515565,0.3127691447734833
|
| 24 |
+
10500,0.33827129006385803,0.3382712798118591,2.3456617398262023,,
|
| 25 |
+
11000,0.3373597264289856,0.337359721660614,2.3465732979774474,,
|
| 26 |
+
11500,0.339799702167511,0.33979975271224977,2.344133266925812,,
|
| 27 |
+
12000,0.3361790180206299,0.33617903375625613,2.3477539858818055,,
|
| 28 |
+
12500,0.34213846921920776,0.3421384539604187,2.3417945656776427,,
|
| 29 |
+
13000,0.33698737621307373,0.33698736619949343,2.346945653438568,,
|
| 30 |
+
13500,0.3411519527435303,0.34115195083618166,2.3427810688018798,,
|
| 31 |
+
14000,0.34138378500938416,0.341383770942688,2.3425492486953736,,
|
| 32 |
+
14500,0.33500048518180847,0.3350005259513855,2.348932493686676,,
|
| 33 |
+
15000,0.34000787138938904,0.34000788497924805,2.3439251346588135,,
|
| 34 |
+
15000,,,,2.355029064416885,0.3289039731025696
|
| 35 |
+
15500,0.3355133533477783,0.33551333999633787,2.3484196796417236,,
|
| 36 |
+
16000,0.33121979236602783,0.33121978759765625,2.352713232040405,,
|
| 37 |
+
16500,0.3411610722541809,0.3411610746383667,2.342771944999695,,
|
| 38 |
+
17000,0.34912651777267456,0.34912655210494997,2.3348064675331117,,
|
| 39 |
+
17500,0.35345301032066345,0.353453010559082,2.3304800090789795,,
|
| 40 |
+
18000,0.33646419644355774,0.3364642186164856,2.347468801021576,,
|
| 41 |
+
18500,0.347053587436676,0.34705356454849245,2.3368794550895693,,
|
| 42 |
+
19000,0.36115509271621704,0.3611551032066345,2.322777916431427,,
|
| 43 |
+
19500,0.33294478058815,0.3329448113441467,2.3509882082939146,,
|
| 44 |
+
20000,0.32412096858024597,0.32412095689773557,2.359812062740326,,
|
| 45 |
+
20000,,,,2.399965113401413,0.28396788239479065
|
| 46 |
+
20500,0.34134143590927124,0.3413414454460144,2.3425915741920473,,
|
| 47 |
+
21000,0.3464898467063904,0.34648982429504394,2.3374431953430177,,
|
| 48 |
+
21500,0.3400173783302307,0.34001737213134764,2.343915647506714,,
|
| 49 |
+
22000,0.33312350511550903,0.3331235122680664,2.3508095073699953,,
|
| 50 |
+
22500,0.34015417098999023,0.34015420913696287,2.3437788105010986,,
|
| 51 |
+
23000,0.3434748351573944,0.3434748573303223,2.340458162307739,,
|
| 52 |
+
23500,0.33854857087135315,0.3385485758781433,2.3453844437599183,,
|
| 53 |
+
24000,0.3371656537055969,0.3371656594276428,2.3467673602104187,,
|
| 54 |
+
24500,0.28274548053741455,0.2827455143928528,2.4011875052452085,,
|
| 55 |
+
25000,0.24586331844329834,0.24586332702636718,2.4380696926116943,,
|
| 56 |
+
25000,,,,2.302274807691574,0.3816582262516022
|
| 57 |
+
25500,0.3714216351509094,0.3714216103553772,2.3125114092826844,,
|
| 58 |
+
26000,0.3670129179954529,0.36701288414001465,2.316920135498047,,
|
| 59 |
+
26500,0.3348219096660614,0.33482186365127564,2.349111155986786,,
|
| 60 |
+
27000,0.33147895336151123,0.33147893142700197,2.3524540882110596,,
|
| 61 |
+
27500,0.3068658411502838,0.3068658447265625,2.377067174911499,,
|
| 62 |
+
28000,0.3133977949619293,0.3133977737426758,2.3705352458953857,,
|
| 63 |
+
28500,0.31069982051849365,0.3106998443603516,2.37323317527771,,
|
| 64 |
+
29000,0.3036830425262451,0.3036830406188965,2.380249979019165,,
|
| 65 |
+
29500,0.31775617599487305,0.31775613689422605,2.3661768827438356,,
|
| 66 |
+
30000,0.294028103351593,0.29402814531326293,2.3899048743247984,,
|
| 67 |
+
30000,,,,2.3480421018600466,0.33589091897010803
|
| 68 |
+
30500,0.2896604537963867,0.28966043949127196,2.3942725801467897,,
|
| 69 |
+
31000,0.2767109274864197,0.2767109642028809,2.407222055435181,,
|
| 70 |
+
31500,0.3014404773712158,0.3014404816627502,2.3824925379753115,,
|
| 71 |
+
32000,0.32920220494270325,0.32920223712921143,2.35473078250885,,
|
| 72 |
+
32500,0.31586503982543945,0.31586507844924927,2.368067941188812,,
|
| 73 |
+
33000,0.3175763487815857,0.3175763926506042,2.366356626987457,,
|
| 74 |
+
33500,0.3188968598842621,0.31889684200286866,2.3650361776351927,,
|
| 75 |
+
34000,0.32870402932167053,0.3287040286064148,2.355228991031647,,
|
| 76 |
+
34500,0.3249926269054413,0.32499262857437133,2.3589403910636904,,
|
| 77 |
+
35000,0.32589104771614075,0.3258910756111145,2.358041944026947,,
|
| 78 |
+
35000,,,,2.465165927410126,0.21876709163188934
|
| 79 |
+
35500,0.3195328712463379,0.3195328459739685,2.364400173664093,,
|
| 80 |
+
36000,0.3255794644355774,0.32557948493957517,2.3583535346984865,,
|
| 81 |
+
36500,0.3027646839618683,0.30276466941833496,2.3811683502197267,,
|
| 82 |
+
37000,0.28240832686424255,0.28240830898284913,2.4015247106552122,,
|
| 83 |
+
37500,0.2972622811794281,0.29726228380203246,2.386670735836029,,
|
| 84 |
+
38000,0.3105317950248718,0.31053178215026855,2.373401237487793,,
|
| 85 |
+
38500,0.3141724765300751,0.31417247438430784,2.3697605452537536,,
|
| 86 |
+
39000,0.3135026693344116,0.31350266408920285,2.3704303555488586,,
|
| 87 |
+
39500,0.3019282817840576,0.3019282999038696,2.382004719734192,,
|
| 88 |
+
40000,0.29805266857147217,0.2980526561737061,2.3858803634643553,,
|
| 89 |
+
40000,,,,2.396221239566803,0.2877117693424225
|
| 90 |
+
40500,0.29082605242729187,0.2908260521888733,2.3931069674491883,,
|
| 91 |
+
41000,0.27740898728370667,0.2774090142250061,2.4065240054130554,,
|
| 92 |
+
41500,0.25735801458358765,0.2573580346107483,2.426574985027313,,
|
| 93 |
+
42000,0.287665992975235,0.28766596841812136,2.39626705121994,,
|
| 94 |
+
42500,0.29726848006248474,0.2972684669494629,2.3866645526885986,,
|
| 95 |
+
43000,0.25463393330574036,0.2546339259147644,2.429299093723297,,
|
| 96 |
+
43500,0.2344123125076294,0.23441230821609496,2.4495207114219664,,
|
| 97 |
+
44000,0.3314891755580902,0.3314891486167908,2.3524438710212707,,
|
| 98 |
+
44500,0.2331017702817917,0.23310177326202391,2.4508312463760378,,
|
| 99 |
+
45000,0.26750460267066956,0.2675046000480652,2.4164284195899963,,
|
| 100 |
+
45000,,,,2.4435568797588347,0.24037612974643707
|
| 101 |
+
45500,0.29665470123291016,0.29665470886230466,2.387278310775757,,
|
| 102 |
+
46000,0.328882098197937,0.3288821029663086,2.355050916671753,,
|
| 103 |
+
46500,0.3211514353752136,0.32115139389038083,2.362781625747681,,
|
| 104 |
+
47000,0.3332333266735077,0.33323332452774046,2.350699695110321,,
|
| 105 |
+
47500,0.3087298572063446,0.3087298717498779,2.3752031478881834,,
|
| 106 |
+
48000,0.31843793392181396,0.31843794441223144,2.36549507522583,,
|
| 107 |
+
48500,0.3035736680030823,0.3035736632347107,2.3803593564033507,,
|
| 108 |
+
49000,0.2835811674594879,0.2835812072753906,2.400351812362671,,
|
| 109 |
+
49500,0.2730940580368042,0.2730941023826599,2.4108389172554014,,
|
| 110 |
+
50000,0.28016120195388794,0.28016119718551635,2.403771822452545,,
|
| 111 |
+
50000,,,,2.4074159145355223,0.2765170931816101
|
2/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8beff5de990e2697554a3a1b55f72db96c77ec472f4b00be93b17026216bc569
|
| 3 |
+
size 58086507
|
2/config.yaml
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 2
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: SAC
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
buffer_size: 1000000
|
| 30 |
+
learning_starts: 100
|
| 31 |
+
batch_size: 256
|
| 32 |
+
tau: 0.005
|
| 33 |
+
gamma: 0.99
|
| 34 |
+
train_freq: 1
|
| 35 |
+
gradient_steps: -1
|
| 36 |
+
action_noise: null
|
| 37 |
+
replay_buffer_class: null
|
| 38 |
+
replay_buffer_kwargs: null
|
| 39 |
+
optimize_memory_usage: false
|
| 40 |
+
ent_coef: auto
|
| 41 |
+
target_update_interval: 1
|
| 42 |
+
target_entropy: auto
|
| 43 |
+
use_sde: false
|
| 44 |
+
sde_sample_freq: -1
|
| 45 |
+
use_sde_at_warmup: false
|
| 46 |
+
stats_window_size: 100
|
| 47 |
+
tensorboard_log: null
|
| 48 |
+
policy_kwargs: {}
|
| 49 |
+
verbose: 0
|
| 50 |
+
seed: ${seed}
|
| 51 |
+
device: cuda
|
| 52 |
+
_init_setup_model: true
|
| 53 |
+
cluster: {}
|
| 54 |
+
test_env_id: ${env_id}
|
| 55 |
+
test_env_kwargs: ${env_kwargs}
|
| 56 |
+
test_rl_mode: ${rl_mode}
|
| 57 |
+
n_test_episodes: 10
|
| 58 |
+
deterministic: true
|
| 59 |
+
save_frames: true
|
| 60 |
+
render_3d: true
|
2/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=2
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=2
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/SAC/2
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
2/multirun.yaml
ADDED
|
@@ -0,0 +1,223 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=2
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=2
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 2
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: SAC
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
buffer_size: 1000000
|
| 193 |
+
learning_starts: 100
|
| 194 |
+
batch_size: 256
|
| 195 |
+
tau: 0.005
|
| 196 |
+
gamma: 0.99
|
| 197 |
+
train_freq: 1
|
| 198 |
+
gradient_steps: -1
|
| 199 |
+
action_noise: null
|
| 200 |
+
replay_buffer_class: null
|
| 201 |
+
replay_buffer_kwargs: null
|
| 202 |
+
optimize_memory_usage: false
|
| 203 |
+
ent_coef: auto
|
| 204 |
+
target_update_interval: 1
|
| 205 |
+
target_entropy: auto
|
| 206 |
+
use_sde: false
|
| 207 |
+
sde_sample_freq: -1
|
| 208 |
+
use_sde_at_warmup: false
|
| 209 |
+
stats_window_size: 100
|
| 210 |
+
tensorboard_log: null
|
| 211 |
+
policy_kwargs: {}
|
| 212 |
+
verbose: 0
|
| 213 |
+
seed: ${seed}
|
| 214 |
+
device: cuda
|
| 215 |
+
_init_setup_model: true
|
| 216 |
+
cluster: {}
|
| 217 |
+
test_env_id: ${env_id}
|
| 218 |
+
test_env_kwargs: ${env_kwargs}
|
| 219 |
+
test_rl_mode: ${rl_mode}
|
| 220 |
+
n_test_episodes: 10
|
| 221 |
+
deterministic: true
|
| 222 |
+
save_frames: true
|
| 223 |
+
render_3d: true
|
2/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_sac
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=2
|
2/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/training_log.csv
ADDED
|
@@ -0,0 +1,111 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,0.09883884340524673,0.0988388442993164,2.585094175338745,,
|
| 3 |
+
1000,0.31514814496040344,0.3151481204032898,2.3687848992347718,,
|
| 4 |
+
1500,0.33801695704460144,0.3380170159339905,2.345916003704071,,
|
| 5 |
+
2000,0.38077467679977417,0.3807747039794922,2.3031583156585693,,
|
| 6 |
+
2500,0.3784728944301605,0.3784729166030884,2.305460103034973,,
|
| 7 |
+
3000,0.3847574293613434,0.38475741815567016,2.2991756014823914,,
|
| 8 |
+
3500,0.3974042236804962,0.39740422868728636,2.286528790950775,,
|
| 9 |
+
4000,0.4110168516635895,0.4110168652534485,2.272916154384613,,
|
| 10 |
+
4500,0.4114917516708374,0.4114917583465576,2.2724412612915037,,
|
| 11 |
+
5000,0.4106045365333557,0.41060451984405516,2.2733284997940064,,
|
| 12 |
+
5000,,,,2.2744255661964417,0.4095074534416199
|
| 13 |
+
5500,0.42030635476112366,0.4203063464164734,2.263626673221588,,
|
| 14 |
+
6000,0.415286660194397,0.415286648273468,2.2686463713645937,,
|
| 15 |
+
6500,0.41055455803871155,0.4105545616149902,2.273378458023071,,
|
| 16 |
+
7000,0.4037080407142639,0.4037080507278442,2.2802249689102174,,
|
| 17 |
+
7500,0.42395445704460144,0.42395447397232056,2.259978545665741,,
|
| 18 |
+
8000,0.43119844794273376,0.43119848823547363,2.252734531402588,,
|
| 19 |
+
8500,0.4119945168495178,0.4119944944381714,2.2719385251998903,,
|
| 20 |
+
9000,0.4096094071865082,0.40960938930511476,2.2743236303329466,,
|
| 21 |
+
9500,0.3941054046154022,0.39410541534423826,2.2898276042938233,,
|
| 22 |
+
10000,0.39230266213417053,0.39230269384384153,2.29163032579422,,
|
| 23 |
+
10000,,,,2.2967470610141754,0.3871859908103943
|
| 24 |
+
10500,0.3908345401287079,0.39083454418182373,2.2930984754562376,,
|
| 25 |
+
11000,0.3723529577255249,0.37235297536849976,2.311580044269562,,
|
| 26 |
+
11500,0.3703734874725342,0.37037346839904783,2.3135595512390137,,
|
| 27 |
+
12000,0.39386749267578125,0.3938675022125244,2.2900655174255373,,
|
| 28 |
+
12500,0.38508328795433044,0.38508330392837525,2.2988497157096863,,
|
| 29 |
+
13000,0.38810205459594727,0.3881020317077637,2.295830987930298,,
|
| 30 |
+
13500,0.3790167272090912,0.3790166926383972,2.304916326999664,,
|
| 31 |
+
14000,0.39240747690200806,0.39240752696990966,2.2915254926681516,,
|
| 32 |
+
14500,0.3993660807609558,0.39936610651016236,2.2845669131278994,,
|
| 33 |
+
15000,0.4016115367412567,0.40161154794692994,2.2823214716911315,,
|
| 34 |
+
15000,,,,2.3128393161296845,0.3710936903953552
|
| 35 |
+
15500,0.38930046558380127,0.38930046606063845,2.294632553577423,,
|
| 36 |
+
16000,0.3958090841770172,0.39580912685394287,2.2881238927841188,,
|
| 37 |
+
16500,0.3815975487232208,0.3815975503921509,2.302335469245911,,
|
| 38 |
+
17000,0.3898243010044098,0.38982433938980104,2.2941086802482604,,
|
| 39 |
+
17500,0.40535253286361694,0.4053525538444519,2.2785804657936097,,
|
| 40 |
+
18000,0.3477639853954315,0.34776399469375613,2.3361690249443052,,
|
| 41 |
+
18500,0.36096417903900146,0.3609641675949097,2.322968852043152,,
|
| 42 |
+
19000,0.36969780921936035,0.36969781970977783,2.3142351999282837,,
|
| 43 |
+
19500,0.3604229688644409,0.36042299032211306,2.3235100293159485,,
|
| 44 |
+
20000,0.3453044593334198,0.3453044781684875,2.338628541469574,,
|
| 45 |
+
20000,,,,2.325555741786957,0.35837727785110474
|
| 46 |
+
20500,0.39089685678482056,0.39089686822891234,2.293036151409149,,
|
| 47 |
+
21000,0.4304860234260559,0.43048596334457395,2.2534470562934876,,
|
| 48 |
+
21500,0.42426207661628723,0.42426207542419436,2.2596709442138674,,
|
| 49 |
+
22000,0.38556018471717834,0.3855601763725281,2.2983728432655335,,
|
| 50 |
+
22500,0.40029409527778625,0.4002940945625305,2.283638925075531,,
|
| 51 |
+
23000,0.4676303565502167,0.4676303882598877,2.216302631378174,,
|
| 52 |
+
23500,0.3802143633365631,0.38021436929702757,2.303718650341034,,
|
| 53 |
+
24000,0.38708698749542236,0.38708698987960816,2.2968460297584534,,
|
| 54 |
+
24500,0.38168323040008545,0.3816832542419434,2.3022497653961183,,
|
| 55 |
+
25000,0.352658212184906,0.35265819263458253,2.331274827003479,,
|
| 56 |
+
25000,,,,2.264131404161453,0.41980162262916565
|
| 57 |
+
25500,0.37030816078186035,0.3703081521987915,2.31362486743927,,
|
| 58 |
+
26000,0.37340614199638367,0.37340612411499025,2.310526895523071,,
|
| 59 |
+
26500,0.3665284514427185,0.3665284695625305,2.317404550075531,,
|
| 60 |
+
27000,0.3480551242828369,0.3480551266670227,2.335877892971039,,
|
| 61 |
+
27500,0.3381863236427307,0.3381863284111023,2.3457466912269593,,
|
| 62 |
+
28000,0.33318424224853516,0.3331842279434204,2.3507487916946412,,
|
| 63 |
+
28500,0.34999334812164307,0.34999338817596437,2.3339396314620973,,
|
| 64 |
+
29000,0.3612307012081146,0.36123069190979,2.3227023277282717,,
|
| 65 |
+
29500,0.3560679852962494,0.35606797409057617,2.3278650455474854,,
|
| 66 |
+
30000,0.3487584888935089,0.3487584753036499,2.3351745443344116,,
|
| 67 |
+
30000,,,,2.3420548593997954,0.341878205537796
|
| 68 |
+
30500,0.3242737352848053,0.32427372121810916,2.3596592984199525,,
|
| 69 |
+
31000,0.3269742429256439,0.3269742169380188,2.3569588027000425,,
|
| 70 |
+
31500,0.331946462392807,0.33194647884368894,2.3519865407943725,,
|
| 71 |
+
32000,0.3538981080055237,0.3538981385231018,2.3300348811149596,,
|
| 72 |
+
32500,0.3361845910549164,0.3361846041679382,2.3477484154701234,,
|
| 73 |
+
33000,0.3243791460990906,0.32437916040420534,2.359553859233856,,
|
| 74 |
+
33500,0.35682880878448486,0.356828773021698,2.3271042466163636,,
|
| 75 |
+
34000,0.34993278980255127,0.349932758808136,2.3340002608299257,,
|
| 76 |
+
34500,0.31978052854537964,0.3197805066108704,2.364152513027191,,
|
| 77 |
+
35000,0.3265296518802643,0.3265296669006348,2.357403352737427,,
|
| 78 |
+
35000,,,,2.305757747888565,0.3781752586364746
|
| 79 |
+
35500,0.33830732107162476,0.3383073091506958,2.345625710487366,,
|
| 80 |
+
36000,0.34578052163124084,0.34578050184249876,2.338152517795563,,
|
| 81 |
+
36500,0.33739808201789856,0.33739806747436524,2.3465349521636965,,
|
| 82 |
+
37000,0.31067517399787903,0.31067513799667357,2.373257881641388,,
|
| 83 |
+
37500,0.2901448607444763,0.29014485216140745,2.393788167476654,,
|
| 84 |
+
38000,0.3599267601966858,0.3599267597198486,2.324006259918213,,
|
| 85 |
+
38500,0.3697894811630249,0.3697894673347473,2.3141435523033143,,
|
| 86 |
+
39000,0.3895874619483948,0.389587450504303,2.2943455691337586,,
|
| 87 |
+
39500,0.4314839243888855,0.43148394107818605,2.2524490785598754,,
|
| 88 |
+
40000,0.3809228539466858,0.3809228916168213,2.3030101280212403,,
|
| 89 |
+
40000,,,,2.2743191039562225,0.4096139073371887
|
| 90 |
+
40500,0.4257664978504181,0.4257664966583252,2.2581665229797365,,
|
| 91 |
+
41000,0.4169514775276184,0.416951473236084,2.2669815464019774,,
|
| 92 |
+
41500,0.414630651473999,0.41463064098358154,2.26930237865448,,
|
| 93 |
+
42000,0.3985764980316162,0.3985765051841736,2.285356514453888,,
|
| 94 |
+
42500,0.4142265021800995,0.4142265286445618,2.2697064909935,,
|
| 95 |
+
43000,0.4133087992668152,0.4133087916374207,2.270624228000641,,
|
| 96 |
+
43500,0.4190700650215149,0.4190701112747192,2.2648629083633423,,
|
| 97 |
+
44000,0.40073639154434204,0.4007364230155945,2.283196596622467,,
|
| 98 |
+
44500,0.40611475706100464,0.40611470651626586,2.2778183131217955,,
|
| 99 |
+
45000,0.4028867483139038,0.4028867521286011,2.2810462675094603,,
|
| 100 |
+
45000,,,,2.309482082128525,0.3744509220123291
|
| 101 |
+
45500,0.40599700808525085,0.40599701738357546,2.277936002254486,,
|
| 102 |
+
46000,0.38081908226013184,0.3808190999031067,2.303113919734955,,
|
| 103 |
+
46500,0.4154774844646454,0.4154774484634399,2.2684555711746217,,
|
| 104 |
+
47000,0.3886411190032959,0.38864110565185545,2.295291913986206,,
|
| 105 |
+
47500,0.3956488072872162,0.39564878702163697,2.2882842326164248,,
|
| 106 |
+
48000,0.3834753632545471,0.38347538805007936,2.300457631587982,,
|
| 107 |
+
48500,0.34946689009666443,0.349466863155365,2.3344661564826965,,
|
| 108 |
+
49000,0.3620041310787201,0.36200413274765014,2.3219288868904115,,
|
| 109 |
+
49500,0.374152272939682,0.37415228128433226,2.309780738353729,,
|
| 110 |
+
50000,0.4014316499233246,0.40143164539337156,2.28250137424469,,
|
| 111 |
+
50000,,,,2.2749226665496827,0.4090103507041931
|
3/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3980288935352966de7100a20f7cefbc7f9547ca7cc2196f1c299d4facd9aaf
|
| 3 |
+
size 58086509
|
3/config.yaml
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 3
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: SAC
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
buffer_size: 1000000
|
| 30 |
+
learning_starts: 100
|
| 31 |
+
batch_size: 256
|
| 32 |
+
tau: 0.005
|
| 33 |
+
gamma: 0.99
|
| 34 |
+
train_freq: 1
|
| 35 |
+
gradient_steps: -1
|
| 36 |
+
action_noise: null
|
| 37 |
+
replay_buffer_class: null
|
| 38 |
+
replay_buffer_kwargs: null
|
| 39 |
+
optimize_memory_usage: false
|
| 40 |
+
ent_coef: auto
|
| 41 |
+
target_update_interval: 1
|
| 42 |
+
target_entropy: auto
|
| 43 |
+
use_sde: false
|
| 44 |
+
sde_sample_freq: -1
|
| 45 |
+
use_sde_at_warmup: false
|
| 46 |
+
stats_window_size: 100
|
| 47 |
+
tensorboard_log: null
|
| 48 |
+
policy_kwargs: {}
|
| 49 |
+
verbose: 0
|
| 50 |
+
seed: ${seed}
|
| 51 |
+
device: cuda
|
| 52 |
+
_init_setup_model: true
|
| 53 |
+
cluster: {}
|
| 54 |
+
test_env_id: ${env_id}
|
| 55 |
+
test_env_kwargs: ${env_kwargs}
|
| 56 |
+
test_rl_mode: ${rl_mode}
|
| 57 |
+
n_test_episodes: 10
|
| 58 |
+
deterministic: true
|
| 59 |
+
save_frames: true
|
| 60 |
+
render_3d: true
|
3/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=3
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=3
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/SAC/3
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
3/multirun.yaml
ADDED
|
@@ -0,0 +1,223 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=3
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=3
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 3
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: SAC
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
buffer_size: 1000000
|
| 193 |
+
learning_starts: 100
|
| 194 |
+
batch_size: 256
|
| 195 |
+
tau: 0.005
|
| 196 |
+
gamma: 0.99
|
| 197 |
+
train_freq: 1
|
| 198 |
+
gradient_steps: -1
|
| 199 |
+
action_noise: null
|
| 200 |
+
replay_buffer_class: null
|
| 201 |
+
replay_buffer_kwargs: null
|
| 202 |
+
optimize_memory_usage: false
|
| 203 |
+
ent_coef: auto
|
| 204 |
+
target_update_interval: 1
|
| 205 |
+
target_entropy: auto
|
| 206 |
+
use_sde: false
|
| 207 |
+
sde_sample_freq: -1
|
| 208 |
+
use_sde_at_warmup: false
|
| 209 |
+
stats_window_size: 100
|
| 210 |
+
tensorboard_log: null
|
| 211 |
+
policy_kwargs: {}
|
| 212 |
+
verbose: 0
|
| 213 |
+
seed: ${seed}
|
| 214 |
+
device: cuda
|
| 215 |
+
_init_setup_model: true
|
| 216 |
+
cluster: {}
|
| 217 |
+
test_env_id: ${env_id}
|
| 218 |
+
test_env_kwargs: ${env_kwargs}
|
| 219 |
+
test_rl_mode: ${rl_mode}
|
| 220 |
+
n_test_episodes: 10
|
| 221 |
+
deterministic: true
|
| 222 |
+
save_frames: true
|
| 223 |
+
render_3d: true
|
3/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_sac
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=3
|
3/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
3/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/training_log.csv
ADDED
|
@@ -0,0 +1,111 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,0.041363656520843506,0.0413636531829834,2.6425693707466125,,
|
| 3 |
+
1000,0.2845894694328308,0.2845894742012024,2.399343560695648,,
|
| 4 |
+
1500,0.3236508071422577,0.3236508226394653,2.360282186508179,,
|
| 5 |
+
2000,0.3055736720561981,0.3055736613273621,2.3783593626022337,,
|
| 6 |
+
2500,0.32240942120552063,0.3224094071388245,2.3615236129760744,,
|
| 7 |
+
3000,0.23630768060684204,0.23630765962600708,2.4476253638267518,,
|
| 8 |
+
3500,0.2893707752227783,0.28937079763412477,2.3945622215270994,,
|
| 9 |
+
4000,0.30349743366241455,0.30349743556976316,2.3804355816841127,,
|
| 10 |
+
4500,0.2680175304412842,0.268017502784729,2.415915515422821,,
|
| 11 |
+
5000,0.3079318702220917,0.3079318833351135,2.3760011320114134,,
|
| 12 |
+
5000,,,,2.44891632437706,0.23501670360565186
|
| 13 |
+
5500,0.3037182688713074,0.30371822357177736,2.38021480512619,,
|
| 14 |
+
6000,0.2913186550140381,0.2913186831474304,2.3926143293380737,,
|
| 15 |
+
6500,0.30054613947868347,0.3005461664199829,2.3833868408203127,,
|
| 16 |
+
7000,0.29859215021133423,0.29859214878082274,2.38534086227417,,
|
| 17 |
+
7500,0.29734140634536743,0.2973413734436035,2.38659165763855,,
|
| 18 |
+
8000,0.313638836145401,0.3136388244628906,2.370294193267822,,
|
| 19 |
+
8500,0.32344916462898254,0.3234491624832153,2.3604838633537293,,
|
| 20 |
+
9000,0.31889909505844116,0.3188991184234619,2.365033890247345,,
|
| 21 |
+
9500,0.32065606117248535,0.32065606451034545,2.3632769508361817,,
|
| 22 |
+
10000,0.3250228762626648,0.32502288246154787,2.358910144329071,,
|
| 23 |
+
10000,,,,2.3849610686302185,0.298971951007843
|
| 24 |
+
10500,0.32610857486724854,0.3261085534095764,2.357824453830719,,
|
| 25 |
+
11000,0.31806114315986633,0.31806115531921386,2.3658718647956847,,
|
| 26 |
+
11500,0.3323117196559906,0.33231172609329224,2.351621289730072,,
|
| 27 |
+
12000,0.3269374370574951,0.3269374437332153,2.356995581626892,,
|
| 28 |
+
12500,0.32448944449424744,0.3244894232749939,2.359443606853485,,
|
| 29 |
+
13000,0.3331490755081177,0.333149112701416,2.350783903121948,,
|
| 30 |
+
13500,0.33554455637931824,0.33554456520080567,2.348388454914093,,
|
| 31 |
+
14000,0.3304682672023773,0.33046827936172485,2.3534647521972656,,
|
| 32 |
+
14500,0.3284685015678406,0.3284685406684876,2.3554644684791564,,
|
| 33 |
+
15000,0.3202449679374695,0.32024497652053835,2.363688047409058,,
|
| 34 |
+
15000,,,,2.363321132659912,0.3206118941307068
|
| 35 |
+
15500,0.3165782392024994,0.31657827425003054,2.3673547463417055,,
|
| 36 |
+
16000,0.3050459325313568,0.30504593563079835,2.3788870735168457,,
|
| 37 |
+
16500,0.2958841919898987,0.2958841919898987,2.38804882478714,,
|
| 38 |
+
17000,0.2823264002799988,0.2823264002799988,2.4016066174507142,,
|
| 39 |
+
17500,0.2732313275337219,0.2732313017845154,2.410701723575592,,
|
| 40 |
+
18000,0.2836480140686035,0.28364799213409425,2.400285025596619,,
|
| 41 |
+
18500,0.27188435196876526,0.27188434267044065,2.4120486850738527,,
|
| 42 |
+
19000,0.27215850353240967,0.27215851831436155,2.4117744946479798,,
|
| 43 |
+
19500,0.2455907016992569,0.24559067106246948,2.4383423504829405,,
|
| 44 |
+
20000,0.25711625814437866,0.2571162958145142,2.426816711425781,,
|
| 45 |
+
20000,,,,2.403497530221939,0.2804355025291443
|
| 46 |
+
20500,0.17816519737243652,0.1781652021408081,2.5057678227424622,,
|
| 47 |
+
21000,0.22277984023094177,0.22277985191345215,2.4611531715393067,,
|
| 48 |
+
21500,0.3372514843940735,0.3372514805793762,2.3466815314292906,,
|
| 49 |
+
22000,0.350021630525589,0.35002161836624146,2.3339114022254943,,
|
| 50 |
+
22500,0.3563081622123718,0.3563081684112549,2.3276248564720152,,
|
| 51 |
+
23000,0.35859349370002747,0.35859352397918703,2.3253394961357117,,
|
| 52 |
+
23500,0.3664802610874176,0.36648026609420775,2.317452746391296,,
|
| 53 |
+
24000,0.36185675859451294,0.3618567843437195,2.322076235771179,,
|
| 54 |
+
24500,0.35699066519737244,0.3569906439781189,2.3269423818588257,,
|
| 55 |
+
25000,0.33407652378082275,0.3340765514373779,2.349856469154358,,
|
| 56 |
+
25000,,,,2.3500538539886473,0.33387917280197144
|
| 57 |
+
25500,0.3495918810367584,0.3495919151306152,2.3343411169052124,,
|
| 58 |
+
26000,0.3547927737236023,0.3547927885055542,2.329140231132507,,
|
| 59 |
+
26500,0.3525802195072174,0.3525802459716797,2.3313527607917788,,
|
| 60 |
+
27000,0.36265188455581665,0.36265189599990844,2.3212811245918274,,
|
| 61 |
+
27500,0.3689521849155426,0.36895218563079835,2.3149808230400084,,
|
| 62 |
+
28000,0.3657776415348053,0.36577767515182497,2.3181553392410277,,
|
| 63 |
+
28500,0.3308854401111603,0.33088543367385864,2.3530475835800173,,
|
| 64 |
+
29000,0.3525615930557251,0.35256156635284425,2.33137145614624,,
|
| 65 |
+
29500,0.3513593077659607,0.3513593492507935,2.332573650836945,,
|
| 66 |
+
30000,0.33893701434135437,0.3389370274543762,2.3449959840774537,,
|
| 67 |
+
30000,,,,2.3707551312446595,0.3131778836250305
|
| 68 |
+
30500,0.3153613805770874,0.31536139631271365,2.3685716228485107,,
|
| 69 |
+
31000,0.29230982065200806,0.2923098478317261,2.3916231780052186,,
|
| 70 |
+
31500,0.30562102794647217,0.30562102794647217,2.3783119945526123,,
|
| 71 |
+
32000,0.3349657654762268,0.3349658074378967,2.3489672236442565,,
|
| 72 |
+
32500,0.3224736452102661,0.3224736132621765,2.3614594049453737,,
|
| 73 |
+
33000,0.3233737051486969,0.32337369775772096,2.360559331417084,,
|
| 74 |
+
33500,0.3176253139972687,0.3176253080368042,2.3663077125549314,,
|
| 75 |
+
34000,0.30631452798843384,0.30631449127197263,2.3776185302734376,,
|
| 76 |
+
34500,0.29748767614364624,0.2974876508712769,2.3864453706741333,,
|
| 77 |
+
35000,0.31834930181503296,0.3183493013381958,2.3655837206840515,,
|
| 78 |
+
35000,,,,2.3906465482711794,0.2932864725589752
|
| 79 |
+
35500,0.3128502666950226,0.31285030126571656,2.3710827116966247,,
|
| 80 |
+
36000,0.3198792636394501,0.3198792691230774,2.364053750038147,,
|
| 81 |
+
36500,0.3058224022388458,0.30582241201400756,2.3781106119155884,,
|
| 82 |
+
37000,0.3193216323852539,0.3193216395378113,2.364611379146576,,
|
| 83 |
+
37500,0.3199530243873596,0.3199530358314514,2.3639799909591677,,
|
| 84 |
+
38000,0.29010534286499023,0.2901053562164307,2.393827654838562,,
|
| 85 |
+
38500,0.3295949399471283,0.32959494304656983,2.3543380837440493,,
|
| 86 |
+
39000,0.3617915213108063,0.36179153871536257,2.32214147567749,,
|
| 87 |
+
39500,0.3303236663341522,0.3303236570358276,2.3536093711853026,,
|
| 88 |
+
40000,0.34733179211616516,0.3473317475318909,2.3366012659072877,,
|
| 89 |
+
40000,,,,2.376874792575836,0.3070582449436188
|
| 90 |
+
40500,0.3683886229991913,0.3683886227607727,2.3155443959236144,,
|
| 91 |
+
41000,0.3795541524887085,0.37955415773391726,2.3043788566589356,,
|
| 92 |
+
41500,0.4047442674636841,0.40474423551559446,2.279188784122467,,
|
| 93 |
+
42000,0.37771379947662354,0.3777138199806213,2.306219205379486,,
|
| 94 |
+
42500,0.35266923904418945,0.3526692686080933,2.3312637553215025,,
|
| 95 |
+
43000,0.31797051429748535,0.3179704937934876,2.365962529182434,,
|
| 96 |
+
43500,0.33190858364105225,0.33190854597091674,2.3520244750976564,,
|
| 97 |
+
44000,0.3241947591304779,0.32419475507736206,2.3597382521629333,,
|
| 98 |
+
44500,0.37281835079193115,0.37281834888458254,2.311114676475525,,
|
| 99 |
+
45000,0.372061163187027,0.37206115007400514,2.3118718695640563,,
|
| 100 |
+
45000,,,,2.3189984023571015,0.36493462324142456
|
| 101 |
+
45500,0.37205931544303894,0.37205933904647825,2.3118736763000487,,
|
| 102 |
+
46000,0.3847729563713074,0.3847729573249817,2.299160063266754,,
|
| 103 |
+
46500,0.37719348073005676,0.3771934952735901,2.30673952960968,,
|
| 104 |
+
47000,0.38410449028015137,0.38410454225540164,2.299828472137451,,
|
| 105 |
+
47500,0.39246466755867004,0.392464684009552,2.291468336582184,,
|
| 106 |
+
48000,0.38820815086364746,0.3882081694602966,2.2957248468399047,,
|
| 107 |
+
48500,0.39245012402534485,0.3924501404762268,2.2914828777313234,,
|
| 108 |
+
49000,0.3875936269760132,0.38759363079071046,2.296339379310608,,
|
| 109 |
+
49500,0.38034874200820923,0.38034876585006716,2.3035842604637145,,
|
| 110 |
+
50000,0.38210004568099976,0.3821000304222107,2.3018329973220824,,
|
| 111 |
+
50000,,,,2.368478583097458,0.3154544532299042
|
4/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22a502ce18f89d75472eb9e14b9a1968b54b983aa18701b8f495c109383dcdee
|
| 3 |
+
size 58086509
|
4/config.yaml
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 4
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: SAC
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
buffer_size: 1000000
|
| 30 |
+
learning_starts: 100
|
| 31 |
+
batch_size: 256
|
| 32 |
+
tau: 0.005
|
| 33 |
+
gamma: 0.99
|
| 34 |
+
train_freq: 1
|
| 35 |
+
gradient_steps: -1
|
| 36 |
+
action_noise: null
|
| 37 |
+
replay_buffer_class: null
|
| 38 |
+
replay_buffer_kwargs: null
|
| 39 |
+
optimize_memory_usage: false
|
| 40 |
+
ent_coef: auto
|
| 41 |
+
target_update_interval: 1
|
| 42 |
+
target_entropy: auto
|
| 43 |
+
use_sde: false
|
| 44 |
+
sde_sample_freq: -1
|
| 45 |
+
use_sde_at_warmup: false
|
| 46 |
+
stats_window_size: 100
|
| 47 |
+
tensorboard_log: null
|
| 48 |
+
policy_kwargs: {}
|
| 49 |
+
verbose: 0
|
| 50 |
+
seed: ${seed}
|
| 51 |
+
device: cuda
|
| 52 |
+
_init_setup_model: true
|
| 53 |
+
cluster: {}
|
| 54 |
+
test_env_id: ${env_id}
|
| 55 |
+
test_env_kwargs: ${env_kwargs}
|
| 56 |
+
test_rl_mode: ${rl_mode}
|
| 57 |
+
n_test_episodes: 10
|
| 58 |
+
deterministic: true
|
| 59 |
+
save_frames: true
|
| 60 |
+
render_3d: true
|
4/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=4
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=4
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/SAC/4
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
4/multirun.yaml
ADDED
|
@@ -0,0 +1,223 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_sac
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=4
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_sac,env_id=RBC3D-hard-v0,rl_mode=marl,seed=4
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_sac
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 4
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: SAC
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.sac.sac.SAC
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
buffer_size: 1000000
|
| 193 |
+
learning_starts: 100
|
| 194 |
+
batch_size: 256
|
| 195 |
+
tau: 0.005
|
| 196 |
+
gamma: 0.99
|
| 197 |
+
train_freq: 1
|
| 198 |
+
gradient_steps: -1
|
| 199 |
+
action_noise: null
|
| 200 |
+
replay_buffer_class: null
|
| 201 |
+
replay_buffer_kwargs: null
|
| 202 |
+
optimize_memory_usage: false
|
| 203 |
+
ent_coef: auto
|
| 204 |
+
target_update_interval: 1
|
| 205 |
+
target_entropy: auto
|
| 206 |
+
use_sde: false
|
| 207 |
+
sde_sample_freq: -1
|
| 208 |
+
use_sde_at_warmup: false
|
| 209 |
+
stats_window_size: 100
|
| 210 |
+
tensorboard_log: null
|
| 211 |
+
policy_kwargs: {}
|
| 212 |
+
verbose: 0
|
| 213 |
+
seed: ${seed}
|
| 214 |
+
device: cuda
|
| 215 |
+
_init_setup_model: true
|
| 216 |
+
cluster: {}
|
| 217 |
+
test_env_id: ${env_id}
|
| 218 |
+
test_env_kwargs: ${env_kwargs}
|
| 219 |
+
test_rl_mode: ${rl_mode}
|
| 220 |
+
n_test_episodes: 10
|
| 221 |
+
deterministic: true
|
| 222 |
+
save_frames: true
|
| 223 |
+
render_3d: true
|
4/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_sac
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=4
|