Upload results for PPO on RBC3D-easy-v0.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +20 -0
- 0/ckpt_latest.zip +3 -0
- 0/config.yaml +58 -0
- 0/hydra.yaml +163 -0
- 0/multirun.yaml +221 -0
- 0/overrides.yaml +4 -0
- 0/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 0/test/test_eval_episode_0.csv +0 -0
- 0/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 0/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 0/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 0/training_log.csv +113 -0
- 1/ckpt_latest.zip +3 -0
- 1/config.yaml +58 -0
- 1/hydra.yaml +163 -0
- 1/multirun.yaml +221 -0
- 1/overrides.yaml +4 -0
- 1/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 1/test/test_eval_episode_0.csv +0 -0
- 1/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 1/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 1/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 1/training_log.csv +113 -0
- 2/ckpt_latest.zip +3 -0
- 2/config.yaml +58 -0
- 2/hydra.yaml +163 -0
- 2/multirun.yaml +221 -0
- 2/overrides.yaml +4 -0
- 2/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 2/test/test_eval_episode_0.csv +0 -0
- 2/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 2/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 2/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 2/training_log.csv +113 -0
- 3/ckpt_latest.zip +3 -0
- 3/config.yaml +58 -0
- 3/hydra.yaml +163 -0
- 3/multirun.yaml +221 -0
- 3/overrides.yaml +4 -0
- 3/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 3/test/test_eval_episode_0.csv +0 -0
- 3/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 3/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 3/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 3/training_log.csv +113 -0
- 4/ckpt_latest.zip +3 -0
- 4/config.yaml +58 -0
- 4/hydra.yaml +163 -0
- 4/multirun.yaml +221 -0
- 4/overrides.yaml +4 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,23 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
0/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
0/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
0/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
0/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
1/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
1/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
1/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
1/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
2/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
2/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
2/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
2/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
3/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
3/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
3/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
3/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
4/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
4/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
4/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
4/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
0/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2094613575a76ccd8cb0f352cf607e98238c83b335b0a8b56c8254a2c8e6d0fe
|
| 3 |
+
size 8844014
|
0/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-easy-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 0
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
0/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=0
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=0
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-easy-v0/PPO/0
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
0/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=0
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=0
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-easy-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 0
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
0/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-easy-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=0
|
0/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
0/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.03450341895222664,-0.034503421783447265,2.21608633852005,,
|
| 3 |
+
1000,-0.04744487628340721,-0.04744487380981445,2.2290278015136717,,
|
| 4 |
+
1500,-0.07780329138040543,-0.07780329942703247,2.259386221885681,,
|
| 5 |
+
2000,-0.06185987964272499,-0.06185988235473633,2.2434428148269654,,
|
| 6 |
+
2500,-0.014688276685774326,-0.014688277721405029,2.1962711925506593,,
|
| 7 |
+
3000,-0.0866512879729271,-0.08665128946304321,2.268234219074249,,
|
| 8 |
+
3500,-0.045226745307445526,-0.045226747989654544,2.2268096861839295,,
|
| 9 |
+
4000,-0.05605094134807587,-0.05605093860626221,2.2376338682174683,,
|
| 10 |
+
4500,-0.01419476605951786,-0.014194766044616699,2.1957777061462402,,
|
| 11 |
+
5000,0.01904117874801159,0.01904117965698242,2.1625417394638062,,
|
| 12 |
+
5000,,,,2.1481730163097383,0.033409908413887024
|
| 13 |
+
5500,0.005845546722412109,0.005845546722412109,2.1757373745441435,,
|
| 14 |
+
6000,-0.02578740380704403,-0.02578740406036377,2.2073703379631042,,
|
| 15 |
+
6500,-0.006663489155471325,-0.006663490295410157,2.1882464270591737,,
|
| 16 |
+
7000,-0.02166476845741272,-0.021664767742156983,2.2032477045059204,,
|
| 17 |
+
7500,0.008638587780296803,0.008638587474822998,2.172944338798523,,
|
| 18 |
+
8000,0.011830026283860207,0.011830027103424073,2.169752900838852,,
|
| 19 |
+
8500,0.024285053834319115,0.02428505277633667,2.157297875881195,,
|
| 20 |
+
9000,0.00818329956382513,0.008183300495147705,2.173399622678757,,
|
| 21 |
+
9500,0.0668615847826004,0.06686158275604248,2.114721347332001,,
|
| 22 |
+
10000,0.057360075414180756,0.05736007666587829,2.1242228457927705,,
|
| 23 |
+
10000,,,,2.097888413667679,0.08369451016187668
|
| 24 |
+
10500,0.06884069740772247,0.0688406994342804,2.1127422280311583,,
|
| 25 |
+
11000,0.02789771370589733,0.02789771556854248,2.1536852095127106,,
|
| 26 |
+
11500,0.09138531237840652,0.09138531303405761,2.0901976108551024,,
|
| 27 |
+
12000,0.10403602570295334,0.10403602051734924,2.0775469059944154,,
|
| 28 |
+
12500,0.08804373443126678,0.08804372334480286,2.093539213895798,,
|
| 29 |
+
13000,0.13331347703933716,0.1333134868144989,2.0482694232463836,,
|
| 30 |
+
13500,0.10579406470060349,0.1057940742969513,2.075788856506348,,
|
| 31 |
+
14000,0.1302189975976944,0.13021900272369386,2.051363911628723,,
|
| 32 |
+
14500,0.14101365208625793,0.1410136513710022,2.040569269657135,,
|
| 33 |
+
15000,0.08936165273189545,0.08936165833473206,2.0922212710380554,,
|
| 34 |
+
15000,,,,1.8774564373493194,0.304126501083374
|
| 35 |
+
15500,0.0895434096455574,0.08954341077804566,2.092039510965347,,
|
| 36 |
+
16000,0.021286876872181892,0.021286877155303956,2.160296056509018,,
|
| 37 |
+
16500,0.08324971050024033,0.08324971103668213,2.098333217382431,,
|
| 38 |
+
17000,0.11891013383865356,0.11891013669967651,2.062672791004181,,
|
| 39 |
+
17500,0.13359619677066803,0.1335961949825287,2.0479867279529573,,
|
| 40 |
+
18000,0.12700319290161133,0.12700318574905395,2.054579733133316,,
|
| 41 |
+
18500,0.16050726175308228,0.1605072796344757,2.0210756483078005,,
|
| 42 |
+
19000,0.11986298859119415,0.11986299753189086,2.0617199251651765,,
|
| 43 |
+
19500,0.18126916885375977,0.1812691767215729,2.000313750743866,,
|
| 44 |
+
20000,0.18594513833522797,0.1859451537132263,1.9956377680301667,,
|
| 45 |
+
20000,,,,1.8686068803071976,0.31297603249549866
|
| 46 |
+
20500,0.15597958862781525,0.15597958087921143,2.0256033458709717,,
|
| 47 |
+
21000,0.1916520595550537,0.19165206623077394,1.9899308605194093,,
|
| 48 |
+
21500,0.1818467378616333,0.18184674453735353,1.9997361936569213,,
|
| 49 |
+
22000,0.1905975043773651,0.1905975136756897,1.9909854114055634,,
|
| 50 |
+
22500,0.1405470371246338,0.14054704189300538,2.0410358879566193,,
|
| 51 |
+
23000,0.21267107129096985,0.21267105317115784,1.968911864042282,,
|
| 52 |
+
23500,0.1852109283208847,0.18521092104911804,1.996372008562088,,
|
| 53 |
+
24000,0.18475738167762756,0.18475737261772157,1.9968255643844603,,
|
| 54 |
+
24500,0.19879989326000214,0.1987998914718628,1.982783041715622,,
|
| 55 |
+
25000,0.22323256731033325,0.22323257732391358,1.9583503544330596,,
|
| 56 |
+
25000,,,,1.8338491117954254,0.3477337956428528
|
| 57 |
+
25500,0.22924970090389252,0.22924968600273132,1.9523332455158233,,
|
| 58 |
+
26000,0.22784361243247986,0.22784361505508424,1.9537393190860748,,
|
| 59 |
+
26500,0.21676860749721527,0.2167686059474945,1.9648143317699431,,
|
| 60 |
+
27000,0.1593806892633438,0.15938069558143617,2.022202234506607,,
|
| 61 |
+
27500,0.18888811767101288,0.1888881220817566,1.9926947934627532,,
|
| 62 |
+
28000,0.17867620289325714,0.17867620348930358,2.0029067261219025,,
|
| 63 |
+
28500,0.19584621489048004,0.19584622168540955,1.985736694574356,,
|
| 64 |
+
29000,0.18205171823501587,0.18205172967910765,1.9995312101840972,,
|
| 65 |
+
29500,0.20991070568561554,0.2099106981754303,1.9716722218990326,,
|
| 66 |
+
30000,0.166031613945961,0.16603161525726318,2.0155513136386873,,
|
| 67 |
+
30000,,,,1.8590470081567765,0.322535902261734
|
| 68 |
+
30500,0.19970406591892242,0.19970405888557435,1.98187886428833,,
|
| 69 |
+
31000,0.2315494418144226,0.23154943919181822,1.9500334920883178,,
|
| 70 |
+
31500,0.22102193534374237,0.22102192211151123,1.9605610048770905,,
|
| 71 |
+
32000,0.23556064069271088,0.2355606198310852,1.946022305727005,,
|
| 72 |
+
32500,0.22610223293304443,0.22610224103927612,1.9554806892871857,,
|
| 73 |
+
33000,0.2338980883359909,0.23389808917045593,1.9476848378181457,,
|
| 74 |
+
33500,0.2303069829940796,0.23030698490142823,1.9512759561538697,,
|
| 75 |
+
34000,0.20536114275455475,0.20536115288734436,1.9762217633724213,,
|
| 76 |
+
34500,0.238141268491745,0.238141277551651,1.943441642999649,,
|
| 77 |
+
35000,0.19898933172225952,0.19898933744430541,1.9825935895442963,,
|
| 78 |
+
35000,,,,1.8403058993816375,0.34127700328826904
|
| 79 |
+
35500,0.20283499360084534,0.2028350086212158,1.9787479271888733,,
|
| 80 |
+
36000,0.18234245479106903,0.1823424563407898,1.9992404680252076,,
|
| 81 |
+
36500,0.19815360009670258,0.19815361189842223,1.9834293143749238,,
|
| 82 |
+
37000,0.23277856409549713,0.2327785701751709,1.9488043575286864,,
|
| 83 |
+
37500,0.2118435949087143,0.21184361171722413,1.969739307165146,,
|
| 84 |
+
38000,0.19836951792240143,0.19836953949928285,1.9832133975028992,,
|
| 85 |
+
38500,0.2093891203403473,0.20938913536071777,1.9721937882900238,,
|
| 86 |
+
39000,0.19542239606380463,0.19542239141464232,1.9861605288982391,,
|
| 87 |
+
39500,0.1940208375453949,0.19402081966400148,1.9875621078014374,,
|
| 88 |
+
40000,0.1852363497018814,0.18523633670806885,1.996346591234207,,
|
| 89 |
+
40000,,,,1.800716791152954,0.380866140127182
|
| 90 |
+
40500,0.1866176277399063,0.18661761355400086,1.994965318441391,,
|
| 91 |
+
41000,0.185668483376503,0.18566848945617676,1.9959144315719604,,
|
| 92 |
+
41500,0.19251126050949097,0.19251125502586364,1.989071682214737,,
|
| 93 |
+
42000,0.18013466894626617,0.18013468408584596,2.0014482305049897,,
|
| 94 |
+
42500,0.18430715799331665,0.18430715322494506,1.9972757818698883,,
|
| 95 |
+
43000,0.1435137391090393,0.14351374077796936,2.038069188117981,,
|
| 96 |
+
43500,0.2033105194568634,0.20331051993370056,1.9782724118232726,,
|
| 97 |
+
44000,0.20817968249320984,0.20817968583106994,1.9734032518863678,,
|
| 98 |
+
44500,0.21687616407871246,0.2168761546611786,1.9647067737579347,,
|
| 99 |
+
45000,0.19658063352108002,0.1965806143283844,1.985002319097519,,
|
| 100 |
+
45000,,,,1.8179256582260133,0.36365726590156555
|
| 101 |
+
45500,0.20966705679893494,0.20966703510284423,1.971915880203247,,
|
| 102 |
+
46000,0.18730169534683228,0.18730170702934265,1.9942812123298645,,
|
| 103 |
+
46500,0.19382217526435852,0.19382215762138366,1.987760773897171,,
|
| 104 |
+
47000,0.22278591990470886,0.22278594374656677,1.9587969834804535,,
|
| 105 |
+
47500,0.22301596403121948,0.22301595544815064,1.9585669672489165,,
|
| 106 |
+
48000,0.23117610812187195,0.23117612409591676,1.9504068081378936,,
|
| 107 |
+
48500,0.23507076501846313,0.23507076692581177,1.9465121581554412,,
|
| 108 |
+
49000,0.21670731902122498,0.21670731854438782,1.9648756036758424,,
|
| 109 |
+
49500,0.2592141628265381,0.2592141625881195,1.922368763923645,,
|
| 110 |
+
50000,0.2537287175655365,0.25372872352600095,1.9278542079925538,,
|
| 111 |
+
50000,,,,1.8115031439065934,0.37007978558540344
|
| 112 |
+
50500,0.2584187686443329,0.25841876912117007,1.9231641564369202,,
|
| 113 |
+
51000,0.2644350826740265,0.26443511295318606,1.9171478066444396,,
|
1/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6943cf968ed6f8a5bdad56e7166a81f45b8c66888164483fb7c9ad27247d04bd
|
| 3 |
+
size 8844018
|
1/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-easy-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 1
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
1/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=1
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=1
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-easy-v0/PPO/1
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
1/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=1
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=1
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-easy-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 1
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
1/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-easy-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=1
|
1/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
1/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.05532454326748848,-0.05532454109191894,2.236907469749451,,
|
| 3 |
+
1000,-0.042064204812049866,-0.04206420612335205,2.223647139072418,,
|
| 4 |
+
1500,-0.06273674219846725,-0.062736741065979,2.244319662570953,,
|
| 5 |
+
2000,-0.07008584588766098,-0.07008584213256835,2.2516687688827512,,
|
| 6 |
+
2500,-0.01913711242377758,-0.01913711452484131,2.200720051288605,,
|
| 7 |
+
3000,-0.001090225880034268,-0.0010902261734008789,2.182673150539398,,
|
| 8 |
+
3500,-0.030156422406435013,-0.030156422138214112,2.21173934841156,,
|
| 9 |
+
4000,-0.016438735648989677,-0.016438735485076905,2.1980216569900515,,
|
| 10 |
+
4500,0.011829023249447346,0.011829023838043212,2.169753906726837,,
|
| 11 |
+
5000,0.00865052081644535,0.008650521993637085,2.1729324123859404,,
|
| 12 |
+
5000,,,,2.109789274930954,0.07179364562034607
|
| 13 |
+
5500,-0.05442178621888161,-0.05442178773880005,2.2360047087669375,,
|
| 14 |
+
6000,-0.03430760279297829,-0.034307602882385255,2.2158905329704286,,
|
| 15 |
+
6500,-0.015637125819921494,-0.015637125968933106,2.197220060348511,,
|
| 16 |
+
7000,0.03096276894211769,0.03096276926994324,2.150620158195496,,
|
| 17 |
+
7500,0.013421268202364445,0.013421268939971923,2.1681616582870484,,
|
| 18 |
+
8000,0.009028011001646519,0.009028010368347168,2.172554919242859,,
|
| 19 |
+
8500,-0.04945112019777298,-0.04945111799240112,2.2310340332984926,,
|
| 20 |
+
9000,-0.020318355411291122,-0.020318357467651368,2.2019012837409973,,
|
| 21 |
+
9500,-0.0155616644769907,-0.015561667442321778,2.197144591808319,,
|
| 22 |
+
10000,-0.014368440955877304,-0.014368441343307494,2.195951369524002,,
|
| 23 |
+
10000,,,,1.974735408425331,0.20684751868247986
|
| 24 |
+
10500,0.007561460603028536,0.007561460494995117,2.1740214745998383,,
|
| 25 |
+
11000,0.0792570635676384,0.07925706815719605,2.1023258695602416,,
|
| 26 |
+
11500,0.051937684416770935,0.051937682390213014,2.1296452515125273,,
|
| 27 |
+
12000,0.08119971305131912,0.08119971799850464,2.1003832159042357,,
|
| 28 |
+
12500,0.05947531759738922,0.059475318908691406,2.1221076090335846,,
|
| 29 |
+
13000,0.06549473851919174,0.06549473905563355,2.1160881946086882,,
|
| 30 |
+
13500,0.0781002789735794,0.07810027623176574,2.1034826579093933,,
|
| 31 |
+
14000,0.05296202376484871,0.05296202850341797,2.1286208984851838,,
|
| 32 |
+
14500,0.045136045664548874,0.045136043548583984,2.136446895122528,,
|
| 33 |
+
15000,0.07512853294610977,0.07512853956222534,2.10645437669754,,
|
| 34 |
+
15000,,,,1.898246524333954,0.2833364009857178
|
| 35 |
+
15500,0.08783398568630219,0.08783397912979125,2.0937489416599275,,
|
| 36 |
+
16000,0.03680252656340599,0.036802526235580446,2.144780403852463,,
|
| 37 |
+
16500,0.06552798300981522,0.06552799391746521,2.1160549376010893,,
|
| 38 |
+
17000,0.11722325533628464,0.11722326016426086,2.0643596632480623,,
|
| 39 |
+
17500,0.10443466901779175,0.1044346706867218,2.077148262023926,,
|
| 40 |
+
18000,0.09700943529605865,0.09700943994522095,2.0845734903812407,,
|
| 41 |
+
18500,0.068212129175663,0.0682121229171753,2.113370796918869,,
|
| 42 |
+
19000,0.1437195986509323,0.14371961188316346,2.0378633136749267,,
|
| 43 |
+
19500,0.1432533860206604,0.1432533824443817,2.0383295407295225,,
|
| 44 |
+
20000,0.15096530318260193,0.1509652965068817,2.0306176216602325,,
|
| 45 |
+
20000,,,,1.8412724453210831,0.3403104543685913
|
| 46 |
+
20500,0.13602545857429504,0.13602546429634094,2.0455574612617493,,
|
| 47 |
+
21000,0.17948126792907715,0.17948127388954163,2.002101660013199,,
|
| 48 |
+
21500,0.1824798285961151,0.18247982621192932,1.9991031079292296,,
|
| 49 |
+
22000,0.1657581925392151,0.16575819063186645,2.0158247327804566,,
|
| 50 |
+
22500,0.15209029614925385,0.15209030151367187,2.029492626905441,,
|
| 51 |
+
23000,0.17347684502601624,0.1734768421649933,2.0081060769557952,,
|
| 52 |
+
23500,0.18314525485038757,0.1831452603340149,1.9984376702308655,,
|
| 53 |
+
24000,0.175364688038826,0.17536468553543091,2.0062182474136354,,
|
| 54 |
+
24500,0.18781845271587372,0.18781845116615295,1.993764481306076,,
|
| 55 |
+
25000,0.17675071954727173,0.1767507128715515,2.0048322126865386,,
|
| 56 |
+
25000,,,,1.822121074795723,0.35946184396743774
|
| 57 |
+
25500,0.17473116517066956,0.17473116493225097,2.0068517661094667,,
|
| 58 |
+
26000,0.18992768228054047,0.1899276773929596,1.9916552500724793,,
|
| 59 |
+
26500,0.19144096970558167,0.19144096755981446,1.9901419644355773,,
|
| 60 |
+
27000,0.1957865208387375,0.19578652715682984,1.9857964112758637,,
|
| 61 |
+
27500,0.17141875624656677,0.17141878700256347,2.010164145231247,,
|
| 62 |
+
28000,0.16530491411685944,0.16530492639541625,2.0162780055999754,,
|
| 63 |
+
28500,0.15861529111862183,0.15861530327796936,2.022967614889145,,
|
| 64 |
+
29000,0.190576434135437,0.19057644152641295,1.9910064816474915,,
|
| 65 |
+
29500,0.14882892370224,0.14882891631126405,2.032754002571106,,
|
| 66 |
+
30000,0.19076226651668549,0.19076227021217346,1.9908206520080567,,
|
| 67 |
+
30000,,,,1.825539590716362,0.35604333877563477
|
| 68 |
+
30500,0.19467350840568542,0.1946735203266144,1.9869094109535217,,
|
| 69 |
+
31000,0.18358498811721802,0.1835849905014038,1.9979979417324065,,
|
| 70 |
+
31500,0.19085055589675903,0.19085055685043334,1.9907323625087738,,
|
| 71 |
+
32000,0.18471629917621613,0.1847162802219391,1.9968666501045227,,
|
| 72 |
+
32500,0.19630907475948334,0.1963090615272522,1.9852738602161408,,
|
| 73 |
+
33000,0.15975883603096008,0.15975883603096008,2.021824098110199,,
|
| 74 |
+
33500,0.18610268831253052,0.1861027090549469,1.9954802176952362,,
|
| 75 |
+
34000,0.1934846043586731,0.19348459935188295,1.9880983350276946,,
|
| 76 |
+
34500,0.19800257682800293,0.19800259137153625,1.9835803401470185,,
|
| 77 |
+
35000,0.19088879227638245,0.19088879346847534,1.9906941406726837,,
|
| 78 |
+
35000,,,,1.801977931857109,0.3796049952507019
|
| 79 |
+
35500,0.18782806396484375,0.1878280704021454,1.9937548604011535,,
|
| 80 |
+
36000,0.18548572063446045,0.18548569560050965,1.9960972273349762,,
|
| 81 |
+
36500,0.19000686705112457,0.19000686478614806,1.99157603931427,,
|
| 82 |
+
37000,0.1815672069787979,0.18156721639633178,2.0000157206058504,,
|
| 83 |
+
37500,0.18995963037014008,0.1899596300125122,1.991623300075531,,
|
| 84 |
+
38000,0.18333159387111664,0.18333158016204834,1.9982513453960418,,
|
| 85 |
+
38500,0.1904798448085785,0.19047985172271728,1.9911030755043029,,
|
| 86 |
+
39000,0.17658422887325287,0.17658423256874084,2.0049986896514893,,
|
| 87 |
+
39500,0.17397551238536835,0.17397549295425416,2.0076074500083925,,
|
| 88 |
+
40000,0.17871572077274323,0.1787157244682312,2.0028672032356263,,
|
| 89 |
+
40000,,,,1.8112351942062377,0.3703477382659912
|
| 90 |
+
40500,0.16244958341121674,0.16244959354400634,2.0191333339214323,,
|
| 91 |
+
41000,0.19321593642234802,0.19321595406532288,1.9883669760227203,,
|
| 92 |
+
41500,0.211032435297966,0.21103244495391846,1.9705504789352417,,
|
| 93 |
+
42000,0.21050134301185608,0.21050135350227356,1.9710815768241883,,
|
| 94 |
+
42500,0.19840531051158905,0.1984053030014038,1.9831776325702668,,
|
| 95 |
+
43000,0.20515142381191254,0.20515143489837648,1.9764314877986908,,
|
| 96 |
+
43500,0.19370397925376892,0.1937039632797241,1.9878789701461792,,
|
| 97 |
+
44000,0.18394632637500763,0.18394634079933167,1.9976365916728973,,
|
| 98 |
+
44500,0.18232017755508423,0.1823201720714569,1.9992627584934235,,
|
| 99 |
+
45000,0.15781936049461365,0.15781937885284425,2.023763556241989,,
|
| 100 |
+
45000,,,,1.7854327964782715,0.396150141954422
|
| 101 |
+
45500,0.19733385741710663,0.19733386588096619,1.98424906873703,,
|
| 102 |
+
46000,0.20169685781002045,0.20169685006141663,1.9798860795497895,,
|
| 103 |
+
46500,0.20770150423049927,0.20770148515701295,1.97388143324852,,
|
| 104 |
+
47000,0.20021924376487732,0.20021922397613526,1.9813636980056764,,
|
| 105 |
+
47500,0.1858740895986557,0.18587410378456115,1.9957088272571564,,
|
| 106 |
+
48000,0.1943330019712448,0.19433301973342895,1.9872499043941498,,
|
| 107 |
+
48500,0.2020830363035202,0.2020830204486847,1.9794999012947083,,
|
| 108 |
+
49000,0.17362676560878754,0.1736267693042755,2.0079561648368833,,
|
| 109 |
+
49500,0.19353489577770233,0.19353489422798156,1.9880480349063874,,
|
| 110 |
+
50000,0.20380152761936188,0.20380153775215148,1.977781393289566,,
|
| 111 |
+
50000,,,,1.7713619846105575,0.4102209210395813
|
| 112 |
+
50500,0.1916441023349762,0.19164412236213685,1.9899387986660004,,
|
| 113 |
+
51000,0.2086837738752365,0.20868376445770265,1.9728991587162017,,
|
2/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1a44b744700bdbff02d62186998b429e03332faa1fb785f1a8e21b21b8dcb88
|
| 3 |
+
size 8844014
|
2/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-easy-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 2
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
2/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=2
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=2
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-easy-v0/PPO/2
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
2/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=2
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=2
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-easy-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 2
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
2/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-easy-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=2
|
2/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.04134989529848099,-0.04134989929199219,2.2229328308105467,,
|
| 3 |
+
1000,-0.055660370737314224,-0.055660367012023926,2.237243290424347,,
|
| 4 |
+
1500,-0.05102980509400368,-0.051029805660247805,2.232612743854523,,
|
| 5 |
+
2000,-0.04047350957989693,-0.040473512172698976,2.222056436538696,,
|
| 6 |
+
2500,-0.017532501369714737,-0.01753250074386597,2.199115427970886,,
|
| 7 |
+
3000,-0.06359454244375229,-0.0635945405960083,2.2451774687767028,,
|
| 8 |
+
3500,-0.05978996306657791,-0.05978996753692627,2.241372896671295,,
|
| 9 |
+
4000,-0.06186138838529587,-0.061861385345458986,2.2434443125724792,,
|
| 10 |
+
4500,-0.007661296520382166,-0.007661296367645264,2.189244219303131,,
|
| 11 |
+
5000,-0.040132034569978714,-0.04013203811645508,2.2217149596214294,,
|
| 12 |
+
5000,,,,2.130394132137299,0.05118880048394203
|
| 13 |
+
5500,-0.014540338888764381,-0.014540338516235351,2.1961232576370238,,
|
| 14 |
+
6000,0.0016551963053643703,0.0016551966667175293,2.179927733898163,,
|
| 15 |
+
6500,-0.003583599114790559,-0.003583599090576172,2.185166516304016,,
|
| 16 |
+
7000,-0.01119804847985506,-0.011198049068450927,2.1927809796333313,,
|
| 17 |
+
7500,0.001698688487522304,0.001698688507080078,2.1798842420578004,,
|
| 18 |
+
8000,0.019577881321310997,0.019577879428863524,2.162005048751831,,
|
| 19 |
+
8500,0.04433877393603325,0.0443387770652771,2.1372441477775572,,
|
| 20 |
+
9000,0.04519568756222725,0.04519568228721619,2.136387239933014,,
|
| 21 |
+
9500,0.008319809101521969,0.008319808483123779,2.1732631232738493,,
|
| 22 |
+
10000,0.05198968946933746,0.05198968505859375,2.1295932478904724,,
|
| 23 |
+
10000,,,,1.980608316063881,0.20097461342811584
|
| 24 |
+
10500,0.056999336928129196,0.0569993371963501,2.124583600521088,,
|
| 25 |
+
11000,0.07764870673418045,0.07764870357513427,2.10393421792984,,
|
| 26 |
+
11500,0.06310242414474487,0.06310242176055908,2.118480516910553,,
|
| 27 |
+
12000,0.052146065980196,0.052146065711975095,2.129436864376068,,
|
| 28 |
+
12500,0.05528493970632553,0.05528494596481323,2.1262979748249053,,
|
| 29 |
+
13000,0.0861661285161972,0.08616613054275513,2.095416803598404,,
|
| 30 |
+
13500,0.08271382004022598,0.08271381664276123,2.098869107961655,,
|
| 31 |
+
14000,0.094476617872715,0.0944766263961792,2.087106302022934,,
|
| 32 |
+
14500,0.06131628528237343,0.06131628346443176,2.1202666475772856,,
|
| 33 |
+
15000,0.054881300777196884,0.05488129353523254,2.1267016282081603,,
|
| 34 |
+
15000,,,,1.915284109711647,0.2662988305091858
|
| 35 |
+
15500,0.07859768718481064,0.07859769773483276,2.1029852209091184,,
|
| 36 |
+
16000,0.03855806589126587,0.03855806517601013,2.143024859428406,,
|
| 37 |
+
16500,0.08901320397853851,0.08901320147514344,2.09256972360611,,
|
| 38 |
+
17000,0.1016482263803482,0.10164821553230285,2.079934710741043,,
|
| 39 |
+
17500,0.09553169459104538,0.09553169798851013,2.0860512268543245,,
|
| 40 |
+
18000,0.10372352600097656,0.10372352480888367,2.0778593997955324,,
|
| 41 |
+
18500,0.09227016568183899,0.09227016353607177,2.0893127617836,,
|
| 42 |
+
19000,0.11707688868045807,0.11707689547538758,2.06450603055954,,
|
| 43 |
+
19500,0.07752527296543121,0.07752527976036072,2.104057633399963,,
|
| 44 |
+
20000,0.11520671099424362,0.11520672488212585,2.0663762073516847,,
|
| 45 |
+
20000,,,,1.8897565984725953,0.2918263077735901
|
| 46 |
+
20500,0.11105618625879288,0.11105618166923523,2.070526759624481,,
|
| 47 |
+
21000,0.11953085660934448,0.11953086709976196,2.0620520544052123,,
|
| 48 |
+
21500,0.1152503490447998,0.11525034570693969,2.066332589149475,,
|
| 49 |
+
22000,0.11999235302209854,0.11999235963821411,2.0615905652046203,,
|
| 50 |
+
22500,0.1303650438785553,0.13036505055427552,2.0512178771495817,,
|
| 51 |
+
23000,0.14331163465976715,0.14331162929534913,2.038271296262741,,
|
| 52 |
+
23500,0.14202982187271118,0.14202981424331665,2.039553119659424,,
|
| 53 |
+
24000,0.1329347938299179,0.132934809923172,2.0486481137275696,,
|
| 54 |
+
24500,0.14296920597553253,0.1429692099094391,2.0386137235164643,,
|
| 55 |
+
25000,0.14348357915878296,0.14348357558250427,2.0380993525981905,,
|
| 56 |
+
25000,,,,1.8442769485712052,0.3373059630393982
|
| 57 |
+
25500,0.14318101108074188,0.1431810085773468,2.0384019305706023,,
|
| 58 |
+
26000,0.14500656723976135,0.14500654792785644,2.0365763862133024,,
|
| 59 |
+
26500,0.1490248143672943,0.14902480506896973,2.032558128118515,,
|
| 60 |
+
27000,0.1537151336669922,0.1537151358127594,2.0278677980899813,,
|
| 61 |
+
27500,0.16485066711902618,0.1648506669998169,2.016732267856598,,
|
| 62 |
+
28000,0.17704522609710693,0.177045223236084,2.0045377001762392,,
|
| 63 |
+
28500,0.16156207025051117,0.16156206107139587,2.0200208599567415,,
|
| 64 |
+
29000,0.18025970458984375,0.18025971436500549,2.001323217153549,,
|
| 65 |
+
29500,0.1644441783428192,0.16444419884681702,2.0171387326717376,,
|
| 66 |
+
30000,0.16831377148628235,0.1683137676715851,2.013269152879715,,
|
| 67 |
+
30000,,,,1.8048384869098664,0.37674441933631897
|
| 68 |
+
30500,0.1928020715713501,0.19280207705497743,1.9887808554172517,,
|
| 69 |
+
31000,0.17093442380428314,0.1709344298839569,2.010648505449295,,
|
| 70 |
+
31500,0.1742946207523346,0.17429463267326356,2.0072882857322694,,
|
| 71 |
+
32000,0.180067241191864,0.18006725740432739,2.001515671491623,,
|
| 72 |
+
32500,0.18590447306632996,0.18590448355674744,1.9956784415245057,,
|
| 73 |
+
33000,0.1711912900209427,0.17119126653671266,2.0103916585445405,,
|
| 74 |
+
33500,0.15487484633922577,0.1548748528957367,2.0267080771923065,,
|
| 75 |
+
34000,0.1897355616092682,0.1897355785369873,1.991847359418869,,
|
| 76 |
+
34500,0.1805247813463211,0.18052478647232056,2.0010581305027006,,
|
| 77 |
+
35000,0.16770698130130768,0.1677069809436798,2.01387593626976,,
|
| 78 |
+
35000,,,,1.8149522477388382,0.3666306734085083
|
| 79 |
+
35500,0.1481206864118576,0.1481206784248352,2.033462256908417,,
|
| 80 |
+
36000,0.16231143474578857,0.16231142234802245,2.019271505832672,,
|
| 81 |
+
36500,0.17383816838264465,0.17383818364143372,2.007744749546051,,
|
| 82 |
+
37000,0.17515498399734497,0.17515498614311217,2.006427950382233,,
|
| 83 |
+
37500,0.13879266381263733,0.13879266476631164,2.0427902591228486,,
|
| 84 |
+
38000,0.14485672116279602,0.14485670948028564,2.0367262098789216,,
|
| 85 |
+
38500,0.16686411201953888,0.16686410665512086,2.0147188200950623,,
|
| 86 |
+
39000,0.15066872537136078,0.1506687228679657,2.0309142134189604,,
|
| 87 |
+
39500,0.18268169462680817,0.18268170690536498,1.9989012172222138,,
|
| 88 |
+
40000,0.15600693225860596,0.15600690293312072,2.0255760271549224,,
|
| 89 |
+
40000,,,,1.7944300961494446,0.3871528208255768
|
| 90 |
+
40500,0.17867568135261536,0.17867569041252135,2.002907225608826,,
|
| 91 |
+
41000,0.1683284044265747,0.16832840609550476,2.0132545228004455,,
|
| 92 |
+
41500,0.17173387110233307,0.17173386788368225,2.0098490529060364,,
|
| 93 |
+
42000,0.19686487317085266,0.1968648748397827,1.9847180500030517,,
|
| 94 |
+
42500,0.20282357931137085,0.20282357573509216,1.978759358882904,,
|
| 95 |
+
43000,0.17615151405334473,0.17615151453018188,2.005431404352188,,
|
| 96 |
+
43500,0.18170075118541718,0.18170075058937074,1.999882180929184,,
|
| 97 |
+
44000,0.17335250973701477,0.17335253238677978,2.0082303965091706,,
|
| 98 |
+
44500,0.18900486826896667,0.1890048577785492,1.9925780787467957,,
|
| 99 |
+
45000,0.17330293357372284,0.17330293107032776,2.00828000164032,,
|
| 100 |
+
45000,,,,1.8278998142480851,0.35368311405181885
|
| 101 |
+
45500,0.15311309695243835,0.15311309576034546,2.0284698269367216,,
|
| 102 |
+
46000,0.17649856209754944,0.17649854969978332,2.0050843760967254,,
|
| 103 |
+
46500,0.16959574818611145,0.16959576773643495,2.011987164258957,,
|
| 104 |
+
47000,0.1912308633327484,0.19123088598251342,1.990352041721344,,
|
| 105 |
+
47500,0.200710266828537,0.20071024584770203,1.980872678756714,,
|
| 106 |
+
48000,0.1822909712791443,0.1822909679412842,1.9992919502258302,,
|
| 107 |
+
48500,0.18565015494823456,0.18565017104148865,1.9959327545166015,,
|
| 108 |
+
49000,0.20148558914661407,0.2014856173992157,1.9800973193645477,,
|
| 109 |
+
49500,0.18955175578594208,0.18955174946784972,1.992031180381775,,
|
| 110 |
+
50000,0.16458189487457275,0.1645818874835968,2.017001046895981,,
|
| 111 |
+
50000,,,,1.7965672659873961,0.38501566648483276
|
| 112 |
+
50500,0.1736375242471695,0.17363752698898316,2.0079453995227814,,
|
| 113 |
+
51000,0.19020415842533112,0.1902041654586792,1.9913787581920623,,
|
3/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1a654f3a5edc179b9a884b35548b0dbf774c18111cd2e23c5f148a4273e9824
|
| 3 |
+
size 8844016
|
3/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-easy-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 3
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
3/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=3
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=3
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-easy-v0/PPO/3
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
3/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=3
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=3
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-easy-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 3
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
3/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-easy-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=3
|
3/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
3/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.050438277423381805,-0.05043827676773071,2.232021207332611,,
|
| 3 |
+
1000,-0.06766729056835175,-0.0676672911643982,2.249250214099884,,
|
| 4 |
+
1500,-0.06475519388914108,-0.06475520038604736,2.2463381309509276,,
|
| 5 |
+
2000,-0.07544218748807907,-0.07544218826293946,2.2570251235961916,,
|
| 6 |
+
2500,-0.04640858247876167,-0.046408580780029296,2.2279915108680726,,
|
| 7 |
+
3000,-0.019970253109931946,-0.019970251083374024,2.2015531821250915,,
|
| 8 |
+
3500,-0.03314433991909027,-0.03314434194564819,2.2147272696495057,,
|
| 9 |
+
4000,-0.0446096770465374,-0.04460967683792114,2.226192602157593,,
|
| 10 |
+
4500,-0.0667218491435051,-0.06672185564041137,2.248304777145386,,
|
| 11 |
+
5000,0.0031401743181049824,0.0031401748657226562,2.178442750453949,,
|
| 12 |
+
5000,,,,2.1348024225234985,0.046780504286289215
|
| 13 |
+
5500,0.022269688546657562,0.022269688606262206,2.159313237667084,,
|
| 14 |
+
6000,0.021571213379502296,0.02157121467590332,2.160011706829071,,
|
| 15 |
+
6500,-0.03134319931268692,-0.031343202590942386,2.212926122188568,,
|
| 16 |
+
7000,0.01380790863186121,0.013807908773422242,2.1677750108242035,,
|
| 17 |
+
7500,0.03137562423944473,0.031375624656677245,2.150207305908203,,
|
| 18 |
+
8000,0.020615708082914352,0.02061570692062378,2.1609672374725344,,
|
| 19 |
+
8500,0.010343119502067566,0.010343119621276856,2.1712397990226746,,
|
| 20 |
+
9000,0.005791854113340378,0.005791854381561279,2.175791069030762,,
|
| 21 |
+
9500,0.013246963731944561,0.013246963024139405,2.168335965156555,,
|
| 22 |
+
10000,-0.0013291880022734404,-0.0013291873931884765,2.1829121141433716,,
|
| 23 |
+
10000,,,,2.11635510802269,0.06522782146930695
|
| 24 |
+
10500,0.004903855267912149,0.004903855800628662,2.1766790614128113,,
|
| 25 |
+
11000,-0.06585860997438431,-0.06585861587524414,2.247441548347473,,
|
| 26 |
+
11500,0.03156871348619461,0.03156871128082275,2.1500142188072204,,
|
| 27 |
+
12000,0.03209967166185379,0.03209967279434204,2.1494832587242128,,
|
| 28 |
+
12500,0.02772170677781105,0.0277217071056366,2.1538612248897553,,
|
| 29 |
+
13000,0.03325227275490761,0.03325227403640747,2.1483306469917296,,
|
| 30 |
+
13500,0.05017443746328354,0.05017443490028382,2.1314084968566895,,
|
| 31 |
+
14000,0.02192855067551136,0.021928547859191894,2.1596543831825255,,
|
| 32 |
+
14500,0.02297738566994667,0.022977387905120848,2.1586055517196656,,
|
| 33 |
+
15000,0.04552844911813736,0.04552845025062561,2.136054482936859,,
|
| 34 |
+
15000,,,,2.0816797852516173,0.09990313649177551
|
| 35 |
+
15500,0.02195972204208374,0.021959722995758057,2.159623192548752,,
|
| 36 |
+
16000,0.05156781151890755,0.0515678071975708,2.1300151209831237,,
|
| 37 |
+
16500,0.032499413937330246,0.03249941205978393,2.149083516359329,,
|
| 38 |
+
17000,0.07406782358884811,0.07406781721115112,2.1075151076316834,,
|
| 39 |
+
17500,0.06772258132696152,0.06772258234024048,2.1138603429794314,,
|
| 40 |
+
18000,0.047708477824926376,0.0477084755897522,2.1338744478225706,,
|
| 41 |
+
18500,0.05880160629749298,0.058801607608795166,2.122781320333481,,
|
| 42 |
+
19000,0.05765968933701515,0.05765968990325928,2.123923238277435,,
|
| 43 |
+
19500,0.03194111958146095,0.03194111776351929,2.1496418001651763,,
|
| 44 |
+
20000,0.06176219508051872,0.0617621967792511,2.119820727109909,,
|
| 45 |
+
20000,,,,2.0652108162641527,0.11637210845947266
|
| 46 |
+
20500,0.07553316652774811,0.07553317403793335,2.10604975438118,,
|
| 47 |
+
21000,0.07630740106105804,0.07630739951133728,2.10527551817894,,
|
| 48 |
+
21500,0.06292356550693512,0.06292356991767883,2.11865935254097,,
|
| 49 |
+
22000,0.05584558844566345,0.05584558796882629,2.125737341403961,,
|
| 50 |
+
22500,0.03619024530053139,0.03619024300575256,2.1453926844596864,,
|
| 51 |
+
23000,0.08000177145004272,0.08000177478790284,2.101581146001816,,
|
| 52 |
+
23500,0.08511899411678314,0.08511899185180664,2.096463934659958,,
|
| 53 |
+
24000,0.04231981560587883,0.042319814920425414,2.1392631089687346,,
|
| 54 |
+
24500,0.048970602452754974,0.04897059941291809,2.1326123216152193,,
|
| 55 |
+
25000,0.10177874565124512,0.10177874445915222,2.0798041846752167,,
|
| 56 |
+
25000,,,,1.9942094898223877,0.18737342953681946
|
| 57 |
+
25500,0.11347105354070663,0.11347105479240417,2.0681118774414062,,
|
| 58 |
+
26000,0.101518914103508,0.10151890659332276,2.0800640194416045,,
|
| 59 |
+
26500,0.11459202319383621,0.11459202551841736,2.066990908384323,,
|
| 60 |
+
27000,0.11430617421865463,0.11430617189407348,2.067276755571365,,
|
| 61 |
+
27500,0.10968131572008133,0.10968131875991821,2.0719016060829163,,
|
| 62 |
+
28000,0.1287713348865509,0.12877134370803833,2.0528115787506103,,
|
| 63 |
+
28500,0.11253622174263,0.112536235332489,2.0690466995239256,,
|
| 64 |
+
29000,0.1281118541955948,0.12811184310913085,2.0534710865020753,,
|
| 65 |
+
29500,0.10534487664699554,0.10534487962722779,2.0762380349636076,,
|
| 66 |
+
30000,0.11968756467103958,0.11968756461143494,2.0618953680992127,,
|
| 67 |
+
30000,,,,1.87678431391716,0.30479860305786133
|
| 68 |
+
30500,0.1030559092760086,0.10305590581893921,2.0785270199775696,,
|
| 69 |
+
31000,0.10445408523082733,0.10445408391952514,2.077128833770752,,
|
| 70 |
+
31500,0.10940387845039368,0.10940388464927674,2.0721790425777433,,
|
| 71 |
+
32000,0.09373175352811813,0.09373175859451294,2.08785116648674,,
|
| 72 |
+
32500,0.1295819729566574,0.1295819625854492,2.052000971317291,,
|
| 73 |
+
33000,0.10238485038280487,0.10238485050201417,2.0791980743408205,,
|
| 74 |
+
33500,0.12654829025268555,0.12654830193519592,2.0550346229076384,,
|
| 75 |
+
34000,0.1189715713262558,0.11897156620025635,2.0626113643646242,,
|
| 76 |
+
34500,0.12389718741178513,0.12389718294143677,2.0576857616901396,,
|
| 77 |
+
35000,0.14573870599269867,0.1457387068271637,2.0358442249298094,,
|
| 78 |
+
35000,,,,1.8783732569217682,0.30320966243743896
|
| 79 |
+
35500,0.1098504364490509,0.10985043406486511,2.0717324867248537,,
|
| 80 |
+
36000,0.11075016111135483,0.11075015997886657,2.070832767009735,,
|
| 81 |
+
36500,0.10975827276706696,0.10975826597213745,2.071824664592743,,
|
| 82 |
+
37000,0.12856659293174744,0.12856660389900207,2.0530163156986236,,
|
| 83 |
+
37500,0.1360883116722107,0.1360883104801178,2.045494614362717,,
|
| 84 |
+
38000,0.09176091849803925,0.0917609167098999,2.089822017431259,,
|
| 85 |
+
38500,0.11355500668287277,0.11355500030517578,2.0680279445648195,,
|
| 86 |
+
39000,0.1526203602552414,0.15262035179138184,2.028962571144104,,
|
| 87 |
+
39500,0.16022932529449463,0.16022932457923889,2.0213536105155945,,
|
| 88 |
+
40000,0.13480022549629211,0.13480024361610413,2.0467826886177063,,
|
| 89 |
+
40000,,,,1.817890984416008,0.36369192600250244
|
| 90 |
+
40500,0.1544303596019745,0.15443037509918212,2.027152554512024,,
|
| 91 |
+
41000,0.15893837809562683,0.15893839478492736,2.0226445353031157,,
|
| 92 |
+
41500,0.16579964756965637,0.1657996542453766,2.0157832798957824,,
|
| 93 |
+
42000,0.15551361441612244,0.15551361966133118,2.0260692956447603,,
|
| 94 |
+
42500,0.10133448988199234,0.10133448123931885,2.0802484333515165,,
|
| 95 |
+
43000,0.14176060259342194,0.14176061749458313,2.039822311878204,,
|
| 96 |
+
43500,0.13890503346920013,0.13890503454208375,2.0426778883934023,,
|
| 97 |
+
44000,0.13777685165405273,0.1377768485546112,2.043806074380875,,
|
| 98 |
+
44500,0.16418947279453278,0.16418947315216065,2.0173934667110442,,
|
| 99 |
+
45000,0.10311790555715561,0.10311790585517883,2.078465024232864,,
|
| 100 |
+
45000,,,,1.875197362303734,0.3063855767250061
|
| 101 |
+
45500,0.15438112616539001,0.15438111734390259,2.0272018098831177,,
|
| 102 |
+
46000,0.1552824079990387,0.15528242325782776,2.026300496816635,,
|
| 103 |
+
46500,0.14290881156921387,0.14290882539749145,2.038674108028412,,
|
| 104 |
+
47000,0.10676785558462143,0.10676785707473754,2.0748150796890257,,
|
| 105 |
+
47500,0.16349585354328156,0.16349583888053895,2.0180870866775513,,
|
| 106 |
+
48000,0.08548945933580399,0.08548946046829224,2.0960934791564942,,
|
| 107 |
+
48500,0.15652664005756378,0.15652664041519165,2.0250562791824342,,
|
| 108 |
+
49000,0.13339276611804962,0.1333927412033081,2.0481901876926423,,
|
| 109 |
+
49500,0.15712739527225494,0.15712741637229918,2.0244555003643034,,
|
| 110 |
+
50000,0.17887240648269653,0.17887241911888122,2.0027105035781863,,
|
| 111 |
+
50000,,,,1.7994264960289001,0.3821564316749573
|
| 112 |
+
50500,0.16286206245422363,0.16286205434799195,2.0187208688259126,,
|
| 113 |
+
51000,0.14349853992462158,0.14349854922294616,2.038084382534027,,
|
4/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5966cfdf929b7d110e0e7da6306be4c64f9dd66c29745e377a9fce441e73ab74
|
| 3 |
+
size 8844012
|
4/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-easy-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 4
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
4/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=4
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=4
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-easy-v0/PPO/4
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
4/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-easy-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=4
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-easy-v0,rl_mode=marl,seed=4
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-easy-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 4
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
4/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-easy-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=4
|