Upload results for PPO on RBC3D-hard-v0.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +20 -0
- 0/ckpt_latest.zip +3 -0
- 0/config.yaml +58 -0
- 0/hydra.yaml +163 -0
- 0/multirun.yaml +221 -0
- 0/overrides.yaml +4 -0
- 0/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 0/test/test_eval_episode_0.csv +0 -0
- 0/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 0/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 0/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 0/training_log.csv +113 -0
- 1/ckpt_latest.zip +3 -0
- 1/config.yaml +58 -0
- 1/hydra.yaml +163 -0
- 1/multirun.yaml +221 -0
- 1/overrides.yaml +4 -0
- 1/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 1/test/test_eval_episode_0.csv +0 -0
- 1/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 1/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 1/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 1/training_log.csv +113 -0
- 2/ckpt_latest.zip +3 -0
- 2/config.yaml +58 -0
- 2/hydra.yaml +163 -0
- 2/multirun.yaml +221 -0
- 2/overrides.yaml +4 -0
- 2/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 2/test/test_eval_episode_0.csv +0 -0
- 2/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 2/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 2/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 2/training_log.csv +113 -0
- 3/ckpt_latest.zip +3 -0
- 3/config.yaml +58 -0
- 3/hydra.yaml +163 -0
- 3/multirun.yaml +221 -0
- 3/overrides.yaml +4 -0
- 3/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 3/test/test_eval_episode_0.csv +0 -0
- 3/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 3/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 3/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 3/training_log.csv +113 -0
- 4/ckpt_latest.zip +3 -0
- 4/config.yaml +58 -0
- 4/hydra.yaml +163 -0
- 4/multirun.yaml +221 -0
- 4/overrides.yaml +4 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,23 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
0/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
0/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
0/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
0/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
1/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
1/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
1/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
1/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
2/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
2/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
2/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
2/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
3/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
3/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
3/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
3/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
4/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
4/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
4/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
4/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
0/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b9eaae34fb7084d6f0e5ef101da26b10f3cc2524a20e09cf041cece9e779656
|
| 3 |
+
size 8844014
|
0/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 0
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
0/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=0
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=0
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/PPO/0
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
0/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=0
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=0
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 0
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
0/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=0
|
0/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
0/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.10074600577354431,-0.10074600219726562,2.784679016113281,,
|
| 3 |
+
1000,-0.10750137269496918,-0.10750137758255005,2.7914344000816347,,
|
| 4 |
+
1500,-0.10830755531787872,-0.10830755472183227,2.792240581035614,,
|
| 5 |
+
2000,-0.11602842062711716,-0.11602842330932617,2.7999614520072935,,
|
| 6 |
+
2500,-0.06680159270763397,-0.06680158758163453,2.750734609127045,,
|
| 7 |
+
3000,-0.06723300367593765,-0.06723300170898437,2.7511660237312316,,
|
| 8 |
+
3500,-0.06557369232177734,-0.0655736894607544,2.7495067138671874,,
|
| 9 |
+
4000,-0.052346404641866684,-0.05234640645980835,2.736279424190521,,
|
| 10 |
+
4500,-0.022079044952988625,-0.022079044342041016,2.706012069225311,,
|
| 11 |
+
5000,-0.00836993008852005,-0.008369930267333984,2.692302949428558,,
|
| 12 |
+
5000,,,,2.565404303073883,0.11852870881557465
|
| 13 |
+
5500,-0.007670428138226271,-0.007670429229736328,2.691603446006775,,
|
| 14 |
+
6000,-0.012983032502233982,-0.0129830322265625,2.696916058063507,,
|
| 15 |
+
6500,0.03490367531776428,0.03490367126464844,2.6490293483734133,,
|
| 16 |
+
7000,0.03069969266653061,0.030699689388275147,2.6532333397865298,,
|
| 17 |
+
7500,0.04590260982513428,0.04590260601043701,2.6380304102897645,,
|
| 18 |
+
8000,0.025222130119800568,0.025222130298614504,2.6587108907699584,,
|
| 19 |
+
8500,0.08284736424684525,0.08284737539291381,2.6010856499671937,,
|
| 20 |
+
9000,0.053213827311992645,0.05321382856369018,2.630719202041626,,
|
| 21 |
+
9500,0.08383308351039886,0.08383309078216553,2.6000999336242674,,
|
| 22 |
+
10000,0.07237756997346878,0.07237756967544556,2.6115554399490355,,
|
| 23 |
+
10000,,,,2.4589192938804625,0.22501373291015625
|
| 24 |
+
10500,0.08914630115032196,0.08914629411697388,2.594786721229553,,
|
| 25 |
+
11000,0.08439309895038605,0.08439310836791993,2.5995399141311646,,
|
| 26 |
+
11500,0.10192469507455826,0.10192470073699951,2.58200830745697,,
|
| 27 |
+
12000,0.08661293238401413,0.08661292743682861,2.597320079803467,,
|
| 28 |
+
12500,0.12497540563344955,0.12497540521621704,2.558957621097565,,
|
| 29 |
+
13000,0.1426006555557251,0.1426006531715393,2.5413323683738707,,
|
| 30 |
+
13500,0.1356959491968155,0.13569596958160401,2.5482370529174805,,
|
| 31 |
+
14000,0.1298772394657135,0.1298772439956665,2.5540557861328126,,
|
| 32 |
+
14500,0.16607566177845,0.16607566213607788,2.5178573656082155,,
|
| 33 |
+
15000,0.17794467508792877,0.1779446711540222,2.5059883427619933,,
|
| 34 |
+
15000,,,,2.4145771539211274,0.2693558633327484
|
| 35 |
+
15500,0.15924221277236938,0.1592422308921814,2.524690779209137,,
|
| 36 |
+
16000,0.16067063808441162,0.16067063331604003,2.5232623801231386,,
|
| 37 |
+
16500,0.15645666420459747,0.15645665645599366,2.5274763593673706,,
|
| 38 |
+
17000,0.16588103771209717,0.16588104152679442,2.5180519647598265,,
|
| 39 |
+
17500,0.16006910800933838,0.16006911277770997,2.523863911628723,,
|
| 40 |
+
18000,0.16735291481018066,0.16735291481018066,2.5165800919532777,,
|
| 41 |
+
18500,0.1653919368982315,0.165391948223114,2.5185410709381104,,
|
| 42 |
+
19000,0.1637827455997467,0.16378274488449096,2.520150289058685,,
|
| 43 |
+
19500,0.1417253166437149,0.1417253041267395,2.542207706451416,,
|
| 44 |
+
20000,0.1691184937953949,0.16911850500106812,2.5148145151138306,,
|
| 45 |
+
20000,,,,2.4566838908195496,0.2272491157054901
|
| 46 |
+
20500,0.15669000148773193,0.15669000339508057,2.5272430062294005,,
|
| 47 |
+
21000,0.17573927342891693,0.17573927116394042,2.508193745136261,,
|
| 48 |
+
21500,0.19506603479385376,0.1950660424232483,2.488866970539093,,
|
| 49 |
+
22000,0.17852602899074554,0.17852605152130127,2.505406970024109,,
|
| 50 |
+
22500,0.16643597185611725,0.1664359803199768,2.5174970302581787,,
|
| 51 |
+
23000,0.1826682835817337,0.18266830825805663,2.5012647032737734,,
|
| 52 |
+
23500,0.16517524421215057,0.16517525148391723,2.5187577629089355,,
|
| 53 |
+
24000,0.16866226494312286,0.16866226291656494,2.5152707438468935,,
|
| 54 |
+
24500,0.1743609607219696,0.174360963344574,2.509572049617767,,
|
| 55 |
+
25000,0.176267609000206,0.17626760292053223,2.5076654200553894,,
|
| 56 |
+
25000,,,,2.399750442504883,0.2841825783252716
|
| 57 |
+
25500,0.18474359810352325,0.18474358224868775,2.4991894330978393,,
|
| 58 |
+
26000,0.1789006143808365,0.1789006209373474,2.505032401561737,,
|
| 59 |
+
26500,0.1618911772966385,0.16189117240905762,2.522041845321655,,
|
| 60 |
+
27000,0.1676018387079239,0.16760185194015503,2.51633118057251,,
|
| 61 |
+
27500,0.1773589551448822,0.17735894727706908,2.506574081897736,,
|
| 62 |
+
28000,0.1582452803850174,0.15824528646469116,2.5256877455711364,,
|
| 63 |
+
28500,0.16940654814243317,0.1694065375328064,2.5145264859199523,,
|
| 64 |
+
29000,0.15190376341342926,0.15190376949310302,2.5320292510986326,,
|
| 65 |
+
29500,0.17523349821567535,0.17523350048065187,2.508699508666992,,
|
| 66 |
+
30000,0.1856042444705963,0.18560425329208374,2.498328766822815,,
|
| 67 |
+
30000,,,,2.4056684279441836,0.278264582157135
|
| 68 |
+
30500,0.1941879391670227,0.19418793773651122,2.4897450890541077,,
|
| 69 |
+
31000,0.19270305335521698,0.19270305347442626,2.4912299642562865,,
|
| 70 |
+
31500,0.19111241400241852,0.19111242198944092,2.4928206024169923,,
|
| 71 |
+
32000,0.16077271103858948,0.1607727041244507,2.523160322189331,,
|
| 72 |
+
32500,0.16405007243156433,0.16405008029937745,2.519882930278778,,
|
| 73 |
+
33000,0.18354669213294983,0.1835467004776001,2.5003863077163695,,
|
| 74 |
+
33500,0.1801392138004303,0.18013920116424562,2.50379381275177,,
|
| 75 |
+
34000,0.19439882040023804,0.19439882564544678,2.4895341930389403,,
|
| 76 |
+
34500,0.19212979078292847,0.19212979078292847,2.491803234577179,,
|
| 77 |
+
35000,0.1954958736896515,0.19549587059020995,2.488437156200409,,
|
| 78 |
+
35000,,,,2.356049635410309,0.32788336277008057
|
| 79 |
+
35500,0.21499569714069366,0.21499570226669312,2.468937307357788,,
|
| 80 |
+
36000,0.21124346554279327,0.21124345016479493,2.4726895661354065,,
|
| 81 |
+
36500,0.20752598345279694,0.20752599573135375,2.476407031059265,,
|
| 82 |
+
37000,0.21055419743061066,0.21055419969558717,2.473378821372986,,
|
| 83 |
+
37500,0.2258177548646927,0.22581775331497192,2.458115259647369,,
|
| 84 |
+
38000,0.20166325569152832,0.20166324758529663,2.4822697677612306,,
|
| 85 |
+
38500,0.21620073914527893,0.2162007517814636,2.4677322692871093,,
|
| 86 |
+
39000,0.21526534855365753,0.21526534271240233,2.4686676750183105,,
|
| 87 |
+
39500,0.20817309617996216,0.20817307901382445,2.4757599391937255,,
|
| 88 |
+
40000,0.18888385593891144,0.18888387346267702,2.495049153804779,,
|
| 89 |
+
40000,,,,2.337438405752182,0.3464946150779724
|
| 90 |
+
40500,0.19457577168941498,0.19457576274871827,2.4893572511672972,,
|
| 91 |
+
41000,0.1973281353712082,0.19732813501358032,2.4866048889160157,,
|
| 92 |
+
41500,0.19428549706935883,0.19428550386428833,2.4896475172042845,,
|
| 93 |
+
42000,0.1908634901046753,0.19086349534988403,2.493069539070129,,
|
| 94 |
+
42500,0.21259050071239471,0.21259049797058105,2.47134250497818,,
|
| 95 |
+
43000,0.20513397455215454,0.20513396549224855,2.4787990527153014,,
|
| 96 |
+
43500,0.20687155425548553,0.20687157678604126,2.4770614485740663,,
|
| 97 |
+
44000,0.18525445461273193,0.18525446462631226,2.498678565502167,,
|
| 98 |
+
44500,0.1916533261537552,0.19165331506729125,2.492279703617096,,
|
| 99 |
+
45000,0.2218555212020874,0.2218555226325989,2.462077509403229,,
|
| 100 |
+
45000,,,,2.337412050962448,0.34652096033096313
|
| 101 |
+
45500,0.21687276661396027,0.21687277126312257,2.4670602412223817,,
|
| 102 |
+
46000,0.1903662085533142,0.1903662166595459,2.493566804885864,,
|
| 103 |
+
46500,0.1969374120235443,0.19693740940093993,2.4869956164360048,,
|
| 104 |
+
47000,0.19990095496177673,0.19990095901489258,2.484032061576843,,
|
| 105 |
+
47500,0.18451529741287231,0.18451531457901002,2.4994176983833314,,
|
| 106 |
+
48000,0.18876561522483826,0.18876562118530274,2.495167398929596,,
|
| 107 |
+
48500,0.20362871885299683,0.20362872743606567,2.4803042974472045,,
|
| 108 |
+
49000,0.19015999138355255,0.19015997314453126,2.4937730469703676,,
|
| 109 |
+
49500,0.21316726505756378,0.21316725444793702,2.4707657566070558,,
|
| 110 |
+
50000,0.19966915249824524,0.19966918420791627,2.484263837814331,,
|
| 111 |
+
50000,,,,2.340068511962891,0.3438645005226135
|
| 112 |
+
50500,0.21618828177452087,0.21618830347061158,2.467744723320007,,
|
| 113 |
+
51000,0.19877077639102936,0.19877078580856322,2.48516223192215,,
|
1/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:966d9253a8b5475e5d100f965dff496da6ca2e9620824b960265c398ea8789d7
|
| 3 |
+
size 8844018
|
1/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 1
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
1/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=1
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=1
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/PPO/1
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
1/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=1
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=1
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 1
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
1/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=1
|
1/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
1/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.10473909229040146,-0.10473910093307495,2.7886721129417418,,
|
| 3 |
+
1000,-0.11437033116817474,-0.11437034177780152,2.7983033628463745,,
|
| 4 |
+
1500,-0.10812825709581375,-0.1081282525062561,2.7920612678527834,,
|
| 5 |
+
2000,-0.1092241182923317,-0.10922413301467895,2.7931571397781374,,
|
| 6 |
+
2500,-0.06332778930664062,-0.06332779312133789,2.7472607975006103,,
|
| 7 |
+
3000,-0.04805663600564003,-0.048056637287139894,2.731989667892456,,
|
| 8 |
+
3500,-0.0665203183889389,-0.06652032232284547,2.750453339099884,,
|
| 9 |
+
4000,-0.07367736101150513,-0.07367735958099365,2.757610381126404,,
|
| 10 |
+
4500,-0.03073206916451454,-0.03073206663131714,2.7146650924682616,,
|
| 11 |
+
5000,-0.032601144164800644,-0.032601141929626466,2.7165341596603394,,
|
| 12 |
+
5000,,,,2.6426688849925997,0.0412641316652298
|
| 13 |
+
5500,-0.028387920930981636,-0.028387924194335938,2.7123209376335145,,
|
| 14 |
+
6000,-0.0317373052239418,-0.03173730707168579,2.715670318603516,,
|
| 15 |
+
6500,0.010132984258234501,0.010132984638214111,2.67380003452301,,
|
| 16 |
+
7000,0.01896466501057148,0.018964664459228515,2.6649683561325075,,
|
| 17 |
+
7500,0.022173656150698662,0.022173654556274413,2.6617593674659727,,
|
| 18 |
+
8000,0.021737616509199142,0.021737616062164306,2.6621953978538513,,
|
| 19 |
+
8500,0.04402424767613411,0.04402424430847168,2.639908770561218,,
|
| 20 |
+
9000,0.05931568890810013,0.05931569242477417,2.624617331027985,,
|
| 21 |
+
9500,0.06714131683111191,0.06714131736755372,2.616791696548462,,
|
| 22 |
+
10000,0.06616228073835373,0.06616227865219117,2.617770739555359,,
|
| 23 |
+
10000,,,,2.517852562665939,0.16608044505119324
|
| 24 |
+
10500,0.09077046066522598,0.09077046489715576,2.593162568092346,,
|
| 25 |
+
11000,0.09030970931053162,0.09030971336364746,2.593623312473297,,
|
| 26 |
+
11500,0.09332715719938278,0.09332715225219726,2.590605867385864,,
|
| 27 |
+
12000,0.08051171898841858,0.08051172018051148,2.603421299934387,,
|
| 28 |
+
12500,0.08307775855064392,0.08307775926589966,2.600855254650116,,
|
| 29 |
+
13000,0.10575522482395172,0.10575522232055665,2.5781777935028076,,
|
| 30 |
+
13500,0.10483419895172119,0.10483420085906982,2.579098823070526,,
|
| 31 |
+
14000,0.09483081102371216,0.09483081674575805,2.5891022005081177,,
|
| 32 |
+
14500,0.09545854479074478,0.09545853233337402,2.588474492073059,,
|
| 33 |
+
15000,0.11473210901021957,0.11473210096359253,2.569200909137726,,
|
| 34 |
+
15000,,,,2.4405125832557677,0.24342042207717896
|
| 35 |
+
15500,0.1548132300376892,0.15481324338912963,2.529119783401489,,
|
| 36 |
+
16000,0.11040763556957245,0.110407630443573,2.573525391101837,,
|
| 37 |
+
16500,0.13510961830615997,0.13510964012145996,2.5488233790397645,,
|
| 38 |
+
17000,0.152826726436615,0.1528267183303833,2.5311062974929808,,
|
| 39 |
+
17500,0.15706315636634827,0.1570631628036499,2.5268698654174804,,
|
| 40 |
+
18000,0.15728147327899933,0.15728148221969604,2.526651542186737,,
|
| 41 |
+
18500,0.1420203149318695,0.14202031898498535,2.541912701129913,,
|
| 42 |
+
19000,0.16043342649936676,0.1604334216117859,2.523499596595764,,
|
| 43 |
+
19500,0.17701265215873718,0.1770126576423645,2.5069203658103945,,
|
| 44 |
+
20000,0.16953414678573608,0.16953416442871094,2.5143988547325136,,
|
| 45 |
+
20000,,,,2.3824210035800935,0.3015120029449463
|
| 46 |
+
20500,0.17038074135780334,0.17038074445724488,2.5135522665977477,,
|
| 47 |
+
21000,0.2094847410917282,0.20948473739624024,2.47444829082489,,
|
| 48 |
+
21500,0.1860993653535843,0.18609936904907226,2.4978336610794067,,
|
| 49 |
+
22000,0.17906510829925537,0.1790651125907898,2.504867914199829,,
|
| 50 |
+
22500,0.1926639974117279,0.19266398334503174,2.491269036769867,,
|
| 51 |
+
23000,0.19894438982009888,0.19894437980651855,2.4849886326789856,,
|
| 52 |
+
23500,0.20095068216323853,0.20095067596435548,2.4829823422431945,,
|
| 53 |
+
24000,0.20060814917087555,0.20060817003250123,2.483324849128723,,
|
| 54 |
+
24500,0.1969020664691925,0.1969020857810974,2.4870309391021728,,
|
| 55 |
+
25000,0.23283688724040985,0.23283690309524535,2.451096116542816,,
|
| 56 |
+
25000,,,,2.429212571382523,0.25472044944763184
|
| 57 |
+
25500,0.22810743749141693,0.2281074357032776,2.455825581073761,,
|
| 58 |
+
26000,0.17585402727127075,0.17585404062271118,2.508078989505768,,
|
| 59 |
+
26500,0.1974763721227646,0.19747639274597167,2.4864566321372985,,
|
| 60 |
+
27000,0.19330130517482758,0.19330129528045653,2.4906317262649535,,
|
| 61 |
+
27500,0.19500063359737396,0.19500066471099853,2.4889323539733885,,
|
| 62 |
+
28000,0.17882174253463745,0.17882175874710082,2.505111262798309,,
|
| 63 |
+
28500,0.19655285775661469,0.196552836894989,2.487380187034607,,
|
| 64 |
+
29000,0.19838356971740723,0.1983835849761963,2.485549425125122,,
|
| 65 |
+
29500,0.20945845544338226,0.2094584560394287,2.4744745626449585,,
|
| 66 |
+
30000,0.21305443346500397,0.21305444002151488,2.4708785848617554,,
|
| 67 |
+
30000,,,,2.38564071893692,0.2982923090457916
|
| 68 |
+
30500,0.19604277610778809,0.19604277896881103,2.4878902373313903,,
|
| 69 |
+
31000,0.19012241065502167,0.19012243795394898,2.4938105845451357,,
|
| 70 |
+
31500,0.16483792662620544,0.16483793210983277,2.519095088481903,,
|
| 71 |
+
32000,0.16758312284946442,0.1675831413269043,2.5163498864173888,,
|
| 72 |
+
32500,0.1661965250968933,0.16619652223587036,2.5177364993095397,,
|
| 73 |
+
33000,0.17162758111953735,0.17162758111953735,2.512305441379547,,
|
| 74 |
+
33500,0.18727459013462067,0.18727459049224854,2.496658432483673,,
|
| 75 |
+
34000,0.20026737451553345,0.20026736068725587,2.4836656460762025,,
|
| 76 |
+
34500,0.2072226107120514,0.20722259902954102,2.4767104244232176,,
|
| 77 |
+
35000,0.2095581293106079,0.20955812358856202,2.474374900817871,,
|
| 78 |
+
35000,,,,2.3982539796829223,0.28567904233932495
|
| 79 |
+
35500,0.20795513689517975,0.20795512676239014,2.4759778938293455,,
|
| 80 |
+
36000,0.18025662004947662,0.18025661516189576,2.503676395893097,,
|
| 81 |
+
36500,0.216342031955719,0.21634201431274414,2.467591009616852,,
|
| 82 |
+
37000,0.19791540503501892,0.19791542959213257,2.486017594337463,,
|
| 83 |
+
37500,0.20728115737438202,0.20728116655349732,2.4766518535614015,,
|
| 84 |
+
38000,0.21051238477230072,0.2105123815536499,2.4734206290245058,,
|
| 85 |
+
38500,0.194564551115036,0.1945645327568054,2.48936848115921,,
|
| 86 |
+
39000,0.21987104415893555,0.2198710379600525,2.4640619711875917,,
|
| 87 |
+
39500,0.21882669627666473,0.21882668495178223,2.4651063356399536,,
|
| 88 |
+
40000,0.20878826081752777,0.20878826665878297,2.4751447463035583,,
|
| 89 |
+
40000,,,,2.4059288442134856,0.27800416946411133
|
| 90 |
+
40500,0.20664410293102264,0.20664411783218384,2.4772888927459715,,
|
| 91 |
+
41000,0.2155437022447586,0.21554368066787719,2.468389335155487,,
|
| 92 |
+
41500,0.2191316932439804,0.21913169670104982,2.464801323413849,,
|
| 93 |
+
42000,0.23121215403079987,0.23121215963363648,2.452720853328705,,
|
| 94 |
+
42500,0.23894308507442474,0.23894308614730836,2.4449899406433104,,
|
| 95 |
+
43000,0.24045385420322418,0.24045384836196898,2.44347917509079,,
|
| 96 |
+
43500,0.23086871206760406,0.23086871957778932,2.4530642910003664,,
|
| 97 |
+
44000,0.2347283512353897,0.23472836446762085,2.4492046546936037,,
|
| 98 |
+
44500,0.19872625172138214,0.19872627067565918,2.485206757545471,,
|
| 99 |
+
45000,0.21545526385307312,0.21545526313781738,2.468477746963501,,
|
| 100 |
+
45000,,,,2.363110291957855,0.32082271575927734
|
| 101 |
+
45500,0.21902252733707428,0.21902254390716552,2.464910472393036,,
|
| 102 |
+
46000,0.2270890474319458,0.22708905458450318,2.456843957901001,,
|
| 103 |
+
46500,0.23847335577011108,0.2384733624458313,2.445459652900696,,
|
| 104 |
+
47000,0.24715656042099,0.24715657043457032,2.436776443004608,,
|
| 105 |
+
47500,0.22855865955352783,0.2285586667060852,2.455374363422394,,
|
| 106 |
+
48000,0.23548468947410583,0.23548469829559326,2.4484483251571656,,
|
| 107 |
+
48500,0.2541220486164093,0.2541220273971558,2.4298109912872317,,
|
| 108 |
+
49000,0.22654587030410767,0.22654584121704102,2.4573871784210204,,
|
| 109 |
+
49500,0.2262624204158783,0.2262624340057373,2.45767058801651,,
|
| 110 |
+
50000,0.24036908149719238,0.24036908674240112,2.443563925743103,,
|
| 111 |
+
50000,,,,2.362757978439331,0.3211750388145447
|
| 112 |
+
50500,0.24408045411109924,0.24408046054840088,2.4398525590896605,,
|
| 113 |
+
51000,0.2395782768726349,0.23957825946807862,2.4443547587394714,,
|
2/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0ebbb2f4e0c915a29398c45b2f1caaa29efa7b3a4beb9954108b3c7c392d7b4
|
| 3 |
+
size 8844014
|
2/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 2
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
2/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=2
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=2
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/PPO/2
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
2/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=2
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=2
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 2
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
2/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=2
|
2/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.0994451716542244,-0.09944517850875854,2.783378199100494,,
|
| 3 |
+
1000,-0.10606984049081802,-0.10606984996795654,2.790002866744995,,
|
| 4 |
+
1500,-0.10751887410879135,-0.10751888036727905,2.7914519019126893,,
|
| 5 |
+
2000,-0.11211390793323517,-0.11211390495300293,2.7960469217300417,,
|
| 6 |
+
2500,-0.06497228145599365,-0.06497228765487671,2.748905309677124,,
|
| 7 |
+
3000,-0.07450605928897858,-0.07450606632232666,2.7584390859603882,,
|
| 8 |
+
3500,-0.07465509325265884,-0.07465509223937988,2.7585881171226503,,
|
| 9 |
+
4000,-0.05147909000515938,-0.051479094982147214,2.7354121136665346,,
|
| 10 |
+
4500,-0.04089735448360443,-0.040897353649139406,2.724830382823944,,
|
| 11 |
+
5000,-0.03495738282799721,-0.03495738363265991,2.718890408039093,,
|
| 12 |
+
5000,,,,2.6037181878089903,0.08021483570337296
|
| 13 |
+
5500,-0.039229728281497955,-0.03922972536087036,2.7231627402305603,,
|
| 14 |
+
6000,-0.03772832453250885,-0.037728325843811035,2.7216613421440123,,
|
| 15 |
+
6500,-0.0037587217520922422,-0.0037587223052978516,2.6876917366981505,,
|
| 16 |
+
7000,0.020572727546095848,0.020572731494903563,2.663360293388367,,
|
| 17 |
+
7500,0.0024799685925245285,0.002479968547821045,2.6814530634880067,,
|
| 18 |
+
8000,0.021671822294592857,0.021671819686889648,2.66226118850708,,
|
| 19 |
+
8500,0.029506858438253403,0.029506860256195068,2.6544261655807495,,
|
| 20 |
+
9000,0.03376694396138191,0.033766944885253905,2.6501660714149473,,
|
| 21 |
+
9500,0.022409599274396896,0.02240959930419922,2.6615234208106995,,
|
| 22 |
+
10000,0.030189668759703636,0.030189669609069825,2.653743350982666,,
|
| 23 |
+
10000,,,,2.5183556270599365,0.16557738184928894
|
| 24 |
+
10500,0.04676058888435364,0.04676058626174927,2.6371724247932433,,
|
| 25 |
+
11000,0.07060226798057556,0.07060226678848266,2.6133307514190673,,
|
| 26 |
+
11500,0.06412626802921295,0.0641262698173523,2.6198067574501036,,
|
| 27 |
+
12000,0.06050346419215202,0.06050346803665161,2.6234295644760133,,
|
| 28 |
+
12500,0.060363538563251495,0.06036353921890259,2.623569480419159,,
|
| 29 |
+
13000,0.08335579186677933,0.08335579109191894,2.6005772447586057,,
|
| 30 |
+
13500,0.08638317883014679,0.08638317489624023,2.5975498485565187,,
|
| 31 |
+
14000,0.06645781546831131,0.06645781898498535,2.617475203514099,,
|
| 32 |
+
14500,0.09151853621006012,0.09151853895187378,2.5924144792556763,,
|
| 33 |
+
15000,0.08465094119310379,0.08465094184875488,2.599282078266144,,
|
| 34 |
+
15000,,,,2.4451038384437562,0.23882916569709778
|
| 35 |
+
15500,0.11452946811914444,0.11452946090698242,2.5694035511016846,,
|
| 36 |
+
16000,0.09500941634178162,0.09500942277908325,2.588923593044281,,
|
| 37 |
+
16500,0.1292753368616104,0.12927532863616945,2.554657697200775,,
|
| 38 |
+
17000,0.13170774281024933,0.13170773887634277,2.5522252779006958,,
|
| 39 |
+
17500,0.14368891716003418,0.14368892765045166,2.540244092464447,,
|
| 40 |
+
18000,0.12941446900367737,0.12941448211669923,2.5545185537338257,,
|
| 41 |
+
18500,0.14257852733135223,0.14257851791381837,2.541354515552521,,
|
| 42 |
+
19000,0.13966801762580872,0.1396680188179016,2.5442650055885316,,
|
| 43 |
+
19500,0.11327601224184036,0.11327600574493409,2.570657021522522,,
|
| 44 |
+
20000,0.13754010200500488,0.137540096282959,2.5463929257392883,,
|
| 45 |
+
20000,,,,2.3374540960788726,0.3464789092540741
|
| 46 |
+
20500,0.1368420124053955,0.13684199571609498,2.547091028213501,,
|
| 47 |
+
21000,0.1405256986618042,0.1405256929397583,2.5434073238372803,,
|
| 48 |
+
21500,0.1498691737651825,0.14986918354034423,2.5340638318061828,,
|
| 49 |
+
22000,0.12159030139446259,0.12159030199050903,2.562342716693878,,
|
| 50 |
+
22500,0.1282031089067459,0.1282031044960022,2.5557299060821532,,
|
| 51 |
+
23000,0.13812652230262756,0.13812652015686036,2.545806498527527,,
|
| 52 |
+
23500,0.14436185359954834,0.14436183929443358,2.539571183204651,,
|
| 53 |
+
24000,0.14042876660823822,0.14042878341674805,2.543504234790802,,
|
| 54 |
+
24500,0.1500898152589798,0.15008983612060547,2.5338431830406187,,
|
| 55 |
+
25000,0.16284410655498505,0.1628440980911255,2.5210889225006103,,
|
| 56 |
+
25000,,,,2.390567365884781,0.2933656573295593
|
| 57 |
+
25500,0.16590774059295654,0.16590775299072266,2.518025266170502,,
|
| 58 |
+
26000,0.15530768036842346,0.15530769491195678,2.528625322341919,,
|
| 59 |
+
26500,0.17472608387470245,0.1747260971069336,2.509206932067871,,
|
| 60 |
+
27000,0.18254752457141876,0.1825475344657898,2.501385488986969,,
|
| 61 |
+
27500,0.1950436234474182,0.19504363346099854,2.488889398097992,,
|
| 62 |
+
28000,0.19465161859989166,0.19465161991119384,2.489281394481659,,
|
| 63 |
+
28500,0.16215169429779053,0.16215169429779053,2.521781334400177,,
|
| 64 |
+
29000,0.1890368014574051,0.1890368037223816,2.494896222114563,,
|
| 65 |
+
29500,0.16764257848262787,0.16764257097244262,2.5162904510498048,,
|
| 66 |
+
30000,0.18648077547550201,0.18648079109191895,2.497452229499817,,
|
| 67 |
+
30000,,,,2.4020849370956423,0.28184807300567627
|
| 68 |
+
30500,0.1981387883424759,0.19813880348205568,2.48579421377182,,
|
| 69 |
+
31000,0.1995157152414322,0.19951573085784913,2.484417300224304,,
|
| 70 |
+
31500,0.19233618676662445,0.19233620643615723,2.4915968136787416,,
|
| 71 |
+
32000,0.1899498850107193,0.18994987297058105,2.4939831395149232,,
|
| 72 |
+
32500,0.17684371769428253,0.17684373235702514,2.507089285373688,,
|
| 73 |
+
33000,0.1916748285293579,0.1916748285293579,2.4922581815719607,,
|
| 74 |
+
33500,0.19882339239120483,0.1988233962059021,2.4851096124649046,,
|
| 75 |
+
34000,0.18513064086437225,0.18513067245483397,2.4988023529052734,,
|
| 76 |
+
34500,0.18377690017223358,0.1837769031524658,2.50015611076355,,
|
| 77 |
+
35000,0.20141400396823883,0.20141400146484376,2.482519019126892,,
|
| 78 |
+
35000,,,,2.326228091716766,0.35770493745803833
|
| 79 |
+
35500,0.2049022763967514,0.20490229749679564,2.479030722618103,,
|
| 80 |
+
36000,0.1827041506767273,0.1827041506767273,2.501228865146637,,
|
| 81 |
+
36500,0.20387372374534607,0.2038737111091614,2.480059317111969,,
|
| 82 |
+
37000,0.196685329079628,0.19668533897399904,2.487247681617737,,
|
| 83 |
+
37500,0.20406845211982727,0.204068443775177,2.479864577770233,,
|
| 84 |
+
38000,0.19349411129951477,0.1934941005706787,2.490438925266266,,
|
| 85 |
+
38500,0.17627273499965668,0.17627272462844848,2.5076602902412413,,
|
| 86 |
+
39000,0.20846974849700928,0.20846974754333497,2.4754632654190063,,
|
| 87 |
+
39500,0.19735704362392426,0.19735703134536745,2.486575985431671,,
|
| 88 |
+
40000,0.2160172015428543,0.216017192363739,2.467915835380554,,
|
| 89 |
+
40000,,,,2.335146962404251,0.34878605604171753
|
| 90 |
+
40500,0.20623968541622162,0.20623968935012818,2.4776933131217955,,
|
| 91 |
+
41000,0.21017757058143616,0.2101775722503662,2.473755452632904,,
|
| 92 |
+
41500,0.20313598215579987,0.20313598442077638,2.480797035217285,,
|
| 93 |
+
42000,0.20961160957813263,0.20961161422729493,2.4743214087486267,,
|
| 94 |
+
42500,0.20024247467517853,0.20024249172210692,2.4836905217170715,,
|
| 95 |
+
43000,0.21787002682685852,0.21787005281448366,2.466062967300415,,
|
| 96 |
+
43500,0.19163763523101807,0.1916376461982727,2.4922953810691832,,
|
| 97 |
+
44000,0.20073702931404114,0.20073703861236572,2.4831959767341614,,
|
| 98 |
+
44500,0.2190060168504715,0.21900599670410156,2.4649270324707033,,
|
| 99 |
+
45000,0.18765786290168762,0.187657874584198,2.4962751512527466,,
|
| 100 |
+
45000,,,,2.315196923017502,0.3687360882759094
|
| 101 |
+
45500,0.22351709008216858,0.22351709222793578,2.4604159235954284,,
|
| 102 |
+
46000,0.20633113384246826,0.2063311243057251,2.4776019020080566,,
|
| 103 |
+
46500,0.2301706224679947,0.23017064189910888,2.4537623782157896,,
|
| 104 |
+
47000,0.21686559915542603,0.21686558055877686,2.4670674419403076,,
|
| 105 |
+
47500,0.22620093822479248,0.22620094537734986,2.45773206949234,,
|
| 106 |
+
48000,0.2198602557182312,0.21986025428771971,2.4640727558135986,,
|
| 107 |
+
48500,0.20460699498653412,0.20460699224472045,2.479326027393341,,
|
| 108 |
+
49000,0.2306915670633316,0.23069156932830812,2.453241452693939,,
|
| 109 |
+
49500,0.22506792843341827,0.22506792736053466,2.458865101337433,,
|
| 110 |
+
50000,0.22412747144699097,0.2241274642944336,2.459805559158325,,
|
| 111 |
+
50000,,,,2.364021906852722,0.3199111223220825
|
| 112 |
+
50500,0.2216455042362213,0.22164550828933716,2.4622875051498414,,
|
| 113 |
+
51000,0.21099665760993958,0.21099666213989257,2.472936363697052,,
|
3/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba31f535f25e87be3e24acab7df712348775e7431eb66e3dac11cede12171ec2
|
| 3 |
+
size 8844016
|
3/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 3
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
3/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=3
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=3
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/PPO/3
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
3/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=3
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=3
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 3
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
3/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=3
|
3/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
3/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.09891711175441742,-0.09891710472106933,2.7828501138687134,,
|
| 3 |
+
1000,-0.11167707294225693,-0.11167706871032715,2.795610085964203,,
|
| 4 |
+
1500,-0.09946882724761963,-0.09946881818771362,2.7834018445014954,,
|
| 5 |
+
2000,-0.10062853991985321,-0.1006285343170166,2.7845615482330324,,
|
| 6 |
+
2500,-0.061527904123067856,-0.061527903079986575,2.745460922718048,,
|
| 7 |
+
3000,-0.06606268137693405,-0.06606268262863159,2.7499957075119017,,
|
| 8 |
+
3500,-0.05954999476671219,-0.05955000162124634,2.7434830274581907,,
|
| 9 |
+
4000,-0.05555497854948044,-0.0555549840927124,2.7394880042076113,,
|
| 10 |
+
4500,0.0023939155507832766,0.0023939151763916018,2.6815391001701356,,
|
| 11 |
+
5000,-7.365843339357525e-05,-7.365846633911133e-05,2.6840066733360293,,
|
| 12 |
+
5000,,,,2.5783715426921843,0.10556146502494812
|
| 13 |
+
5500,0.0008393868338316679,0.0008393864631652832,2.683093640804291,,
|
| 14 |
+
6000,-0.008465495891869068,-0.008465495586395264,2.6923985118865965,,
|
| 15 |
+
6500,0.03367268294095993,0.03367268657684326,2.6502603302001955,,
|
| 16 |
+
7000,0.03924187645316124,0.03924187755584717,2.644691149711609,,
|
| 17 |
+
7500,0.04294167086482048,0.04294166994094849,2.6409913530349733,,
|
| 18 |
+
8000,0.036273177713155746,0.03627317810058594,2.6476598501205446,,
|
| 19 |
+
8500,0.07401108741760254,0.07401108598709107,2.6099219312667845,,
|
| 20 |
+
9000,0.07633965462446213,0.07633965444564819,2.607593364715576,,
|
| 21 |
+
9500,0.09850367903709412,0.09850367832183837,2.585429337978363,,
|
| 22 |
+
10000,0.09704853594303131,0.09704854631423951,2.586884476184845,,
|
| 23 |
+
10000,,,,2.4838084244728087,0.200124591588974
|
| 24 |
+
10500,0.11583186686038971,0.11583186864852905,2.56810115480423,,
|
| 25 |
+
11000,0.10295286774635315,0.10295286750793457,2.5809801516532898,,
|
| 26 |
+
11500,0.11649453639984131,0.11649454069137573,2.567438478946686,,
|
| 27 |
+
12000,0.11690977960824966,0.1169097809791565,2.5670232491493223,,
|
| 28 |
+
12500,0.12889903783798218,0.12889904308319092,2.5550339760780334,,
|
| 29 |
+
13000,0.12540902197360992,0.12540903282165528,2.558523998737335,,
|
| 30 |
+
13500,0.12952035665512085,0.1295203619003296,2.5544126563072203,,
|
| 31 |
+
14000,0.13816821575164795,0.13816821908950805,2.545764805316925,,
|
| 32 |
+
14500,0.11913298815488815,0.11913299465179443,2.5648000168800356,,
|
| 33 |
+
15000,0.10662222653627396,0.1066222243309021,2.5773107938766477,,
|
| 34 |
+
15000,,,,2.4391083467006682,0.24482467770576477
|
| 35 |
+
15500,0.11620670557022095,0.11620670652389527,2.5677263140678406,,
|
| 36 |
+
16000,0.10898709297180176,0.10898709011077881,2.5749459319114685,,
|
| 37 |
+
16500,0.11433500796556473,0.11433500957489014,2.569598002433777,,
|
| 38 |
+
17000,0.12699638307094574,0.1269963755607605,2.5569366488456726,,
|
| 39 |
+
17500,0.1446753293275833,0.14467531251907348,2.539257697582245,,
|
| 40 |
+
18000,0.13824604451656342,0.13824604177474975,2.5456869912147524,,
|
| 41 |
+
18500,0.1420973539352417,0.14209736490249633,2.5418356566429137,,
|
| 42 |
+
19000,0.15067099034786224,0.15067098760604858,2.5332620320320127,,
|
| 43 |
+
19500,0.1436053067445755,0.1436053171157837,2.5403277053833007,,
|
| 44 |
+
20000,0.15211673080921173,0.15211671876907348,2.5318163022994997,,
|
| 45 |
+
20000,,,,2.450709583759308,0.23322342336177826
|
| 46 |
+
20500,0.16624878346920013,0.16624877786636352,2.5176842403411865,,
|
| 47 |
+
21000,0.18854767084121704,0.188547664642334,2.4953853616714476,,
|
| 48 |
+
21500,0.19203181564807892,0.1920318284034729,2.4919011945724487,,
|
| 49 |
+
22000,0.16513976454734802,0.1651397547721863,2.5187932596206664,,
|
| 50 |
+
22500,0.16812942922115326,0.1681294322013855,2.5158035764694215,,
|
| 51 |
+
23000,0.19641534984111786,0.1964153428077698,2.4875176720619203,,
|
| 52 |
+
23500,0.18649353086948395,0.1864935417175293,2.497439467906952,,
|
| 53 |
+
24000,0.19292527437210083,0.1929252882003784,2.4910077376365662,,
|
| 54 |
+
24500,0.1816236674785614,0.1816236433982849,2.5023093786239623,,
|
| 55 |
+
25000,0.16704362630844116,0.1670436224937439,2.5168893966674806,,
|
| 56 |
+
25000,,,,2.395929628610611,0.2880033850669861
|
| 57 |
+
25500,0.23327630758285522,0.23327631330490112,2.4506566948890685,,
|
| 58 |
+
26000,0.2154207080602646,0.21542072820663452,2.4685122900009153,,
|
| 59 |
+
26500,0.21192854642868042,0.21192854166030883,2.4720044722557066,,
|
| 60 |
+
27000,0.20999127626419067,0.20999128913879395,2.473941734790802,,
|
| 61 |
+
27500,0.20917782187461853,0.20917780876159667,2.4747552065849305,,
|
| 62 |
+
28000,0.18882322311401367,0.18882323455810546,2.495109778881073,,
|
| 63 |
+
28500,0.19372473657131195,0.19372472953796388,2.490208284854889,,
|
| 64 |
+
29000,0.2108186036348343,0.21081860113143921,2.473114411830902,,
|
| 65 |
+
29500,0.20430395007133484,0.20430395030975343,2.4796290740966795,,
|
| 66 |
+
30000,0.1950298547744751,0.19502984809875487,2.4889031624794007,,
|
| 67 |
+
30000,,,,2.38793460726738,0.29599839448928833
|
| 68 |
+
30500,0.22502166032791138,0.22502168512344362,2.458911340236664,,
|
| 69 |
+
31000,0.20458984375,0.20458983850479126,2.479343176841736,,
|
| 70 |
+
31500,0.2069457620382309,0.20694575357437134,2.4769872674942017,,
|
| 71 |
+
32000,0.20202268660068512,0.2020227084159851,2.4819103121757506,,
|
| 72 |
+
32500,0.22310367226600647,0.22310365438461305,2.460829359531403,,
|
| 73 |
+
33000,0.22981679439544678,0.2298167986869812,2.454116222858429,,
|
| 74 |
+
33500,0.20290018618106842,0.20290019702911377,2.4810328259468077,,
|
| 75 |
+
34000,0.2062346339225769,0.206234637260437,2.477698389053345,,
|
| 76 |
+
34500,0.23413966596126556,0.234139666557312,2.449793354511261,,
|
| 77 |
+
35000,0.22518916428089142,0.2251891598701477,2.4587438702583313,,
|
| 78 |
+
35000,,,,2.3405652976036073,0.34336769580841064
|
| 79 |
+
35500,0.22377637028694153,0.22377637100219727,2.4601566586494448,,
|
| 80 |
+
36000,0.23810531198978424,0.23810530424118043,2.4458277153968813,,
|
| 81 |
+
36500,0.22875234484672546,0.22875235891342163,2.455180656909943,,
|
| 82 |
+
37000,0.22764217853546143,0.22764219093322755,2.4562908101081846,,
|
| 83 |
+
37500,0.21719835698604584,0.21719837856292726,2.466734628677368,,
|
| 84 |
+
38000,0.19750618934631348,0.19750620651245118,2.4864268193244934,,
|
| 85 |
+
38500,0.22053012251853943,0.22053012132644653,2.4634029116630556,,
|
| 86 |
+
39000,0.22359926998615265,0.22359929656982422,2.460333724975586,,
|
| 87 |
+
39500,0.23657433688640594,0.23657435846328737,2.4473586540222168,,
|
| 88 |
+
40000,0.20637521147727966,0.20637521266937256,2.477557804107666,,
|
| 89 |
+
40000,,,,2.3699842357635497,0.31394875049591064
|
| 90 |
+
40500,0.22578999400138855,0.22579001426696776,2.4581430106163027,,
|
| 91 |
+
41000,0.20213009417057037,0.20213009786605834,2.4818029208183288,,
|
| 92 |
+
41500,0.222834974527359,0.22283495903015138,2.4610980582237243,,
|
| 93 |
+
42000,0.214809849858284,0.21480985116958617,2.46912316942215,,
|
| 94 |
+
42500,0.20192191004753113,0.20192190837860108,2.4820111145973205,,
|
| 95 |
+
43000,0.18683753907680511,0.1868375382423401,2.497095480918884,,
|
| 96 |
+
43500,0.23042967915534973,0.23042965745925903,2.453503354549408,,
|
| 97 |
+
44000,0.21709732711315155,0.21709729719161988,2.4668357152938842,,
|
| 98 |
+
44500,0.2244701385498047,0.22447013664245605,2.459462878704071,,
|
| 99 |
+
45000,0.21839791536331177,0.2183979172706604,2.465535108566284,,
|
| 100 |
+
45000,,,,2.36728297829628,0.31665003299713135
|
| 101 |
+
45500,0.21026742458343506,0.2102674479484558,2.473665577411652,,
|
| 102 |
+
46000,0.2203454226255417,0.22034544086456298,2.463587579727173,,
|
| 103 |
+
46500,0.2295851856470108,0.2295851788520813,2.4543478422164915,,
|
| 104 |
+
47000,0.23154929280281067,0.23154930305480956,2.4523837060928346,,
|
| 105 |
+
47500,0.21177606284618378,0.21177606201171875,2.4721569662094116,,
|
| 106 |
+
48000,0.20393964648246765,0.20393967151641845,2.4799933428764342,,
|
| 107 |
+
48500,0.23248827457427979,0.23248827171325684,2.451444736480713,,
|
| 108 |
+
49000,0.22605499625205994,0.22605501747131349,2.4578780026435854,,
|
| 109 |
+
49500,0.24113361537456512,0.24113362884521483,2.4427993798255923,,
|
| 110 |
+
50000,0.2199091911315918,0.2199091944694519,2.4640238270759585,,
|
| 111 |
+
50000,,,,2.3439831459522247,0.3399498462677002
|
| 112 |
+
50500,0.23813430964946747,0.23813428592681884,2.445798729419708,,
|
| 113 |
+
51000,0.22703494131565094,0.2270349555015564,2.456898073673248,,
|
4/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43add9802b19a3a387c872bd4f66605ca1189177175dfe7d7adffb15b7bc9a7f
|
| 3 |
+
size 8844012
|
4/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-hard-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 4
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
4/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=4
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=4
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-hard-v0/PPO/4
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
4/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-hard-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=4
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-hard-v0,rl_mode=marl,seed=4
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-hard-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 4
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
4/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-hard-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=4
|