Upload results for PPO on RBC3D-medium-v0.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +20 -0
- 0/ckpt_latest.zip +3 -0
- 0/config.yaml +58 -0
- 0/hydra.yaml +163 -0
- 0/multirun.yaml +221 -0
- 0/overrides.yaml +4 -0
- 0/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 0/test/test_eval_episode_0.csv +0 -0
- 0/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 0/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 0/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 0/training_log.csv +113 -0
- 1/ckpt_latest.zip +3 -0
- 1/config.yaml +58 -0
- 1/hydra.yaml +163 -0
- 1/multirun.yaml +221 -0
- 1/overrides.yaml +4 -0
- 1/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 1/test/test_eval_episode_0.csv +0 -0
- 1/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 1/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 1/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 1/training_log.csv +113 -0
- 2/ckpt_latest.zip +3 -0
- 2/config.yaml +58 -0
- 2/hydra.yaml +163 -0
- 2/multirun.yaml +221 -0
- 2/overrides.yaml +4 -0
- 2/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 2/test/test_eval_episode_0.csv +0 -0
- 2/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 2/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 2/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 2/training_log.csv +113 -0
- 3/ckpt_latest.zip +3 -0
- 3/config.yaml +58 -0
- 3/hydra.yaml +163 -0
- 3/multirun.yaml +221 -0
- 3/overrides.yaml +4 -0
- 3/test/3d_temperature_test_eval_episode_0.gif +3 -0
- 3/test/test_eval_episode_0.csv +0 -0
- 3/test/x-y-temperature_test_eval_episode_0.gif +3 -0
- 3/test/x-z-temperature_test_eval_episode_0.gif +3 -0
- 3/test/y-z-temperature_test_eval_episode_0.gif +3 -0
- 3/training_log.csv +113 -0
- 4/ckpt_latest.zip +3 -0
- 4/config.yaml +58 -0
- 4/hydra.yaml +163 -0
- 4/multirun.yaml +221 -0
- 4/overrides.yaml +4 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,23 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
0/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
0/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
0/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
0/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
1/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
1/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
1/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
1/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
2/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
2/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
2/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
2/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
3/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
3/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
3/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
3/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
4/test/3d_temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
4/test/x-y-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
4/test/x-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
4/test/y-z-temperature_test_eval_episode_0.gif filter=lfs diff=lfs merge=lfs -text
|
0/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c8add9ea9ef665357d927755e9752869f9d0c6f4ee38eed5d3361983b61eec1
|
| 3 |
+
size 8844014
|
0/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-medium-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 0
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
0/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=0
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=0
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-medium-v0/PPO/0
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
0/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=0
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=0
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-medium-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 0
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
0/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-medium-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=0
|
0/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
0/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
0/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.07284899801015854,-0.07284899568557739,2.516992525100708,,
|
| 3 |
+
1000,-0.08247055858373642,-0.0824705605506897,2.526614098072052,,
|
| 4 |
+
1500,-0.081957146525383,-0.08195714282989502,2.5261006712913514,,
|
| 5 |
+
2000,-0.09400798380374908,-0.09400798463821411,2.538151517391205,,
|
| 6 |
+
2500,-0.03117496147751808,-0.031174960136413573,2.47531849193573,,
|
| 7 |
+
3000,-0.040552545338869095,-0.040552542686462405,2.4846960706710814,,
|
| 8 |
+
3500,-0.027283145114779472,-0.0272831449508667,2.471426689147949,,
|
| 9 |
+
4000,-0.02746737375855446,-0.027467374324798583,2.4716108980178833,,
|
| 10 |
+
4500,0.009480989538133144,0.009480987548828125,2.434662547111511,,
|
| 11 |
+
5000,0.01582098938524723,0.01582098913192749,2.4283225474357604,,
|
| 12 |
+
5000,,,,2.2840357506275177,0.1601077914237976
|
| 13 |
+
5500,0.009929155930876732,0.009929156303405762,2.434214381694794,,
|
| 14 |
+
6000,-0.00016683874127920717,-0.0001668386459350586,2.4443103799819945,,
|
| 15 |
+
6500,0.029412414878606796,0.029412415981292725,2.4147311053276064,,
|
| 16 |
+
7000,0.015340999700129032,0.015341001033782959,2.4288025283813477,,
|
| 17 |
+
7500,0.04828393831849098,0.04828394079208374,2.39585959148407,,
|
| 18 |
+
8000,0.027136696502566338,0.027136694431304932,2.417006841659546,,
|
| 19 |
+
8500,0.07230944186449051,0.0723094391822815,2.371834099292755,,
|
| 20 |
+
9000,0.048889052122831345,0.048889055728912355,2.39525447511673,,
|
| 21 |
+
9500,0.05876648798584938,0.05876648855209351,2.3853770394325258,,
|
| 22 |
+
10000,0.05273273587226868,0.05273273324966431,2.3914108033180237,,
|
| 23 |
+
10000,,,,2.2356233417987825,0.20852018892765045
|
| 24 |
+
10500,0.0887230858206749,0.08872308492660523,2.355420449256897,,
|
| 25 |
+
11000,0.08898043632507324,0.08898043489456177,2.3551631011962892,,
|
| 26 |
+
11500,0.08206947147846222,0.08206947517395019,2.3620740489959715,,
|
| 27 |
+
12000,0.0905391201376915,0.09053913021087646,2.3536044063568116,,
|
| 28 |
+
12500,0.10625230520963669,0.10625230598449707,2.337891225337982,,
|
| 29 |
+
13000,0.109677255153656,0.1096772484779358,2.334466288089752,,
|
| 30 |
+
13500,0.11173564195632935,0.11173565101623535,2.332407876491547,,
|
| 31 |
+
14000,0.09036831557750702,0.09036831712722779,2.3537752056121826,,
|
| 32 |
+
14500,0.1243913546204567,0.12439135694503785,2.319752179145813,,
|
| 33 |
+
15000,0.1234671100974083,0.12346712493896485,2.3206764101982116,,
|
| 34 |
+
15000,,,,2.1257523238658904,0.31839120388031006
|
| 35 |
+
15500,0.12805908918380737,0.12805908918380737,2.3160844388008117,,
|
| 36 |
+
16000,0.13696682453155518,0.1369668369293213,2.307176693916321,,
|
| 37 |
+
16500,0.13080060482025146,0.13080060958862305,2.313342926979065,,
|
| 38 |
+
17000,0.137887105345726,0.1378871202468872,2.306256417751312,,
|
| 39 |
+
17500,0.15704573690891266,0.15704573345184325,2.2870978031158447,,
|
| 40 |
+
18000,0.14428897202014923,0.14428897428512574,2.2998545632362366,,
|
| 41 |
+
18500,0.1392766237258911,0.1392766270637512,2.3048669080734254,,
|
| 42 |
+
19000,0.15581251680850983,0.15581250572204589,2.2883310408592226,,
|
| 43 |
+
19500,0.14729617536067963,0.14729618215560913,2.296847346305847,,
|
| 44 |
+
20000,0.14627820253372192,0.14627820062637328,2.2978653359413146,,
|
| 45 |
+
20000,,,,2.1434880673885344,0.3006554841995239
|
| 46 |
+
20500,0.15487876534461975,0.15487877368927003,2.289264750957489,,
|
| 47 |
+
21000,0.16191016137599945,0.16191016149520873,2.282233376979828,,
|
| 48 |
+
21500,0.16468729078769684,0.1646873049736023,2.2794562277793884,,
|
| 49 |
+
22000,0.16435864567756653,0.16435863161087036,2.2797848925590514,,
|
| 50 |
+
22500,0.1759740263223648,0.1759740309715271,2.268169508457184,,
|
| 51 |
+
23000,0.14877089858055115,0.14877091121673583,2.295372636318207,,
|
| 52 |
+
23500,0.1593804955482483,0.1593805079460144,2.2847630252838136,,
|
| 53 |
+
24000,0.14516723155975342,0.14516724014282226,2.298976301193237,,
|
| 54 |
+
24500,0.1500563621520996,0.15005637502670288,2.2940871591567995,,
|
| 55 |
+
25000,0.14823997020721436,0.14823997020721436,2.2959035658836364,,
|
| 56 |
+
25000,,,,2.130064435005188,0.3140791058540344
|
| 57 |
+
25500,0.15658481419086456,0.1565848045349121,2.2875587220191957,,
|
| 58 |
+
26000,0.1492302566766739,0.1492302703857422,2.2949132595062256,,
|
| 59 |
+
26500,0.17601348459720612,0.17601349353790283,2.268130049228668,,
|
| 60 |
+
27000,0.156053826212883,0.15605384588241578,2.2880896854400636,,
|
| 61 |
+
27500,0.17075638473033905,0.17075635385513305,2.2733871846199034,,
|
| 62 |
+
28000,0.12509135901927948,0.12509135055541992,2.31905219078064,,
|
| 63 |
+
28500,0.15504378080368042,0.15504377365112304,2.289099756717682,,
|
| 64 |
+
29000,0.155385822057724,0.15538580894470214,2.2887577252388,,
|
| 65 |
+
29500,0.17931413650512695,0.17931413507461547,2.264829409122467,,
|
| 66 |
+
30000,0.14405401051044464,0.14405400228500367,2.3000895295143127,,
|
| 67 |
+
30000,,,,2.108922697305679,0.3352208137512207
|
| 68 |
+
30500,0.1728549748659134,0.17285499954223632,2.271288526535034,,
|
| 69 |
+
31000,0.16838832199573517,0.1683883352279663,2.2757551975250245,,
|
| 70 |
+
31500,0.19653981924057007,0.19653982305526732,2.247603726387024,,
|
| 71 |
+
32000,0.16980622708797455,0.1698062391281128,2.2743372921943665,,
|
| 72 |
+
32500,0.1903025507926941,0.19030255270004273,2.253840987205505,,
|
| 73 |
+
33000,0.16106392443180084,0.16106392574310302,2.2830796155929565,,
|
| 74 |
+
33500,0.18171410262584686,0.18171411275863647,2.2624294199943544,,
|
| 75 |
+
34000,0.16792571544647217,0.16792572355270385,2.2762178149223327,,
|
| 76 |
+
34500,0.16000893712043762,0.16000893783569337,2.2841346116065977,,
|
| 77 |
+
35000,0.17219094932079315,0.1721909580230713,2.2719525790214536,,
|
| 78 |
+
35000,,,,2.105157878398895,0.3389856815338135
|
| 79 |
+
35500,0.17283929884433746,0.17283930397033692,2.2713042240142824,,
|
| 80 |
+
36000,0.18398155272006989,0.18398155641555786,2.260161968231201,,
|
| 81 |
+
36500,0.15513131022453308,0.15513133764266968,2.289012189865112,,
|
| 82 |
+
37000,0.16344286501407623,0.16344288635253906,2.280700644016266,,
|
| 83 |
+
37500,0.16775661706924438,0.16775661993026733,2.2763869104385375,,
|
| 84 |
+
38000,0.1437034010887146,0.1437033996582031,2.300440122127533,,
|
| 85 |
+
38500,0.19318921864032745,0.19318924617767333,2.2509542956352235,,
|
| 86 |
+
39000,0.18310870230197906,0.18310872077941895,2.261034816265106,,
|
| 87 |
+
39500,0.19639214873313904,0.19639215898513793,2.2477513699531557,,
|
| 88 |
+
40000,0.1735430210828781,0.17354302501678467,2.2706005129814146,,
|
| 89 |
+
40000,,,,2.1538765203952788,0.2902669906616211
|
| 90 |
+
40500,0.19081838428974152,0.19081839036941528,2.2533251333236692,,
|
| 91 |
+
41000,0.19824714958667755,0.19824715232849122,2.2458963828086853,,
|
| 92 |
+
41500,0.1705096811056137,0.17050966691970826,2.273633864879608,,
|
| 93 |
+
42000,0.19678214192390442,0.196782133102417,2.247361406326294,,
|
| 94 |
+
42500,0.17333373427391052,0.17333374214172365,2.2708097829818725,,
|
| 95 |
+
43000,0.1892850697040558,0.18928504657745363,2.254858489990234,,
|
| 96 |
+
43500,0.19315484166145325,0.19315485191345214,2.250988679885864,,
|
| 97 |
+
44000,0.17756743729114532,0.17756744718551637,2.266576090335846,,
|
| 98 |
+
44500,0.19930996000766754,0.19930998182296752,2.2448335528373717,,
|
| 99 |
+
45000,0.19340313971042633,0.19340316438674926,2.250740375995636,,
|
| 100 |
+
45000,,,,2.1233883452415467,0.3207551836967468
|
| 101 |
+
45500,0.20025090873241425,0.20025090503692627,2.2438926210403443,,
|
| 102 |
+
46000,0.19082942605018616,0.19082943630218505,2.2533141112327577,,
|
| 103 |
+
46500,0.19664253294467926,0.1966425232887268,2.2475010209083557,,
|
| 104 |
+
47000,0.18970148265361786,0.18970146465301513,2.2544420595169066,,
|
| 105 |
+
47500,0.17102493345737457,0.17102494335174562,2.273118592262268,,
|
| 106 |
+
48000,0.2168714851140976,0.21687149810791015,2.2272720403671267,,
|
| 107 |
+
48500,0.21920549869537354,0.21920550203323363,2.224938039779663,,
|
| 108 |
+
49000,0.21964401006698608,0.21964401769638062,2.2244995188713075,,
|
| 109 |
+
49500,0.2057390660047531,0.2057390580177307,2.2384044857025147,,
|
| 110 |
+
50000,0.2132531851530075,0.21325318336486818,2.2308903584480286,,
|
| 111 |
+
50000,,,,2.0895031124353407,0.3546404540538788
|
| 112 |
+
50500,0.19286243617534637,0.19286244964599608,2.251281086444855,,
|
| 113 |
+
51000,0.18694031238555908,0.18694031429290772,2.2572032160758972,,
|
1/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:707b865b7e4e1146050ad3954865d9ede61a9856e22847704527e92fc87b6181
|
| 3 |
+
size 8844018
|
1/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-medium-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 1
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
1/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=1
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=1
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-medium-v0/PPO/1
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
1/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=1
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=1
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-medium-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 1
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
1/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-medium-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=1
|
1/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
1/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
1/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.08366084098815918,-0.08366084432601929,2.5278043789863585,,
|
| 3 |
+
1000,-0.09297764301300049,-0.09297764301300049,2.53712117767334,,
|
| 4 |
+
1500,-0.08641175180673599,-0.08641175746917724,2.530555289745331,,
|
| 5 |
+
2000,-0.0874360054731369,-0.08743599462509155,2.5315795216560364,,
|
| 6 |
+
2500,-0.0405673086643219,-0.04056731128692627,2.484710841178894,,
|
| 7 |
+
3000,-0.021202605217695236,-0.0212026047706604,2.465346137046814,,
|
| 8 |
+
3500,-0.037111878395080566,-0.0371118803024292,2.481255407333374,,
|
| 9 |
+
4000,-0.046849992126226425,-0.046849987983703614,2.490993522167206,,
|
| 10 |
+
4500,-0.0019580242224037647,-0.001958024501800537,2.446101553440094,,
|
| 11 |
+
5000,0.00825823750346899,0.008258237361907958,2.4358853001594545,,
|
| 12 |
+
5000,,,,2.28835297703743,0.1557905673980713
|
| 13 |
+
5500,-0.00027999942540191114,-0.0002799992561340332,2.4444235401153565,,
|
| 14 |
+
6000,0.004405356477946043,0.004405355930328369,2.439738178730011,,
|
| 15 |
+
6500,0.030355848371982574,0.03035584783554077,2.4137876868247985,,
|
| 16 |
+
7000,0.021564261987805367,0.02156426239013672,2.4225792751312256,,
|
| 17 |
+
7500,0.028914358466863632,0.028914360523223877,2.4152291746139527,,
|
| 18 |
+
8000,0.02819138951599598,0.02819138765335083,2.4159521479606627,,
|
| 19 |
+
8500,0.023626087233424187,0.02362608861923218,2.4205174407958983,,
|
| 20 |
+
9000,0.06576478481292725,0.06576479053497314,2.378378733634949,,
|
| 21 |
+
9500,0.054117247462272644,0.05411725330352783,2.3900262799263,,
|
| 22 |
+
10000,0.05904707312583923,0.059047069549560544,2.3850964593887327,,
|
| 23 |
+
10000,,,,2.239135735034943,0.20500779151916504
|
| 24 |
+
10500,0.06512696295976639,0.06512696266174317,2.3790165672302246,,
|
| 25 |
+
11000,0.0724114254117012,0.07241142320632935,2.3717321128845215,,
|
| 26 |
+
11500,0.0745772272348404,0.07457722806930542,2.369566306114197,,
|
| 27 |
+
12000,0.06642086803913116,0.06642086744308472,2.3777226538658143,,
|
| 28 |
+
12500,0.06590814143419266,0.06590813875198365,2.37823540019989,,
|
| 29 |
+
13000,0.09832964837551117,0.09832965278625488,2.3458138847351075,,
|
| 30 |
+
13500,0.10290686041116714,0.10290686988830566,2.3412366628646852,,
|
| 31 |
+
14000,0.08539082854986191,0.08539082431793213,2.3587527213096617,,
|
| 32 |
+
14500,0.07266561686992645,0.07266561651229858,2.3714779143333433,,
|
| 33 |
+
15000,0.08612429350614548,0.08612428760528565,2.358019244670868,,
|
| 34 |
+
15000,,,,2.2292354357242585,0.21490809321403503
|
| 35 |
+
15500,0.10826536267995834,0.10826536083221436,2.335878182411194,,
|
| 36 |
+
16000,0.0939083844423294,0.09390838861465454,2.3502351422309875,,
|
| 37 |
+
16500,0.09960270673036575,0.09960269689559936,2.344540831565857,,
|
| 38 |
+
17000,0.1263253539800644,0.12632535457611083,2.3178181862831115,,
|
| 39 |
+
17500,0.11701292544603348,0.11701291990280151,2.327130614280701,,
|
| 40 |
+
18000,0.11246103048324585,0.11246103191375732,2.331682500362396,,
|
| 41 |
+
18500,0.1060979962348938,0.10609800148010254,2.338045522689819,,
|
| 42 |
+
19000,0.10817639529705048,0.1081763949394226,2.3359671382904055,,
|
| 43 |
+
19500,0.12890228629112244,0.1289022750854492,2.3152412567138674,,
|
| 44 |
+
20000,0.12308061867952347,0.12308062076568603,2.3210629186630247,,
|
| 45 |
+
20000,,,,2.170112668275833,0.274030864238739
|
| 46 |
+
20500,0.10645964741706848,0.1064596529006958,2.3376838750839233,,
|
| 47 |
+
21000,0.11845333874225616,0.1184533338546753,2.3256902017593384,,
|
| 48 |
+
21500,0.15487515926361084,0.15487514352798462,2.289268393993378,,
|
| 49 |
+
22000,0.13464190065860748,0.13464189291000367,2.3095016331672666,,
|
| 50 |
+
22500,0.14186520874500275,0.1418651933670044,2.3022783303260805,,
|
| 51 |
+
23000,0.12954141199588776,0.12954140520095825,2.3146021370887757,,
|
| 52 |
+
23500,0.12115524709224701,0.12115525341033935,2.3229882917404177,,
|
| 53 |
+
24000,0.15144363045692444,0.1514436273574829,2.292699903011322,,
|
| 54 |
+
24500,0.13261589407920837,0.13261588764190674,2.311527645111084,,
|
| 55 |
+
25000,0.1468086689710617,0.14680867624282837,2.2973348531723023,,
|
| 56 |
+
25000,,,,2.1549171948432924,0.28922632336616516
|
| 57 |
+
25500,0.15241017937660217,0.15241017961502076,2.2917333550453187,,
|
| 58 |
+
26000,0.13457338511943817,0.13457337522506713,2.3095701665878297,,
|
| 59 |
+
26500,0.1453704982995987,0.14537049198150634,2.298773047924042,,
|
| 60 |
+
27000,0.1668587625026703,0.16685876941680908,2.2772847628593444,,
|
| 61 |
+
27500,0.1698814481496811,0.16988144636154176,2.2742620787620544,,
|
| 62 |
+
28000,0.1558079570531845,0.15580794954299926,2.2883355894088746,,
|
| 63 |
+
28500,0.13617078959941864,0.13617079639434815,2.307972741603851,,
|
| 64 |
+
29000,0.16322462260723114,0.16322461748123168,2.280918914794922,,
|
| 65 |
+
29500,0.17669051885604858,0.17669053888320924,2.26745299243927,,
|
| 66 |
+
30000,0.17846758663654327,0.17846759366989134,2.265675946712494,,
|
| 67 |
+
30000,,,,2.1715856873989106,0.2725578546524048
|
| 68 |
+
30500,0.16667309403419495,0.1666730899810791,2.277470438480377,,
|
| 69 |
+
31000,0.15678571164608002,0.15678571462631224,2.28735782623291,,
|
| 70 |
+
31500,0.2010551393032074,0.20105513334274291,2.243088393688202,,
|
| 71 |
+
32000,0.17751403152942657,0.17751403713226319,2.266629493713379,,
|
| 72 |
+
32500,0.17216086387634277,0.1721608567237854,2.271982675552368,,
|
| 73 |
+
33000,0.19131796061992645,0.19131796360015868,2.252825571537018,,
|
| 74 |
+
33500,0.18275043368339539,0.18275044250488282,2.2613930921554566,,
|
| 75 |
+
34000,0.20784145593643188,0.20784145212173463,2.2363020701408387,,
|
| 76 |
+
34500,0.18046826124191284,0.18046828508377075,2.26367524766922,,
|
| 77 |
+
35000,0.18855692446231842,0.18855693387985228,2.25558660364151,,
|
| 78 |
+
35000,,,,2.1727890491485597,0.2713544964790344
|
| 79 |
+
35500,0.1925363689661026,0.19253636932373047,2.2516071653366088,,
|
| 80 |
+
36000,0.16561688482761383,0.1656168942451477,2.278526629924774,,
|
| 81 |
+
36500,0.16554294526576996,0.1655429458618164,2.2786005945205687,,
|
| 82 |
+
37000,0.19604265689849854,0.19604266548156737,2.2481008710861206,,
|
| 83 |
+
37500,0.17421479523181915,0.17421479463577272,2.2699287328720095,,
|
| 84 |
+
38000,0.1756732314825058,0.17567323160171508,2.26847030878067,,
|
| 85 |
+
38500,0.1954001933336258,0.19540018033981324,2.248743362903595,,
|
| 86 |
+
39000,0.17579451203346252,0.17579451847076416,2.2683490142822267,,
|
| 87 |
+
39500,0.1855808049440384,0.18558082294464112,2.258562706947327,,
|
| 88 |
+
40000,0.2053901106119156,0.20539010763168336,2.2387534322738647,,
|
| 89 |
+
40000,,,,2.161219387054443,0.2829241454601288
|
| 90 |
+
40500,0.20918519794940948,0.20918521451950073,2.2349583129882813,,
|
| 91 |
+
41000,0.19407238066196442,0.19407238340377808,2.2500711522102357,,
|
| 92 |
+
41500,0.2151118963956833,0.21511189603805542,2.229031632900238,,
|
| 93 |
+
42000,0.2062837779521942,0.20628378677368164,2.2378597469329833,,
|
| 94 |
+
42500,0.20741024613380432,0.2074102578163147,2.236733280658722,,
|
| 95 |
+
43000,0.18989317119121552,0.18989318466186522,2.2542503509521485,,
|
| 96 |
+
43500,0.19421561062335968,0.19421561193466186,2.2499279150962828,,
|
| 97 |
+
44000,0.1906915307044983,0.1906915249824524,2.253452006816864,,
|
| 98 |
+
44500,0.20838510990142822,0.2083851203918457,2.235758409500122,,
|
| 99 |
+
45000,0.2230866700410843,0.2230866904258728,2.2210568466186524,,
|
| 100 |
+
45000,,,,2.105118463039398,0.33902508020401
|
| 101 |
+
45500,0.2155987173318863,0.21559873962402343,2.228544791698456,,
|
| 102 |
+
46000,0.18086951971054077,0.18086951875686647,2.263274023532867,,
|
| 103 |
+
46500,0.20663580298423767,0.2066358060836792,2.2375077238082888,,
|
| 104 |
+
47000,0.2150769680738449,0.2150769772529602,2.22906655216217,,
|
| 105 |
+
47500,0.20921730995178223,0.2092173080444336,2.2349262390136717,,
|
| 106 |
+
48000,0.18769679963588715,0.18769677066802978,2.2564467492103577,,
|
| 107 |
+
48500,0.20955044031143188,0.209550452709198,2.23459308052063,,
|
| 108 |
+
49000,0.19852685928344727,0.19852686166763306,2.2456166667938233,,
|
| 109 |
+
49500,0.20671308040618896,0.20671307468414307,2.2374304571151735,,
|
| 110 |
+
50000,0.18875905871391296,0.1887590742111206,2.2553844656944273,,
|
| 111 |
+
50000,,,,2.1008523547649385,0.34329116344451904
|
| 112 |
+
50500,0.21066132187843323,0.2106613154411316,2.233482211589813,,
|
| 113 |
+
51000,0.2130340337753296,0.21303403091430664,2.231109505176544,,
|
2/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f768ce50725ef7b87709dcf36d8ef99ff85acadb0eab982302f48c7938d4c378
|
| 3 |
+
size 8844014
|
2/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-medium-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 2
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
2/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=2
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=2
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-medium-v0/PPO/2
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
2/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=2
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=2
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-medium-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 2
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
2/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-medium-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=2
|
2/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
2/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.07617373764514923,-0.07617373752593994,2.5203172755241394,,
|
| 3 |
+
1000,-0.08122028410434723,-0.0812202868461609,2.5253638234138487,,
|
| 4 |
+
1500,-0.08418595045804977,-0.0841859540939331,2.528329489707947,,
|
| 5 |
+
2000,-0.0857914462685585,-0.08579144620895386,2.5299349813461305,,
|
| 6 |
+
2500,-0.036292914301157,-0.036292914867401126,2.4804364471435547,,
|
| 7 |
+
3000,-0.0573156364262104,-0.0573156361579895,2.5014591674804687,,
|
| 8 |
+
3500,-0.03452780842781067,-0.034527808666229245,2.4786713409423826,,
|
| 9 |
+
4000,-0.02934977412223816,-0.029349772930145263,2.4734933099746703,,
|
| 10 |
+
4500,-0.020923318341374397,-0.020923319339752198,2.465066843986511,,
|
| 11 |
+
5000,0.0008688150555826724,0.0008688149452209473,2.4432747282981873,,
|
| 12 |
+
5000,,,,2.302758717536926,0.1413848102092743
|
| 13 |
+
5500,-0.004743958357721567,-0.004743958473205566,2.448887502193451,,
|
| 14 |
+
6000,-0.004918466787785292,-0.00491846752166748,2.4490620012283326,,
|
| 15 |
+
6500,-0.01970241405069828,-0.019702414512634277,2.463845951080322,,
|
| 16 |
+
7000,0.028401371091604233,0.028401370048522948,2.4157421565055848,,
|
| 17 |
+
7500,0.025030527263879776,0.025030526161193847,2.4191130137443544,,
|
| 18 |
+
8000,0.03886733949184418,0.038867340564727786,2.405276186943054,,
|
| 19 |
+
8500,0.024771681055426598,0.024771682262420654,2.419371840953827,,
|
| 20 |
+
9000,0.04508260264992714,0.04508260011672974,2.39906093788147,,
|
| 21 |
+
9500,0.03319144621491432,0.03319144058227539,2.4109520945549012,,
|
| 22 |
+
10000,0.05705280601978302,0.05705280828475952,2.387090718269348,,
|
| 23 |
+
10000,,,,2.2286224615573884,0.21552106738090515
|
| 24 |
+
10500,0.05242375656962395,0.052423755168914794,2.391719780921936,,
|
| 25 |
+
11000,0.07662103325128555,0.07662102603912353,2.3675225043296813,,
|
| 26 |
+
11500,0.06457732617855072,0.06457732057571411,2.379566216945648,,
|
| 27 |
+
12000,0.06433624774217606,0.06433625173568726,2.3798072891235353,,
|
| 28 |
+
12500,0.07520896941423416,0.07520897483825684,2.3689345531463624,,
|
| 29 |
+
13000,0.10430970788002014,0.10430970907211304,2.339833821296692,,
|
| 30 |
+
13500,0.107138492166996,0.10713849496841431,2.337005042076111,,
|
| 31 |
+
14000,0.060681093484163284,0.060681090831756594,2.3834624366760253,,
|
| 32 |
+
14500,0.0923704132437706,0.09237041425704956,2.351773105621338,,
|
| 33 |
+
15000,0.10639812052249908,0.10639812278747558,2.3377454075813295,,
|
| 34 |
+
15000,,,,2.184898077249527,0.25924545526504517
|
| 35 |
+
15500,0.11017220467329025,0.11017220497131347,2.3339713287353514,,
|
| 36 |
+
16000,0.11010102182626724,0.11010102367401123,2.334042506694794,,
|
| 37 |
+
16500,0.11482339352369308,0.11482338523864746,2.329320155143738,,
|
| 38 |
+
17000,0.12434407323598862,0.12434407234191895,2.3197994556427,,
|
| 39 |
+
17500,0.11305133998394012,0.11305133199691772,2.3310921902656556,,
|
| 40 |
+
18000,0.12088536471128464,0.12088536596298217,2.3232581696510315,,
|
| 41 |
+
18500,0.09946314990520477,0.09946315479278564,2.3446803817749022,,
|
| 42 |
+
19000,0.14079995453357697,0.14079995679855348,2.3033435688018797,,
|
| 43 |
+
19500,0.13807989656925201,0.13807989978790283,2.306063636302948,,
|
| 44 |
+
20000,0.1453116089105606,0.14531161546707153,2.298831922054291,,
|
| 45 |
+
20000,,,,2.1613855922222136,0.2827579379081726
|
| 46 |
+
20500,0.1477949470281601,0.14779496240615844,2.2963485679626463,,
|
| 47 |
+
21000,0.1494130790233612,0.14941309309005738,2.294730438709259,,
|
| 48 |
+
21500,0.12903814017772675,0.1290381441116333,2.315105395793915,,
|
| 49 |
+
22000,0.12245482206344604,0.12245481967926025,2.3216887168884277,,
|
| 50 |
+
22500,0.14850793778896332,0.1485079288482666,2.2956356039047243,,
|
| 51 |
+
23000,0.1593887209892273,0.15938872623443603,2.2847548065185546,,
|
| 52 |
+
23500,0.1564064621925354,0.1564064474105835,2.287737093925476,,
|
| 53 |
+
24000,0.14594756066799164,0.14594755792617797,2.298195967674255,,
|
| 54 |
+
24500,0.16107545793056488,0.16107544851303102,2.2830680861473085,,
|
| 55 |
+
25000,0.1436605602502823,0.1436605486869812,2.300482988357544,,
|
| 56 |
+
25000,,,,2.125348083972931,0.31879544258117676
|
| 57 |
+
25500,0.15157821774482727,0.1515782117843628,2.2925653324127198,,
|
| 58 |
+
26000,0.15027154982089996,0.15027155828475952,2.2938719668388368,,
|
| 59 |
+
26500,0.14881035685539246,0.14881037378311157,2.2953331503868104,,
|
| 60 |
+
27000,0.15366321802139282,0.15366322469711305,2.290480305671692,,
|
| 61 |
+
27500,0.15129607915878296,0.15129607629776,2.292847459793091,,
|
| 62 |
+
28000,0.1703789383172989,0.1703789448738098,2.2737645916938782,,
|
| 63 |
+
28500,0.16875307261943817,0.16875307989120483,2.275390453338623,,
|
| 64 |
+
29000,0.17007438838481903,0.17007437372207643,2.274069155216217,,
|
| 65 |
+
29500,0.1755026876926422,0.175502685546875,2.268640851020813,,
|
| 66 |
+
30000,0.17779889702796936,0.17779889917373656,2.2663446488380434,,
|
| 67 |
+
30000,,,,2.1136897838115694,0.3304537534713745
|
| 68 |
+
30500,0.1763191968202591,0.1763191967010498,2.2678243365287782,,
|
| 69 |
+
31000,0.1936023086309433,0.19360231113433837,2.250541229248047,,
|
| 70 |
+
31500,0.20531147718429565,0.20531146097183228,2.238832067489624,,
|
| 71 |
+
32000,0.19302237033843994,0.19302235841751098,2.2511211709976195,,
|
| 72 |
+
32500,0.1957819163799286,0.1957819299697876,2.2483616013526917,,
|
| 73 |
+
33000,0.2009516954421997,0.20095169830322265,2.2431918382644653,,
|
| 74 |
+
33500,0.18352803587913513,0.18352803564071654,2.26061549949646,,
|
| 75 |
+
34000,0.1996477097272873,0.1996476926803589,2.24449583530426,,
|
| 76 |
+
34500,0.20643119513988495,0.206431209564209,2.2377123193740847,,
|
| 77 |
+
35000,0.19420981407165527,0.19420981359481812,2.2499337205886842,,
|
| 78 |
+
35000,,,,2.116284295320511,0.32785922288894653
|
| 79 |
+
35500,0.1769229769706726,0.17692296791076662,2.2672205543518067,,
|
| 80 |
+
36000,0.17825405299663544,0.17825404453277588,2.265889495372772,,
|
| 81 |
+
36500,0.20613519847393036,0.20613520622253417,2.238008319377899,,
|
| 82 |
+
37000,0.18780066072940826,0.18780066394805908,2.2563428716659546,,
|
| 83 |
+
37500,0.16821329295635223,0.1682132921218872,2.2759302372932435,,
|
| 84 |
+
38000,0.19664159417152405,0.19664160633087158,2.247501920223236,,
|
| 85 |
+
38500,0.2009422332048416,0.20094219589233397,2.2432013301849367,,
|
| 86 |
+
39000,0.2011440396308899,0.20114404773712158,2.242999482154846,,
|
| 87 |
+
39500,0.16940616071224213,0.16940615797042846,2.274737373828888,,
|
| 88 |
+
40000,0.17714549601078033,0.17714548587799073,2.2669980425834657,,
|
| 89 |
+
40000,,,,2.0692211282253266,0.37492239475250244
|
| 90 |
+
40500,0.20836426317691803,0.2083642635345459,2.235779273509979,,
|
| 91 |
+
41000,0.15532349050045013,0.15532347869873048,2.288820049762726,,
|
| 92 |
+
41500,0.20738382637500763,0.20738384246826172,2.2367596850395204,,
|
| 93 |
+
42000,0.1978406012058258,0.1978406000137329,2.2463029441833497,,
|
| 94 |
+
42500,0.2178330421447754,0.21783304357528688,2.2263104815483095,,
|
| 95 |
+
43000,0.17135366797447205,0.17135367965698242,2.2727898488044738,,
|
| 96 |
+
43500,0.19093331694602966,0.19093331241607667,2.253210223674774,,
|
| 97 |
+
44000,0.2045438289642334,0.20454383707046508,2.23959970664978,,
|
| 98 |
+
44500,0.20506392419338226,0.2050639204978943,2.2390796036720277,,
|
| 99 |
+
45000,0.21799743175506592,0.21799742937088012,2.226146113395691,,
|
| 100 |
+
45000,,,,2.0496765255928038,0.39446699619293213
|
| 101 |
+
45500,0.2031274288892746,0.2031274199485779,2.241016125679016,,
|
| 102 |
+
46000,0.20602136850357056,0.20602136135101318,2.2381221833229064,,
|
| 103 |
+
46500,0.20439587533473969,0.2043959002494812,2.2397476387023927,,
|
| 104 |
+
47000,0.21186970174312592,0.21186971473693847,2.2322738165855407,,
|
| 105 |
+
47500,0.19912885129451752,0.1991288652420044,2.245014661312103,,
|
| 106 |
+
48000,0.19694609940052032,0.19694612550735474,2.2471973972320556,,
|
| 107 |
+
48500,0.1987495869398117,0.19874959707260131,2.2453939437866213,,
|
| 108 |
+
49000,0.18140915036201477,0.18140912914276122,2.262734398841858,,
|
| 109 |
+
49500,0.18297235667705536,0.18297234630584716,2.2611711859703063,,
|
| 110 |
+
50000,0.16303163766860962,0.1630316252708435,2.2811119132041933,,
|
| 111 |
+
50000,,,,2.0873835837841033,0.3567599654197693
|
| 112 |
+
50500,0.17654703557491302,0.17654704618453979,2.2675964856147766,,
|
| 113 |
+
51000,0.16081663966178894,0.16081664752960206,2.2833268809318543,,
|
3/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37aee7b3551646c96e16e46b527f51f09b65bae658cd2faeea7b674b3666e5aa
|
| 3 |
+
size 8844016
|
3/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-medium-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 3
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
3/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=3
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=3
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-medium-v0/PPO/3
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
3/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=3
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=3
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-medium-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 3
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
3/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-medium-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=3
|
3/test/3d_temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/test_eval_episode_0.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
3/test/x-y-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/x-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/test/y-z-temperature_test_eval_episode_0.gif
ADDED
|
Git LFS Details
|
3/training_log.csv
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward
|
| 2 |
+
500,-0.07390627264976501,-0.07390628242492676,2.518049818515778,,
|
| 3 |
+
1000,-0.08724372833967209,-0.087243718624115,2.531387258052826,,
|
| 4 |
+
1500,-0.07559693604707718,-0.07559694385528565,2.519740481853485,,
|
| 5 |
+
2000,-0.07617391645908356,-0.07617391920089722,2.520317449092865,,
|
| 6 |
+
2500,-0.04141496121883392,-0.041414964199066165,2.485558495044708,,
|
| 7 |
+
3000,-0.051523543894290924,-0.05152354192733764,2.495667078971863,,
|
| 8 |
+
3500,-0.0371941514313221,-0.03719415283203125,2.4813376808166505,,
|
| 9 |
+
4000,-0.03483041375875473,-0.03483041477203369,2.478973955154419,,
|
| 10 |
+
4500,0.0009665085235610604,0.0009665088653564453,2.4431770210266115,,
|
| 11 |
+
5000,-0.005294564180076122,-0.005294564247131347,2.4494381065368653,,
|
| 12 |
+
5000,,,,2.31602064371109,0.12812289595603943
|
| 13 |
+
5500,0.004257561173290014,0.004257560729980469,2.4398859729766844,,
|
| 14 |
+
6000,0.0017888316651806235,0.0017888317108154298,2.442354696273804,,
|
| 15 |
+
6500,0.02558412216603756,0.025584121704101563,2.418559416294098,,
|
| 16 |
+
7000,0.050269726663827896,0.050269726276397704,2.3938738136291504,,
|
| 17 |
+
7500,0.03176252916455269,0.03176252555847168,2.412381003856659,,
|
| 18 |
+
8000,0.03976239636540413,0.03976239585876465,2.404381154060364,,
|
| 19 |
+
8500,0.07413981854915619,0.07413981866836548,2.3700037245750427,,
|
| 20 |
+
9000,0.08669136464595795,0.08669136905670166,2.3574521565437316,,
|
| 21 |
+
9500,0.10101397335529327,0.10101397848129272,2.343129569530487,,
|
| 22 |
+
10000,0.10231971740722656,0.10231971454620362,2.3418238105773925,,
|
| 23 |
+
10000,,,,2.205227777957916,0.23891577124595642
|
| 24 |
+
10500,0.11757748574018478,0.11757749319076538,2.326566038608551,,
|
| 25 |
+
11000,0.12777704000473022,0.12777705097198486,2.3163664717674255,,
|
| 26 |
+
11500,0.11625555157661438,0.11625556039810181,2.3278879837989805,,
|
| 27 |
+
12000,0.09639664739370346,0.09639664316177368,2.34774689245224,,
|
| 28 |
+
12500,0.11421811580657959,0.11421811819076538,2.3299254179000854,,
|
| 29 |
+
13000,0.11440875381231308,0.11440875434875489,2.329734779834747,,
|
| 30 |
+
13500,0.09974504262208939,0.09974504709243774,2.3443984932899475,,
|
| 31 |
+
14000,0.11173249036073685,0.11173248386383057,2.3324110498428343,,
|
| 32 |
+
14500,0.12371999025344849,0.12371998596191407,2.320423544406891,,
|
| 33 |
+
15000,0.10063192993402481,0.10063192558288574,2.343511613368988,,
|
| 34 |
+
15000,,,,2.183921078443527,0.2602224349975586
|
| 35 |
+
15500,0.13624313473701477,0.13624313402175903,2.3079004073143006,,
|
| 36 |
+
16000,0.1314019113779068,0.131401921749115,2.312741620540619,,
|
| 37 |
+
16500,0.12276434153318405,0.1227643494606018,2.321379185676575,,
|
| 38 |
+
17000,0.15706594288349152,0.1570659384727478,2.2870775899887086,,
|
| 39 |
+
17500,0.1507042795419693,0.1507042899131775,2.2934392328262327,,
|
| 40 |
+
18000,0.13904492557048798,0.13904491662979127,2.305098618984222,,
|
| 41 |
+
18500,0.10918829590082169,0.1091882939338684,2.334955247402191,,
|
| 42 |
+
19000,0.13520114123821259,0.13520115184783935,2.308942383289337,,
|
| 43 |
+
19500,0.13481640815734863,0.13481641006469727,2.309327122211456,,
|
| 44 |
+
20000,0.13992148637771606,0.13992150020599364,2.304222029209137,,
|
| 45 |
+
20000,,,,2.1812509286403654,0.26289260387420654
|
| 46 |
+
20500,0.13818001747131348,0.13818002653121947,2.305963505744934,,
|
| 47 |
+
21000,0.1507529616355896,0.1507529706954956,2.2933905725479127,,
|
| 48 |
+
21500,0.14281274378299713,0.1428127450942993,2.3013307847976683,,
|
| 49 |
+
22000,0.14474648237228394,0.1447464761734009,2.2993970580101015,,
|
| 50 |
+
22500,0.1291736513376236,0.12917363500595092,2.3149699010849,,
|
| 51 |
+
23000,0.14184033870697021,0.14184032726287843,2.3023032054901122,,
|
| 52 |
+
23500,0.16246497631072998,0.16246499729156494,2.2816785368919374,,
|
| 53 |
+
24000,0.16510120034217834,0.16510118865966797,2.279042347431183,,
|
| 54 |
+
24500,0.14208242297172546,0.14208242750167846,2.3020611071586607,,
|
| 55 |
+
25000,0.1492636352777481,0.14926364707946776,2.2948798971176148,,
|
| 56 |
+
25000,,,,2.129824488162994,0.31431901454925537
|
| 57 |
+
25500,0.14894090592861176,0.14894090557098388,2.2952026290893555,,
|
| 58 |
+
26000,0.1577991098165512,0.15779911184310913,2.2863444185256956,,
|
| 59 |
+
26500,0.15204346179962158,0.15204343128204345,2.2921001014709472,,
|
| 60 |
+
27000,0.1549072563648224,0.15490724515914917,2.2892362823486327,,
|
| 61 |
+
27500,0.14777664840221405,0.14777664136886598,2.296366892337799,,
|
| 62 |
+
28000,0.14107440412044525,0.14107440757751466,2.3030691332817077,,
|
| 63 |
+
28500,0.13092312216758728,0.1309231128692627,2.313220422267914,,
|
| 64 |
+
29000,0.145025372505188,0.1450253653526306,2.2991181592941285,,
|
| 65 |
+
29500,0.16985982656478882,0.16985982322692872,2.274283724784851,,
|
| 66 |
+
30000,0.143903911113739,0.14390391874313355,2.300239607810974,,
|
| 67 |
+
30000,,,,2.1115304112434385,0.33261311054229736
|
| 68 |
+
30500,0.1811332106590271,0.18113322067260743,2.2630103130340578,,
|
| 69 |
+
31000,0.17133885622024536,0.1713388419151306,2.272804693698883,,
|
| 70 |
+
31500,0.14383167028427124,0.1438316683769226,2.3003118591308596,,
|
| 71 |
+
32000,0.16668915748596191,0.1666891632080078,2.277454363822937,,
|
| 72 |
+
32500,0.1647949516773224,0.16479495763778687,2.279348576068878,,
|
| 73 |
+
33000,0.16870209574699402,0.16870210218429565,2.275441444396973,,
|
| 74 |
+
33500,0.14940625429153442,0.14940624475479125,2.2947372879981995,,
|
| 75 |
+
34000,0.14929772913455963,0.1492977352142334,2.29484579706192,,
|
| 76 |
+
34500,0.1559593826532364,0.15595938968658446,2.2881841444969178,,
|
| 77 |
+
35000,0.15000000596046448,0.15000001049041747,2.2941435165405273,,
|
| 78 |
+
35000,,,,2.0977576458454132,0.3463858962059021
|
| 79 |
+
35500,0.16067169606685638,0.16067171716690062,2.2834718165397643,,
|
| 80 |
+
36000,0.1609184294939041,0.1609184274673462,2.2832251019477843,,
|
| 81 |
+
36500,0.1631198674440384,0.163119882106781,2.2810236520767213,,
|
| 82 |
+
37000,0.15903852880001068,0.15903852701187135,2.285105010032654,,
|
| 83 |
+
37500,0.17231398820877075,0.17231400728225707,2.2718295278549197,,
|
| 84 |
+
38000,0.150469109416008,0.1504691390991211,2.293674398422241,,
|
| 85 |
+
38500,0.17065496742725372,0.17065497636795043,2.2734885630607606,,
|
| 86 |
+
39000,0.1847417652606964,0.18474176502227782,2.2594017791748047,,
|
| 87 |
+
39500,0.1964797079563141,0.1964797053337097,2.2476638159751894,,
|
| 88 |
+
40000,0.1874154955148697,0.1874155035018921,2.256728018283844,,
|
| 89 |
+
40000,,,,2.081857109069824,0.36228641867637634
|
| 90 |
+
40500,0.1882760375738144,0.1882760157585144,2.255867521762848,,
|
| 91 |
+
41000,0.19848762452602386,0.19848761177062987,2.2456559267044067,,
|
| 92 |
+
41500,0.17876015603542328,0.1787601580619812,2.265383380413055,,
|
| 93 |
+
42000,0.19051851332187653,0.19051851844787598,2.2536250109672546,,
|
| 94 |
+
42500,0.16763806343078613,0.16763806772232057,2.276505458831787,,
|
| 95 |
+
43000,0.17176513373851776,0.1717651596069336,2.272378378868103,,
|
| 96 |
+
43500,0.1721804141998291,0.172180419921875,2.271963116645813,,
|
| 97 |
+
44000,0.163779154419899,0.16377915620803832,2.2803643798828124,,
|
| 98 |
+
44500,0.18140438199043274,0.18140438985824586,2.2627391352653503,,
|
| 99 |
+
45000,0.1873386800289154,0.18733866834640503,2.2568048696517944,,
|
| 100 |
+
45000,,,,2.0943012177944182,0.3498423099517822
|
| 101 |
+
45500,0.18842843174934387,0.18842843866348266,2.2557150955200194,,
|
| 102 |
+
46000,0.14761318266391754,0.14761318159103393,2.2965303511619566,,
|
| 103 |
+
46500,0.16771431267261505,0.1677143259048462,2.276429214477539,,
|
| 104 |
+
47000,0.19022445380687714,0.19022444677352907,2.25391908121109,,
|
| 105 |
+
47500,0.18850445747375488,0.18850445652008058,2.255639070034027,,
|
| 106 |
+
48000,0.18985414505004883,0.18985413122177125,2.254289398193359,,
|
| 107 |
+
48500,0.18755413591861725,0.18755411958694457,2.2565894050598145,,
|
| 108 |
+
49000,0.19055670499801636,0.1905567021369934,2.2535868368148804,,
|
| 109 |
+
49500,0.18797944486141205,0.1879794373512268,2.2561640863418577,,
|
| 110 |
+
50000,0.19208407402038574,0.1920840802192688,2.2520594539642333,,
|
| 111 |
+
50000,,,,2.0825169241428374,0.36162662506103516
|
| 112 |
+
50500,0.19545389711856842,0.19545391178131102,2.248689628601074,,
|
| 113 |
+
51000,0.17610549926757812,0.17610550546646117,2.268038013458252,,
|
4/ckpt_latest.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5369f1bb44e3d4993bcde1872585df43f6869d142a1f31560f2ad57c4ea26f8e
|
| 3 |
+
size 8844012
|
4/config.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
env_id: RBC3D-medium-v0
|
| 2 |
+
env_kwargs: {}
|
| 3 |
+
eval_env_kwargs: {}
|
| 4 |
+
seed: 4
|
| 5 |
+
rl_mode: marl
|
| 6 |
+
total_timesteps: 50000.0
|
| 7 |
+
n_eval_steps: 10
|
| 8 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 9 |
+
n_eval_episodes: 1
|
| 10 |
+
continue_training: false
|
| 11 |
+
checkpoint_latest: true
|
| 12 |
+
rl_device: cpu
|
| 13 |
+
eval_callback:
|
| 14 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 15 |
+
eval_freq: ${eval_freq}
|
| 16 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 17 |
+
use_wandb: ${wandb.enable}
|
| 18 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 19 |
+
wandb:
|
| 20 |
+
enable: true
|
| 21 |
+
entity: safe-autonomous-systems
|
| 22 |
+
project: jbecktepe-fluidgym
|
| 23 |
+
algorithm:
|
| 24 |
+
name: PPO
|
| 25 |
+
obj:
|
| 26 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 27 |
+
policy: MlpPolicy
|
| 28 |
+
learning_rate: 0.0003
|
| 29 |
+
n_steps: 2048
|
| 30 |
+
batch_size: 64
|
| 31 |
+
n_epochs: 10
|
| 32 |
+
gamma: 0.99
|
| 33 |
+
gae_lambda: 0.95
|
| 34 |
+
clip_range: 0.2
|
| 35 |
+
clip_range_vf: null
|
| 36 |
+
normalize_advantage: true
|
| 37 |
+
ent_coef: 0.01
|
| 38 |
+
vf_coef: 0.5
|
| 39 |
+
max_grad_norm: 0.5
|
| 40 |
+
use_sde: false
|
| 41 |
+
sde_sample_freq: -1
|
| 42 |
+
rollout_buffer_class: null
|
| 43 |
+
rollout_buffer_kwargs: null
|
| 44 |
+
target_kl: null
|
| 45 |
+
stats_window_size: 100
|
| 46 |
+
tensorboard_log: null
|
| 47 |
+
verbose: 0
|
| 48 |
+
seed: ${seed}
|
| 49 |
+
device: ${rl_device}
|
| 50 |
+
_init_setup_model: true
|
| 51 |
+
cluster: {}
|
| 52 |
+
test_env_id: ${env_id}
|
| 53 |
+
test_env_kwargs: ${env_kwargs}
|
| 54 |
+
test_rl_mode: ${rl_mode}
|
| 55 |
+
n_test_episodes: 10
|
| 56 |
+
deterministic: true
|
| 57 |
+
save_frames: true
|
| 58 |
+
render_3d: true
|
4/hydra.yaml
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=4
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=4
|
| 123 |
+
id: '0'
|
| 124 |
+
num: 0
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: /cephfs/users/becktepe/git_projects/FluidGym/output/training/marl/RBC3D-medium-v0/PPO/4
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
4/multirun.yaml
ADDED
|
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
hydra:
|
| 2 |
+
run:
|
| 3 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 4 |
+
sweep:
|
| 5 |
+
dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed}
|
| 6 |
+
subdir: ''
|
| 7 |
+
launcher:
|
| 8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
| 9 |
+
sweeper:
|
| 10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
| 11 |
+
max_batch_size: null
|
| 12 |
+
params: null
|
| 13 |
+
help:
|
| 14 |
+
app_name: ${hydra.job.name}
|
| 15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
| 16 |
+
|
| 17 |
+
'
|
| 18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
| 19 |
+
|
| 20 |
+
Use --hydra-help to view Hydra specific help
|
| 21 |
+
|
| 22 |
+
'
|
| 23 |
+
template: '${hydra.help.header}
|
| 24 |
+
|
| 25 |
+
== Configuration groups ==
|
| 26 |
+
|
| 27 |
+
Compose your configuration from those groups (group=option)
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
$APP_CONFIG_GROUPS
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
== Config ==
|
| 34 |
+
|
| 35 |
+
Override anything in the config (foo.bar=value)
|
| 36 |
+
|
| 37 |
+
|
| 38 |
+
$CONFIG
|
| 39 |
+
|
| 40 |
+
|
| 41 |
+
${hydra.help.footer}
|
| 42 |
+
|
| 43 |
+
'
|
| 44 |
+
hydra_help:
|
| 45 |
+
template: 'Hydra (${hydra.runtime.version})
|
| 46 |
+
|
| 47 |
+
See https://hydra.cc for more info.
|
| 48 |
+
|
| 49 |
+
|
| 50 |
+
== Flags ==
|
| 51 |
+
|
| 52 |
+
$FLAGS_HELP
|
| 53 |
+
|
| 54 |
+
|
| 55 |
+
== Configuration groups ==
|
| 56 |
+
|
| 57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
| 58 |
+
to command line)
|
| 59 |
+
|
| 60 |
+
|
| 61 |
+
$HYDRA_CONFIG_GROUPS
|
| 62 |
+
|
| 63 |
+
|
| 64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
| 65 |
+
|
| 66 |
+
'
|
| 67 |
+
hydra_help: ???
|
| 68 |
+
hydra_logging:
|
| 69 |
+
version: 1
|
| 70 |
+
formatters:
|
| 71 |
+
simple:
|
| 72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
| 73 |
+
handlers:
|
| 74 |
+
console:
|
| 75 |
+
class: logging.StreamHandler
|
| 76 |
+
formatter: simple
|
| 77 |
+
stream: ext://sys.stdout
|
| 78 |
+
root:
|
| 79 |
+
level: INFO
|
| 80 |
+
handlers:
|
| 81 |
+
- console
|
| 82 |
+
loggers:
|
| 83 |
+
logging_example:
|
| 84 |
+
level: DEBUG
|
| 85 |
+
disable_existing_loggers: false
|
| 86 |
+
job_logging:
|
| 87 |
+
version: 1
|
| 88 |
+
formatters:
|
| 89 |
+
simple:
|
| 90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
| 91 |
+
handlers:
|
| 92 |
+
console:
|
| 93 |
+
class: logging.StreamHandler
|
| 94 |
+
formatter: simple
|
| 95 |
+
stream: ext://sys.stdout
|
| 96 |
+
file:
|
| 97 |
+
class: logging.FileHandler
|
| 98 |
+
formatter: simple
|
| 99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
| 100 |
+
root:
|
| 101 |
+
level: INFO
|
| 102 |
+
handlers:
|
| 103 |
+
- console
|
| 104 |
+
- file
|
| 105 |
+
disable_existing_loggers: false
|
| 106 |
+
env: {}
|
| 107 |
+
mode: MULTIRUN
|
| 108 |
+
searchpath: []
|
| 109 |
+
callbacks: {}
|
| 110 |
+
output_subdir: .
|
| 111 |
+
overrides:
|
| 112 |
+
hydra:
|
| 113 |
+
- hydra.mode=MULTIRUN
|
| 114 |
+
task:
|
| 115 |
+
- algorithm=sb3_ppo
|
| 116 |
+
- env_id=RBC3D-medium-v0
|
| 117 |
+
- rl_mode=marl
|
| 118 |
+
- seed=4
|
| 119 |
+
job:
|
| 120 |
+
name: test_sb3
|
| 121 |
+
chdir: true
|
| 122 |
+
override_dirname: algorithm=sb3_ppo,env_id=RBC3D-medium-v0,rl_mode=marl,seed=4
|
| 123 |
+
id: ???
|
| 124 |
+
num: ???
|
| 125 |
+
config_name: test_sb3
|
| 126 |
+
env_set: {}
|
| 127 |
+
env_copy: []
|
| 128 |
+
config:
|
| 129 |
+
override_dirname:
|
| 130 |
+
kv_sep: '='
|
| 131 |
+
item_sep: ','
|
| 132 |
+
exclude_keys: []
|
| 133 |
+
runtime:
|
| 134 |
+
version: 1.3.2
|
| 135 |
+
version_base: '1.3'
|
| 136 |
+
cwd: /cephfs/users/becktepe/git_projects/FluidGym
|
| 137 |
+
config_sources:
|
| 138 |
+
- path: hydra.conf
|
| 139 |
+
schema: pkg
|
| 140 |
+
provider: hydra
|
| 141 |
+
- path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs
|
| 142 |
+
schema: file
|
| 143 |
+
provider: main
|
| 144 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
| 145 |
+
schema: pkg
|
| 146 |
+
provider: hydra-colorlog
|
| 147 |
+
- path: ''
|
| 148 |
+
schema: structured
|
| 149 |
+
provider: schema
|
| 150 |
+
output_dir: ???
|
| 151 |
+
choices:
|
| 152 |
+
cluster: local
|
| 153 |
+
algorithm: sb3_ppo
|
| 154 |
+
hydra/env: default
|
| 155 |
+
hydra/callbacks: null
|
| 156 |
+
hydra/job_logging: default
|
| 157 |
+
hydra/hydra_logging: default
|
| 158 |
+
hydra/hydra_help: default
|
| 159 |
+
hydra/help: default
|
| 160 |
+
hydra/sweeper: basic
|
| 161 |
+
hydra/launcher: basic
|
| 162 |
+
hydra/output: default
|
| 163 |
+
verbose: false
|
| 164 |
+
env_id: RBC3D-medium-v0
|
| 165 |
+
env_kwargs: {}
|
| 166 |
+
eval_env_kwargs: {}
|
| 167 |
+
seed: 4
|
| 168 |
+
rl_mode: marl
|
| 169 |
+
total_timesteps: 50000.0
|
| 170 |
+
n_eval_steps: 10
|
| 171 |
+
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
|
| 172 |
+
n_eval_episodes: 1
|
| 173 |
+
continue_training: false
|
| 174 |
+
checkpoint_latest: true
|
| 175 |
+
rl_device: cpu
|
| 176 |
+
eval_callback:
|
| 177 |
+
_target_: fluidgym.integration.sb3.EvalCallback
|
| 178 |
+
eval_freq: ${eval_freq}
|
| 179 |
+
n_eval_episodes: ${n_eval_episodes}
|
| 180 |
+
use_wandb: ${wandb.enable}
|
| 181 |
+
checkpoint_latest: ${checkpoint_latest}
|
| 182 |
+
wandb:
|
| 183 |
+
enable: true
|
| 184 |
+
entity: safe-autonomous-systems
|
| 185 |
+
project: jbecktepe-fluidgym
|
| 186 |
+
algorithm:
|
| 187 |
+
name: PPO
|
| 188 |
+
obj:
|
| 189 |
+
_target_: stable_baselines3.ppo.ppo.PPO
|
| 190 |
+
policy: MlpPolicy
|
| 191 |
+
learning_rate: 0.0003
|
| 192 |
+
n_steps: 2048
|
| 193 |
+
batch_size: 64
|
| 194 |
+
n_epochs: 10
|
| 195 |
+
gamma: 0.99
|
| 196 |
+
gae_lambda: 0.95
|
| 197 |
+
clip_range: 0.2
|
| 198 |
+
clip_range_vf: null
|
| 199 |
+
normalize_advantage: true
|
| 200 |
+
ent_coef: 0.01
|
| 201 |
+
vf_coef: 0.5
|
| 202 |
+
max_grad_norm: 0.5
|
| 203 |
+
use_sde: false
|
| 204 |
+
sde_sample_freq: -1
|
| 205 |
+
rollout_buffer_class: null
|
| 206 |
+
rollout_buffer_kwargs: null
|
| 207 |
+
target_kl: null
|
| 208 |
+
stats_window_size: 100
|
| 209 |
+
tensorboard_log: null
|
| 210 |
+
verbose: 0
|
| 211 |
+
seed: ${seed}
|
| 212 |
+
device: ${rl_device}
|
| 213 |
+
_init_setup_model: true
|
| 214 |
+
cluster: {}
|
| 215 |
+
test_env_id: ${env_id}
|
| 216 |
+
test_env_kwargs: ${env_kwargs}
|
| 217 |
+
test_rl_mode: ${rl_mode}
|
| 218 |
+
n_test_episodes: 10
|
| 219 |
+
deterministic: true
|
| 220 |
+
save_frames: true
|
| 221 |
+
render_3d: true
|
4/overrides.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- algorithm=sb3_ppo
|
| 2 |
+
- env_id=RBC3D-medium-v0
|
| 3 |
+
- rl_mode=marl
|
| 4 |
+
- seed=4
|