| hydra: | |
| run: | |
| dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed} | |
| sweep: | |
| dir: output/training/${rl_mode}/${env_id}/${algorithm.name}/${seed} | |
| subdir: '' | |
| launcher: | |
| _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher | |
| sweeper: | |
| _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper | |
| max_batch_size: null | |
| params: null | |
| help: | |
| app_name: ${hydra.job.name} | |
| header: '${hydra.help.app_name} is powered by Hydra. | |
| ' | |
| footer: 'Powered by Hydra (https://hydra.cc) | |
| Use --hydra-help to view Hydra specific help | |
| ' | |
| template: '${hydra.help.header} | |
| == Configuration groups == | |
| Compose your configuration from those groups (group=option) | |
| $APP_CONFIG_GROUPS | |
| == Config == | |
| Override anything in the config (foo.bar=value) | |
| $CONFIG | |
| ${hydra.help.footer} | |
| ' | |
| hydra_help: | |
| template: 'Hydra (${hydra.runtime.version}) | |
| See https://hydra.cc for more info. | |
| == Flags == | |
| $FLAGS_HELP | |
| == Configuration groups == | |
| Compose your configuration from those groups (For example, append hydra/job_logging=disabled | |
| to command line) | |
| $HYDRA_CONFIG_GROUPS | |
| Use ''--cfg hydra'' to Show the Hydra config. | |
| ' | |
| hydra_help: ??? | |
| hydra_logging: | |
| version: 1 | |
| formatters: | |
| simple: | |
| format: '[%(asctime)s][HYDRA] %(message)s' | |
| handlers: | |
| console: | |
| class: logging.StreamHandler | |
| formatter: simple | |
| stream: ext://sys.stdout | |
| root: | |
| level: INFO | |
| handlers: | |
| - console | |
| loggers: | |
| logging_example: | |
| level: DEBUG | |
| disable_existing_loggers: false | |
| job_logging: | |
| version: 1 | |
| formatters: | |
| simple: | |
| format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s' | |
| handlers: | |
| console: | |
| class: logging.StreamHandler | |
| formatter: simple | |
| stream: ext://sys.stdout | |
| file: | |
| class: logging.FileHandler | |
| formatter: simple | |
| filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log | |
| root: | |
| level: INFO | |
| handlers: | |
| - console | |
| - file | |
| disable_existing_loggers: false | |
| env: {} | |
| mode: MULTIRUN | |
| searchpath: [] | |
| callbacks: {} | |
| output_subdir: . | |
| overrides: | |
| hydra: | |
| - hydra.mode=MULTIRUN | |
| task: | |
| - algorithm=sb3_ppo | |
| - env_id=RBC2D-medium-v0 | |
| - rl_mode=sarl | |
| - seed=2 | |
| job: | |
| name: test_sb3 | |
| chdir: true | |
| override_dirname: algorithm=sb3_ppo,env_id=RBC2D-medium-v0,rl_mode=sarl,seed=2 | |
| id: ??? | |
| num: ??? | |
| config_name: test_sb3 | |
| env_set: {} | |
| env_copy: [] | |
| config: | |
| override_dirname: | |
| kv_sep: '=' | |
| item_sep: ',' | |
| exclude_keys: [] | |
| runtime: | |
| version: 1.3.2 | |
| version_base: '1.3' | |
| cwd: /cephfs/users/becktepe/git_projects/FluidGym | |
| config_sources: | |
| - path: hydra.conf | |
| schema: pkg | |
| provider: hydra | |
| - path: /cephfs/users/becktepe/git_projects/FluidGym/runscripts/configs | |
| schema: file | |
| provider: main | |
| - path: '' | |
| schema: structured | |
| provider: schema | |
| output_dir: ??? | |
| choices: | |
| cluster: local | |
| algorithm: sb3_ppo | |
| hydra/env: default | |
| hydra/callbacks: null | |
| hydra/job_logging: default | |
| hydra/hydra_logging: default | |
| hydra/hydra_help: default | |
| hydra/help: default | |
| hydra/sweeper: basic | |
| hydra/launcher: basic | |
| hydra/output: default | |
| verbose: false | |
| env_id: RBC2D-medium-v0 | |
| env_kwargs: {} | |
| eval_env_kwargs: {} | |
| seed: 2 | |
| rl_mode: sarl | |
| total_timesteps: 50000.0 | |
| n_eval_steps: 10 | |
| eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}} | |
| n_eval_episodes: 1 | |
| continue_training: false | |
| checkpoint_latest: true | |
| rl_device: cpu | |
| eval_callback: | |
| _target_: fluidgym.integration.sb3.EvalCallback | |
| eval_freq: ${eval_freq} | |
| n_eval_episodes: ${n_eval_episodes} | |
| use_wandb: ${wandb.enable} | |
| checkpoint_latest: ${checkpoint_latest} | |
| wandb: | |
| enable: true | |
| entity: safe-autonomous-systems | |
| project: jbecktepe-fluidgym | |
| algorithm: | |
| name: PPO | |
| obj: | |
| _target_: stable_baselines3.ppo.ppo.PPO | |
| policy: MlpPolicy | |
| learning_rate: 0.0003 | |
| n_steps: 2048 | |
| batch_size: 64 | |
| n_epochs: 10 | |
| gamma: 0.99 | |
| gae_lambda: 0.95 | |
| clip_range: 0.2 | |
| clip_range_vf: null | |
| normalize_advantage: true | |
| ent_coef: 0.01 | |
| vf_coef: 0.5 | |
| max_grad_norm: 0.5 | |
| use_sde: false | |
| sde_sample_freq: -1 | |
| rollout_buffer_class: null | |
| rollout_buffer_kwargs: null | |
| target_kl: null | |
| stats_window_size: 100 | |
| tensorboard_log: null | |
| verbose: 0 | |
| seed: ${seed} | |
| device: ${rl_device} | |
| _init_setup_model: true | |
| cluster: {} | |
| test_env_id: ${env_id} | |
| test_env_kwargs: ${env_kwargs} | |
| test_rl_mode: ${rl_mode} | |
| n_test_episodes: 10 | |
| deterministic: true | |
| save_frames: true | |
| render_3d: true | |