File size: 1,394 Bytes
a58beb2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 |
env_id: RBC2D-medium-v0
env_kwargs: {}
eval_env_kwargs: {}
seed: 2
rl_mode: sarl
total_timesteps: 50000.0
n_eval_steps: 10
eval_freq: ${eval:${total_timesteps} // ${n_eval_steps}}
n_eval_episodes: 1
continue_training: false
checkpoint_latest: true
rl_device: cpu
eval_callback:
_target_: fluidgym.integration.sb3.EvalCallback
eval_freq: ${eval_freq}
n_eval_episodes: ${n_eval_episodes}
use_wandb: ${wandb.enable}
checkpoint_latest: ${checkpoint_latest}
wandb:
enable: true
entity: safe-autonomous-systems
project: jbecktepe-fluidgym
algorithm:
name: SAC
obj:
_target_: stable_baselines3.sac.sac.SAC
policy: MlpPolicy
learning_rate: 0.0003
buffer_size: 1000000
learning_starts: 100
batch_size: 256
tau: 0.005
gamma: 0.99
train_freq: 1
gradient_steps: -1
action_noise: null
replay_buffer_class: null
replay_buffer_kwargs: null
optimize_memory_usage: false
ent_coef: auto
target_update_interval: 1
target_entropy: auto
use_sde: false
sde_sample_freq: -1
use_sde_at_warmup: false
stats_window_size: 100
tensorboard_log: null
policy_kwargs: {}
verbose: 0
seed: ${seed}
device: cuda
_init_setup_model: true
cluster: {}
test_env_id: ${env_id}
test_env_kwargs: ${env_kwargs}
test_rl_mode: ${rl_mode}
n_test_episodes: 10
deterministic: true
save_frames: true
render_3d: true
|