File size: 2,216 Bytes
1e2ace7 d58868e 1e2ace7 99fc7ba d58868e 1e2ace7 1db1ed4 1e2ace7 1db1ed4 1e2ace7 d58868e 99fc7ba 1e2ace7 433c774 1e2ace7 d58868e 1e2ace7 0fee85f 1e2ace7 1db1ed4 d58868e 1e2ace7 d58868e 1e2ace7 99fc7ba 1e2ace7 433c774 1e2ace7 1db1ed4 1e2ace7 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 | default_settings: null
behaviors:
Pyramids:
trainer_type: ppo
hyperparameters:
batch_size: 2048
buffer_size: 20480
learning_rate: 0.0003
beta: 0.01
epsilon: 0.2
lambd: 0.95
num_epoch: 8
shared_critic: false
learning_rate_schedule: linear
beta_schedule: linear
epsilon_schedule: linear
checkpoint_interval: 120000
network_settings:
normalize: false
hidden_units: 512
num_layers: 3
vis_encode_type: simple
memory:
sequence_length: 64
memory_size: 256
goal_conditioning_type: hyper
deterministic: false
reward_signals:
extrinsic:
gamma: 0.99
strength: 1.0
network_settings:
normalize: false
hidden_units: 128
num_layers: 2
vis_encode_type: simple
memory: null
goal_conditioning_type: hyper
deterministic: false
rnd:
gamma: 0.99
strength: 0.01
network_settings:
normalize: false
hidden_units: 64
num_layers: 3
vis_encode_type: simple
memory: null
goal_conditioning_type: hyper
deterministic: false
learning_rate: 0.0001
encoding_size: null
init_path: null
keep_checkpoints: 100
even_checkpoints: false
max_steps: 6000000
time_horizon: 128
summary_freq: 30000
threaded: false
self_play: null
behavioral_cloning: null
env_settings:
env_path: ./training-envs-executables/linux/Pyramids/Pyramids
env_args: null
base_port: 5005
num_envs: 10
num_areas: 1
timeout_wait: 60
seed: -1
max_lifetime_restarts: 10
restarts_rate_limit_n: 1
restarts_rate_limit_period_s: 60
engine_settings:
width: 84
height: 84
quality_level: 5
time_scale: 20
target_frame_rate: -1
capture_frame_rate: 60
no_graphics: true
no_graphics_monitor: false
environment_parameters: null
checkpoint_settings:
run_id: Pyramids Training5 Memory
initialize_from: null
load_model: false
resume: true
force: false
train_model: false
inference: false
results_dir: results
torch_settings:
device: null
debug: false
|