File size: 2,216 Bytes
1e2ace7
 
d58868e
1e2ace7
 
99fc7ba
 
 
d58868e
1e2ace7
 
1db1ed4
1e2ace7
 
 
 
1db1ed4
1e2ace7
 
d58868e
99fc7ba
1e2ace7
433c774
 
 
1e2ace7
 
 
 
 
 
 
 
 
 
 
 
 
 
d58868e
 
 
 
 
 
 
 
 
 
 
 
 
1e2ace7
0fee85f
1e2ace7
1db1ed4
d58868e
 
1e2ace7
 
 
 
d58868e
1e2ace7
 
99fc7ba
1e2ace7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
433c774
1e2ace7
 
1db1ed4
1e2ace7
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
default_settings: null
behaviors:
  Pyramids:
    trainer_type: ppo
    hyperparameters:
      batch_size: 2048
      buffer_size: 20480
      learning_rate: 0.0003
      beta: 0.01
      epsilon: 0.2
      lambd: 0.95
      num_epoch: 8
      shared_critic: false
      learning_rate_schedule: linear
      beta_schedule: linear
      epsilon_schedule: linear
    checkpoint_interval: 120000
    network_settings:
      normalize: false
      hidden_units: 512
      num_layers: 3
      vis_encode_type: simple
      memory:
        sequence_length: 64
        memory_size: 256
      goal_conditioning_type: hyper
      deterministic: false
    reward_signals:
      extrinsic:
        gamma: 0.99
        strength: 1.0
        network_settings:
          normalize: false
          hidden_units: 128
          num_layers: 2
          vis_encode_type: simple
          memory: null
          goal_conditioning_type: hyper
          deterministic: false
      rnd:
        gamma: 0.99
        strength: 0.01
        network_settings:
          normalize: false
          hidden_units: 64
          num_layers: 3
          vis_encode_type: simple
          memory: null
          goal_conditioning_type: hyper
          deterministic: false
        learning_rate: 0.0001
        encoding_size: null
    init_path: null
    keep_checkpoints: 100
    even_checkpoints: false
    max_steps: 6000000
    time_horizon: 128
    summary_freq: 30000
    threaded: false
    self_play: null
    behavioral_cloning: null
env_settings:
  env_path: ./training-envs-executables/linux/Pyramids/Pyramids
  env_args: null
  base_port: 5005
  num_envs: 10
  num_areas: 1
  timeout_wait: 60
  seed: -1
  max_lifetime_restarts: 10
  restarts_rate_limit_n: 1
  restarts_rate_limit_period_s: 60
engine_settings:
  width: 84
  height: 84
  quality_level: 5
  time_scale: 20
  target_frame_rate: -1
  capture_frame_rate: 60
  no_graphics: true
  no_graphics_monitor: false
environment_parameters: null
checkpoint_settings:
  run_id: Pyramids Training5 Memory
  initialize_from: null
  load_model: false
  resume: true
  force: false
  train_model: false
  inference: false
  results_dir: results
torch_settings:
  device: null
debug: false