File size: 2,544 Bytes
6b24f5d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
{
  "env_cls": "qiskit_gym.envs.synthesis.LinearFunctionEnv",
  "env": {
    "num_qubits": 8,
    "difficulty": 1,
    "gateset": [
      [
        "CX",
        [
          0,
          1
        ]
      ],
      [
        "CX",
        [
          1,
          0
        ]
      ],
      [
        "CX",
        [
          1,
          2
        ]
      ],
      [
        "CX",
        [
          2,
          1
        ]
      ],
      [
        "CX",
        [
          2,
          4
        ]
      ],
      [
        "CX",
        [
          3,
          6
        ]
      ],
      [
        "CX",
        [
          4,
          2
        ]
      ],
      [
        "CX",
        [
          4,
          5
        ]
      ],
      [
        "CX",
        [
          4,
          7
        ]
      ],
      [
        "CX",
        [
          5,
          4
        ]
      ],
      [
        "CX",
        [
          5,
          6
        ]
      ],
      [
        "CX",
        [
          6,
          3
        ]
      ],
      [
        "CX",
        [
          6,
          5
        ]
      ],
      [
        "CX",
        [
          7,
          4
        ]
      ]
    ],
    "depth_slope": 2,
    "max_depth": 512,
    "metrics_weights": {
      "n_cnots": 0.01,
      "n_layers_cnots": 0.01,
      "n_layers": 0.01,
      "n_gates": 0.01
    }
  },
  "policy_cls": "twisterl.nn.BasicPolicy",
  "policy": {
    "embedding_size": 512,
    "common_layers": [
      256
    ],
    "policy_layers": [],
    "value_layers": []
  },
  "algorithm_cls": "twisterl.rl.PPO",
  "algorithm": {
    "collecting": {
      "num_cores": 32,
      "num_episodes": 1024,
      "lambda": 0.995,
      "gamma": 0.995
    },
    "training": {
      "num_epochs": 10,
      "vf_coef": 0.8,
      "ent_coef": 0.01,
      "clip_ratio": 0.1,
      "normalize_advantage": false
    },
    "learning": {
      "diff_threshold": 0.85,
      "diff_max": 1024,
      "diff_metric": "ppo_deterministic"
    },
    "optimizer": {
      "lr": 0.0003
    },
    "evals": {
      "ppo_deterministic": {
        "num_episodes": 100,
        "deterministic": true,
        "num_searches": 1,
        "num_mcts_searches": 0,
        "num_cores": 32,
        "C": 1.41
      },
      "ppo_10": {
        "num_episodes": 100,
        "deterministic": false,
        "num_searches": 10,
        "num_mcts_searches": 0,
        "num_cores": 32,
        "C": 1.41
      }
    },
    "logging": {
      "log_freq": 1,
      "checkpoint_freq": 10
    }
  }
}