File size: 1,935 Bytes
6b24f5d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 |
{
"env_cls": "qiskit_gym.envs.synthesis.LinearFunctionEnv",
"env": {
"num_qubits": 4,
"difficulty": 1,
"gateset": [
[
"CX",
[
0,
1
]
],
[
"CX",
[
0,
3
]
],
[
"CX",
[
1,
0
]
],
[
"CX",
[
2,
3
]
],
[
"CX",
[
3,
0
]
],
[
"CX",
[
3,
2
]
]
],
"depth_slope": 2,
"max_depth": 128,
"metrics_weights": {
"n_cnots": 0.01,
"n_layers_cnots": 0.01,
"n_layers": 0.01,
"n_gates": 0.01
}
},
"policy_cls": "twisterl.nn.BasicPolicy",
"policy": {
"embedding_size": 512,
"common_layers": [
256
],
"policy_layers": [],
"value_layers": []
},
"algorithm_cls": "twisterl.rl.PPO",
"algorithm": {
"collecting": {
"num_cores": 32,
"num_episodes": 1024,
"lambda": 0.995,
"gamma": 0.995
},
"training": {
"num_epochs": 10,
"vf_coef": 0.8,
"ent_coef": 0.01,
"clip_ratio": 0.1,
"normalize_advantage": false
},
"learning": {
"diff_threshold": 0.85,
"diff_max": 256,
"diff_metric": "ppo_deterministic"
},
"optimizer": {
"lr": 0.0003
},
"evals": {
"ppo_deterministic": {
"num_episodes": 100,
"deterministic": true,
"num_searches": 1,
"num_mcts_searches": 0,
"num_cores": 32,
"C": 1.41
},
"ppo_10": {
"num_episodes": 100,
"deterministic": false,
"num_searches": 10,
"num_mcts_searches": 0,
"num_cores": 32,
"C": 1.41
}
},
"logging": {
"log_freq": 1,
"checkpoint_freq": 10
}
}
} |