File size: 2,544 Bytes

6b24f5d

{
  "env_cls": "qiskit_gym.envs.synthesis.LinearFunctionEnv",
  "env": {
    "num_qubits": 8,
    "difficulty": 1,
    "gateset": [
      [
        "CX",
        [
          0,
          1
        ]
      ],
      [
        "CX",
        [
          1,
          0
        ]
      ],
      [
        "CX",
        [
          1,
          2
        ]
      ],
      [
        "CX",
        [
          2,
          1
        ]
      ],
      [
        "CX",
        [
          2,
          4
        ]
      ],
      [
        "CX",
        [
          3,
          6
        ]
      ],
      [
        "CX",
        [
          4,
          2
        ]
      ],
      [
        "CX",
        [
          4,
          5
        ]
      ],
      [
        "CX",
        [
          4,
          7
        ]
      ],
      [
        "CX",
        [
          5,
          4
        ]
      ],
      [
        "CX",
        [
          5,
          6
        ]
      ],
      [
        "CX",
        [
          6,
          3
        ]
      ],
      [
        "CX",
        [
          6,
          5
        ]
      ],
      [
        "CX",
        [
          7,
          4
        ]
      ]
    ],
    "depth_slope": 2,
    "max_depth": 512,
    "metrics_weights": {
      "n_cnots": 0.01,
      "n_layers_cnots": 0.01,
      "n_layers": 0.01,
      "n_gates": 0.01
    }
  },
  "policy_cls": "twisterl.nn.BasicPolicy",
  "policy": {
    "embedding_size": 512,
    "common_layers": [
      256
    ],
    "policy_layers": [],
    "value_layers": []
  },
  "algorithm_cls": "twisterl.rl.PPO",
  "algorithm": {
    "collecting": {
      "num_cores": 32,
      "num_episodes": 1024,
      "lambda": 0.995,
      "gamma": 0.995
    },
    "training": {
      "num_epochs": 10,
      "vf_coef": 0.8,
      "ent_coef": 0.01,
      "clip_ratio": 0.1,
      "normalize_advantage": false
    },
    "learning": {
      "diff_threshold": 0.85,
      "diff_max": 1024,
      "diff_metric": "ppo_deterministic"
    },
    "optimizer": {
      "lr": 0.0003
    },
    "evals": {
      "ppo_deterministic": {
        "num_episodes": 100,
        "deterministic": true,
        "num_searches": 1,
        "num_mcts_searches": 0,
        "num_cores": 32,
        "C": 1.41
      },
      "ppo_10": {
        "num_episodes": 100,
        "deterministic": false,
        "num_searches": 10,
        "num_mcts_searches": 0,
        "num_cores": 32,
        "C": 1.41
      }
    },
    "logging": {
      "log_freq": 1,
      "checkpoint_freq": 10
    }
  }
}