import argparse def main(args): import json with open(args.input_path, "r") as json_file: json_list = list(json_file) global_designed_chain_list = [] if args.chain_list != "": global_designed_chain_list = [str(item) for item in args.chain_list.split()] my_dict = {} for json_str in json_list: result = json.loads(json_str) all_chain_list = [ item[-1:] for item in list(result) if item[:9] == "seq_chain" ] # ['A','B', 'C',...] if len(global_designed_chain_list) > 0: designed_chain_list = global_designed_chain_list else: # manually specify, e.g. designed_chain_list = ["A"] fixed_chain_list = [ letter for letter in all_chain_list if letter not in designed_chain_list ] # fix/do not redesign these chains my_dict[result["name"]] = (designed_chain_list, fixed_chain_list) with open(args.output_path, "w") as f: f.write(json.dumps(my_dict) + "\n") if __name__ == "__main__": argparser = argparse.ArgumentParser( formatter_class=argparse.ArgumentDefaultsHelpFormatter ) argparser.add_argument("--input_path", type=str, help="Path to the parsed PDBs") argparser.add_argument( "--output_path", type=str, help="Path to the output dictionary" ) argparser.add_argument( "--chain_list", type=str, default="", help="List of the chains that need to be designed", ) args = argparser.parse_args() main(args) # Output looks like this: # {"5TTA": [["A"], ["B"]], "3LIS": [["A"], ["B"]]}