FlowProt / model /ProteinMPNN /helper_scripts /assign_fixed_chains.py
alibtsd's picture
Deploy FlowProt Docker Space
f34af6f verified
Raw
History Blame Contribute Delete
1.64 kB
import argparse
def main(args):
import json
with open(args.input_path, "r") as json_file:
json_list = list(json_file)
global_designed_chain_list = []
if args.chain_list != "":
global_designed_chain_list = [str(item) for item in args.chain_list.split()]
my_dict = {}
for json_str in json_list:
result = json.loads(json_str)
all_chain_list = [
item[-1:] for item in list(result) if item[:9] == "seq_chain"
] # ['A','B', 'C',...]
if len(global_designed_chain_list) > 0:
designed_chain_list = global_designed_chain_list
else:
# manually specify, e.g.
designed_chain_list = ["A"]
fixed_chain_list = [
letter for letter in all_chain_list if letter not in designed_chain_list
] # fix/do not redesign these chains
my_dict[result["name"]] = (designed_chain_list, fixed_chain_list)
with open(args.output_path, "w") as f:
f.write(json.dumps(my_dict) + "\n")
if __name__ == "__main__":
argparser = argparse.ArgumentParser(
formatter_class=argparse.ArgumentDefaultsHelpFormatter
)
argparser.add_argument("--input_path", type=str, help="Path to the parsed PDBs")
argparser.add_argument(
"--output_path", type=str, help="Path to the output dictionary"
)
argparser.add_argument(
"--chain_list",
type=str,
default="",
help="List of the chains that need to be designed",
)
args = argparser.parse_args()
main(args)
# Output looks like this:
# {"5TTA": [["A"], ["B"]], "3LIS": [["A"], ["B"]]}