Spaces:
Sleeping
Sleeping
Commit
·
90f8374
1
Parent(s):
73f2f0c
Update code/add_alignment.py
Browse files- code/add_alignment.py +6 -3
code/add_alignment.py
CHANGED
|
@@ -7,10 +7,9 @@ from Bio.pairwise2 import format_alignment
|
|
| 7 |
|
| 8 |
|
| 9 |
def do_alignment(identifier, uniprotSequence, pdbSequence, alignment_path):
|
| 10 |
-
|
| 11 |
if len(pdbSequence) >= 1:
|
| 12 |
-
f = open(Path(alignment_path / f'{identifier}_alignment.txt'),
|
| 13 |
-
"w")
|
| 14 |
aligner.mode = 'local'
|
| 15 |
aligner.substitution_matrix = substitution_matrices.load("BLOSUM62")
|
| 16 |
aligner.open_gap_score = -11
|
|
@@ -25,6 +24,7 @@ def do_alignment(identifier, uniprotSequence, pdbSequence, alignment_path):
|
|
| 25 |
alignment = (str(alignment).strip().split('\n'))
|
| 26 |
alignment = [''.join(['.' if m == ' ' else m for m in x]) for x in alignment]
|
| 27 |
alignment_list.append(alignment)
|
|
|
|
| 28 |
return alignment_list
|
| 29 |
|
| 30 |
|
|
@@ -308,8 +308,11 @@ def final_stage(df, annotation_list, alignment_path):
|
|
| 308 |
for i in df.index:
|
| 309 |
print('i',i)
|
| 310 |
identifier = df.at[i, 'uniprotID'] + '_' + df.at[i, 'pdbID'] + '_' + df.at[i, 'chain'] + '_'
|
|
|
|
| 311 |
alignment_list = do_alignment(identifier, df.at[i, 'uniprotSequence'], df.at[i, 'pdbSequence'], alignment_path)
|
| 312 |
df.at[i, 'pdb_alignStatus'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[0]
|
|
|
|
|
|
|
| 313 |
df.at[i, 'mutationPositionOnPDB'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[1]
|
| 314 |
print('df',df)
|
| 315 |
startGap = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[2]
|
|
|
|
| 7 |
|
| 8 |
|
| 9 |
def do_alignment(identifier, uniprotSequence, pdbSequence, alignment_path):
|
| 10 |
+
print(f'Aligning Datapoint: {identifier}')
|
| 11 |
if len(pdbSequence) >= 1:
|
| 12 |
+
f = open(Path(alignment_path / f'{identifier}_alignment.txt'),"w")
|
|
|
|
| 13 |
aligner.mode = 'local'
|
| 14 |
aligner.substitution_matrix = substitution_matrices.load("BLOSUM62")
|
| 15 |
aligner.open_gap_score = -11
|
|
|
|
| 24 |
alignment = (str(alignment).strip().split('\n'))
|
| 25 |
alignment = [''.join(['.' if m == ' ' else m for m in x]) for x in alignment]
|
| 26 |
alignment_list.append(alignment)
|
| 27 |
+
print(alignment_list)
|
| 28 |
return alignment_list
|
| 29 |
|
| 30 |
|
|
|
|
| 308 |
for i in df.index:
|
| 309 |
print('i',i)
|
| 310 |
identifier = df.at[i, 'uniprotID'] + '_' + df.at[i, 'pdbID'] + '_' + df.at[i, 'chain'] + '_'
|
| 311 |
+
print('i',i)
|
| 312 |
alignment_list = do_alignment(identifier, df.at[i, 'uniprotSequence'], df.at[i, 'pdbSequence'], alignment_path)
|
| 313 |
df.at[i, 'pdb_alignStatus'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[0]
|
| 314 |
+
|
| 315 |
+
print('df',df)
|
| 316 |
df.at[i, 'mutationPositionOnPDB'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[1]
|
| 317 |
print('df',df)
|
| 318 |
startGap = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[2]
|