Spaces:
Sleeping
Sleeping
fatmacankara
commited on
Commit
·
90f8374
1
Parent(s):
73f2f0c
Update code/add_alignment.py
Browse files- code/add_alignment.py +6 -3
code/add_alignment.py
CHANGED
@@ -7,10 +7,9 @@ from Bio.pairwise2 import format_alignment
|
|
7 |
|
8 |
|
9 |
def do_alignment(identifier, uniprotSequence, pdbSequence, alignment_path):
|
10 |
-
|
11 |
if len(pdbSequence) >= 1:
|
12 |
-
f = open(Path(alignment_path / f'{identifier}_alignment.txt'),
|
13 |
-
"w")
|
14 |
aligner.mode = 'local'
|
15 |
aligner.substitution_matrix = substitution_matrices.load("BLOSUM62")
|
16 |
aligner.open_gap_score = -11
|
@@ -25,6 +24,7 @@ def do_alignment(identifier, uniprotSequence, pdbSequence, alignment_path):
|
|
25 |
alignment = (str(alignment).strip().split('\n'))
|
26 |
alignment = [''.join(['.' if m == ' ' else m for m in x]) for x in alignment]
|
27 |
alignment_list.append(alignment)
|
|
|
28 |
return alignment_list
|
29 |
|
30 |
|
@@ -308,8 +308,11 @@ def final_stage(df, annotation_list, alignment_path):
|
|
308 |
for i in df.index:
|
309 |
print('i',i)
|
310 |
identifier = df.at[i, 'uniprotID'] + '_' + df.at[i, 'pdbID'] + '_' + df.at[i, 'chain'] + '_'
|
|
|
311 |
alignment_list = do_alignment(identifier, df.at[i, 'uniprotSequence'], df.at[i, 'pdbSequence'], alignment_path)
|
312 |
df.at[i, 'pdb_alignStatus'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[0]
|
|
|
|
|
313 |
df.at[i, 'mutationPositionOnPDB'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[1]
|
314 |
print('df',df)
|
315 |
startGap = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[2]
|
|
|
7 |
|
8 |
|
9 |
def do_alignment(identifier, uniprotSequence, pdbSequence, alignment_path):
|
10 |
+
print(f'Aligning Datapoint: {identifier}')
|
11 |
if len(pdbSequence) >= 1:
|
12 |
+
f = open(Path(alignment_path / f'{identifier}_alignment.txt'),"w")
|
|
|
13 |
aligner.mode = 'local'
|
14 |
aligner.substitution_matrix = substitution_matrices.load("BLOSUM62")
|
15 |
aligner.open_gap_score = -11
|
|
|
24 |
alignment = (str(alignment).strip().split('\n'))
|
25 |
alignment = [''.join(['.' if m == ' ' else m for m in x]) for x in alignment]
|
26 |
alignment_list.append(alignment)
|
27 |
+
print(alignment_list)
|
28 |
return alignment_list
|
29 |
|
30 |
|
|
|
308 |
for i in df.index:
|
309 |
print('i',i)
|
310 |
identifier = df.at[i, 'uniprotID'] + '_' + df.at[i, 'pdbID'] + '_' + df.at[i, 'chain'] + '_'
|
311 |
+
print('i',i)
|
312 |
alignment_list = do_alignment(identifier, df.at[i, 'uniprotSequence'], df.at[i, 'pdbSequence'], alignment_path)
|
313 |
df.at[i, 'pdb_alignStatus'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[0]
|
314 |
+
|
315 |
+
print('df',df)
|
316 |
df.at[i, 'mutationPositionOnPDB'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[1]
|
317 |
print('df',df)
|
318 |
startGap = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[2]
|