fatmacankara commited on
Commit
90f8374
·
1 Parent(s): 73f2f0c

Update code/add_alignment.py

Browse files
Files changed (1) hide show
  1. code/add_alignment.py +6 -3
code/add_alignment.py CHANGED
@@ -7,10 +7,9 @@ from Bio.pairwise2 import format_alignment
7
 
8
 
9
  def do_alignment(identifier, uniprotSequence, pdbSequence, alignment_path):
10
- #print(f'Aligning Datapoint: {identifier}')
11
  if len(pdbSequence) >= 1:
12
- f = open(Path(alignment_path / f'{identifier}_alignment.txt'),
13
- "w")
14
  aligner.mode = 'local'
15
  aligner.substitution_matrix = substitution_matrices.load("BLOSUM62")
16
  aligner.open_gap_score = -11
@@ -25,6 +24,7 @@ def do_alignment(identifier, uniprotSequence, pdbSequence, alignment_path):
25
  alignment = (str(alignment).strip().split('\n'))
26
  alignment = [''.join(['.' if m == ' ' else m for m in x]) for x in alignment]
27
  alignment_list.append(alignment)
 
28
  return alignment_list
29
 
30
 
@@ -308,8 +308,11 @@ def final_stage(df, annotation_list, alignment_path):
308
  for i in df.index:
309
  print('i',i)
310
  identifier = df.at[i, 'uniprotID'] + '_' + df.at[i, 'pdbID'] + '_' + df.at[i, 'chain'] + '_'
 
311
  alignment_list = do_alignment(identifier, df.at[i, 'uniprotSequence'], df.at[i, 'pdbSequence'], alignment_path)
312
  df.at[i, 'pdb_alignStatus'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[0]
 
 
313
  df.at[i, 'mutationPositionOnPDB'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[1]
314
  print('df',df)
315
  startGap = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[2]
 
7
 
8
 
9
  def do_alignment(identifier, uniprotSequence, pdbSequence, alignment_path):
10
+ print(f'Aligning Datapoint: {identifier}')
11
  if len(pdbSequence) >= 1:
12
+ f = open(Path(alignment_path / f'{identifier}_alignment.txt'),"w")
 
13
  aligner.mode = 'local'
14
  aligner.substitution_matrix = substitution_matrices.load("BLOSUM62")
15
  aligner.open_gap_score = -11
 
24
  alignment = (str(alignment).strip().split('\n'))
25
  alignment = [''.join(['.' if m == ' ' else m for m in x]) for x in alignment]
26
  alignment_list.append(alignment)
27
+ print(alignment_list)
28
  return alignment_list
29
 
30
 
 
308
  for i in df.index:
309
  print('i',i)
310
  identifier = df.at[i, 'uniprotID'] + '_' + df.at[i, 'pdbID'] + '_' + df.at[i, 'chain'] + '_'
311
+ print('i',i)
312
  alignment_list = do_alignment(identifier, df.at[i, 'uniprotSequence'], df.at[i, 'pdbSequence'], alignment_path)
313
  df.at[i, 'pdb_alignStatus'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[0]
314
+
315
+ print('df',df)
316
  df.at[i, 'mutationPositionOnPDB'] = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[1]
317
  print('df',df)
318
  startGap = mutation_position_on_pdb(alignment_list, df.at[i, 'pos'])[2]