-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathreverse_aln_file.py
executable file
·58 lines (44 loc) · 1.31 KB
/
reverse_aln_file.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
#!/usr/bin/env python
import os
import sys
"""
Jens Luebeck
UC San Diego, Bioinformatics & Systems Biology
"""
rdd = {'+':'-', '-':'+'}
# output a reversed alignment from a segaligner _aln.txt file format.
alignment_file = sys.argv[1]
oname = os.path.splitext(os.path.basename(alignment_file))[0]
oname = oname.rstrip("\_aln")
oname += "_reversed_aln.txt"
with open(alignment_file) as infile, open(oname, 'w') as ofile:
ofile.write(next(infile))
seqline = next(infile)
# reverse the seq
fields = seqline.rsplit("\t")
seq = fields[0][1:].rsplit(",")
rseq = [x[:-1] + "-" if x[-1] == "+" else x[:-1] + "+" for x in seq[::-1]]
fields[0] = "#" + ",".join(rseq)
ofile.write("\t".join(fields))
# header
ofile.write(next(infile))
# alignment lines
lines = [l for l in infile]
max_ind = len(seq) - 1
if seq[0] == "0+":
leaveInitInd = False
max_ind -= 2
else:
leaveInitInd = True
rev_lines = []
for x in lines[::-1]:
fields = x.rsplit("\t")
fields[4] = rdd[fields[4]]
fields[5] = rdd[fields[5]]
san = int(fields[6])
if san != 0 or not leaveInitInd:
fields[6] = str(max_ind - san)
rev_lines.append("\t".join(fields))
for oline in rev_lines:
ofile.write(oline)