forked from andreas-wilm/compbio-utils
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdecode_ascii_phred.py
executable file
·89 lines (71 loc) · 2.58 KB
/
decode_ascii_phred.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
#!/usr/bin/env python
"""Decode ASCII-encoded phred scores.
Can replace certain columns with decoded values and leave the rest. Try e.g.
samtools mpileup -s your.bam | decode_ascii_phred.py -c 6 7
"""
#--- standard library imports
#
import sys
import argparse
#--- third-party imports
#
# /
#--- project specific imports
#
# /
__author__ = "Andreas Wilm"
__version__ = "0.1"
__email__ = "andreas.wilm@gmail.com"
__license__ = "The MIT License (MIT)"
def decode_phred(ascii_enc_phred, offset=33):
"""Decode ASCII encoded phred qualities in ascii_enc_phred and
yield decoded values as int
"""
for c in ascii_enc_phred:
res = ord(c)-offset
assert res >= 0 and res <= 100, ("Phred quality for %c out of range" % c)
yield res
def main():
"""The main function
"""
# http://docs.python.org/dev/howto/argparse.html
parser = argparse.ArgumentParser()
#parser.add_argument("-v", "--verbose", action="store_true", # action="count", default=0,
# help="increase output verbosity")
default = 33
parser.add_argument("-e", "--qualenc",
choices=[33, 64], type=int, default=default,
help="Qualities are ASCII-encoded Phred +33"
" (e.g. Sanger, SRA, Illumina 1.8+) or +64"
" (e.g. Illumina 1.3-1.7). Default: %d" % default)
parser.add_argument("-c", "--col",
type=int, nargs='*',
help="Decode qualities in this column"
" (tab delimited fields) and replace contents")
args = parser.parse_args()
# FIXME add file option
fh = sys.stdin
for line in fh:
line = line.rstrip()
if not len(line):
print
continue
if not args.col:
enc_quals = line
dec_quals = decode_phred(enc_quals, args.qualenc)
print ' '.join(["%s" % q for q in dec_quals])
else:
for (idx, col) in enumerate(line.split('\t')):
if idx > 0:
print "\t",
if idx+1 not in args.col:
print col,
else:
enc_quals = col
dec_quals = decode_phred(enc_quals, args.qualenc)
print ' '.join(["%s" % q for q in dec_quals]),
print
if fh != sys.stdin:
fh.close()
if __name__ == "__main__":
main()