forked from petercombs/dicty
-
Notifications
You must be signed in to change notification settings - Fork 0
/
BlastSummary.py
41 lines (33 loc) · 1.19 KB
/
BlastSummary.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
from argparse import ArgumentParser, FileType
from os.path import commonprefix
from collections import Counter
def parse_args():
"Parse command line arguments"
parser = ArgumentParser()
parser.add_argument("--output", "-o", type=FileType("w"))
parser.add_argument("blast_files", nargs="+")
return parser.parse_args()
if __name__ == "__main__":
args = parse_args()
prefix = commonprefix(args.blast_files)
bact = Counter()
dicty = Counter()
other_euk = Counter()
keys = []
for fname in args.blast_files:
keys.append(fname)
for line in open(fname):
data = line.split("\t")
if data[1] == "Bacteria":
bact[fname] += 1
elif data[1] == "Eukaryota":
if data[2].startswith("Dictyostelium"):
dicty[fname] += 1
else:
other_euk[fname] += 1
print("File", "Dicty", "Bacteria", "Other_Eukaryote", sep="\t", file=args.output)
for key in keys:
key_short = key.replace(prefix, "").replace("/blastout.tsv", "")
print(
key_short, dicty[key], bact[key], other_euk[key], sep="\t", file=args.output
)