1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
|
import re
def parsing(entree, sortie):
inp=open(entree, "r")
out=open(sortie, "w")
line = inp.readline()
p = re.compile("\s{2,}")
out.write("Scaffold\tDomaine\tScore\tE-value\n")
for line in inp:
if line[0] == "#":
continue
line = p.sub(r" ", line)
if '>>' in line :
scaffold = list(line.split(" "))
line = inp.readline()
line = inp.readline()
line = inp.readline()
colonne = list(line.split(" "))
out.write("\t".join(list([scaffold[1], colonne[3], colonne[6], colonne[13]])) + "\n")
line = inp.readline() |