annotate cpt_trnascanse_to_gff/tRNAscan_to_gff_SE_format.py @ 2:09168094a98f draft default tip

Uploaded
author cpt
date Fri, 20 May 2022 08:43:44 +0000
parents b4134ad44443
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
b4134ad44443 Uploaded
cpt
parents:
diff changeset
1 #!/usr/bin/env python
b4134ad44443 Uploaded
cpt
parents:
diff changeset
2 import fileinput
b4134ad44443 Uploaded
cpt
parents:
diff changeset
3
b4134ad44443 Uploaded
cpt
parents:
diff changeset
4 print ("##gff-version-3")
b4134ad44443 Uploaded
cpt
parents:
diff changeset
5 # process each trna in tsv file
b4134ad44443 Uploaded
cpt
parents:
diff changeset
6 metaLines = 0
b4134ad44443 Uploaded
cpt
parents:
diff changeset
7 for trna in fileinput.input():
b4134ad44443 Uploaded
cpt
parents:
diff changeset
8 if metaLines < 3:
b4134ad44443 Uploaded
cpt
parents:
diff changeset
9 metaLines += 1
b4134ad44443 Uploaded
cpt
parents:
diff changeset
10 continue
b4134ad44443 Uploaded
cpt
parents:
diff changeset
11 cols_tsv = trna.split("\t")
b4134ad44443 Uploaded
cpt
parents:
diff changeset
12 if int(cols_tsv[2]) < int(cols_tsv[3]):
b4134ad44443 Uploaded
cpt
parents:
diff changeset
13 cols_gff = [
b4134ad44443 Uploaded
cpt
parents:
diff changeset
14 cols_tsv[0].strip(),
b4134ad44443 Uploaded
cpt
parents:
diff changeset
15 "tRNAscan",
b4134ad44443 Uploaded
cpt
parents:
diff changeset
16 "tRNA",
b4134ad44443 Uploaded
cpt
parents:
diff changeset
17 cols_tsv[2].strip(),
b4134ad44443 Uploaded
cpt
parents:
diff changeset
18 cols_tsv[3].strip(),
b4134ad44443 Uploaded
cpt
parents:
diff changeset
19 cols_tsv[8],
b4134ad44443 Uploaded
cpt
parents:
diff changeset
20 "+",
b4134ad44443 Uploaded
cpt
parents:
diff changeset
21 ".",
b4134ad44443 Uploaded
cpt
parents:
diff changeset
22 'ID=trna.%s;Anticodon=%s;Codon=tRNA-%s'
b4134ad44443 Uploaded
cpt
parents:
diff changeset
23 % (cols_tsv[1], cols_tsv[5].lower(), cols_tsv[4]),
b4134ad44443 Uploaded
cpt
parents:
diff changeset
24 ]
b4134ad44443 Uploaded
cpt
parents:
diff changeset
25 else:
b4134ad44443 Uploaded
cpt
parents:
diff changeset
26 cols_gff = [
b4134ad44443 Uploaded
cpt
parents:
diff changeset
27 cols_tsv[0].strip(),
b4134ad44443 Uploaded
cpt
parents:
diff changeset
28 "tRNAscan",
b4134ad44443 Uploaded
cpt
parents:
diff changeset
29 "tRNA",
b4134ad44443 Uploaded
cpt
parents:
diff changeset
30 cols_tsv[3].strip(),
b4134ad44443 Uploaded
cpt
parents:
diff changeset
31 cols_tsv[2].strip(),
b4134ad44443 Uploaded
cpt
parents:
diff changeset
32 cols_tsv[8],
b4134ad44443 Uploaded
cpt
parents:
diff changeset
33 "-",
b4134ad44443 Uploaded
cpt
parents:
diff changeset
34 ".",
b4134ad44443 Uploaded
cpt
parents:
diff changeset
35 'ID=trna.%s;Anticodon=%s;Codon=tRNA-%s'
b4134ad44443 Uploaded
cpt
parents:
diff changeset
36 % (cols_tsv[1], cols_tsv[5].lower(), cols_tsv[4]),
b4134ad44443 Uploaded
cpt
parents:
diff changeset
37 ]
b4134ad44443 Uploaded
cpt
parents:
diff changeset
38 print ("\t".join(cols_gff))