annotate test-data/human_augustus_protein_codingseq_introns_cds_main.gtf @ 0:af307d3285c5 draft

Uploaded
author bgruening
date Sat, 06 Jul 2013 10:07:41 -0400
parents
children f5075dee9d6b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
1 # This output was generated with AUGUSTUS (version 2.7).
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
2 # AUGUSTUS is a gene prediction tool for eukaryotes written by Mario Stanke (mario.stanke@uni-greifswald.de)
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
3 # and Oliver Keller (keller@cs.uni-goettingen.de).
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
4 # Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008),
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
5 # Using native and syntenically mapped cDNA alignments to improve de novo gene finding
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
6 # Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
7 # No extrinsic information on sequences given.
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
8 # Initialising the parameters ...
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
9 # human version. Using default transition matrix.
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
10 # Looks like /home/bag/projects/galaxy/galaxy-central/database/files/001/dataset_1149.dat is in fasta format.
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
11 # We have hints for 0 sequences and for 0 of the sequences in the input set.
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
12 #
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
13 # ----- prediction on sequence number 1 (length = 9453, name = HS04636) -----
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
14 #
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
15 # Constraints/Hints:
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
16 # (none)
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
17 # Predicted genes for sequence number 1 on both strands
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
18 # start gene g1
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
19 HS04636 AUGUSTUS gene 966 6903 1 + . g1
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
20 HS04636 AUGUSTUS transcript 966 6903 . + . g1.t1
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
21 HS04636 AUGUSTUS intron 1018 1817 . + . transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
22 HS04636 AUGUSTUS intron 1935 2054 . + . transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
23 HS04636 AUGUSTUS intron 2199 2851 . + . transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
24 HS04636 AUGUSTUS intron 2996 3425 . + . transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
25 HS04636 AUGUSTUS intron 3608 4339 . + . transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
26 HS04636 AUGUSTUS intron 4424 4542 . + . transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
27 HS04636 AUGUSTUS intron 4790 5071 . + . transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
28 HS04636 AUGUSTUS intron 5359 5859 . + . transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
29 HS04636 AUGUSTUS intron 6008 6493 . + . transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
30 HS04636 AUGUSTUS CDS 966 1017 . + 0 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
31 HS04636 AUGUSTUS CDS 1818 1934 . + 2 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
32 HS04636 AUGUSTUS CDS 2055 2198 . + 2 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
33 HS04636 AUGUSTUS CDS 2852 2995 . + 2 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
34 HS04636 AUGUSTUS CDS 3426 3607 . + 2 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
35 HS04636 AUGUSTUS CDS 4340 4423 . + 0 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
36 HS04636 AUGUSTUS CDS 4543 4789 . + 0 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
37 HS04636 AUGUSTUS CDS 5072 5358 . + 2 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
38 HS04636 AUGUSTUS CDS 5860 6007 . + 0 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
39 HS04636 AUGUSTUS CDS 6494 6903 . + 2 transcript_id "g1.t1"; gene_id "g1";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
40 # coding sequence = [atgctcgcccgcgccctgctgctgtgcgcggtcctggcgctcagccatacagcaaatccttgctgttcccacccatgtc
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
41 # aaaaccgaggtgtatgtatgagtgtgggatttgaccagtataagtgcgattgtacccggacaggattctatggagaaaactgctcaacaccggaattt
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
42 # ttgacaagaataaaattatttctgaaacccactccaaacacagtgcactacatacttacccacttcaagggattttggaacgttgtgaataacattcc
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
43 # cttccttcgaaatgcaattatgagttatgtcttgacatccagatcacatttgattgacagtccaccaacttacaatgctgactatggctacaaaagct
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
44 # gggaagccttctctaacctctcctattatactagagcccttcctcctgtgcctgatgattgcccgactcccttgggtgtcaaaggtaaaaagcagctt
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
45 # cctgattcaaatgagattgtggaaaaattgcttctaagaagaaagttcatccctgatccccagggctcaaacatgatgtttgcattctttgcccagca
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
46 # cttcacgcatcagtttttcaagacagatcataagcgagggccagctttcaccaacgggctgggccatggggtggacttaaatcatatttacggtgaaa
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
47 # ctctggctagacagcgtaaactgcgccttttcaaggatggaaaaatgaaatatcagataattgatggagagatgtatcctcccacagtcaaagatact
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
48 # caggcagagatgatctaccctcctcaagtccctgagcatctacggtttgctgtggggcaggaggtctttggtctggtgcctggtctgatgatgtatgc
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
49 # cacaatctggctgcgggaacacaacagagtatgcgatgtgcttaaacaggagcatcctgaatggggtgatgagcagttgttccagacaagcaggctaa
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
50 # tactgataggagagactattaagattgtgattgaagattatgtgcaacacttgagtggctatcacttcaaactgaaatttgacccagaactacttttc
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
51 # aacaaacaattccagtaccaaaatcgtattgctgctgaatttaacaccctctatcactggcatccccttctgcctgacacctttcaaattcatgacca
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
52 # gaaatacaactatcaacagtttatctacaacaactctatattgctggaacatggaattacccagtttgttgaatcattcaccaggcaaattgctggca
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
53 # gggttgctggtggtaggaatgttccacccgcagtacagaaagtatcacaggcttccattgaccagagcaggcagatgaaataccagtcttttaatgag
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
54 # taccgcaaacgctttatgctgaagccctatgaatcatttgaagaacttacaggagaaaaggaaatgtctgcagagttggaagcactctatggtgacat
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
55 # cgatgctgtggagctgtatcctgcccttctggtagaaaagcctcggccagatgccatctttggtgaaaccatggtagaagttggagcaccattctcct
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
56 # tgaaaggacttatgggtaatgttatatgttctcctgcctactggaagccaagcacttttggtggagaagtgggttttcaaatcatcaacactgcctca
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
57 # attcagtctctcatctgcaataacgtgaagggctgtccctttacttcattcagtgttccagatccagagctcattaaaacagtcaccatcaatgcaag
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
58 # ttcttcccgctccggactagatgatatcaatcccacagtactactaaaagaacgttcgactgaactgtag]
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
59 # protein sequence = [MLARALLLCAVLALSHTANPCCSHPCQNRGVCMSVGFDQYKCDCTRTGFYGENCSTPEFLTRIKLFLKPTPNTVHYIL
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
60 # THFKGFWNVVNNIPFLRNAIMSYVLTSRSHLIDSPPTYNADYGYKSWEAFSNLSYYTRALPPVPDDCPTPLGVKGKKQLPDSNEIVEKLLLRRKFIPD
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
61 # PQGSNMMFAFFAQHFTHQFFKTDHKRGPAFTNGLGHGVDLNHIYGETLARQRKLRLFKDGKMKYQIIDGEMYPPTVKDTQAEMIYPPQVPEHLRFAVG
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
62 # QEVFGLVPGLMMYATIWLREHNRVCDVLKQEHPEWGDEQLFQTSRLILIGETIKIVIEDYVQHLSGYHFKLKFDPELLFNKQFQYQNRIAAEFNTLYH
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
63 # WHPLLPDTFQIHDQKYNYQQFIYNNSILLEHGITQFVESFTRQIAGRVAGGRNVPPAVQKVSQASIDQSRQMKYQSFNEYRKRFMLKPYESFEELTGE
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
64 # KEMSAELEALYGDIDAVELYPALLVEKPRPDAIFGETMVEVGAPFSLKGLMGNVICSPAYWKPSTFGGEVGFQIINTASIQSLICNNVKGCPFTSFSV
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
65 # PDPELIKTVTINASSSRSGLDDINPTVLLKERSTEL]
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
66 # end gene g1
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
67 ###
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
68 #
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
69 # ----- prediction on sequence number 2 (length = 2344, name = HS08198) -----
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
70 #
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
71 # Constraints/Hints:
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
72 # (none)
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
73 # Predicted genes for sequence number 2 on both strands
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
74 # start gene g2
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
75 HS08198 AUGUSTUS gene 445 1848 1 + . g2
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
76 HS08198 AUGUSTUS transcript 445 1848 . + . g2.t1
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
77 HS08198 AUGUSTUS intron 583 811 . + . transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
78 HS08198 AUGUSTUS intron 895 1052 . + . transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
79 HS08198 AUGUSTUS intron 1124 1207 . + . transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
80 HS08198 AUGUSTUS intron 1316 1586 . + . transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
81 HS08198 AUGUSTUS intron 1689 1771 . + . transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
82 HS08198 AUGUSTUS CDS 445 582 . + 0 transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
83 HS08198 AUGUSTUS CDS 812 894 . + 0 transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
84 HS08198 AUGUSTUS CDS 1053 1123 . + 1 transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
85 HS08198 AUGUSTUS CDS 1208 1315 . + 2 transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
86 HS08198 AUGUSTUS CDS 1587 1688 . + 2 transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
87 HS08198 AUGUSTUS CDS 1772 1848 . + 2 transcript_id "g2.t1"; gene_id "g2";
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
88 # coding sequence = [atgctgccccctgggactgcgaccctcttgactctgctcctggcagctggctcgctgggccagaagcctcagaggccac
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
89 # gccggcccgcatcccccatcagcaccatccagcccaaggccaattttgatgcgcagcaggagcagggccaccgggccgaggccaccacactgcatgtg
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
90 # gctccccagggcacagccatggctgtcagtaccttccgaaagctggatgggatctgctggcaggtgcgccagctctatggagacacaggggtcctcgg
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
91 # ccgcttcctgcttcaagcccgaggcgcccgaggggctgtgcacgtggttgtcgctgagaccgactaccagagtttcgctgtcctgtacctggagcggg
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
92 # cggggcagctgtcagtgaagctctacgcccgctcgctccctgtgagcgactcggtcctgagtgggtttgagcagcgggtccaggaggcccacctgact
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
93 # gaggaccagatcttctacttccccaagtacggcttctgcgaggctgcagaccagttccacgtcctggacggtgagtgcacagcgggggcaagcatggc
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
94 # ggcgtggtga]
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
95 # protein sequence = [MLPPGTATLLTLLLAAGSLGQKPQRPRRPASPISTIQPKANFDAQQEQGHRAEATTLHVAPQGTAMAVSTFRKLDGIC
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
96 # WQVRQLYGDTGVLGRFLLQARGARGAVHVVVAETDYQSFAVLYLERAGQLSVKLYARSLPVSDSVLSGFEQRVQEAHLTEDQIFYFPKYGFCEAADQF
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
97 # HVLDGECTAGASMAAW]
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
98 # end gene g2
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
99 ###
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
100 # command line:
af307d3285c5 Uploaded
bgruening
parents:
diff changeset
101 # augustus --strand=both --noInFrameStop=false --gff3=off --protein=on --introns=on --start=off --stop=off --cds=on --codingseq=on --singlestrand=false /home/bag/projects/galaxy/galaxy-central/database/files/001/dataset_1149.dat --UTR=off --genemodel=complete --species=human