1
|
1 <tool id="aragorn_trna" name="tRNA and tmRNA" version="0.4">
|
|
2 <description>prediction (Aragorn)</description>
|
0
|
3 <requirements>
|
|
4 <requirement type="package" version="1.2.36">aragorn</requirement>
|
1
|
5 <requirement type="set_environment">TRNAPRED_SCRIPT_PATH</requirement>
|
0
|
6 </requirements>
|
|
7 <command>
|
1
|
8 <![CDATA[
|
|
9 aragorn
|
|
10 $input
|
0
|
11 -gc$genbank_gencode
|
|
12 $tmRNA
|
|
13 $tRNA
|
|
14 $mtRNA
|
|
15 $mam_mtRNA
|
|
16 $topology
|
|
17 -o $output
|
|
18 $secondary_structure
|
1
|
19 $introns;
|
|
20
|
|
21 #if $gff3_output:
|
|
22 aragorn
|
|
23 $input
|
|
24 -gc$genbank_gencode
|
|
25 $tmRNA
|
|
26 $tRNA
|
|
27 $mtRNA
|
|
28 $mam_mtRNA
|
|
29 $topology
|
|
30 -fasta
|
|
31 $introns | python \$TRNAPRED_SCRIPT_PATH/aragorn_out_to_gff3.py > $gff3_output_file;
|
|
32 #end if
|
|
33 ]]>
|
0
|
34 </command>
|
|
35 <inputs>
|
|
36 <param name="input" type="data" format="fasta" label="Genome Sequence"/>
|
|
37 <param name="genbank_gencode" type="select" label="Genetic code">
|
|
38 <option value="1" select="True">1. Standard</option>
|
|
39 <option value="2">2. Vertebrate Mitochondrial</option>
|
|
40 <option value="3">3. Yeast Mitochondrial</option>
|
|
41 <option value="4">4. Mold, Protozoan, and Coelenterate Mitochondrial Code and the Mycoplasma/Spiroplasma Code</option>
|
|
42 <option value="5">5. Invertebrate Mitochondrial</option>
|
|
43 <option value="6">6. Ciliate, Dasycladacean and Hexamita Nuclear Code</option>
|
|
44 <option value="9">9. Echinoderm Mitochondrial</option>
|
|
45 <option value="10">10. Euplotid Nuclear</option>
|
|
46 <option value="11">11. Bacteria and Archaea</option>
|
|
47 <option value="12">12. Alternative Yeast Nuclear</option>
|
|
48 <option value="13">13. Ascidian Mitochondrial</option>
|
|
49 <option value="14">14. Flatworm Mitochondrial</option>
|
|
50 <option value="15">15. Blepharisma Macronuclear</option>
|
|
51 <option value="16">16. Chlorophycean Mitochondrial</option>
|
|
52 <option value="21">21. Trematode Mitochondrial</option>
|
|
53 <option value="22">22. Scenedesmus obliquus mitochondrial</option>
|
|
54 <option value="23">23. Thraustochytrium Mitochondrial</option>
|
|
55 <option value="24">24. Pterobranchia mitochondrial</option>
|
|
56 </param>
|
|
57 <param name="topology" type="select" label="Topology">
|
|
58 <option value="-c">Assume that each sequence has a circular topology</option>
|
|
59 <option value="-l">Assume that each sequence has a linear topology</option>
|
|
60 </param>
|
|
61 <param name='tmRNA' type='boolean' label='Search for tmRNA genes (-m)' truevalue='-m' falsevalue='' checked="true" help='' />
|
|
62 <param name='tRNA' type='boolean' label='Search for tRNA genes (-t)' truevalue='-t' falsevalue='' checked="true" help='' />
|
|
63 <param name='mtRNA' type='boolean' label='Search for Metazoan mitochondrial tRNA genes (-mt)' truevalue='-mt' falsevalue='' checked="false" help='-i switch ignored. Composite Metazoan mitochondrial genetic code used.' />
|
|
64 <param name='mam_mtRNA' type='boolean' label='Search for Mammalian mitochondrial tRNA genes (-mtmam)' truevalue='-mtmam' falsevalue='' checked="false" help='-i switch ignored. -tv switch set. Mammalian mitochondrial genetic code used.' />
|
|
65 <param name='introns' type='boolean' label='Search for tRNA genes with introns in anticodon loop ...' truevalue='-i' falsevalue='' checked="false" help='...with maximum length 3000 bases (-i).' />
|
|
66 <param name='secondary_structure' type='boolean' label='Print out secondary structure (-fasta,-fon)' truevalue='-fasta' falsevalue='-fon' checked="false" help='' />
|
1
|
67 <param name="gff3_output" type='boolean' label='Convert output to GFF3' truevalue='True' falsevalue='' checked="false" help='' />
|
0
|
68 </inputs>
|
|
69 <outputs>
|
|
70 <data name="output" format="fasta">
|
|
71 <change_format>
|
|
72 <when input="secondary_structure" value="true" format="text"/>
|
|
73 </change_format>
|
|
74 </data>
|
1
|
75 <data format="gff3" name="gff3_output_file" >
|
|
76 <filter>gff3_output</filter>
|
|
77 </data>
|
0
|
78 </outputs>
|
|
79 <tests>
|
|
80 <test>
|
|
81 <param name="input" value="trna_arabidopsis.fasta" ftype="fasta" />
|
|
82 <param name="genbank_gencode" value="1" />
|
|
83 <param name="topology" value="-c" />
|
|
84 <param name="tmRNA" value="-m" />
|
|
85 <param name="tRNA" value="-t" />
|
|
86 <param name="mtRNA" value="" />
|
|
87 <param name="mam_mtRNA" value="" />
|
1
|
88 <param name="introns" value="" />
|
0
|
89 <param name="secondary_structure" value="-fon" />
|
1
|
90 <param name="gff3_output" value="True" />
|
0
|
91 <output name="output" file="aragorn_tansl-table-1_tmRNA_tRNA.fasta" ftype="fasta" />
|
1
|
92 <output name="output" file="aragorn_tansl-table-1_tmRNA_tRNA.gff3" ftype="gff3" />
|
0
|
93 </test>
|
|
94 </tests>
|
|
95 <help>
|
1
|
96 <![CDATA[
|
0
|
97
|
|
98 **What it does**
|
|
99
|
|
100 Aragorn_ predicts tRNA (and tmRNA) in nucleotide sequences.
|
|
101
|
|
102 .. _Aragorn: http://mbio-serv2.mbioekol.lu.se/ARAGORN/
|
|
103
|
|
104 -----
|
|
105
|
|
106 **Example**
|
|
107
|
|
108 Suppose you have the following nucleotide sequences::
|
|
109
|
|
110 >SQ Sequence 8667507 BP; 1203558 A; 3121252 C; 3129638 G; 1213059 T; 0 other;
|
|
111 cccgcggagcgggtaccacatcgctgcgcgatgtgcgagcgaacacccgggctgcgcccg
|
|
112 ggtgttgcgctcccgctccgcgggagcgctggcgggacgctgcgcgtcccgctcaccaag
|
|
113 cccgcttcgcgggcttggtgacgctccgtccgctgcgcttccggagttgcggggcttcgc
|
|
114 cccgctaaccctgggcctcgcttcgctccgccttgggcctgcggcgggtccgctgcgctc
|
|
115 ccccgcctcaagggcccttccggctgcgcctccaggacccaaccgcttgcgcgggcctgg
|
|
116 ....
|
|
117
|
|
118 Running this tool can produce a FASTA file with all detected RNAs or a more detailed text file like the following::
|
|
119
|
|
120 c
|
|
121 c
|
|
122 a
|
|
123 g-c
|
|
124 g-c
|
|
125 g-c
|
|
126 c-g
|
|
127 g-c
|
|
128 a-t
|
|
129 t-a ca
|
|
130 t tgacc a
|
|
131 ga a !!!!! g
|
|
132 t ctcg actgg c
|
|
133 g !!!! c tt
|
|
134 g gagc t
|
|
135 aa g g
|
|
136 c-gag
|
|
137 t-a
|
|
138 t-a
|
|
139 c-g
|
|
140 g-c
|
|
141 t c
|
|
142 t a
|
|
143 cac
|
|
144
|
|
145 tRNA-Val(cac)
|
|
146 74 bases, %GC = 58.1
|
|
147 Sequence [6669703,6669776]
|
|
148
|
|
149
|
|
150 tRNA Anticodon Frequency
|
1
|
151 AAA Phe GAA Phe 1 CAA Leu 1 TAA Leu 1
|
|
152 AGA Ser GGA Ser 1 CGA Ser 2 TGA Ser 1
|
|
153 ACA Cys GCA Cys 2 CCA Trp 2 TCA seC
|
|
154 ATA Tyr GTA Tyr 1 CTA Pyl TTA Stop
|
|
155 AAG Leu GAG Leu 3 CAG Leu 1 TAG Leu 2
|
|
156 AGG Pro GGG Pro 2 CGG Pro 2 TGG Pro 2
|
|
157 ACG Arg 1 GCG Arg 2 CCG Arg 1 TCG Arg
|
|
158 ATG His GTG His 2 CTG Gln 2 TTG Gln 1
|
|
159 AAC Val GAC Val 3 CAC Val 2 TAC Val 1
|
|
160 AGC Ala GGC Ala 2 CGC Ala 3 TGC Ala 1
|
|
161 ACC Gly GCC Gly 5 CCC Gly 1 TCC Gly 2
|
|
162 ATC Asp GTC Asp 3 CTC Glu 2 TTC Glu 2
|
|
163 AAT Ile GAT Ile 3 CAT Met 6 TAT Ile
|
|
164 AGT Thr GGT Thr 2 CGT Thr 1 TGT Thr 2
|
|
165 ACT Ser GCT Ser 1 CCT Arg 1 TCT Arg 1
|
|
166 ATT Asn GTT Asn 3 CTT Lys 3 TTT Lys 2
|
0
|
167 Ambiguous: 1
|
|
168
|
|
169 tRNA Codon Frequency
|
1
|
170 TTT Phe TTC Phe 1 TTG Leu 1 TTA Leu 1
|
|
171 TCT Ser TCC Ser 1 TCG Ser 2 TCA Ser 1
|
|
172 TGT Cys TGC Cys 2 TGG Trp 2 TGA seC
|
|
173 TAT Tyr TAC Tyr 1 TAG Pyl TAA Stop
|
|
174 CTT Leu CTC Leu 3 CTG Leu 1 CTA Leu 2
|
|
175 CCT Pro CCC Pro 2 CCG Pro 2 CCA Pro 2
|
|
176 CGT Arg 1 CGC Arg 2 CGG Arg 1 CGA Arg
|
|
177 CAT His CAC His 2 CAG Gln 2 CAA Gln 1
|
|
178 GTT Val GTC Val 3 GTG Val 2 GTA Val 1
|
|
179 GCT Ala GCC Ala 2 GCG Ala 3 GCA Ala 1
|
|
180 GGT Gly GGC Gly 5 GGG Gly 1 GGA Gly 2
|
|
181 GAT Asp GAC Asp 3 GAG Glu 2 GAA Glu 2
|
|
182 ATT Ile ATC Ile 3 ATG Met 6 ATA Ile
|
|
183 ACT Thr ACC Thr 2 ACG Thr 1 ACA Thr 2
|
|
184 AGT Ser AGC Ser 1 AGG Arg 1 AGA Arg 1
|
|
185 AAT Asn AAC Asn 3 AAG Lys 3 AAA Lys 2
|
0
|
186 Ambiguous: 1
|
|
187
|
|
188 Number of tRNA genes = 86
|
|
189 tRNA GC range = 50.0% to 85.1%
|
|
190 Number of tmRNA genes = 1
|
|
191
|
|
192 -------
|
|
193
|
|
194 **References**
|
|
195
|
|
196 Dean Laslett and Bjorn Canback
|
|
197
|
|
198 ARAGORN, a program to detect tRNA genes and tmRNA genes in nucleotide sequences Nucl. Acids Res. (2004) 32(1): 11-16
|
|
199
|
1
|
200 doi:10.1093/nar/gkh152
|
0
|
201
|
1
|
202 ]]>
|
0
|
203 </help>
|
|
204 </tool>
|