comparison TargetFinder.xml @ 1:c9d56748fbde draft default tip

"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/targetfinder/ commit fe9dd99a14770b6c5f26e24893599acb577e304f"
author rnateam
date Thu, 25 Mar 2021 19:53:15 +0000
parents 773fdd1a02ea
children
comparison
equal deleted inserted replaced
0:773fdd1a02ea 1:c9d56748fbde
1 <tool id="targetfinder" name="Plant small RNA target prediction tool" version="1.7.0"> 1 <tool id='targetfinder' name='TargetFinder' version='1.7.0+galaxy1' profile='20.01'>
2 <requirements> 2 <description>plant small RNA target prediction tool</description>
3 <requirement type="package" version="1.7">targetfinder</requirement> 3 <macros>
4 </requirements> 4 <import>macros.xml</import>
5 </macros>
6 <expand macro='edam' />
7 <expand macro='requirements' />
5 <stdio> 8 <stdio>
6 <exit_code range="1:" /> 9 <exit_code range='1:' />
7 </stdio> 10 </stdio>
8 <command><![CDATA[ 11 <command><![CDATA[
9 targetfinder_threads.pl 12 targetfinder_threads.pl
10 -f $f 13 -f '$f'
11 -d $d 14 -d '$d'
12 -c $c 15 -c $c
16 -p $output_format
13 -t "\${GALAXY_SLOTS:-12}" 17 -t "\${GALAXY_SLOTS:-12}"
14 $r 18 $r
15 -o $output1 19 -o '$output_file'
20
16 ]]></command> 21 ]]></command>
17 <inputs> 22 <inputs>
18 <param label="Input small RNA sequences file" help="(-f) FASTA-format" name="f" type="data" format="fasta" /> 23 <param argument='-f' type='data' format='fasta' label='Input small RNA sequences file' help='FASTA-format' />
19 <param label="Target sequence database file" help="(-d) FASTA-format" name="d" type="data" format="fasta" /> 24 <param argument='-d' type='data' format='fasta' label='Target sequence database file' help='FASTA-format' />
20 <param label="Prediction score cutoff value" help="(-c) DEFAULT = 4" name="c" type="float" value="4.0" /> 25 <param argument='-c' type='float' value='4.0' label='Prediction score cutoff value' help='Predicted targets are printed out if they are equal to or lower than the cutoff score specified. DEFAULT = 4' />
21 <param label="Search reverse strand for targets?" help="(-r) Use this option if the database is genomic DNA." name="r" type="boolean" falsevalue="" truevalue="-r" checked="false" /> 26 <param argument='-c' type='float' value='4.0' label='Prediction score cutoff value' help='Predicted targets are printed out if they are equal to or lower than the cutoff score specified. DEFAULT = 4' />
27 <param argument='-r' type='boolean' falsevalue='' truevalue='-r' checked='false' label='Search reverse strand for targets?' help='Use this option if the database is genomic DNA.' />
28 <param name='output_format' argument='-p' type='select' label='Output format' help='Output format for small RNA-target pairs (Default = classic).' >
29 <option value='classic'>Original TargetFinder base-pair format</option>
30 <option value='gff'>GFF</option>
31 <option value='json'>JavaScript Object Notation (JSON)</option>
32 <option value='table'>Tab-delimited format</option>
33 </param>
22 </inputs> 34 </inputs>
23 <outputs> 35 <outputs>
24 <data name="output1" format="data"/> 36 <data name='output_file' format='txt'>
37 <change_format>
38 <when input="output_format" value="gff" format="gff" />
39 <when input="output_format" value="json" format="json" />
40 <when input="output_format" value="table" format="tabular" />
41 </change_format>
42 </data>
25 </outputs> 43 </outputs>
26 <tests> 44 <tests>
27 <test> 45 <test>
28 <param name="f" value="ath_miRNAs_test.fa"/> 46 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/>
29 <param name="d" value="Antirrhinum_majus.mRNA.EST.fasta"/> 47 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/>
30 <param name="r" value=""/> 48 <param name='r' value='false'/>
31 <param name="c" value="4.0"/> 49 <param name='c' value='4.0'/>
32 <param name="t" value="1"/> 50 <param name='output_format' value='classic'/>
33 <output name="output1" file="ath_miRNAs_predicted_targets.txt" compare="contains"/> 51 <output name='output_file' file='targetfinder_test_01.txt' compare='contains'/>
52 </test>
53 <test>
54 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/>
55 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/>
56 <param name='r' value='true'/>
57 <param name='c' value='4.0'/>
58 <param name='output_format' value='classic'/>
59 <output name='output_file' file='targetfinder_test_02.txt' compare='contains'/>
60 </test>
61 <test>
62 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/>
63 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/>
64 <param name='r' value='false'/>
65 <param name='c' value='6.0'/>
66 <param name='output_format' value='classic'/>
67 <output name='output_file' file='targetfinder_test_03.txt' compare='contains'/>
68 </test>
69 <test>
70 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/>
71 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/>
72 <param name='r' value='false'/>
73 <param name='c' value='4.0'/>
74 <param name='output_format' value='classic'/>
75 <output name='output_file' file='targetfinder_test_04.txt' compare='contains'/>
76 </test>
77 <test>
78 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/>
79 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/>
80 <param name='r' value='false'/>
81 <param name='c' value='4.0'/>
82 <param name='output_format' value='gff'/>
83 <output name='output_file' file='targetfinder_test_05.gff' compare='contains'/>
84 </test>
85 <test>
86 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/>
87 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/>
88 <param name='r' value='false'/>
89 <param name='c' value='4.0'/>
90 <param name='output_format' value='table'/>
91 <output name='output_file' file='targetfinder_test_06.tab' compare='contains'/>
92 </test>
93 <test>
94 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/>
95 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/>
96 <param name='r' value='false'/>
97 <param name='c' value='4.0'/>
98 <param name='output_format' value='json'/>
99 <output name='output_file' file='targetfinder_test_07.json' compare='contains' lines_diff='1'/>
100 </test>
101 <test>
102 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/>
103 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/>
104 <param name='r' value='true'/>
105 <param name='c' value='6.5'/>
106 <param name='output_format' value='table'/>
107 <output name='output_file' file='targetfinder_test_08.tab' compare='contains'/>
34 </test> 108 </test>
35 </tests> 109 </tests>
36 <help><![CDATA[ 110 <help><![CDATA[
111 .. class:: infomark
112
37 **What it does** 113 **What it does**
38 114
39 TargetFinder will computationally predict small RNA binding sites on target transcripts from a sequence database. 115 TargetFinder will computationally predict small RNA binding sites on target transcripts from a sequence database.
40 116
41 This is done by aligning the input small RNA sequence against all transcripts, 117 This is done by aligning the input small RNA sequence against all transcripts, followed by site scoring using a position-weighted scoring matrix.
42 followed by site scoring using a position-weighted scoring matrix. 118
119 ----
120
121 .. class:: infomark
43 122
44 **Input** 123 **Input**
45 124
46 -f Input small RNA sequences file (FASTA-format). 125 This tool requires two fasta files:
47 126
48 -d Target sequence database file (FASTA-format) 127 ::
49 128
50 **Output** 129 -f Input small RNA sequences file (FASTA-format).
51 130 -d Target sequence database file (FASTA-format)
52 Each predicted target site is printed out separately. 131
53 The output consists of two parts. 132 ----
54 133
55 The first is a description line and the second is a base-pairing diagram of the target and small RNA (query) sequence. 134 .. class:: infomark
56 135
57 The description line contains the query name, the description line from the target sequence database, and the target prediction score. 136 **Original TargetFinder Output**
58 137
59 The base-pairing diagram has the target site sequence on top in 5'-3' orientation and the query sequence on the bottom in 3'-5' orientation. 138
60 139 Each predicted target site is printed out separately.
61 Between the target site sequece and the query sequence are base pair symbols. 140
62 141 The output consists of two parts. The first is a description line and the second is a base-pairing diagram of the target and small RNA (query) sequence. The description line contains the query name, the description line from the target sequence database, and the target prediction score.
63 A ":" (colon) symbol represents an ordinary Watson-Crick base pair, a "." (period) represents a G:U base pair, and a " " (space) represents a mismatch. 142
143 ::
144
145 query=miR399a, target=AT2G33770.1 | Symbol: None | ubiquitin-conjugating enzyme family protein, low similarity to u, score=1.5
146
147
148 The base-pairing diagram has the target site sequence on top in 5'-3' orientation and the query sequence on the bottom in 3'-5' orientation. Between the target site sequece and the query sequence are base pair symbols. A ':' (colon) symbol represents an ordinary Watson-Crick base pair, a '.' (period) represents a G:U base pair, and a ' ' (space) represents a mismatch.
149
150 ::
151
152 target 5' UAGGGCAAAUCUUCUUUGGCA 3'
153 .:::::::::::.::::::::
154 query 3' GUCCCGUUUAGAGGAAACCGU 5'
155
64 156
65 If a small RNA is predicted to target a sequence more than once, each target site will be output as separate output. 157 If a small RNA is predicted to target a sequence more than once, each target site will be output as separate output.
158
159
160 ----
161
162 .. class:: infomark
163
164 **Additional output formats**
165
166 In addition to the output described above ('classic' output), three new output format options were added to TargetFinder.
167
168 Generic Feature Format (GFF3):
169
170 ::
171
172 AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN targetfinder rna_target 607 627 1.5 + . smallRNA=miR399a;target_seq=UAGGGCAAAUCUUCUUUGGCA;base_pairs=.:::::::::::.::::::::;miR_seq=GUCCCGUUUAGAGGAAACCGU
173 AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN targetfinder rna_target 740 760 1.5 + . smallRNA=miR399a;target_seq=UAGGGCAUAUCUCCUUUGGCA;base_pairs=.:::::: :::::::::::::;miR_seq=GUCCCGUUUAGAGGAAACCGU
174 AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN targetfinder rna_target 829 849 1.5 + . smallRNA=miR399a;target_seq=UUGGGCAAAUCUCCUUUGGCA;base_pairs=. :::::::::::::::::::;miR_seq=GUCCCGUUUAGAGGAAACCGU
175
176
177 Tab-deliminated Format:
178
179 ::
180
181 miR399a AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN 607 627 + 1.5 UAGGGCAAAUCUUCUUUGGCA .:::::::::::.:::::::: GUCCCGUUUAGAGGAAACCGU
182 miR399a AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN 740 760 + 1.5 UAGGGCAUAUCUCCUUUGGCA .:::::: ::::::::::::: GUCCCGUUUAGAGGAAACCGU
183 miR399a AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN 829 849 + 1.5 UUGGGCAAAUCUCCUUUGGCA . ::::::::::::::::::: GUCCCGUUUAGAGGAAACCGU
184
185 JavaScript Object Notation Format (JSON):
186
187 ::
188
189 {
190 'miR399a': {
191 'hits' : [
192 {
193 'Target accession': 'AT2G33770.1 | Symbols: UBC24, ATUBC24, PHO2 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN',
194 'Score': '1.5',
195 'Coordinates': '607-627',
196 'Strand': '+',
197 'Target sequence': 'UAGGGCAAAUCUUCUUUGGCA',
198 'Base pairing': '.:::::::::::.::::::::',
199 'amiRNA sequence': 'GUCCCGUUUAGAGGAAACCGU'
200 }
201 ]
202 }
203 }
204
205
206 ----
207
208 .. class:: infomark
209
210 **Method**
211
212 TargetFinder searches for potential miRNA target sites in a FASTA-formated sequence database using three main steps.
213
214
215 1. The small RNA query sequence is aligned to every sequence in the FASTA-formated sequence database using `Smith-Waterman (SW) alignments <https://en.wikipedia.org/wiki/Smith%E2%80%93Waterman_algorithm>`_ implemented in the FASTA package (ssearch35_t).
216 2. The SW alignments are converted into RNA duplexes.
217 3. Each duplex is scored using a position-dependent scoring matrix.
218
219 SW alignments are used to identify the best complementary regions between the small RNA query sequence and every sequence in the FASTA-formated sequence database.
220
66 ]]></help> 221 ]]></help>
67 <citations> 222 <expand macro='citations' />
68 <citation type="doi">10.1016/j.cell.2005.04.004</citation>
69 <citation type="doi">10.1371/journal.pone.0000219</citation>
70 <citation type="doi">10.1007/978-1-60327-005-2_4</citation>
71 </citations>
72 </tool> 223 </tool>
73 224