Mercurial > repos > rnateam > targetfinder
comparison TargetFinder.xml @ 1:c9d56748fbde draft default tip
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/targetfinder/ commit fe9dd99a14770b6c5f26e24893599acb577e304f"
author | rnateam |
---|---|
date | Thu, 25 Mar 2021 19:53:15 +0000 |
parents | 773fdd1a02ea |
children |
comparison
equal
deleted
inserted
replaced
0:773fdd1a02ea | 1:c9d56748fbde |
---|---|
1 <tool id="targetfinder" name="Plant small RNA target prediction tool" version="1.7.0"> | 1 <tool id='targetfinder' name='TargetFinder' version='1.7.0+galaxy1' profile='20.01'> |
2 <requirements> | 2 <description>plant small RNA target prediction tool</description> |
3 <requirement type="package" version="1.7">targetfinder</requirement> | 3 <macros> |
4 </requirements> | 4 <import>macros.xml</import> |
5 </macros> | |
6 <expand macro='edam' /> | |
7 <expand macro='requirements' /> | |
5 <stdio> | 8 <stdio> |
6 <exit_code range="1:" /> | 9 <exit_code range='1:' /> |
7 </stdio> | 10 </stdio> |
8 <command><![CDATA[ | 11 <command><![CDATA[ |
9 targetfinder_threads.pl | 12 targetfinder_threads.pl |
10 -f $f | 13 -f '$f' |
11 -d $d | 14 -d '$d' |
12 -c $c | 15 -c $c |
16 -p $output_format | |
13 -t "\${GALAXY_SLOTS:-12}" | 17 -t "\${GALAXY_SLOTS:-12}" |
14 $r | 18 $r |
15 -o $output1 | 19 -o '$output_file' |
20 | |
16 ]]></command> | 21 ]]></command> |
17 <inputs> | 22 <inputs> |
18 <param label="Input small RNA sequences file" help="(-f) FASTA-format" name="f" type="data" format="fasta" /> | 23 <param argument='-f' type='data' format='fasta' label='Input small RNA sequences file' help='FASTA-format' /> |
19 <param label="Target sequence database file" help="(-d) FASTA-format" name="d" type="data" format="fasta" /> | 24 <param argument='-d' type='data' format='fasta' label='Target sequence database file' help='FASTA-format' /> |
20 <param label="Prediction score cutoff value" help="(-c) DEFAULT = 4" name="c" type="float" value="4.0" /> | 25 <param argument='-c' type='float' value='4.0' label='Prediction score cutoff value' help='Predicted targets are printed out if they are equal to or lower than the cutoff score specified. DEFAULT = 4' /> |
21 <param label="Search reverse strand for targets?" help="(-r) Use this option if the database is genomic DNA." name="r" type="boolean" falsevalue="" truevalue="-r" checked="false" /> | 26 <param argument='-c' type='float' value='4.0' label='Prediction score cutoff value' help='Predicted targets are printed out if they are equal to or lower than the cutoff score specified. DEFAULT = 4' /> |
27 <param argument='-r' type='boolean' falsevalue='' truevalue='-r' checked='false' label='Search reverse strand for targets?' help='Use this option if the database is genomic DNA.' /> | |
28 <param name='output_format' argument='-p' type='select' label='Output format' help='Output format for small RNA-target pairs (Default = classic).' > | |
29 <option value='classic'>Original TargetFinder base-pair format</option> | |
30 <option value='gff'>GFF</option> | |
31 <option value='json'>JavaScript Object Notation (JSON)</option> | |
32 <option value='table'>Tab-delimited format</option> | |
33 </param> | |
22 </inputs> | 34 </inputs> |
23 <outputs> | 35 <outputs> |
24 <data name="output1" format="data"/> | 36 <data name='output_file' format='txt'> |
37 <change_format> | |
38 <when input="output_format" value="gff" format="gff" /> | |
39 <when input="output_format" value="json" format="json" /> | |
40 <when input="output_format" value="table" format="tabular" /> | |
41 </change_format> | |
42 </data> | |
25 </outputs> | 43 </outputs> |
26 <tests> | 44 <tests> |
27 <test> | 45 <test> |
28 <param name="f" value="ath_miRNAs_test.fa"/> | 46 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> |
29 <param name="d" value="Antirrhinum_majus.mRNA.EST.fasta"/> | 47 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> |
30 <param name="r" value=""/> | 48 <param name='r' value='false'/> |
31 <param name="c" value="4.0"/> | 49 <param name='c' value='4.0'/> |
32 <param name="t" value="1"/> | 50 <param name='output_format' value='classic'/> |
33 <output name="output1" file="ath_miRNAs_predicted_targets.txt" compare="contains"/> | 51 <output name='output_file' file='targetfinder_test_01.txt' compare='contains'/> |
52 </test> | |
53 <test> | |
54 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
55 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
56 <param name='r' value='true'/> | |
57 <param name='c' value='4.0'/> | |
58 <param name='output_format' value='classic'/> | |
59 <output name='output_file' file='targetfinder_test_02.txt' compare='contains'/> | |
60 </test> | |
61 <test> | |
62 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
63 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
64 <param name='r' value='false'/> | |
65 <param name='c' value='6.0'/> | |
66 <param name='output_format' value='classic'/> | |
67 <output name='output_file' file='targetfinder_test_03.txt' compare='contains'/> | |
68 </test> | |
69 <test> | |
70 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
71 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
72 <param name='r' value='false'/> | |
73 <param name='c' value='4.0'/> | |
74 <param name='output_format' value='classic'/> | |
75 <output name='output_file' file='targetfinder_test_04.txt' compare='contains'/> | |
76 </test> | |
77 <test> | |
78 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
79 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
80 <param name='r' value='false'/> | |
81 <param name='c' value='4.0'/> | |
82 <param name='output_format' value='gff'/> | |
83 <output name='output_file' file='targetfinder_test_05.gff' compare='contains'/> | |
84 </test> | |
85 <test> | |
86 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
87 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
88 <param name='r' value='false'/> | |
89 <param name='c' value='4.0'/> | |
90 <param name='output_format' value='table'/> | |
91 <output name='output_file' file='targetfinder_test_06.tab' compare='contains'/> | |
92 </test> | |
93 <test> | |
94 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
95 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
96 <param name='r' value='false'/> | |
97 <param name='c' value='4.0'/> | |
98 <param name='output_format' value='json'/> | |
99 <output name='output_file' file='targetfinder_test_07.json' compare='contains' lines_diff='1'/> | |
100 </test> | |
101 <test> | |
102 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
103 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
104 <param name='r' value='true'/> | |
105 <param name='c' value='6.5'/> | |
106 <param name='output_format' value='table'/> | |
107 <output name='output_file' file='targetfinder_test_08.tab' compare='contains'/> | |
34 </test> | 108 </test> |
35 </tests> | 109 </tests> |
36 <help><![CDATA[ | 110 <help><![CDATA[ |
111 .. class:: infomark | |
112 | |
37 **What it does** | 113 **What it does** |
38 | 114 |
39 TargetFinder will computationally predict small RNA binding sites on target transcripts from a sequence database. | 115 TargetFinder will computationally predict small RNA binding sites on target transcripts from a sequence database. |
40 | 116 |
41 This is done by aligning the input small RNA sequence against all transcripts, | 117 This is done by aligning the input small RNA sequence against all transcripts, followed by site scoring using a position-weighted scoring matrix. |
42 followed by site scoring using a position-weighted scoring matrix. | 118 |
119 ---- | |
120 | |
121 .. class:: infomark | |
43 | 122 |
44 **Input** | 123 **Input** |
45 | 124 |
46 -f Input small RNA sequences file (FASTA-format). | 125 This tool requires two fasta files: |
47 | 126 |
48 -d Target sequence database file (FASTA-format) | 127 :: |
49 | 128 |
50 **Output** | 129 -f Input small RNA sequences file (FASTA-format). |
51 | 130 -d Target sequence database file (FASTA-format) |
52 Each predicted target site is printed out separately. | 131 |
53 The output consists of two parts. | 132 ---- |
54 | 133 |
55 The first is a description line and the second is a base-pairing diagram of the target and small RNA (query) sequence. | 134 .. class:: infomark |
56 | 135 |
57 The description line contains the query name, the description line from the target sequence database, and the target prediction score. | 136 **Original TargetFinder Output** |
58 | 137 |
59 The base-pairing diagram has the target site sequence on top in 5'-3' orientation and the query sequence on the bottom in 3'-5' orientation. | 138 |
60 | 139 Each predicted target site is printed out separately. |
61 Between the target site sequece and the query sequence are base pair symbols. | 140 |
62 | 141 The output consists of two parts. The first is a description line and the second is a base-pairing diagram of the target and small RNA (query) sequence. The description line contains the query name, the description line from the target sequence database, and the target prediction score. |
63 A ":" (colon) symbol represents an ordinary Watson-Crick base pair, a "." (period) represents a G:U base pair, and a " " (space) represents a mismatch. | 142 |
143 :: | |
144 | |
145 query=miR399a, target=AT2G33770.1 | Symbol: None | ubiquitin-conjugating enzyme family protein, low similarity to u, score=1.5 | |
146 | |
147 | |
148 The base-pairing diagram has the target site sequence on top in 5'-3' orientation and the query sequence on the bottom in 3'-5' orientation. Between the target site sequece and the query sequence are base pair symbols. A ':' (colon) symbol represents an ordinary Watson-Crick base pair, a '.' (period) represents a G:U base pair, and a ' ' (space) represents a mismatch. | |
149 | |
150 :: | |
151 | |
152 target 5' UAGGGCAAAUCUUCUUUGGCA 3' | |
153 .:::::::::::.:::::::: | |
154 query 3' GUCCCGUUUAGAGGAAACCGU 5' | |
155 | |
64 | 156 |
65 If a small RNA is predicted to target a sequence more than once, each target site will be output as separate output. | 157 If a small RNA is predicted to target a sequence more than once, each target site will be output as separate output. |
158 | |
159 | |
160 ---- | |
161 | |
162 .. class:: infomark | |
163 | |
164 **Additional output formats** | |
165 | |
166 In addition to the output described above ('classic' output), three new output format options were added to TargetFinder. | |
167 | |
168 Generic Feature Format (GFF3): | |
169 | |
170 :: | |
171 | |
172 AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN targetfinder rna_target 607 627 1.5 + . smallRNA=miR399a;target_seq=UAGGGCAAAUCUUCUUUGGCA;base_pairs=.:::::::::::.::::::::;miR_seq=GUCCCGUUUAGAGGAAACCGU | |
173 AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN targetfinder rna_target 740 760 1.5 + . smallRNA=miR399a;target_seq=UAGGGCAUAUCUCCUUUGGCA;base_pairs=.:::::: :::::::::::::;miR_seq=GUCCCGUUUAGAGGAAACCGU | |
174 AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN targetfinder rna_target 829 849 1.5 + . smallRNA=miR399a;target_seq=UUGGGCAAAUCUCCUUUGGCA;base_pairs=. :::::::::::::::::::;miR_seq=GUCCCGUUUAGAGGAAACCGU | |
175 | |
176 | |
177 Tab-deliminated Format: | |
178 | |
179 :: | |
180 | |
181 miR399a AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN 607 627 + 1.5 UAGGGCAAAUCUUCUUUGGCA .:::::::::::.:::::::: GUCCCGUUUAGAGGAAACCGU | |
182 miR399a AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN 740 760 + 1.5 UAGGGCAUAUCUCCUUUGGCA .:::::: ::::::::::::: GUCCCGUUUAGAGGAAACCGU | |
183 miR399a AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN 829 849 + 1.5 UUGGGCAAAUCUCCUUUGGCA . ::::::::::::::::::: GUCCCGUUUAGAGGAAACCGU | |
184 | |
185 JavaScript Object Notation Format (JSON): | |
186 | |
187 :: | |
188 | |
189 { | |
190 'miR399a': { | |
191 'hits' : [ | |
192 { | |
193 'Target accession': 'AT2G33770.1 | Symbols: UBC24, ATUBC24, PHO2 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN', | |
194 'Score': '1.5', | |
195 'Coordinates': '607-627', | |
196 'Strand': '+', | |
197 'Target sequence': 'UAGGGCAAAUCUUCUUUGGCA', | |
198 'Base pairing': '.:::::::::::.::::::::', | |
199 'amiRNA sequence': 'GUCCCGUUUAGAGGAAACCGU' | |
200 } | |
201 ] | |
202 } | |
203 } | |
204 | |
205 | |
206 ---- | |
207 | |
208 .. class:: infomark | |
209 | |
210 **Method** | |
211 | |
212 TargetFinder searches for potential miRNA target sites in a FASTA-formated sequence database using three main steps. | |
213 | |
214 | |
215 1. The small RNA query sequence is aligned to every sequence in the FASTA-formated sequence database using `Smith-Waterman (SW) alignments <https://en.wikipedia.org/wiki/Smith%E2%80%93Waterman_algorithm>`_ implemented in the FASTA package (ssearch35_t). | |
216 2. The SW alignments are converted into RNA duplexes. | |
217 3. Each duplex is scored using a position-dependent scoring matrix. | |
218 | |
219 SW alignments are used to identify the best complementary regions between the small RNA query sequence and every sequence in the FASTA-formated sequence database. | |
220 | |
66 ]]></help> | 221 ]]></help> |
67 <citations> | 222 <expand macro='citations' /> |
68 <citation type="doi">10.1016/j.cell.2005.04.004</citation> | |
69 <citation type="doi">10.1371/journal.pone.0000219</citation> | |
70 <citation type="doi">10.1007/978-1-60327-005-2_4</citation> | |
71 </citations> | |
72 </tool> | 223 </tool> |
73 | 224 |