comparison rnafold.xml @ 0:d6044fad075f draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit 0065dafe7bbd382bb995b28cc4089c9e4f4eeeb9
author rnateam
date Tue, 06 Dec 2016 12:34:44 -0500
parents
children f87325531be8
comparison
equal deleted inserted replaced
-1:000000000000 0:d6044fad075f
1 <tool id="viennarna_rnafold" name="@EXECUTABLE@" version="@VERSION@.0">
2 <description>Calculate minimum free energy secondary structures and partition function of RNAs</description>
3 <macros>
4 <token name="@EXECUTABLE@">RNAfold</token>
5 <import>macros.xml</import>
6 </macros>
7 <expand macro="requirements" />
8 <expand macro="stdio" />
9 <expand macro="version_command" />
10 <command>
11 <![CDATA[
12 #if str($input_source.select_fasta) == "false"
13 #if str($input_source.input_sequence).lstrip()[0] == ">"
14 echo "${input_source.input_sequence}" > "input.fasta" &&
15 #else
16 echo ">Sequence" > "input.fasta" &&
17 echo "${input_source.input_sequence}" >> "input.fasta" &&
18 #end if
19 #end if
20 RNAfold
21 -T $temperature
22 --dangles=$dangling
23 #if $layout_type ==0
24 --layout-type=$general_options.layout_type
25 #end if
26 #if $measelect.mea == "yes":
27 --MEA=$measelect.meavalue
28 #if $measelect.pfScale <> 1.07
29 --pfScale=$measelect.pfScale
30 #end if
31 #else
32 $measelect.pf
33 #if $measelect.pfScale <> 1.07
34 --pfScale=$measelect.pfScale
35 #end if
36 #end if
37 $advancedOptions.noconversion
38 $advancedOptions.gquad
39 $advancedOptions.nolp
40 $advancedOptions.nogu
41 $advancedOptions.noclosinggu
42 $advancedOptions.notetra
43 $advancedOptions.circular
44 #if $advancedOptions.bppmThreshold <> 1e-5
45 --bppmThreshold=$advancedOptions.bppmThreshold
46 #end if
47 #if $advancedOptions.nsp
48 --nsp='$advancedOptions.nsp'
49 #end if
50 #if $advancedOptions.betaScale <> 1.0
51 --betaScale=$advancedOptions.betaScale
52 #end if
53 #if $constraints.maxBPspan <> -1
54 --maxBPspan=$constraints.maxBPspan
55 #end if
56 #if str($constraints.constraintLocation.constraintSelector) == "fromFile"
57 --constraint='$constraints.constraintLocation.constraintsFile'
58 $constraints.constraintLocation.batch
59 $constraints.constraintLocation.canonicalBPonly
60 $constraints.constraintLocation.enforceConstraint
61 #end if
62 #if str($constraints.shapeOption.shapeSelector) == "isUsed"
63 --shape='$constraints.shapeOption.shapeFile'
64 #if str($constraints.shapeOption.shapeMethod.methodSelector) == "W"
65 #set $s="W"
66 --shapeMethod=$s
67 #else if str($constraints.shapeOption.shapeMethod.methodSelector) == "Z"
68 #set $s="Zb"+str($constraints.shapeOption.shapeMethod.b)
69 --shapeMethod=$s
70 #if str($constraints.shapeOption.shapeMethod.shapeConversion.conversionSelector) == "C"
71 #set $c="C"+str($constraints.shapeOption.shapeMethod.shapeConversion.c)
72 --shapeConversion=$c
73 #else if str($constraints.shapeOption.shapeMethod.shapeConversion.conversionSelector) == "L"
74 #set $c="Ls"+str($constraints.shapeOption.shapeMethod.shapeConversion.s)+"i"+ str($constraints.shapeOption.shapeMethod.shapeConversion.i)
75 --shapeConversion=$c
76 #else if str($constraints.shapeOption.shapeMethod.shapeConversion.conversionSelector) == "O"
77 #set $c="Os"+str($constraints.shapeOption.shapeMethod.shapeConversion.s)+"i"+ str($constraints.shapeOption.shapeMethod.shapeConversion.i)
78 --shapeConversion=$c
79 #else
80 #set $c=str($constraints.shapeOption.shapeMethod.shapeConversion.conversionSelector)
81 --shapeConversion=$c
82 #end if
83 #else if str($constraints.shapeOption.shapeMethod.methodSelector) == "D"
84 #set $s="Dm"+str($constraints.shapeOption.shapeMethod.m)+"b"+str($constraints.shapeOption.shapeMethod.b)
85 --shapeMethod=$s
86 #end if
87 #end if
88 #if $constraints.motif
89 --motif='$constraints.motif'
90 #end if
91 <
92 #if str($input_source.select_fasta) == "false"
93 "input.fasta"
94 #else
95 "${input_source.fasta_input}"
96 #end if
97 > '$tabular_file'
98 ]]>
99 </command>
100
101 <inputs>
102 <conditional name="input_source">
103 <param name="select_fasta" type="select" label="Input from FASTA file">
104 <option value="true" selected="true">Use FASTA</option>
105 <option value="false">Provide sequence as text-field</option>
106 </param>
107 <when value="true">
108 <param format="fasta" name="fasta_input" type="data" label="Sequence to fold (FASTA file)"/>
109 </when>
110 <when value="false">
111 <param name="input_sequence" type="text" label="Input sequence"/>
112 </when>
113 </conditional>
114 <param name="temperature" type="float" value="37.0" label="Temperature [°C]" argument="-T"/>
115 <param name="dangling" type="select" label="How to treat dangling end energies" argument="-d">
116 <option value="0">0: ignore dangling ends</option>
117 <option value="1">1: unpaired bases participate in one dangling end only</option>
118 <option value="2" selected="True">2: unpaired bases participate in all dangling ends</option>
119 <option value="3">3: allow coaxial stacking</option>
120 </param>
121 <param name="layout_type" type="select" label="Layout algorithm" argument="--layout_type" >
122 <option value="1" selected="true">Default: Naview layout</option>
123 <option value="0">Simple radial layout</option>
124 </param>
125 <conditional name="measelect">
126 <param name="mea" type="select" label="Calculate Maximum Expected accuracy" argument="--MEA">
127 <option value="no">No</option>
128 <option value="yes">Yes</option>
129 </param>
130 <when value="yes">
131 <param name="meavalue" type="float" value="1.0" label="Gamma Value"/>
132 <param argument="--pfScale" type="float" value="1.07" label="Scaling factor" help="In the calculation of the pf use scale*mfe as an estimate for the ensemble free energy (used to avoid overflows). The default is 1.07, useful values are 1.0 to 1.2. Occasionally needed for long sequences."/>
133 </when>
134 <when value="no">
135 <param name="pf" type="boolean" checked="false" truevalue="--partfunc" falsevalue="" label="Calculate Partition Function" help="--partfunc"/>
136 <param argument="--pfScale" type="float" value="1.07" label="Scaling factor" help="In the calculation of the pf use scale*mfe as an estimate for the ensemble free energy (used to avoid overflows). The default is 1.07, useful values are 1.0 to 1.2. Occasionally needed for long sequences."/>
137 </when>
138 </conditional>
139 <section name="advancedOptions" title="Advanced options">
140 <param name="nolp" type="boolean" truevalue="" falsevalue="--noLP" checked="true" label="Allow lonely base-pairs" help="(--noLP)"/>
141 <param name="nogu" type="boolean" truevalue="" falsevalue="--noGU" checked="true" label="Allow GU pairing" help="--noGU"/>
142 <param name="noclosinggu" type="boolean" truevalue="" falsevalue="--noClosingGU" checked="true" label="Allow GU pairing at the ends" help="Allow pairing of G and U at the ends of helices. --noClosingGU"/>
143 <param name="notetra" type="boolean" truevalue="" falsevalue="--noTetra" checked="true" label="Allow stabilization for loops, hairpins etc." help=" Include special tabulated stabilizing energies for tri-, tetra- and hexaloop hairpins. Mostly for testing. (--noTetra)"/>
144 <param name="noconversion" type="boolean" truevalue="" falsevalue="--noconv" checked="true" label="Convert Thymine to Uracil (T -> U)" help="Avoids confusion with DNA sequences (--noconv)"/>
145 <param name="gquad"
146 type="boolean"
147 truevalue="--gquad"
148 falsevalue=""
149 checked="false"
150 label="Take G Quadruplex formation into account"
151 argument="-g"/>
152 <param name="circular"
153 type="boolean"
154 truevalue="--circ"
155 falsevalue=""
156 checked="false"
157 label="Model as circular RNA structure"
158 argument="--circ"/>
159 <param name="bppmThreshold"
160 type="float"
161 value="1e-5"
162 label="Threshold for base pair probabilities"
163 help="By setting the threshold the base pair probabilities that are included in the output can be varied. By default only those exceeding 1e−5 in probability will be shown as squares in the dot plot. Changing the threshold to any other value allows for increase or decrease of data."
164 argument="--bppmThreshold"/>
165 <param name="nsp"
166 type="text"
167 value=""
168 label="Allow other pairs in addition to the usual AU,GC,and GU pairs."
169 help="Its argument is a comma separated list of additionally allowed pairs. If the first character is '-' then AB will imply that AB and BA are allowed pairs. e.g. RNAfold -nsp -GA will allow GA and AG pairs. Nonstandard pairs are given 0 stacking energy."
170 argument="--nsp"/>
171 <param name="betaScale"
172 type="float"
173 value="1.0"
174 label="Scaling of Boltzman factors"
175 help=" The argument provided with this option enables to scale the thermodynamic temperature used in the Boltzmann factors independently from the temperature used to scale the individual energy contributions of the loop types."
176 argument="--betaScale"/>
177 </section>
178 <section name="constraints" title="Structure constraints">
179 <param name="maxBPspan" type="integer" value="-1" label="Set the maximum base pair span" help="" argument="--maxBPspan"/>
180 <conditional name="constraintLocation">
181 <param name="constraintSelector" type="select" label="Constraints">
182 <!-- <option value="fromInput">The constraints are included in the input file</option> -->
183 <option value="fromFile">The constraints are in a seperate file</option>
184 <option value="none" selected="true">Don't use constraints</option>
185 </param>
186 <!-- <when value="fromInput"></when> -->
187 <when value="none"></when>
188 <when value="fromFile">
189 <param name="constraintsFile" type="data" format="*" label="Constraints file" argument="--constraint"/>
190 <param name="batch" type="boolean" checked="false" truevalue="--batch" falsevalue=""
191 label="Use constraints for all alignment records"
192 help="Usually, constraints provided from input file are only applied to a single sequence alignment. Therefore, RNAalifold will stop its computation and quit after the first input alignment was processed. Using this switch, RNAalifold processes all sequence alignments in the input and applies the same provided constraints to each of them."
193 argument="--batch"/>
194 <param argument="--canonicalBPonly" type="boolean" truevalue="--canonicalBPonly" falsevalue="" checked="false" label="Remove non-canonical base pairs from he structure constraint" />
195 <param argument="--enforceConstraint" type="boolean" truevalue="--enforceConstraint" falsevalue="" checked="false" label="Enforce base pair given by round brackets () in structure constraint" />
196 </when>
197 </conditional>
198 <conditional name="shapeOption">
199 <param name="shapeSelector" type="select" label="Shape reactivity data">
200 <option value="isUsed">Use shape reactivity data</option>
201 <option value="notUsed" selected="true">Don't use shape reactivity data</option>
202 </param>
203 <when value ="isUsed">
204 <param type="data" name="shapeFile" format="shape,*" label="Shape file" argument="--shape"/>
205 <conditional name="shapeMethod">
206 <param name="methodSelector" type="select" label="Shape reactivity data" argument="--shapeMethod">
207 <option value="D" selected="true">D: Convert by using a linear equation according to Deigan et al 2009</option>
208 <option value="Z">Z: Convert SHAPE reactivities to pseudo energies according to Zarringhalam et al 2012.</option>
209 <option value="W">W: Apply a given vector of perturbation energies to unpaired nucleotides according to Washietl et al 2012</option>
210 </param>
211 <when value="D">
212 <param name="m" type="float" value="1.8" label="Slope m"/>
213 <param name="b" type="float" value="-0.6" label="Intercept"/>
214 </when>
215 <when value="Z">
216 <param name="b" type="float" value="-0.6" label="Intercept"/>
217 <conditional name="shapeConversion">
218 <param name="conversionSelector" type="select" label="shape reactivity data">
219 <option value="M">M: Use linear mapping according to Zarringhalam et al</option>
220 <option value="C">C: Use a cutoff−approach to divide into paired and unpaired nucleotides</option>
221 <option value="S">S: Skip the normalizing step since the input data already represents probabilities for being unpaired rather than raw reactivity values</option>
222 <option value="L">L: Use a linear model to convert the reactivity into a probability for being unpaired</option>
223 <option value="O" selected="true">O: Use a linear model to convert the log of the reactivity into a probability for being unpaired</option>
224 </param>
225 <when value="M">
226 </when>
227 <when value="C">
228 <param name="c" type="float" value="0.25" label="Cutoff"/>
229 </when>
230 <when value="S">
231 </when>
232 <when value="L">
233 <param name="s" type="float" value="0.68" label="Slope"/>
234 <param name="i" type="float" value="0.2" label="Intercept"/>
235 </when>
236 <when value="O">
237 <param name="s" type="float" value="1.6" label="Slope s"/>
238 <param name="i" type="float" value="-2.29" label="Intercept"/>
239 </when>
240 </conditional>
241 </when>
242 <when value="W">
243 </when>
244 </conditional>
245 </when>
246 <when value="notUsed">
247 </when>
248 </conditional>
249 <param argument="--motif" type="text" value="" label="Sequence structure energy" help="Specify stabilizing effect of ligand binding to a particular sequence/structure motif. Some ligands binding to RNAs require and/or induce particular sequence and structure motifs. For instance they bind to an interior loop, or small hairpin loop. If for such cases a binding free energy is known, the binding and therefore stabilizing effect of the ligand can be included in the folding recursions. Interior loop motifs are specified as concatenations of 5’ and 3’ motif, separated by an ’&amp;’ character. Energy contributions must be specified in kcal/mol."/>
250 </section>
251 <section name="IDs" title="Naming Conventions">
252 <param name="auto_id"
253 type="boolean" truevalue="--auto-id" falsevalue="" checked="false"
254 label="Automatically generate an ID for each alignment."
255 help="If this flag is active, RNAalifold ignores any IDs retrieved from the input and automatically generates an ID for each alignment."
256 argument="--auto-id"/>
257 <param name="id_prefix"
258 type="text" value="alignment"
259 label="Prefix for automatically generated IDs (as used in output file names)"
260 help="If this parameter is set, each alignment will be prefixed with the provided string. Hence, the output files will obey the following naming scheme: 'prefix_xxxx_ss.ps' (secondary structure plot), 'prefix_xxxx_dp.ps' (dot−plot), 'prefix_xxxx_aln.ps' (annotated alignment), etc. where xxxx is the alignment number beginning with the second alignment in the input. Use this setting in conjunction with the −−continuous−ids flag to assign IDs beginning with the first input alignment."
261 argument="--id-prefix"/>
262 <param name="id_digits"
263 type="integer" value="4" min="1" max="18"
264 label="The number of digits of the counter in automatically generated alignment IDs"
265 help="When alignments IDs are automatically generated, they receive an increasing number, starting with 1. This number will always be left−padded by leading zeros, such that the number takes up a certain width. Using this parameter, the width can be specified to the users need. We allow numbers in the range [1:18]."
266 argument="--id-digits"/>
267 <param name="id_start"
268 type="integer" value="1" min="0"
269 label="First number in automatically generated alignment IDs"
270 help="When alignment IDs are automatically generated, they receive an increasing number, usually starting with 1. Using this parameter, the first number can be specified to the users requirements. Note: negative numbers are not allowed. Note: Setting this parameter implies continuous alignment IDs, i.e. it activates the −−continuous−ids flag.."
271 argument="--id-start"/>
272 </section>
273 </inputs>
274 <outputs>
275 <data format="dbn" name="tabular_file"/>
276 <collection name="sequence_outputs" type="list" label="rna_eps outputs">
277 <discover_datasets pattern="(?P&lt;designation&gt;.+)_ss\.ps" ext="eps" />
278 </collection>
279 <collection name="matrix_outputs" type="list" label="rna_eps outputs">
280 <filter>measelect['pf'] is True</filter>
281 <discover_datasets pattern="(?P&lt;designation&gt;.+)_dp\.ps" ext="rna_eps" visible="true"/>
282 </collection>
283 </outputs>
284 <tests>
285 <test>
286 <param name="select_fasta" value="true" />
287 <param name="fasta_input" value="rnafold_input1.fa"/>
288 <output name="out_file1" file="rnafold_result1.txt"/>
289 </test>
290
291 <test>
292 <param name="select_fasta" value="true" />
293 <param name="fasta_input" value="rnafold_input2.fa"/>
294 <param name="temperature" value="75"/>
295 <output name="out_file1" file="rnafold_result2.txt"/>
296 </test>
297
298 <test>
299 <param name="select_fasta" value="false" />
300 <param name="input_sequence" value="TGGGAATTAGCTCAAATGGTAGAGCGCTCGCTTAGCATGTGAGAGGTAGTGGGATCGATGCCCACATTCTCCA"/>
301 <output name="out_file1" file="rnafold_result3.txt"/>
302 </test>
303 </tests>
304 <help>
305 <![CDATA[
306 **RNAfold**
307
308 The program reads RNA sequences, calculates their minimum free
309 energy (mfe) structure and the mfe structure in dot-bracket notation.
310
311 If the -p option was given it also computes the
312 partition function (pf) and base pairing probability matrix.
313
314 The dot plot of the base pairing probability matrix shows a matrix of squares with area proportional to the pairing
315 probability in the upper right half, and one square for each pair in the
316 minimum free energy structure in the lower left half. For each pair i-j with
317 probability p>10E-6 there is a line of the form
318
319 i j sqrt(p) ubox
320
321 in the PostScript file, so that the pair probabilities can be easily extracted.
322
323 The sequences have to be provided in FASTA format. The first word (max. 42 char) of the FASTA header will be used for output file names. PostScript files "name_ss.ps" and "name_dp.ps" are produced for the structure and dot plot, respectively.
324 The program will read the whole FASTA input file and provide output for each found sequence.
325
326
327 -----
328
329 **Input format**
330
331 RNAfold requires one input file or a plain RNA sequence
332
333 ------
334
335 **Outputs**
336
337 - Secondary structures in dot-bracket notation
338
339 - several possible postscript images bundled together in a tar file
340 - secondary structure for each sequence in the input file
341 - if partition function is calculated (--MEA or --partfunc is set) then also the pairing probabilty matrix is generated for each sequence
342
343 ]]>
344 </help>
345 <expand macro="citations" />
346 </tool>