comparison rnasnp.xml @ 0:327f5721612f draft default tip

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rnasnp commit 6e51a331dbeab2786d8df5fd379ae3a63eb61d83
author rnateam
date Tue, 13 Dec 2016 12:31:56 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:327f5721612f
1 <tool id="rnasnp" name="RNAsnp" version="1.2.0">
2 <description> Efficient detection of local RNA secondary structure changes induced by SNPs </description>
3
4 <requirements>
5 <requirement type="package" version="1.2">rnasnp</requirement>
6 </requirements>
7
8 <stdio>
9 <exit_code range="1" level="fatal" description="Error occurred. Please check Tool Standard Error" />
10 <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error" />
11 <exit_code range="2:" level="warning" description="Warning: Tool exited with error_code != 0" />
12 </stdio>
13
14 <version_command>RNAsnp --version</version_command>
15 <command>
16 <![CDATA[
17
18 RNAsnp
19 --seq='$seq'
20 --mode=$mode.mode_selector
21 #if $mode.mode_selector == "1"
22 --snp=$mode.snp
23 --cutoff=$mode.cutoff
24 --minLen=$mode.minLen
25 #end if
26 #if $mode.mode_selector == "2"
27 --snp=$mode.snp
28 --winsize=$mode.winsize
29 --span=$mode.span
30 --regionX=$mode.regionX
31 --regionY=$mode.regionY
32 #end if
33 #if $mode.mode_selector == "3"
34 --pvalue1=$mode.pvalue1
35 --pvalue2=$mode.pvalue2
36 --winsizeExt=$mode.winsizeExt
37 #end if
38 --edist=$edist
39 --boltzmannPreFactor=$boltzmannPreFactor
40 --winsizeFold=$mode.winsizeFold
41 > '$outfile'
42
43 ]]>
44 </command>
45 <inputs>
46 <param argument="--seq" format="txt" type="data" label="Input Alignment File" />
47 <conditional name="mode">
48 <param name="mode_selector" type="select" label="Mode of operation">
49 <option value="1" selected="true">1: Perform global folding by using RNAfold</option>
50 <option value="2">2: Perform local folding by using RNAplfold</option>
51 <option value="3">3: Screen putative structure-disruptive SNPs in an RNA sequence</option>
52 </param>
53 <when value="1">
54 <param argument="--snp" format="txt" type="data" label="List of SNP" help="The list of SNPs to be tested have to be provided in separate lines"/>
55 <param argument="--winsizeFold" type="select" label="Folding windows size" help="Length of flanking sequence on either side of SNP considered for folding. please make sure that the input sequence is at least twice the size of chosen flanking. This restriction is necessary to keep the size of parameter tables for the p-value calculations manageable. In case the input sequence is less than twice the size of chosen flanking, the RNAsnp takes the nts up to the start and end position of the given sequence from the SNP position and perform the analysis.">
56 <option value="100"></option> <option value="150" ></option>
57 <option value="200" selected ="true"></option> <option value="250"></option> <option value="300"></option> <option value="350"></option> <option value="400"></option> <option value="450"></option>
58 <option value="500"></option> <option value="600"></option> <option value="650"></option> <option value="700"></option> <option value="750"></option> <option value="800"></option>
59 </param>
60
61 <param argument="--cutoff" type="float" value="0.01" label="Cut-off" help="Cut-off for the base pair probabilities."/>
62 <param argument="--minLen" type="integer" value="50" min="1" label="Minimum length of the sequence interval" help="The structural difference between wild-type and mutant is computed for all sequence intervals with the selected minimum length" />
63 </when>
64 <when value="2">
65 <param argument="--snp" format="txt" type="data" label="List of SNP" help="The list of SNPs to be tested have to be provided in separate lines"/>
66 <param argument="--winsizeFold" type="select" label="Folding windows size" help="Length of flanking sequence on either side of SNP considered for folding. please make sure that the input sequence is at least twice the size of chosen flanking. This restriction is necessary to keep the size of parameter tables for the p-value calculations manageable. In case the input sequence is less than twice the size of chosen flanking, the RNAsnp takes the nts up to the start and end position of the given sequence from the SNP position and perform the analysis.">
67 <option value="200" selected ="true"></option> <option value="250"></option> <option value="300"></option> <option value="350"></option> <option value="400"></option> <option value="450"></option>
68 <option value="500"></option> <option value="600"></option> <option value="650"></option> <option value="700"></option> <option value="750"></option> <option value="800"></option>
69 </param>
70
71 <param argument="--cutoff" type="float" value="0.01" min="0" label="Cut-off" help="Cut-off for the base pair probabilities."/>
72 <param argument="--winsize" type="integer" value="200" min="1" label="Windows size" help="Average the pair probabilities over windows of given size"/>
73 <param argument="--span" type="integer" value="120" min="1" label="Span" help="Set the maximum allowed separation of a base pair to span. i.e. no pairs (i,j) with j-i > L will be allowed."/>
74 <param argument="--regionX" type="integer" value="20" min="1" label="Length of the local structural element that we expect to have an effect" help=""/>
75 <param argument="--regionY" type="integer" value="120" min="1" label="Length of the interval over which the local structural changes are evaluated" help=""/>
76 </when>
77 <when value="3">
78 <param argument="--winsizeFold" type="select" label="Folding windows size" help="Length of flanking sequence on either side of SNP considered for folding. please make sure that the input sequence is at least twice the size of chosen flanking. This restriction is necessary to keep the size of parameter tables for the p-value calculations manageable. In case the input sequence is less than twice the size of chosen flanking, the RNAsnp takes the nts up to the start and end position of the given sequence from the SNP position and perform the analysis.">
79 <option value="200" selected ="true"></option> <option value="250"></option> <option value="300"></option> <option value="350"></option> <option value="400"></option> <option value="450"></option>
80 <option value="500"></option> <option value="600"></option> <option value="650"></option> <option value="700"></option> <option value="750"></option> <option value="800"></option>
81 </param>
82 <param argument="--pvalue1" type="float" value="0.4" min="0" label="p-value threshold to filter SNPs that are predicted using Mode 2" help=""/>
83 <param argument="--pvalue2" type="float" value="0.1" min="0" label="p-value threshold to filter SNPs that are predicted using Mode 1" help=""/>
84 <param argument="--winsizeExt" type="integer" value="200" min="1" label="Windows size" help="size of the flanking region on either side of SNP that includes the local window returned by Mode 2. This subsequence is then passed to Mode 1 for re-computation"/>
85 </when>
86 </conditional>
87 <param argument="--edist" type="integer" value="0" min="0" label="Ensemble Euclidean distance" help="compute ensemble Euclidean distance between the distribution of structures between two sequences"/>
88 <param argument="--boltzmannPreFactor" type="float" value="1" label="Boltzmann PreFactor" help="Multiply the bolztmann factor with a prefactor alpha"/>
89
90 </inputs>
91 <outputs>
92 <data name="outfile" format="tabular" />
93 </outputs>
94 <tests>
95 <test>
96 <param name="seq" value="seq1.txt"/>
97 <conditional name="mode">
98 <param name="mode_selector" value="1"/>
99 <param name="snp" value="snp1.txt"/>
100 </conditional>
101 <output name="outfile" file="seq1_snp1_mode1.out"/>
102 </test>
103 </tests>
104
105 <help>
106 <![CDATA[
107
108 **What it does**
109 Efficient detection of local RNA secondary structure changes induced by SNPs
110
111
112 RNAsnp requires an RNA sequence and optionally a list of SNPs to be analyzed. The effect of SNPs on local RNA secondary structure can be detected in three possible modes,
113
114 Mode 1: The first mode is designed to compute the effect of SNPs by using global folding. This option should be used only for short input sequences, since the base pair probabilities are calculated using RNAfold.
115
116 Mode 2: The second mode is designed to compute the effect of SNPs on large sequences. Here the local base pair probabilities are calculated using RNAplfold (with the parameters -W 200 and -L 120).
117
118 Mode 3: The third mode is the combination of the above two. It is intended to determine the positions of putative structure-disruptive SNPs using either transcript or genome sequence.
119
120
121 **Input**
122
123 Sequence file must contain one sequence (preferably in FASTA format).
124
125 SNP file must contain the list of SNPs that are given in separate lines. The
126 SNPs are described as, wild-type nucleotide followed by nucleotide position
127 followed by mutant nucleotide. In case of multiple SNPs, the SNPs are delimited
128 by the special character "-".
129
130 Example formats:
131 Single SNP: A201G
132 where, A is the wild-type nucleotide in the given sequence, 201 is the sequence
133 position of wild-type nucleotide and G is the mutant (or SNP).
134
135 Multiple SNPs: A201G-U257A-C260G
136 The multiple SNPs (which occurs together) are defined next to each other with
137 the delimiter "-" between them.
138
139
140 **Output**
141
142 SNP w Slen GC interval d pvalue1 ewin interval d_max pvalue2
143
144 G1C 200 3344 0.5522 1-46 0.0421 0.0755 200 1-50 0.1581 0.0183
145
146 G7A 200 3344 0.5556 1-43 0.2236 0.0207 200 1-50 0.1570 0.0996
147
148
149 Output details:
150
151 Column 1: details of the screened SNPs
152
153 Column 2: length of the flanking region considered on either side of the SNP to fold
154
155 Column 3: length of the given input sequence
156
157 Column 4: GC percent of the sequence interval considered for folding
158
159 Column 5-7: results of initial screen returned by mode 2
160
161 Column 8: ewin is the length of the flanking region considered on either of the SNP that also includes the local interval returned by mode 2. This subsequence is then passed to mode 1 to compute the d_max
162
163 Column 9-11: results of final screen returned by mode 1
164
165
166 Note: By default, the ewin(-e) uses the window length of 200. A higher computation speed is achieved if the ewin value is reduced to 100 or 150, however, there will be little difference in the result compare to ewin with 200. In addition, RNAsnp does automatically increase the length of ewin if the defined length is not enough to cover the local interval returned by mode 2.
167
168 ]]>
169
170 </help>
171
172 <citations>
173 <citation type="doi">10.1002/humu.22273</citation>
174 </citations>
175
176 </tool>