comparison dsCompareCurves.xml @ 7:ef6b589a3715 draft default tip

More documentation to match the Wiki
author gtrichard
date Wed, 07 Aug 2019 11:23:52 -0400
parents
children
comparison
equal deleted inserted replaced
6:a6f0d3b1d891 7:ef6b589a3715
1 <tool id="deepstats_compare_curves" name="dsCompareCurves" version="@WRAPPER_VERSION@.0" profile="18.01">
2 <description>
3 compares multiple genomic scores at multiple regions sets by bootstraps and per-bin distribution test
4 </description>
5 <macros>
6 <token name="@BINARY@">dsCompareCurves</token>
7 <import>deepStats_macros.xml</import>
8 </macros>
9 <expand macro="requirements" />
10 <command>
11 <![CDATA[
12 @BINARY@
13 --input '$input'
14 --output 'output'
15 --comparison '$comparison'
16 --signalName '$signalName'
17 --scoreLabels '$nameLabels.scoreLabels'
18 --regionLabels '$nameLabels.regionLabels'
19
20 #if $scaleRegions.showScaleRegionsOpt == "yes":
21 --firstRegionName '$scaleRegions.firstRegionName'
22 --secondRegionName '$scaleRegions.secondRegionName'
23 #else
24 --firstRegionName '$scaleRegions.firstRegionName'
25 #end if
26
27 --bootstraps '$statsOptions.bootstraps'
28 --bootstrapsCI '$statsOptions.bootstrapsCI'
29 --wilcoxThreshold '$statsOptions.wilcoxThreshold'
30 --bootPlotShareY '$plotOptions.bootPlotShareY'
31 --bootPlotRatio '$plotOptions.bootPlotRatio'
32 --bootPlotWidth '$plotOptions.bootPlotWidth'
33 --bootPlotHeight '$plotOptions.bootPlotHeight'
34 --wilcoxPlotWidth '$plotOptions.wilcoxPlotWidth'
35 --wilcoxPlotHeight '$plotOptions.wilcoxPlotHeight'
36 --CPU '$advancedOptions.CPU'
37
38 #if $fontOptions.showFontOptions == "yes":
39 --font '$fontOptions.font_file'
40 #end if
41
42 #if $colorsOptions.showColorsOptions == "yes":
43 --bootPlotColors '$colorsOptions.bootPlotColors'
44 #end if
45 ]]>
46 </command>
47 <inputs>
48 <param argument="--input" format="tabular" type="data"
49 label="deepTools computeMatrix output file."/>
50
51 <param argument="--comparison" type="select"
52 label="What do you want to compare?">
53 <option value="scores" selected="true">scores</option>
54 <option value="regions">regions</option>
55 </param>
56
57 <param argument="--signalName" type="text" value= "Normalized ATAC-seq counts"
58 label="Name of the genomic signal" help="Name given to the signal on the plots, \n can be added for linebreaks."/>
59
60 <conditional name="scaleRegions">
61 <param name="showScaleRegionsOpt" type="select" label="Which mode was used in deepTools computeMatrix?">
62 <option value="reference-point" selected="true">reference-point</option>
63 <option value="scale-regions">scale-regions</option>
64 </param>
65 <when value="scale-regions">
66 <param argument="--firstRegionName" type="text" value="TSS" size="10"
67 label="Label for the region start"
68 help ="Label shown in the plot
69 for the start of the region. Default is TSS (transcription start site),
70 but could be changed to anything, e.g. &quot;peak start&quot;." />
71 <param argument="--secondRegionName" type="text" value="TES" size="10"
72 label="Label for the region end"
73 help ="Label shown in the plot
74 for the end of the region. Default is TES (transcription end site),
75 but could be changed to anything, e.g. &quot;peak end&quot;." />
76 </when>
77 <when value="reference-point">
78 <param argument="--firstRegionName" type="text" value="TSS"
79 label="Label for the region start"
80 help ="Label shown in the plot
81 for the start of the region. Default is TSS (transcription start site),
82 but could be changed to anything, e.g. &quot;peak start&quot;." />
83 </when>
84 </conditional>
85
86 <section name="nameLabels" title="Customize score and region labels" expanded="false">
87 <param argument="--scoreLabels" optional="true" type="text" value= ""
88 label="Name of the scores" help="For plot display. It must be provided as text seperated
89 by semi-colons, i.e. 'Score A;Score B;Score C' as in the example.">
90 <sanitizer>
91 <valid initial="string.printable"/>
92 </sanitizer>
93 </param>
94
95 <param argument="--regionLabels" optional="true" type="text" value= ""
96 label="Name of the regions" help="For plot display. It must be provided as text seperated
97 by semi-colons, i.e. 'Regions A;Regions B;Regions C' as in the example.">
98 <sanitizer>
99 <valid initial="string.printable"/>
100 </sanitizer>
101 </param>
102 </section>
103
104 <section name="statsOptions" title="Statistics options" expanded="false">
105 <param argument="--bootstraps" type="integer" value="1000"
106 label="--bootstraps" help="Number of bootstraps to perform. Default is 1000,
107 increasing this number will increase the computing time."/>
108 <param argument="--bootstrapsCI" type="float" value="0.95"
109 label="--bootstrapsCI" help="Bootstraps confidence interval. Default is 0.95,
110 increasing this will make the analysis more stringent by increasing the min and max of the shadowed area on the bootstrap plot."/>
111 <param argument="--wilcoxThreshold" type="float" value="0.05"
112 label="--wilcoxThreshold" help="Threshold used to define significant
113 bins on the Wilcoxon rank-sum test plot (grey box). Default is 0.05"/>
114 </section>
115
116 <section name="plotOptions" title="Plotting options" expanded="false">
117 <param argument="--bootPlotShareY" type="select" label="--bootPlotShareY">
118 <option value="TRUE" selected="true">TRUE</option>
119 <option value="FALSE">FALSE</option>
120 </param>
121 <param argument="--bootPlotRatio" type="float" value="0.85" label="--bootPlotRatio"
122 help="Changes the aspect ratio of the plot. A value inferior to 1 results in a wide plot,
123 a value above 1 results in a narrow plot. Default: 0.85."/>
124
125 <param argument="--bootPlotWidth" type="float" value="5.2" label="--bootPlotWidth"
126 help="How large the bootstraps plot should be."/>
127
128 <param argument="--bootPlotHeight" type="float" value="3.7" label="--bootPlotHeight"
129 help="How tall the bootstraps plot should be."/>
130
131 <param argument="--wilcoxPlotWidth" type="float" value="4.6" label="--wilcoxPlotWidth"
132 help="How large the Wilcoxon rank-sum test plot should be."/>
133
134 <param argument="--wilcoxPlotHeight" type="float" value="4.6" label="--wilcoxPlotHeight"
135 help="How tall the Wilcoxon rank-sum test plot should be."/>
136 </section>
137
138 <section name="advancedOptions" title="Computing options" expanded="false">
139 <param argument="--CPU" type="integer" value="4" label="--CPU"
140 help="Number of CPU to use."/>
141 </section>
142
143 <conditional name="fontOptions">
144 <param name="showFontOptions" type="select" label="Customize font?">
145 <option value="No" selected="true">No</option>
146 <option value="Yes">Yes</option>
147 </param>
148 <when value="No"/>
149 <when value="Yes">
150 <param argument="--font" type="file" format="ttf" value=" " label="--font" optional="true"
151 help="Font used for plotting, given a TTF file. Default is usually Helvetica."/>
152 </when>
153 </conditional>
154
155 <conditional name="colorsOptions">
156 <param name="showColorsOptions" type="select" label="Customize colors?">
157 <option value="No" selected="true">No</option>
158 <option value="Yes">Yes</option>
159 </param>
160 <when value="No"/>
161 <when value="Yes">
162 <param argument="--bootPlotColors" type="file" format="tabular" value=" " label="--bootPlotColors"
163 help="Change the bootstraps plot color palette to a user-provided one. The file must
164 be tab-delimited and contain for each line two HTML color codes ( #3366CC #769EF2 ).
165 The first column corresponds to the mean color, the second column corresponds to the
166 color of the bootstrap confidence interval shadowed area. The default color scale
167 contains 6 colors that are color blind friendly using the dichromat R package."/>
168 </when>
169 </conditional>
170
171 </inputs>
172 <outputs>
173 <data format="pdf" name="pdf1" label="${tool.name} on ${on_string}: Bootstrap Plot" from_work_dir="output_bootstraps.pdf"/>
174 <data format="pdf" name="pdf2" label="${tool.name} on ${on_string}: Wilcox Plot" from_work_dir="output_wilcoxon.pdf"/>
175 </outputs>
176 <tests>
177 <test>
178 </test>
179 </tests>
180 <help><![CDATA[
181
182 .. role:: raw-html(raw)
183 :format: html
184
185 .. image:: https://raw.githubusercontent.com/gtrichard/deepStats/master/docs/images/deepStats_logo.png
186 :width: 400
187
188 :raw-html:`<br />`
189
190 dsCompareCurves: Comparing multiple genomic scores at multiple regions sets
191 ===========================================================================
192
193 **deepStats** aims at providing statistical analyses and streamlining the production of high quality, color-blind friendly, and fully customisable plots (up to the fonts!) for your classic genomic datasets (.bed, .bigwig, gene lists). The goal of deepStats is thus to significantly decrease the amount of time spent in Inkscape/Illustrator to get publication ready plots, and decreasing the research time alloted to finding proper statistical analyses for your genomic signals and datasets.
194
195 ``dsCompareCurves`` assesses if multiple genomics signals (ChIP-seq, ATAC-seq, etc as .bigwig files) are significantly different or not for multiple region sets (.bed files), and specifically on which bins. ``dsCompareCurves`` uses two methods to do so: bootstraps and per-bin Bonferroni corrected Wilcoxon Rank-sum tests. The input for ``dsCompareCurves`` comes from deepTools ``computeMatrix --outFileNameMatrix``, that thus must be used prior to ``dsCompareCurves``.
196
197 In a nutshell, ``dsCompareCurves`` is replacing deepTools ``plotProfile``, but with customisable, scalable and publication ready plots, in addition to providing statistical analyses.
198
199 ``dsCompareCurves`` compares regions for each signal (``--comparison regions``), or compares all signals for each region set (``--comparison scores``).
200
201 Concerning the plots and as the other deepStats tools, a lot of parameters can be customized: plot colors (although the basic color scale is color-blind friendly), fonts, plot size and size ratio.
202
203
204 _______________
205
206
207 Example usage
208 -------------
209
210 Below you can find an example of regions comparison.
211
212 We consider two set of regions, conserved genes, and unconserved genes in Drosophila melanogaster. We want to know which histone marks from modENCODE are differentially enriched between these two regions sets.
213
214 Prior to ``dsCompareCurves``, we used **deepTools** ``computeMatrix scale-regions`` with the two bed files as regions, and the three histone marks bigwig tracks as scores. We also added the optional parameter ``outFileNameMatrix`` in order to get the output as a tab-delimited file (.txt).
215
216 For more information about deepTools computeMatrix: https://deeptools.readthedocs.io/en/develop/content/tools/computeMatrix.html
217
218 The latter file `deeptools_computeMatrix_output.txt ` is then used as input for the present tool in "regions" mode, in order to compare the conserved and unconserved genes for each one of the three histone marks scores.
219
220 You can find an image describing the outputs below using the said data set and the parameters used for the same analysis on Galaxy:
221
222 .. class:: bold
223
224 `Example parameters`_
225
226 .. _Example parameters: https://raw.githubusercontent.com/gtrichard/deepStats/master/docs/images/dsCompareCurves_galaxy.png
227
228 :raw-html:`<br />`
229
230 Output description
231 ++++++++++++++++++
232
233 .. image:: https://raw.githubusercontent.com/gtrichard/deepStats/master/docs/images/dsCompareCurves_doc.png
234 :width: 800
235
236 ]]></help>
237 <expand macro="citations" />
238 </tool>