comparison topGO.xml @ 0:aade04e750fa draft default tip

planemo upload
author lnguyen
date Fri, 15 Sep 2017 10:38:28 -0400
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:aade04e750fa
1 <tool id="topGO" name="topGO enrichment analysis" version="0.1.0">
2 <requirements>
3 </requirements>
4 <stdio>
5 <exit_code range="1:" />
6 </stdio>
7 <command><![CDATA[
8
9 #if $inputtype.filetype == "file_all":
10 Rscript --vanilla $__tool_directory__/enrichment_v3.R --inputtype tabfile --input '$inputtype.genelist' --ontology '$ontocat' --option '$option' --threshold '$threshold' --correction '$correction' --textoutput '$condtext.textoutput' --barplotoutput '$condbar.barplotoutput' --dotplotoutput '$conddot.dotplotoutput' --column '$inputtype.column' --geneuniverse '$geneuniverse' --header '$inputtype.header'
11 #end if
12
13
14 #if $inputtype.filetype == "copy_paste":
15 Rscript --vanilla $__tool_directory__/enrichment_v3.R --inputtype copypaste --input '$inputtype.genelist' --ontology '$ontocat' --option '$option' --threshold '$threshold' --correction '$correction' --textoutput '$condtext.textoutput' --barplotoutput '$condbar.barplotoutput' --dotplotoutput '$conddot.dotplotoutput' --column c1 --geneuniverse '$geneuniverse' --header None
16
17 #end if
18
19
20
21 ]]></command>
22
23 <inputs>
24 <conditional name="inputtype">
25 <param name="filetype" type="select" label="Select your type of input file" help="The identifiers must be Ensembl gene IDs (e.g : ENSG00000139618). If it is not the case, please use the ID Mapping tool.">
26 <option value="file_all">Input file containing your identifiers</option>
27 <option value="copy_paste">Copy/paste your list of IDs</option>
28 </param>
29 <when value="copy_paste">
30 <param name="genelist" type="text" label="Enter a list of identifiers"/>
31 </when>
32 <when value="file_all">
33 <param name="genelist" type="data" format="txt,tabular" label="Choose an input file" help="This file must imperatively have 1 column filled with IDs consistent with the database that will be used. Please use the MappingIDs component if this is not the case."/>
34 <param name="column" type="text" label="Please specify the column where you would like to apply the comparison (e.g : Enter c1)" value="c1"/>
35
36 <param name="header" type="select" label="Does your file have a header?" multiple="false" optional="false">
37 <option value="TRUE" selected="true">Yes</option>
38 <option value="FALSE" selected="false">No</option>
39 </param>
40 </when>
41 </conditional>
42 <param name="geneuniverse" type="select" label="Select a specie">
43 <option value="org.At.tair.db" >Arabidopsis</option>
44 <option value="org.Ce.eg.db" >C.elegans</option>
45 <option value="org.Dm.eg.db" >Fly</option>
46 <option value="org.Hs.eg.db" selected="true">Human</option>
47 <option value="org.Mm.eg.db" >Mouse</option>
48 <option value="org.Sc.sqd.db" >Yeast</option>
49 </param>
50
51 <param name="ontocat" type="select" label="Ontology category">
52 <option value="BP" >Biological Process</option>
53 <option value="CC" >Cellular Component</option>
54 <option value="MF" >Molecular Function</option>
55 </param>
56
57 <param name="option" type="select" label="Choose the topGO option for your analysis">
58 <option value="classic" >Classic fisher test</option>
59 <option value="elim" selected="true">Elim</option>
60 <option value="weight01" >Weight01</option>
61 <option value="parentchild" >ParentChild</option>
62 </param>
63 <param name="threshold" type="text" label="Enter the p-value threshold level under the form 1e-level wanted (e.g : 1e-3)" value="1e-3"/>
64 <param name="correction" label="Choose a correction for multiple testing" type="select">
65 <option value="none" >None</option>
66 <option value="holm">Holm correction</option>
67 <option value="hochberg" >Hochberg correction</option>
68 <option value="hommel" >Hommel correction</option>
69 <option value="bonferroni" >Bonferroni correction</option>
70 <option value="BH" selected="true">Benjamini and Hochberg</option>
71 <option value="BY" >Benjamini and Yekutieli</option>
72 <option value="fdr" >FDR</option>
73 </param>
74 <conditional name="condtext">
75 <param name="textoutput" type="select" label="Generate a text file for results">
76 <option value="TRUE">Yes</option>
77 <option value="FALSE">No</option>
78 </param>
79 </conditional>
80 <conditional name="condbar">
81 <param name="barplotoutput" type="select" label="Generate a barplot of over-represented GO terms">
82 <option value="TRUE">Yes</option>
83 <option value="FALSE">No</option>
84 </param>
85 </conditional>
86 <conditional name="conddot">
87 <param name="dotplotoutput" type="select" label="Generate a dotplot of over-represented GO terms">
88 <option value="TRUE">Yes</option>
89 <option value="FALSE">No</option>
90 </param>
91 </conditional>
92 </inputs>
93 <outputs>
94
95 <data name="outputtext" format="tabular" label="Text output for topGO analysis" from_work_dir="result.csv">
96 <filter>condtext['textoutput']=="TRUE"</filter>
97 </data>
98
99 <data name="outputbarplot" format="png" label="Barplot output for topGO analysis" from_work_dir="barplot.png">
100 <filter>condbar['barplotoutput']=="TRUE"</filter>
101 </data>
102
103 <data name="outputdotplot" format="png" label="Dotplot output for topGO analysis" from_work_dir="dotplot.png">
104 <filter>conddot['dotplotoutput']=="TRUE"</filter>
105 </data>
106
107 </outputs>
108 <help><![CDATA[
109
110
111 **Galaxy component based on R package topGO.**
112
113 **Input required**
114
115 This component works with Ensembl gene ids (e.g : ENSG0000013618). You can
116 copy/paste these identifiers or supply a tabular file (.csv, .tsv, .txt, .tab)
117 where there are contained.
118
119 **Principle**
120
121 This component provides the GO terms representativity of a gene list in one ontology category (Biological Process "BP", Cellular Component "CC", Molecular Function "MF"). This representativity is evaluated in comparison to the background list of all human genes associated associated with GO terms of the chosen category (BP,CC,MF). This background is given by the R package "org.Hs.eg.db", which is a genome wide association package for **human**.
122
123 **Output**
124
125 Three kind of outputs are available : a textual output, a barplot output and
126 a dotplot output.
127
128 *Textual output* :
129 The text output lists all the GO-terms that were found significant under the specified threshold.
130
131
132 The different fields are as follow :
133
134 - Annotated : number of genes in org.Hs.eg.db which are annotated with the GO-term.
135
136 - Significant : number of genes belonging to your input which are annotated with the GO-term.
137
138 - Expected : show an estimate of the number of genes a node of size Annotated would have if the significant genes were to be randomly selected from the gene universe.
139
140 - pvalues : pvalue obtained after the test
141
142 - ( qvalues : additional column with adjusted pvalues )
143
144
145 **Tests**
146
147 topGO provides a classic fisher test for evaluating if some GO terms are over-represented in your gene list, but other options are also provided (elim, weight01,parentchild). For the merits of each option and their algorithmic descriptions, please refer to topGO manual :
148 https://bioconductor.org/packages/release/bioc/vignettes/topGO/inst/doc/topGO.pdf
149
150 **Multiple testing corrections**
151
152 Furthermore, the following corrections for multiple testing can also be applied :
153 - holm
154 - hochberg
155 - hommel
156 - bonferroni
157 - BH
158 - BY
159 - fdr
160
161
162
163 ]]></help>
164
165 <tests>
166 <test>
167 <conditional name="inputtype">
168 <param name="filetype " value="tabfile"/>
169 <param name="genelist" value="prot_reactome_EGFR_mapped_ensg.txt"/>
170 <param name="column" value="c1"/>
171 <param name="header" value="FALSE"/>
172 </conditional>
173 <param name="ontocat" value="BP"/>
174 <param name="option" value="elim"/>
175 <param name="threshold" value="1e-3"/>
176 <param name="correction" value="BH"/>
177 <conditional name="condtext">
178 <param name="textoutput" value="TRUE"/>
179 </conditional>
180 <conditional name="condbar">
181 <param name="barplotoutput" value="TRUE"/>
182 </conditional>
183 <conditional name="conddot">
184 <param name="dotoutput" value="TRUE"/>
185 </conditional>
186 <param name="geneuniverse" value="org.Hs.eg.db"/>
187 <output name="outputtext" file="Text_output_for_topGO_analysis.txt"/>
188 <output name="outputbarplot" file="Barplot_output_for_topGO_analysis.png"/>
189 <output name="outputdotplot" file="Dotplot_output_for_topGO_analysis.png"/>
190 </test>
191 </tests>
192 </tool>