comparison pathview.xml @ 0:bd99e8fbde97 draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/pathview commit 438c20a62c01fa4adea6fbb4cb40ae05b4166043"
author iuc
date Mon, 26 Aug 2019 14:42:52 -0400
parents
children 03c13085aecc
comparison
equal deleted inserted replaced
-1:000000000000 0:bd99e8fbde97
1 <tool id="pathview" name="Pathview" version="@VERSION@+@GALAXY_VERSION@">
2 <description>for pathway based data integration and visualization</description>
3 <macros>
4 <token name="@VERSION@">1.24.0</token>
5 <token name="@GALAXY_VERSION@">galaxy0</token>
6 </macros>
7 <requirements>
8 <requirement type="package" version="@VERSION@">bioconductor-pathview</requirement>
9 <requirement type="package" version="3.8.2">bioconductor-org.ag.eg.db</requirement>
10 <requirement type="package" version="3.8.2">bioconductor-org.at.tair.db</requirement>
11 <requirement type="package" version="3.8.2">bioconductor-org.bt.eg.db</requirement>
12 <requirement type="package" version="3.8.2">bioconductor-org.ce.eg.db</requirement>
13 <requirement type="package" version="3.8.2">bioconductor-org.cf.eg.db</requirement>
14 <requirement type="package" version="3.8.2">bioconductor-org.dm.eg.db</requirement>
15 <requirement type="package" version="3.8.2">bioconductor-org.dr.eg.db</requirement>
16 <requirement type="package" version="3.8.2">bioconductor-org.eck12.eg.db</requirement>
17 <requirement type="package" version="3.8.2">bioconductor-org.ecsakai.eg.db</requirement>
18 <requirement type="package" version="3.8.2">bioconductor-org.gg.eg.db</requirement>
19 <requirement type="package" version="3.8.2">bioconductor-org.hs.eg.db</requirement>
20 <requirement type="package" version="3.8.2">bioconductor-org.mm.eg.db</requirement>
21 <requirement type="package" version="3.8.2">bioconductor-org.mmu.eg.db</requirement>
22 <requirement type="package" version="3.8.2">bioconductor-org.pf.plasmo.db</requirement>
23 <requirement type="package" version="3.8.2">bioconductor-org.pt.eg.db</requirement>
24 <requirement type="package" version="3.8.2">bioconductor-org.rn.eg.db</requirement>
25 <requirement type="package" version="3.8.2">bioconductor-org.sc.sgd.db</requirement>
26 <requirement type="package" version="3.8.2">bioconductor-org.ss.eg.db</requirement>
27 <requirement type="package" version="3.8.2">bioconductor-org.xl.eg.db</requirement>
28 <requirement type="package" version="1.6.2">r-optparse</requirement>
29 </requirements>
30 <version_command><![CDATA[
31 echo $(R --version | grep version | grep -v GNU)", pathview version" $(R --vanilla --slave -e "library(pathview); cat(sessionInfo()\$otherPkgs\$pathview\$Version)" 2> /dev/null | grep -v -i "WARNING: ")", optparse version" $(R --vanilla --slave -e "library(optparse); cat(sessionInfo()\$otherPkgs\$optparse\$Version)" 2> /dev/null | grep -v -i "WARNING: ")", dplyr version" $(R --vanilla --slave -e "library(dplyr); cat(sessionInfo()\$otherPkgs\$dplyr\$Version)" 2> /dev/null | grep -v -i "WARNING: ")", ggplot2 version" $(R --vanilla --slave -e "library(ggplot2); cat(sessionInfo()\$otherPkgs\$ggplot2\$Version)" 2> /dev/null | grep -v -i "WARNING: ")
32 ]]></version_command>
33 <command detect_errors="exit_code"><![CDATA[
34 Rscript '$__tool_directory__/pathview.r'
35
36 #if str($pathway.nb) == 'one'
37 --pathway_id '$pathway.one_id'
38 #else
39 --pathway_id_fp '$pathway.tabular'
40 --pathway_id_header $pathway.header
41 #end if
42
43 --species '$species'
44
45 #if str($gene_data.gd) == 'true'
46 --gene_data '$gene_data.tabular'
47 --gd_header $gene_data.header
48 --gene_idtype '$gene_data.idtype'
49 #end if
50
51 #if str($cpd_data.cpd) == 'true'
52 --cpd_data '$cpd_data.tabular'
53 --cpd_header $cpd_data.header
54 --cpd_idtype '$cpd_data.idtype'
55 #end if
56
57 --multi_state $multi_state
58 --match_data $match_data
59
60 --kegg_native $out.kegg_native.out
61 --same_layer $out.kegg_native.same_layer
62 #if str($out.kegg_native.out) == 'TRUE'
63 --map_null $out.kegg_native.map_null
64 #else
65 --split_group $out.kegg_native.split_group
66 --expand_node $out.kegg_native.expand_node
67 --sign_pos $out.kegg_native.sign_pos
68 #end if
69
70 &&
71 ls .
72 ]]></command>
73 <inputs>
74 <conditional name="pathway">
75 <param name="nb" type="select" label="Number of pathways to plot">
76 <option value="one" selected="true">One</option>
77 <option value="multiple">Multiple</option>
78 </param>
79 <when value="one">
80 <param name="one_id" type="text" label="KEGG pathway" help="KEGG pathway ID with 5 digits and without the 3 letter KEGG species code.">
81 <validator type="regex" message="It should be the 5 digits of the KEGG pathway ID.">^(?:\d\d\d\d\d)?$</validator>
82 </param>
83 </when>
84 <when value="multiple">
85 <param name="tabular" type="data" format="tabular" optional="true" label="KEGG pathways" help="A table with one-column with KEGG pathways to plot"/>
86 <param name="header" type="boolean" checked="true" label="Does the file have header (a first line with column names)?"/>
87 </when>
88 </conditional>
89 <param name="species" type="select" label="Species to use">
90 <option value="aga">Anopheles</option>
91 <option value="ath">Arabidopsis</option>
92 <option value="bta">Bovine</option>
93 <option value="cel">Worm</option>
94 <option value="cfa">Canine</option>
95 <option value="dme">Fly</option>
96 <option value="dre">Zebrafish</option>
97 <option value="eco">E coli strain K12</option>
98 <option value="ecs">E coli strain Sakai</option>
99 <option value="gga">Chicken</option>
100 <option value="hsa" selected="true">Human</option>
101 <option value="mmu">Mouse</option>
102 <option value="mcc">Rhesus</option>
103 <option value="pfa">Malaria</option>
104 <option value="ptr">Chimp</option>
105 <option value="rno">Rat</option>
106 <option value="sce">Yeast</option>
107 <option value="ssc">Pig</option>
108 <option value="xla">Xenopus</option>
109 </param>
110 <conditional name="gene_data">
111 <param name="gd" type="select" label="Provide a gene data file?" help="Gene data is a broad concept including genes, transcripts, protein, enzymes and their expression, modifications and any measurable attributes.">
112 <option value="true">Yes</option>
113 <option value="false">No</option>
114 </param>
115 <when value="true">
116 <param name="tabular" type="data" format="tabular" label="Gene data" help="It should be a table with first column being the gene ids and other being information (p-value, fold change, levels, etc) from one or several samples."/>
117 <param name="header" type="boolean" checked="true" label="Does the file have header (a first line with sample names)?"/>
118 <param name="idtype" type="select" label="Format for gene data">
119 <option value="entrez" selected="true">Entrez Gene ID</option>
120 <option value="symbol">Gene Symbol</option>
121 <option value="genename">Gene Name</option>
122 <option value="ensembl">Ensembl Gene ID</option>
123 <option value="ensemblprot">Ensembl Protein ID</option>
124 <option value="ensembltrans">Ensembl Trans ID</option>
125 <option value="unigene">UniGene</option>
126 <option value="uniprot">UniProt</option>
127 <option value="refseq">RefSeq</option>
128 <option value="enzyme">Enzyme</option>
129 <option value="tair">TAIR</option>
130 <option value="prosite">Prosite</option>
131 <option value="orf">ORF</option>
132 </param>
133 </when>
134 <when value="false"/>
135 </conditional>
136 <conditional name="cpd_data">
137 <param name="cpd" type="select" label="Provide a compound data file?" help="compound data is a broad concept including metabolites, drugs, their measurements and attributes.">
138 <option value="true">Yes</option>
139 <option value="false" selected="true">No</option>
140 </param>
141 <when value="true">
142 <param name="tabular" type="data" format="tabular" label="Compound data" help="It should be a table with first column being the gene ids and other being information (p-value, fold change, levels, etc) from one or several samples."/>
143 <param name="header" type="boolean" checked="true" label="Does the file have header (a first line with sample names)?"/>
144 <param name="idtype" type="select" label="Format for compound data">
145 <option value="kegg" selected="true">KEGG (include compound, glycan and drug accessions)</option>
146 </param>
147 </when>
148 <when value="false"/>
149 </conditional>
150 <param name="multi_state" type="boolean" checked="true" label="Should multiple states of gene or compond data be intergrated and plotted in the same graph?" help="Gene or compound nodes will be sliced into multiple pieces corresponding to the number of states in the data" />
151 <param name="match_data" type="boolean" checked="true" label="Are the gene and compound data paired?" help="When let sample sizes of gene and compound be m and n, when m>n, extra columns of NA's (mapped to no color) will be added to make the sample size the same" />
152 <section name="out" title="Output Options" expanded="true">
153 <conditional name="kegg_native">
154 <param name="out" type="select" label="Output for pathway">
155 <option value="TRUE" selected="true">KEGG native</option>
156 <option value="FALSE">Graphviz</option>
157 </param>
158 <when value="TRUE">
159 <param name="same_layer" type="boolean" checked="true" label="Plot on same layer?" help="If yes, node colors will be plotted in the same layer as the pathway graph." />
160 <param name="map_null" type="boolean" checked="true" label="Map the NULL gene or compound data to pathway?" help="When NULL data are mapped, the gene or compound nodes in the pathway will berendered as actually mapped nodes, except with NA-valued color. When NULL data are not mapped, the nodes are rendered as unmapped nodes." />
161 </when>
162 <when value="FALSE">
163 <param name="same_layer" type="boolean" checked="true" label="Plot on same layer?" help="If yes, edge/node type legend will be plotted in the same page." />
164 <param name="split_group" type="boolean" checked="false" label="Split node groups into individual nodes?" help="Each split member nodes inherits all edges from the node group. This option also effects most metabolic pathways even without group nodes defined orginally. For these pathways, genes involved in the same reaction are grouped automatically when converting reactions to edges unless split.group is true." />
165 <param name="expand_node" type="boolean" checked="false" label="Expand multiple-gene nodes into single-gene nodes?" help="Each expanded single-gene nodes inherits all edges from the original multiple-gene node. This option is not effective for most metabolic pathways where it conflits with converting reactions to edges." />
166 <param name="sign_pos" type="select" label="Position of pathview signature">
167 <option value="bottomright" selected="true">Bottom right</option>
168 <option value="bottomleft">Bottom left</option>
169 <option value="topleft">Top left</option>
170 <option value="topright">Top right</option>
171 </param>
172 </when>
173 </conditional>
174 </section>
175 </inputs>
176 <outputs>
177 <data name="one_kegg_native" format="png" from_work_dir="*.pathview.png" label="${tool.name} on ${on_string}: KEGG Pathway (${species}${pathway.one_id})">
178 <filter>pathway['nb'] == 'one'</filter>
179 <filter>out['kegg_native']['out'] == 'TRUE'</filter>
180 </data>
181 <data name="one_graphviz" format="pdf" from_work_dir="*.pathview.pdf" label="${tool.name} on ${on_string}: KEGG Pathway (${species}${pathway.one_id}), Graphviz format">
182 <filter>pathway['nb'] == 'one'</filter>
183 <filter>out['kegg_native']['out'] == 'FALSE'</filter>
184 </data>
185 <collection name="multiple_kegg_native" type="list" label="${tool.name} on ${on_string}: KEGG Pathways">
186 <filter>pathway['nb'] == 'multiple'</filter>
187 <filter>out['kegg_native']['out'] == 'TRUE'</filter>
188 <discover_datasets pattern="(?P&lt;designation&gt;.+)\.pathview\.png" directory="." ext="png"/>
189 </collection>
190 <collection name="multiple_graphviz" type="list" label="${tool.name} on ${on_string}: KEGG Pathways, Graphviz format">
191 <filter>pathway['nb'] == 'multiple'</filter>
192 <filter>out['kegg_native']['out'] == 'FALSE'</filter>
193 <discover_datasets pattern="(?P&lt;designation&gt;.+)\.pathview\.pdf" directory="." ext="pdf"/>
194 </collection>
195 </outputs>
196 <tests>
197 <test>
198 <conditional name="pathway">
199 <param name="nb" value="one" />
200 <param name="one_id" value="00010"/>
201 </conditional>
202 <param name="species" value="dme"/>
203 <conditional name="gene_data">
204 <param name="gd" value="true"/>
205 <param name="tabular" value="gene_data.tabular"/>
206 <param name="header" value="false"/>
207 <param name="idtype" value="ensembl"/>
208 </conditional>
209 <conditional name="cpd_data">
210 <param name="cpd" value="false"/>
211 </conditional>
212 <param name="multi_state" value="true" />
213 <param name="match_data" value="true"/>
214 <section name="out">
215 <conditional name="kegg_native">
216 <param name="out" value="TRUE" />
217 <param name="same_layer" value="true"/>
218 <param name="map_null" value="true"/>
219 </conditional>
220 </section>
221 <output name="one_kegg_native" ftype="png" file="dme00010.png" compare="sim_size" delta="30000"/>
222 </test>
223 <test>
224 <conditional name="pathway">
225 <param name="nb" value="one" />
226 <param name="one_id" value="00010"/>
227 </conditional>
228 <param name="species" value="dme"/>
229 <conditional name="gene_data">
230 <param name="gd" value="true"/>
231 <param name="tabular" value="gene_data.tabular"/>
232 <param name="header" value="false"/>
233 <param name="idtype" value="ensembl"/>
234 </conditional>
235 <conditional name="cpd_data">
236 <param name="cpd" value="false"/>
237 </conditional>
238 <param name="multi_state" value="true" />
239 <param name="match_data" value="true"/>
240 <section name="out">
241 <conditional name="kegg_native">
242 <param name="out" value="FALSE" />
243 <param name="same_layer" value="true"/>
244 <param name="split_group" value="false" />
245 <param name="expand_node" value="false"/>
246 <param name="sign_pos" value="bottomright"/>
247 </conditional>
248 </section>
249 <output name="one_graphviz" ftype="pdf" file="dme00010.pdf" compare="sim_size"/>
250 </test>
251 <test>
252 <conditional name="pathway">
253 <param name="nb" value="multiple" />
254 <param name="tabular" value="pathways.tabular"/>
255 <param name="header" value="false"/>
256 </conditional>
257 <param name="species" value="dme"/>
258 <conditional name="gene_data">
259 <param name="gd" value="true"/>
260 <param name="tabular" value="gene_data.tabular"/>
261 <param name="header" value="false"/>
262 <param name="idtype" value="ensembl"/>
263 </conditional>
264 <conditional name="cpd_data">
265 <param name="cpd" value="false"/>
266 </conditional>
267 <param name="multi_state" value="true" />
268 <param name="match_data" value="true"/>
269 <section name="out">
270 <conditional name="kegg_native">
271 <param name="out" value="TRUE" />
272 <param name="same_layer" value="true"/>
273 <param name="map_null" value="true"/>
274 </conditional>
275 </section>
276 <output_collection name="multiple_kegg_native" count="2">
277 <element name="dme00010" ftype="png" file="dme00010.png" compare="sim_size" delta="30000"/>
278 <element name="dme00480" ftype="png" file="dme00480.png" compare="sim_size" delta="40000"/>
279 </output_collection>
280 </test>
281 <test>
282 <conditional name="pathway">
283 <param name="nb" value="multiple" />
284 <param name="tabular" value="pathways.tabular"/>
285 <param name="header" value="false"/>
286 </conditional>
287 <param name="species" value="dme"/>
288 <conditional name="gene_data">
289 <param name="gd" value="true"/>
290 <param name="tabular" value="gene_data.tabular"/>
291 <param name="header" value="false"/>
292 <param name="idtype" value="ensembl"/>
293 </conditional>
294 <conditional name="cpd_data">
295 <param name="cpd" value="false"/>
296 <param name="tabular" value="cpd_data.tabular"/>
297 <param name="header" value="false"/>
298 <param name="idtype" value="kegg"/>
299 </conditional>
300 <param name="multi_state" value="true" />
301 <param name="match_data" value="true"/>
302 <section name="out">
303 <conditional name="kegg_native">
304 <param name="out" value="FALSE" />
305 <param name="same_layer" value="false"/>
306 <param name="split_group" value="false" />
307 <param name="expand_node" value="false"/>
308 <param name="sign_pos" value="bottomright"/>
309 </conditional>
310 </section>
311 <output_collection name="multiple_graphviz" count="2">
312 <element name="dme00010" ftype="pdf" file="dme00010_cpd.pdf" compare="sim_size"/>
313 <element name="dme00480" ftype="pdf" file="dme00480_cpd.pdf" compare="sim_size"/>
314 </output_collection>
315 </test>
316 </tests>
317 <help><![CDATA[
318
319 .. class:: infomark
320
321 **What it does**
322
323 Pathview is a stand-alone software package for pathway based data integration and visualization.
324
325 This package can be divided into four functional modules: the Downloader, Parser, Mapper andViewer.
326 Mostly importantly, pathview maps and renders user data on relevant pathway graphs.
327
328 Notice that KEGG requires subscription for FTP access since May 2011.
329 However,Pathview downloads individual pathway graphs and data files through API or HTTP access, which is freely available (for academic and non-commerical uses).
330 Pathview uses KEGGgraph (Zhang and Wiemann, 2009) when parsing KEGG xml data files.
331
332
333 Options map closely to the excellent pathview manual_.
334
335 -----
336
337 **Inputs**
338
339 Pathview provides strong support for data integration. It works with:
340
341 - essentially all types of biological data mappable to pathways (gene expression, protein expression, genetic association, metabolite, genomic data, literature, etc)
342 - over 10 types of gene or protein IDs, and 20 types of compound or metabolite IDs
343 - pathways for about 4800 species as well as KEGG orthology
344 - various data attributes and formats, i.e. continuous/discrete data, matrices/vectors, single/multiple samples etc.
345
346 Pathview can be directly used for metagenomic, microbiome or unknown species data when the data are mapped to KEGG ortholog pathways.
347
348 *Pathway ids*
349
350 Either just the name or a table with one column with the different pathway ids to represent.
351
352
353 *Gene data*
354
355 The first input of Pathview is a gene data table. Here gene data is a broad concept including genes, transcripts, protein, enzymes and their expression, modifications and any measurable attributes.
356
357 It should be a table with first column being the gene ids and other being information (p-value, fold change, levels, etc) from one or several samples.
358 The first line can include the sample names.
359
360 Here gene id is a generic concepts, including multiple types of gene, transcript and protein uniquely mappable to KEGG gene IDs. KEGG ortholog IDs are also treated as gene IDs as to handle metagenomic data.
361
362 Example:
363
364 =========== =================
365 FBgn0039155 -4.14844993705661
366 FBgn0003360 -2.99977727873544
367 FBgn0026562 -2.38016404989418
368 FBgn0025111 2.69993883050214
369 FBgn0029167 -2.10506155636758
370 =========== =================
371
372 *Compound data*
373
374 We also frequently want to look at metabolic pathways too. Besides gene nodes, these pathways also have compound nodes.
375 Therefore, we may integrate or visualize both gene data and compound data with metabolic pathways.
376
377 Here compound data is a broad concept including metabolites, drugs, their measurements and attributes.
378
379 The format is similar to the gene data table, except named with IDs mappable to KEGG compound IDs.
380 Over 20 types of IDs included in CHEMBL database can be used here.
381
382 -----
383
384 **Outputs**
385
386 Pathview generates both native KEGG view and Graphviz view for pathways.
387
388 KEGG view keeps all the meta-data on pathways, spacial and temporal information, tissue/cell types, inputs, outputs and connections. This is important for human reading and interpretation of pathway biology.
389
390 .. image:: $PATH_TO_IMAGES/dme00010_native.png
391 :width: 60 %
392
393 Graphviz view provides better control of node and edge attributes, better view of pathway topology, better understanding of the pathway analysis statistics.
394
395 .. image:: $PATH_TO_IMAGES/dme00010_graphviz.png
396 :width: 60 %
397
398 .. _manual: https://bioconductor.org/packages/release/bioc/vignettes/pathview/inst/doc/pathview.pdf
399 .. _KEGG: http://www.genome.jp/kegg
400
401 ]]></help>
402 <citations>
403 <citation type="doi">10.1093/bioinformatics/btt285</citation>
404 </citations>
405 </tool>