comparison humann2.xml @ 0:3d6f37e7e3a8 draft

planemo upload for repository https://github.com/ASaiM/galaxytools/tree/master/tools/humann2/ commit 7aadbbdef6da644837f62ea428cb859eeff34f04-dirty
author bebatut
date Thu, 26 May 2016 10:20:59 -0400
parents
children bcd414bb721b
comparison
equal deleted inserted replaced
-1:000000000000 0:3d6f37e7e3a8
1 <tool id="humann2" name="HUMAnN2" version="0.6.1">
2 <description>to profile presence/absence and abundance of microbial pathways and gene families</description>
3
4 <macros>
5 <import>humann2_macros.xml</import>
6 </macros>
7
8 <expand macro="requirements"/>
9 <expand macro="stdio"/>
10
11 <version_command>
12 <![CDATA[
13 humann2 --version
14 ]]>
15 </version_command>
16
17 <command><![CDATA[
18 `mkdir nucleotide_db`
19
20 &&
21
22 #if $nucleotide_db.nucleotide_db_selector == "history"
23 #for $file in $nucleotide_db.history_nucleotide_db:
24 `cp $file nucleotide_db/$file.name`
25 #end for
26
27 &&
28 #end if
29
30 `mkdir protein_db`
31
32 &&
33
34 #if $protein_db.protein_db_selector == "history"
35 diamond makedb
36 --in $protein_db.history_protein_db
37 --db protein_db/protein_db
38 #end if
39
40 &&
41
42 humann2
43 -i "$input_file"
44
45 #set $metaphlan_option = "-t rel_ab"
46 #if $taxonomic_profile.taxonomic_profile_test == "true":
47 --taxonomic-profile $taxonomic_profile.taxonomic_profile_file
48 #else
49
50 #if $taxonomic_profile.mpa_pkl.mpa_pkl_selector == "cached"
51 #set $mpa_pkl_table = dict([(_[0], _[2]) for _ in $taxonomic_profile.mpa_pkl.cached_mpa_pkl.input.options.tool_data_table.data])
52 #set $mpa_pkl_db = $taxonomic_profile.mpa_pkl.cached_mpa_pkl.value
53 #set $metaphlan_option += " --mpa_pkl " + $mpa_pkl_table[$mpa_pkl_db]
54 #else
55 #set $metaphlan_option += " --mpa_pkl " + $taxonomic_profile.mpa_pkl.history_mpa_pkl
56 #end if
57
58 #if $taxonomic_profile.bowtie2db.bowtie2db_selector == "cached"
59 #set $bowtie2_table = dict([(_[0], _[2]) for _ in $taxonomic_profile.bowtie2db.cached_bowtie2db.input.options.tool_data_table.data])
60 #set $bowtie2db_choice = $taxonomic_profile.bowtie2db.cached_bowtie2db.value
61 #set $metaphlan_option += " --bowtie2db " + $bowtie2_table[$bowtie2db_choice]
62 #else
63 #set $metaphlan_option += " --bowtie2db " + $taxonomic_profile.bowtie2db.history_bowtie2db
64 #end if
65
66 #end if
67
68 --metaphlan-options="$metaphlan_option"
69
70 --evalue $e_value
71 --identity-threshold $identity
72 --prescreen-threshold $prescreen
73
74 --pathways $pathways
75
76 #if $nucleotide_db.nucleotide_db_selector == "cached"
77 --nucleotide-database \${HUMANN2_DIR}/databases/chocophlan
78 #else
79 --nucleotide-database nucleotide_db
80 #end if
81
82 #if $protein_db.protein_db_selector == "cached"
83 --protein-database \${HUMANN2_DIR}/databases/uniref
84 #else
85 --protein-database protein_db
86 #end if
87
88 --threads \${GALAXY_SLOTS:-4}
89
90 --xipe $xipe
91 --minpath $minpath
92 --pick-frames $pick_frames
93
94 -o "output"
95 --output-format $output_format
96 --output-max-decimals $output_max_dec
97 --output-basename "humann2"
98 $remove_statified_output
99 ]]></command>
100
101 <inputs>
102 <param name="input_file" type="data" format="fastq,fasta,sam,bam,biom"
103 label="Input sequence file" help=""/>
104
105 <conditional name="taxonomic_profile">
106 <param name='taxonomic_profile_test' type='select' label="Use a custom taxonomic profile?" help="The file must have been created by MetaPhlan2">
107 <option value="true">Yes</option>
108 <option value="false" selected="true">No</option>
109 </param>
110 <when value="true">
111 <param name="taxonomic_profile_file" type="data" format="tabular,txt" label="Taxonomic profile
112 file" help=""/>
113 </when>
114 <when value="false">
115 <conditional name="mpa_pkl">
116 <param name="mpa_pkl_selector" type="select" label="Metadata for MetaPhlAn2" help="">
117 <option value="cached" selected="true">Locally cached</option>
118 <option value="history">From history</option>
119 </param>
120
121 <when value="cached">
122 <param name="cached_mpa_pkl" label="Cached metadata" type="select">
123 <options from_data_table="metaphlan2_metadata" />
124 </param>
125 </when>
126 <when value="history">
127 <param name="history_mpa_pkl" type="data" format="fasta" label="Metadata from history"/>
128 </when>
129 </conditional>
130
131 <conditional name="bowtie2db">
132 <param name="bowtie2db_selector" type="select" label="BowTie2 database for MetaPhlAn2" help="">
133 <option value="cached" selected="true">Locally cached</option>
134 <option value="history">From history</option>
135 </param>
136
137 <when value="cached">
138 <param name="cached_bowtie2db" label="Cached BowTie2 database" type="select" >
139 <options from_data_table="metaphlan2_bowtie_db" />
140 </param>
141 </when>
142 <when value="history">
143 <param name="history_bowtie2db" type="data" format="fasta" label="BowTie2 database from history"/>
144 </when>
145 </conditional>
146 </when>
147 </conditional>
148
149 <conditional name="nucleotide_db">
150 <param name="nucleotide_db_selector" type="select" label="Nucleotide database" help="">
151 <option value="cached" selected="true">Locally cached</option>
152 <option value="history">From history (as collection)</option>
153 </param>
154
155 <when value="cached"/>
156 <when value="history">
157 <param format="fasta" name="history_nucleotide_db" type="data_collection" collection_type="list" label="Nucleotide database from history" help="Each file must be named: ^[g__].[s__]"/>
158 </when>
159 </conditional>
160
161 <conditional name="protein_db">
162 <param name="protein_db_selector" type="select" label="Protein database" help="">
163 <option value="cached" selected="true">Locally cached</option>
164 <option value="history">From history</option>
165 </param>
166
167 <when value="cached"/>
168 <when value="history">
169 <param name="history_protein_db" type="data" format="fasta" label="Protein database from history" help=""/>
170 </when>
171 </conditional>
172
173 <param name="e_value" type="float" min="0" max="10" value="1" label="E-value threshold to use with the translated search" help="(--evalue)"/>
174 <param name="identity" type="integer" min="0" max="100" value="40" label="Identity threshold for alignments" help="(--identity-threshold)"/>
175 <param name="prescreen" type="float" min="0" max="1" value="0.01" label="Minimum percentage of reads matching a species" help="(--prescreen-threshold)"/>
176
177 <param name='pathways' type="select" label="Database to use for pathway computations" help="(--pathways)">
178 <option value="metacyc" selected="true">MetaCyc</option>
179 <option value="unipathway">UniPathway</option>
180 </param>
181
182 <param name='xipe' type='boolean' checked="false" truevalue='on' falsevalue='off' label="Use xipe computation?" help="(--xipe)"/>
183 <param name='minpath' type='boolean' checked="true" truevalue='on' falsevalue='off' label="Use minpath computation?" help="(--minpath)"/>
184 <param name='pick_frames' type='boolean' checked="true" truevalue='on' falsevalue='off' label="Use pick frames computation?" help="(--pick-frames)"/>
185
186 <param name='output_format' type="select" label="Format of the output files" help="(--output-format)">
187 <option value="tsv" selected="true">TSV</option>
188 <option value="biom">BIOM</option>
189 </param>
190
191 <param name="output_max_dec" type="integer" min="0" max="100" value="10" label="Number of decimals to output" help="(--output-max-decimals)"/>
192 <param name='remove_statified_output' type='boolean' checked="false" truevalue='--remove-stratified-output' falsevalue='' label="Remove stratification from output?" help="(--remove-stratified-output)"/>
193 </inputs>
194
195 <outputs>
196 <data format="tsv" name="gene_families_tsv" from_work_dir="output/humann2_genefamilies.tsv" label="${tool.name} on ${on_string}: Gene families and their abundance" >
197 <filter>output_format == "tsv"</filter>
198 </data>
199 <data format="biom" name="gene_families_biom" from_work_dir="output/humann2_genefamilies.biom" label="${tool.name} on ${on_string}: Gene families and their abundance" >
200 <filter>output_format == "biom"</filter>
201 </data>
202
203 <data format="tsv" name="pathcoverage_tsv" from_work_dir="output/humann2_pathcoverage.tsv" label="${tool.name} on ${on_string}: Pathways and their coverage" >
204 <filter>output_format == "tsv"</filter>
205 </data>
206 <data format="biom" name="pathcoverage_biom" from_work_dir="output/humann2_pathcoverage.biom" label="${tool.name} on ${on_string}: Pathways and their coverage" >
207 <filter>output_format == "biom"</filter>
208 </data>
209
210 <data format="tsv" name="pathabundance_tsv" from_work_dir="output/humann2_pathabundance.tsv" label="${tool.name} on ${on_string}: Pathways and their abundance" >
211 <filter>output_format == "tsv"</filter>
212 </data>
213 <data format="biom" name="pathabundance_biom" from_work_dir="output/humann2_pathabundance.biom" label="${tool.name} on ${on_string}: Pathways and their abundance" >
214 <filter>output_format == "biom"</filter>
215 </data>
216 </outputs>
217
218 <tests>
219 <test>
220 <param name="input_file" value="input_sequences.fasta"/>
221 <param name='taxonomic_profile_test' value="true"/>
222 <param name="taxonomic_profile_file" value="taxonomic_profile.tabular"/>
223 <param name="nucleotide_db_selector" value="history"/>
224 <param name="history_nucleotide_db">
225 <collection type="list">
226 <element name="g__Bacteroides.s__Bacteroides_stercoris.centroids.v0.1.1" ftype="fasta" value="g__Bacteroides.s__Bacteroides_stercoris.centroids.v0.1.1.ffn.gz" />
227 <element name="g__Bacteroides.s__Bacteroides_thetaiotaomicron.centroids.v0.1.1" ftype="fasta" value="g__Bacteroides.s__Bacteroides_thetaiotaomicron.centroids.v0.1.1.ffn.gz" />
228 </collection>
229 </param>
230 <param name="protein_db_selector" value="history"/>
231 <param name="history_protein_db" value="reduced_uniref50.fasta"/>
232 <param name="e_value" value="1"/>
233 <param name="identity" value="40"/>
234 <param name="prescreen" value="0.01"/>
235 <param name='pathways' value="metacyc"/>
236 <param name='xipe' value="false"/>
237 <param name='minpath' value="true"/>
238 <param name='pick_frames' value="true"/>
239 <param name='output_format' value="tsv"/>
240 <param name="output_max_dec" value="10"/>
241 <output name="gene_families_tsv" file="expected_gene_family_abundance.tsv"/>
242 <output name="pathcoverage_tsv" file="expected_pathway_coverage.tsv"/>
243 <output name="pathabundance_tsv" file="expected_pathway_abundance.tsv"/>
244 </test>
245 </tests>
246
247 <help><![CDATA[
248 **What it does**
249
250 HUMAnN is a pipeline for efficiently and accuretly profiling the presence/absence and abundance of microbial pathways in a community from metagenomic or metatranscriptomic sequencing data. `Read more about the tool <http://huttenhower.sph.harvard.edu/humann2/manual>`_.
251
252 This tool corresponds to the main tool in HUMAnN2 pipeline.
253
254 **Inputs**
255
256 The input is a single file corresponding either to filtered shotgun sequencing metagenome file (fastq, fastq.gz, fasta, or fasta.gz format), alignment file (sam, bam or blastm8 format) or gene table file (tsv or biom format).
257
258 A file with a taxonomic profile (obtained with MetaPhlan2) can also be provided to avoid first step of taxonomic profiling needed to select pangenomes in protein database.
259
260 HUMAnN2 uses multiple databases. Locally cached nucleotide or protein databases have to be downloaded database before using them (using the dedicated tool). Custom databases can also be used after upload. Nucleotide database have to be provided as a dataset.
261
262 **Outputs**
263
264 HUMAnN creates three output files:
265
266 - A file with gene families and their abundance
267 - A file with pathways and their abundance
268 - A file with pathways and their coverage
269
270 ]]></help>
271
272 <expand macro="citations"/>
273 </tool>