comparison humann2.xml @ 1:bcd414bb721b draft default tip

planemo upload for repository https://github.com/ASaiM/galaxytools/tree/master/tools/humann2/ commit 79571d981d7d56657699be8aa24a40a36a8d0ab5-dirty
author bebatut
date Thu, 02 Jun 2016 04:23:09 -0400
parents 3d6f37e7e3a8
children
comparison
equal deleted inserted replaced
0:3d6f37e7e3a8 1:bcd414bb721b
23 #for $file in $nucleotide_db.history_nucleotide_db: 23 #for $file in $nucleotide_db.history_nucleotide_db:
24 `cp $file nucleotide_db/$file.name` 24 `cp $file nucleotide_db/$file.name`
25 #end for 25 #end for
26 26
27 && 27 &&
28 #end if 28 #end if
29 29
30 `mkdir protein_db` 30 `mkdir protein_db`
31 31
32 && 32 &&
33 33
34 #if $protein_db.protein_db_selector == "history" 34 #if $protein_db.protein_db_selector == "history"
35 diamond makedb 35 diamond makedb
36 --in $protein_db.history_protein_db 36 --in $protein_db.history_protein_db
37 --db protein_db/protein_db 37 --db protein_db/protein_db
38 &&
38 #end if 39 #end if
39 40
40 && 41 #if $taxonomic_profile.taxonomic_profile_test == "false"
41 42 #if $taxonomic_profile.metaphlan2_db_choice.metaphlan2_db_selector == "history"
42 humann2 43 `mkdir ref_db`
44 &&
45 bowtie2-build $taxonomic_profile.metaphlan2_db_choice.metaphlan2_db_sequences ref_db/ref_db
46 &&
47 python $__tool_directory__/transform_json_to_pkl.py
48 --json_input $metaphlan2_db_metadata
49 --pkl_output ref_db/metadata.pkl
50 &&
51 #end if
52 #end if
53
54 humann2
43 -i "$input_file" 55 -i "$input_file"
44 56
45 #set $metaphlan_option = "-t rel_ab" 57 #set $metaphlan_option = "-t rel_ab"
46 #if $taxonomic_profile.taxonomic_profile_test == "true": 58 #if $taxonomic_profile.taxonomic_profile_test == "true":
47 --taxonomic-profile $taxonomic_profile.taxonomic_profile_file 59 --taxonomic-profile $taxonomic_profile.taxonomic_profile_file
48 #else 60 #else
49 61 #if $taxonomic_profile.metaphlan2_db_choice.metaphlan2_db_selector == "cached"
50 #if $taxonomic_profile.mpa_pkl.mpa_pkl_selector == "cached" 62 #set $table = dict([(_[0], _[2]) for _ in $taxonomic_profile.metaphlan2_db_choice.cached_metaphlan2_db.input.options.tool_data_table.data])
51 #set $mpa_pkl_table = dict([(_[0], _[2]) for _ in $taxonomic_profile.mpa_pkl.cached_mpa_pkl.input.options.tool_data_table.data]) 63 #set $db_choice = $taxonomic_profile.metaphlan2_db_choice.cached_metaphlan2_db.value
52 #set $mpa_pkl_db = $taxonomic_profile.mpa_pkl.cached_mpa_pkl.value 64 #set $metaphlan_option += " --bowtie2db " + $table[$db_choice]
53 #set $metaphlan_option += " --mpa_pkl " + $mpa_pkl_table[$mpa_pkl_db] 65 #set $metaphlan_option += " --mpa_pkl " + $table[$db_choice] + ".pkl"
54 #else 66 #else
55 #set $metaphlan_option += " --mpa_pkl " + $taxonomic_profile.mpa_pkl.history_mpa_pkl 67 #set $metaphlan_option += " --bowtie2db " + ref_db/ref_db
68 #set $metaphlan_option += " --mpa_pkl " + ref_db/metadata.pkl
56 #end if 69 #end if
57
58 #if $taxonomic_profile.bowtie2db.bowtie2db_selector == "cached"
59 #set $bowtie2_table = dict([(_[0], _[2]) for _ in $taxonomic_profile.bowtie2db.cached_bowtie2db.input.options.tool_data_table.data])
60 #set $bowtie2db_choice = $taxonomic_profile.bowtie2db.cached_bowtie2db.value
61 #set $metaphlan_option += " --bowtie2db " + $bowtie2_table[$bowtie2db_choice]
62 #else
63 #set $metaphlan_option += " --bowtie2db " + $taxonomic_profile.bowtie2db.history_bowtie2db
64 #end if
65
66 #end if 70 #end if
67
68 --metaphlan-options="$metaphlan_option" 71 --metaphlan-options="$metaphlan_option"
69 72
70 --evalue $e_value 73 --evalue $e_value
71 --identity-threshold $identity 74 --identity-threshold $identity
72 --prescreen-threshold $prescreen 75 --prescreen-threshold $prescreen
93 96
94 -o "output" 97 -o "output"
95 --output-format $output_format 98 --output-format $output_format
96 --output-max-decimals $output_max_dec 99 --output-max-decimals $output_max_dec
97 --output-basename "humann2" 100 --output-basename "humann2"
98 $remove_statified_output 101 $remove_statified_output
99 ]]></command> 102 ]]></command>
100 103
101 <inputs> 104 <inputs>
102 <param name="input_file" type="data" format="fastq,fasta,sam,bam,biom" 105 <param name="input_file" type="data" format="fastq,fasta,sam,bam,biom"
103 label="Input sequence file" help=""/> 106 label="Input sequence file" help=""/>
104 107
105 <conditional name="taxonomic_profile"> 108 <conditional name="taxonomic_profile">
106 <param name='taxonomic_profile_test' type='select' label="Use a custom taxonomic profile?" help="The file must have been created by MetaPhlan2"> 109 <param name='taxonomic_profile_test' type='select' label="Use a custom taxonomic profile?" help="The file must have been created by MetaPhlan2">
107 <option value="true">Yes</option> 110 <option value="true">Yes</option>
108 <option value="false" selected="true">No</option> 111 <option value="false" selected="true">No</option>
109 </param> 112 </param>
110 <when value="true"> 113 <when value="true">
111 <param name="taxonomic_profile_file" type="data" format="tabular,txt" label="Taxonomic profile 114 <param name="taxonomic_profile_file" type="data" format="tabular,txt" label="Taxonomic profile file" help=""/>
112 file" help=""/>
113 </when> 115 </when>
114 <when value="false"> 116 <when value="false">
115 <conditional name="mpa_pkl"> 117 <conditional name="metaphlan2_db_choice">
116 <param name="mpa_pkl_selector" type="select" label="Metadata for MetaPhlAn2" help=""> 118 <param name="metaphlan2_db_selector" type="select" label="Database with clade-specific marker genes" help="">
117 <option value="cached" selected="true">Locally cached</option> 119 <option value="cached" selected="true">Locally cached</option>
118 <option value="history">From history</option> 120 <option value="history">From history</option>
119 </param> 121 </param>
120 122
121 <when value="cached"> 123 <when value="cached">
122 <param name="cached_mpa_pkl" label="Cached metadata" type="select"> 124 <param name="cached_metaphlan2_db" label="Cached database with clade-specific marker genes" type="select" >
123 <options from_data_table="metaphlan2_metadata" /> 125 <options from_data_table="metaphlan2_db" />
124 </param> 126 </param>
125 </when> 127 </when>
126 <when value="history"> 128 <when value="history">
127 <param name="history_mpa_pkl" type="data" format="fasta" label="Metadata from history"/> 129 <param name="metaphlan2_db_sequences" type="data" format="fasta" label="Database with clade-specific marker genes from history" help="(--bowtie2db)"/>
130 <param name="metaphlan2_db_metadata" type="data" format="json" label="Metadata associate to the database with clade-specific marker genes from history" help="(--mpa_pkl)"/>
128 </when> 131 </when>
129 </conditional> 132 </conditional>
130
131 <conditional name="bowtie2db">
132 <param name="bowtie2db_selector" type="select" label="BowTie2 database for MetaPhlAn2" help="">
133 <option value="cached" selected="true">Locally cached</option>
134 <option value="history">From history</option>
135 </param>
136
137 <when value="cached">
138 <param name="cached_bowtie2db" label="Cached BowTie2 database" type="select" >
139 <options from_data_table="metaphlan2_bowtie_db" />
140 </param>
141 </when>
142 <when value="history">
143 <param name="history_bowtie2db" type="data" format="fasta" label="BowTie2 database from history"/>
144 </when>
145 </conditional>
146 </when> 133 </when>
147 </conditional> 134 </conditional>
148 135
149 <conditional name="nucleotide_db"> 136 <conditional name="nucleotide_db">
150 <param name="nucleotide_db_selector" type="select" label="Nucleotide database" help=""> 137 <param name="nucleotide_db_selector" type="select" label="Nucleotide database" help="For locally cached databases, you need first to execute the tool to download HUMAnN2 databases">
151 <option value="cached" selected="true">Locally cached</option> 138 <option value="cached" selected="true">Locally cached</option>
152 <option value="history">From history (as collection)</option> 139 <option value="history">From history (as collection)</option>
153 </param> 140 </param>
154 141
155 <when value="cached"/> 142 <when value="cached"/>
157 <param format="fasta" name="history_nucleotide_db" type="data_collection" collection_type="list" label="Nucleotide database from history" help="Each file must be named: ^[g__].[s__]"/> 144 <param format="fasta" name="history_nucleotide_db" type="data_collection" collection_type="list" label="Nucleotide database from history" help="Each file must be named: ^[g__].[s__]"/>
158 </when> 145 </when>
159 </conditional> 146 </conditional>
160 147
161 <conditional name="protein_db"> 148 <conditional name="protein_db">
162 <param name="protein_db_selector" type="select" label="Protein database" help=""> 149 <param name="protein_db_selector" type="select" label="Protein database" help="For locally cached databases, you need first to execute the tool to download HUMAnN2 databases">
163 <option value="cached" selected="true">Locally cached</option> 150 <option value="cached" selected="true">Locally cached</option>
164 <option value="history">From history</option> 151 <option value="history">From history</option>
165 </param> 152 </param>
166 153
167 <when value="cached"/> 154 <when value="cached"/>
253 240
254 **Inputs** 241 **Inputs**
255 242
256 The input is a single file corresponding either to filtered shotgun sequencing metagenome file (fastq, fastq.gz, fasta, or fasta.gz format), alignment file (sam, bam or blastm8 format) or gene table file (tsv or biom format). 243 The input is a single file corresponding either to filtered shotgun sequencing metagenome file (fastq, fastq.gz, fasta, or fasta.gz format), alignment file (sam, bam or blastm8 format) or gene table file (tsv or biom format).
257 244
258 A file with a taxonomic profile (obtained with MetaPhlan2) can also be provided to avoid first step of taxonomic profiling needed to select pangenomes in protein database. 245 A file with a taxonomic profile (obtained with MetaPhlan2) can also be provided to avoid first step of taxonomic profiling needed to select pangenomes in protein database. Otherwise, default MetaPhlAn2 or custom databases can be used for taxonomic profiling. For custom databases, a fasta file with marker gene sequences is required and also a json file containing metadata:
259 246
260 HUMAnN2 uses multiple databases. Locally cached nucleotide or protein databases have to be downloaded database before using them (using the dedicated tool). Custom databases can also be used after upload. Nucleotide database have to be provided as a dataset. 247 ::
248
249 {
250 "taxonomy": {
251 "taxonomy of genome1": genome1_length,
252 "taxonomy of genome2": genome2_length,
253 ...
254 }
255 "markers": {
256 "marker1_name": {
257 "clade": the clade that the marker belongs to,
258 "ext": [list of external genomes where the marker appears],
259 "len": length of the marker,
260 "score": score of the marker,
261 "taxon": the taxon of the marker
262 }
263 ...
264 }
265 }
266
267 For functional profiling, HUMAnN2 uses multiple databases. Locally cached nucleotide or protein databases have to be downloaded database before using them (using the dedicated tool). Custom databases can also be used after upload. Nucleotide database have to be provided as a dataset.
261 268
262 **Outputs** 269 **Outputs**
263 270
264 HUMAnN creates three output files: 271 HUMAnN creates three output files:
265 272