comparison bbnorm.xml @ 5:770bceda7785 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bbtools commit cd59ba2c349865259b92302a1d70e103b8a5e3cb
author iuc
date Tue, 27 Aug 2024 10:14:11 +0000
parents 1baa4ad1ac2f
children
comparison
equal deleted inserted replaced
4:1baa4ad1ac2f 5:770bceda7785
143 <when value="PE_2files"> 143 <when value="PE_2files">
144 <param name="read1" type="data" format="fastqsanger,fastqsanger.gz" label="Forward reads"/> 144 <param name="read1" type="data" format="fastqsanger,fastqsanger.gz" label="Forward reads"/>
145 <param name="read2" type="data" format="fastqsanger,fastqsanger.gz" label="Reverse reads"/> 145 <param name="read2" type="data" format="fastqsanger,fastqsanger.gz" label="Reverse reads"/>
146 </when> 146 </when>
147 <when value="paired"> 147 <when value="paired">
148 <param name="reads_collection" type="data_collection" format="fastqsanger,fastqsanger.gz" collection_type="paired" label="Collection of forward and reverse reads"/> 148 <param name="reads_collection" type="data_collection" format="fastqsanger,fastqsanger.gz" label="Collection of forward and reverse reads" collection_type="paired"/>
149 </when> 149 </when>
150 </conditional> 150 </conditional>
151 <param argument="target" type="integer" value="100" min="1" label="Target normalization depth" help="All depth parameters control kmer depth, not read depth. For kmer depth Dk, read depth Dr, read length R, and kmer size K: Dr=Dk*(R/(R-K+1))"/> 151 <param argument="target" type="integer" min="1" value="100" label="Target normalization depth" help="All depth parameters control kmer depth, not read depth. For kmer depth Dk, read depth Dr, read length R, and kmer size K: Dr=Dk*(R/(R-K+1))"/>
152 <section name="norm_params" title="Normalization parameters"> 152 <section name="norm_params" title="Normalization parameters">
153 <param argument="maxdepth" type="integer" value="-1" min="-1" label="Reads will not be downsampled when below this depth, even if they are above the target depth." help="All depth parameters control kmer depth, not read depth. For kmer depth Dk, read depth Dr, read length R, and kmer size K: Dr=Dk*(R/(R-K+1))"/> 153 <param argument="maxdepth" type="integer" min="-1" value="-1" label="Reads will not be downsampled when below this depth, even if they are above the target depth." help="All depth parameters control kmer depth, not read depth. For kmer depth Dk, read depth Dr, read length R, and kmer size K: Dr=Dk*(R/(R-K+1))"/>
154 <param argument="mindepth" type="integer" value="5" min="0" label="kmers with depth below this number will not be included when calculating the depth of a read." help="All depth parameters control kmer depth, not read depth. For kmer depth Dk, read depth Dr, read length R, and kmer size K: Dr=Dk*(R/(R-K+1))"/> 154 <param argument="mindepth" type="integer" min="0" value="5" label="kmers with depth below this number will not be included when calculating the depth of a read." help="All depth parameters control kmer depth, not read depth. For kmer depth Dk, read depth Dr, read length R, and kmer size K: Dr=Dk*(R/(R-K+1))"/>
155 <param argument="minkmers" type="integer" value="15" min="0" label="Reads must have at least this many kmers over min depth to be retained."/> 155 <param argument="minkmers" type="integer" min="0" value="15" label="Reads must have at least this many kmers over min depth to be retained."/>
156 <param argument="percentile" type="integer" value="54" min="1" max="100" label="Percentile to infer read depth" help="Read depth is by default inferred from the 54th percentile of kmer depth, but this may be changed to any number 1-100."/> 156 <param argument="percentile" type="integer" min="1" max="100" value="54" label="Percentile to infer read depth" help="Read depth is by default inferred from the 54th percentile of kmer depth, but this may be changed to any number 1-100."/>
157 <param argument="uselowerdepth" type="boolean" checked="true" label="For pairs, use the depth of the lower read as the depth proxy."/> 157 <param argument="uselowerdepth" type="boolean" checked="true" label="For pairs, use the depth of the lower read as the depth proxy."/>
158 <param argument="deterministic" type="boolean" checked="true" label="Generate random numbers deterministically" help="This would ensure identical output between multiple runs. May decrease speed with a huge number of threads."/> 158 <param argument="deterministic" type="boolean" checked="true" label="Generate random numbers deterministically" help="This would ensure identical output between multiple runs. May decrease speed with a huge number of threads."/>
159 <param argument="fixspikes" type="boolean" checked="false" label="Do a slower, high-precision bloom filter lookup of kmers that appear to have an abnormally high depth due to collisions."/> 159 <param argument="fixspikes" type="boolean" checked="false" label="Do a slower, high-precision bloom filter lookup of kmers that appear to have an abnormally high depth due to collisions."/>
160 <param argument="passes" type="integer" value="2" label="Number of passes to perform" help=" pass is the basic mode. 2 passes allows greater accuracy, error detection, better contol of output depth."/> 160 <param argument="passes" type="integer" value="2" label="Number of passes to perform" help=" pass is the basic mode. 2 passes allows greater accuracy, error detection, better contol of output depth."/>
161 </section> 161 </section>
162 <section name="hashing_params" title="Hashing parameters"> 162 <section name="hashing_params" title="Hashing parameters">
163 <param argument="k" type="integer" value="31" min="1" label="kmer length" help="Values under 32 are most efficient, but arbitrarily high values are supported."/> 163 <param argument="k" type="integer" min="1" value="31" label="kmer length" help="Values under 32 are most efficient, but arbitrarily high values are supported."/>
164 <param argument="bits" type="select" label="Bits per cell in bloom filter" help="Maximum kmer depth recorded is 2^c bits. Large values decrease accuracy for a fixed amount of memory, so use the lowest number you can that will still capture highest-depth kmers."> 164 <param argument="bits" type="select" label="Bits per cell in bloom filter" help="Maximum kmer depth recorded is 2^c bits. Large values decrease accuracy for a fixed amount of memory, so use the lowest number you can that will still capture highest-depth kmers.">
165 <option value="2">2</option> 165 <option value="2">2</option>
166 <option value="4">4</option> 166 <option value="4">4</option>
167 <option value="8">8</option> 167 <option value="8">8</option>
168 <option value="16" selected="true">16</option> 168 <option value="16" selected="true">16</option>
169 <option value="32">32</option> 169 <option value="32">32</option>
170 </param> 170 </param>
171 <param argument="hashes" type="integer" value="3" min="1" label="Number of times each kmer is hashed and stored." help="Higher is slower. Higher is more accurate if there is enough memory, but less accurate if there is not enough memory."/> 171 <param argument="hashes" type="integer" min="1" value="3" label="Number of times each kmer is hashed and stored." help="Higher is slower. Higher is more accurate if there is enough memory, but less accurate if there is not enough memory."/>
172 <conditional name="prefilter"> 172 <conditional name="prefilter">
173 <param argument="prefilter" type="select" label="Use a prefilter to eliminate low-depth kmers" help="True is slower, but generally more accurate; filters out low-depth kmers from the main hashtable. The prefilter is more memory-efficient because it uses 2-bit cells."> 173 <param argument="prefilter" type="select" label="Use a prefilter to eliminate low-depth kmers" help="True is slower, but generally more accurate; filters out low-depth kmers from the main hashtable. The prefilter is more memory-efficient because it uses 2-bit cells.">
174 <option value="true">Yes</option> 174 <option value="true">Yes</option>
175 <option value="false" selected="true">No</option> 175 <option value="false" selected="true">No</option>
176 </param> 176 </param>
177 <when value="false"/> 177 <when value="false"/>
178 <when value="true"> 178 <when value="true">
179 <param argument="prehashes" type="integer" value="2" min="1" label="Number of hashes for the prefilter"/> 179 <param argument="prehashes" type="integer" min="1" value="2" label="Number of hashes for the prefilter"/>
180 <param argument="prefilterbits" type="integer" value="2" min="1" label="Bits per cell in prefilter"/> 180 <param argument="prefilterbits" type="integer" min="1" value="2" label="Bits per cell in prefilter"/>
181 <param argument="prefiltersize" type="float" value="0.35" min="0" max="1" label="Fraction of memory to allocate for the prefilter."/> 181 <param argument="prefiltersize" type="float" min="0" max="1" value="0.35" label="Fraction of memory to allocate for the prefilter."/>
182 </when> 182 </when>
183 </conditional> 183 </conditional>
184 <param argument="buildpasses" type="integer" value="1" min="1" label="Number of passes" help="More passes can sometimes increase accuracy by iteratively removing low-depth kmers"/> 184 <param argument="buildpasses" type="integer" min="1" value="1" label="Number of passes" help="More passes can sometimes increase accuracy by iteratively removing low-depth kmers"/>
185 <param argument="minq" type="integer" value="6" min="0" label="Ignore kmers containing bases with quality below this threshold"/> 185 <param argument="minq" type="integer" min="0" value="6" label="Ignore kmers containing bases with quality below this threshold"/>
186 <param argument="minprob" type="float" value="0.5" min="0" max="1" label="Ignore kmers with overall probability of correctness below this threshold"/> 186 <param argument="minprob" type="float" min="0" max="1" value="0.5" label="Ignore kmers with overall probability of correctness below this threshold"/>
187 <param argument="rdk" type="boolean" checked="true" label="Remove duplicate kmers" help="When true, a kmer's count will only be incremented once per read pair, even if that kmer occurs more than once."/> 187 <param argument="rdk" type="boolean" checked="true" label="Remove duplicate kmers" help="When true, a kmer's count will only be incremented once per read pair, even if that kmer occurs more than once."/>
188 </section> 188 </section>
189 <section name="error_det_params" title="Error detection parameters"> 189 <section name="error_det_params" title="Error detection parameters">
190 <param argument="hdp" type="integer" value="90" min="0" max="100" label="highdepthpercentile" help="Position in sorted kmer depth array used as proxy of a read's high kmer depth."/> 190 <param argument="hdp" type="integer" min="0" max="100" value="90" label="highdepthpercentile" help="Position in sorted kmer depth array used as proxy of a read's high kmer depth."/>
191 <param argument="ldp" type="integer" value="25" min="0" max="100" label="lowdepthpercentile" help="Position in sorted kmer depth array used as proxy of a read's low kmer depth."/> 191 <param argument="ldp" type="integer" min="0" max="100" value="25" label="lowdepthpercentile" help="Position in sorted kmer depth array used as proxy of a read's low kmer depth."/>
192 <param argument="tossbadreads" type="boolean" checked="false" label="Throw away reads detected as containing errors."/> 192 <param argument="tossbadreads" type="boolean" checked="false" label="Throw away reads detected as containing errors."/>
193 <param argument="requirebothbad" type="boolean" checked="false" label="Only toss bad pairs if both reads are bad."/> 193 <param argument="requirebothbad" type="boolean" checked="false" label="Only toss bad pairs if both reads are bad."/>
194 <param argument="errordetectratio" type="integer" value="125" min="0" label="Error detection ratio" help="Reads with a ratio of at least this much between their high and low depth kmers will be classified as error reads."/> 194 <param argument="errordetectratio" type="integer" min="0" value="125" label="Error detection ratio" help="Reads with a ratio of at least this much between their high and low depth kmers will be classified as error reads."/>
195 <param argument="highthresh" type="integer" value="12" min="0" label="Threshold for high kmer" help="A high kmer at this or above are considered non-error."/> 195 <param argument="highthresh" type="integer" min="0" value="12" label="Threshold for high kmer" help="A high kmer at this or above are considered non-error."/>
196 <param argument="lowthresh" type="integer" value="3" min="0" label="Threshold for low kmer" help="Kmers at this and below are always considered errors."/> 196 <param argument="lowthresh" type="integer" min="0" value="3" label="Threshold for low kmer" help="Kmers at this and below are always considered errors."/>
197 </section> 197 </section>
198
199 <section name="error_corr_params" title="Error correction parameters"> 198 <section name="error_corr_params" title="Error correction parameters">
200 <conditional name="ecc"> 199 <conditional name="ecc">
201 <param argument="ecc" type="select" label="What should be done with detected errors?" help="Tadpole is now preferred for error correction, as it does a better job."> 200 <param argument="ecc" type="select" label="What should be done with detected errors?" help="Tadpole is now preferred for error correction, as it does a better job.">
202 <option value="true" >Correct errors when possible</option> 201 <option value="true">Correct errors when possible</option>
203 <option value="false" selected="true">Do not attempt to correct errors</option> 202 <option value="false" selected="true">Do not attempt to correct errors</option>
204 </param> 203 </param>
205 <when value="false"/> 204 <when value="false"/>
206 <when value="true"> 205 <when value="true">
207 <param argument="ecclimit" type="integer" value="3" min="1" label="Correct up to this many errors per read." help="If more are detected, the read will remain unchanged."/> 206 <param argument="ecclimit" type="integer" min="1" value="3" label="Correct up to this many errors per read." help="If more are detected, the read will remain unchanged."/>
208 <param argument="errorcorrectratio" type="integer" value="140" min="0" label="Depth ratio" help="Adjacent kmers with a depth ratio of at least this much between will be classified as an error."/> 207 <param argument="errorcorrectratio" type="integer" min="0" value="140" label="Depth ratio" help="Adjacent kmers with a depth ratio of at least this much between will be classified as an error."/>
209 <param argument="echighthresh" type="integer" value="22" min="0" label="Threshold for high kmer" help="A kmer at this or above may be considered non-error."/> 208 <param argument="echighthresh" type="integer" min="0" value="22" label="Threshold for high kmer" help="A kmer at this or above may be considered non-error."/>
210 <param argument="eclowthresh" type="integer" value="2" min="0" label="Threshold for low kmer." help="kmers at this depth or below will be considered as errors."/> 209 <param argument="eclowthresh" type="integer" min="0" value="2" label="Threshold for low kmer." help="kmers at this depth or below will be considered as errors."/>
211 <param argument="eccmaxqual" type="integer" value="127" min="0" label="Do not correct bases with quality above this value."/> 210 <param argument="eccmaxqual" type="integer" min="0" value="127" label="Do not correct bases with quality above this value."/>
212 <param argument="meo" type="boolean" checked="false" label="Marks errors by reducing quality value of suspected errors; does not correct anything."/> 211 <param argument="meo" type="boolean" checked="false" label="Marks errors by reducing quality value of suspected errors; does not correct anything."/>
213 <param argument="mue" type="boolean" checked="true" label="Mark errors only on uncorrectable reads."/> 212 <param argument="mue" type="boolean" checked="true" label="Mark errors only on uncorrectable reads."/>
214 <param argument="overlap" type="boolean" checked="false" label="Correct errors by read overlap."/> 213 <param argument="overlap" type="boolean" checked="false" label="Correct errors by read overlap."/>
215 </when> 214 </when>
216 </conditional> 215 </conditional>
217 </section> 216 </section>
218
219 <section name="output_options" title="Output options"> 217 <section name="output_options" title="Output options">
220 <param name="save_discarded_reads" type="boolean" checked="false" label="Save the reads that were eliminated from the input datasets to the history"/> 218 <param name="save_discarded_reads" type="boolean" checked="false" label="Save the reads that were eliminated from the input datasets to the history"/>
221 <param name="save_kmer_hists" type="boolean" checked="false" label="Save the kmer histograms (in tabular format) for the input and output datasets to the history"/> 219 <param name="save_kmer_hists" type="boolean" checked="false" label="Save the kmer histograms (in tabular format) for the input and output datasets to the history"/>
222 </section> 220 </section>
223 </inputs> 221 </inputs>
245 </outputs> 243 </outputs>
246 <tests> 244 <tests>
247 <!-- Single end sequencing --> 245 <!-- Single end sequencing -->
248 <test expect_num_outputs="1"> 246 <test expect_num_outputs="1">
249 <param name="input_type" value="single_end"/> 247 <param name="input_type" value="single_end"/>
250 <param name="read1" ftype="fastqsanger" value="bbnorm/input_R1.fastq"/> 248 <param name="read1" value="bbnorm/input_R1.fastq" ftype="fastqsanger"/>
251 <param name="target" value="4"/> 249 <param name="target" value="4"/>
252 <section name="norm_params"> 250 <section name="norm_params">
253 <param name="deterministic" value="true"/> 251 <param name="deterministic" value="true"/>
254 <param name="mindepth" value="0"/> 252 <param name="mindepth" value="0"/>
255 </section> 253 </section>
256 <output name="output_normalised_R1" ftype="fastqsanger" value="bbnorm/normalised_R1.fastq"/> 254 <output name="output_normalised_R1" ftype="fastqsanger" value="bbnorm/normalised_R1.fastq"/>
257 </test> 255 </test>
258 <!-- Single end sequencing, compressed --> 256 <!-- Single end sequencing, compressed -->
259 <test expect_num_outputs="1"> 257 <test expect_num_outputs="1">
260 <param name="input_type" value="single_end"/> 258 <param name="input_type" value="single_end"/>
261 <param name="read1" ftype="fastqsanger.gz" value="bbnorm/input_R1.fastq.gz"/> 259 <param name="read1" value="bbnorm/input_R1.fastq.gz" ftype="fastqsanger.gz"/>
262 <param name="target" value="4"/> 260 <param name="target" value="4"/>
263 <section name="norm_params"> 261 <section name="norm_params">
264 <param name="deterministic" value="true"/> 262 <param name="deterministic" value="true"/>
265 <param name="mindepth" value="0"/> 263 <param name="mindepth" value="0"/>
266 </section> 264 </section>
267 <output name="output_normalised_R1" ftype="fastqsanger.gz" value="bbnorm/normalised_R1.fastq"/> 265 <output name="output_normalised_R1" ftype="fastqsanger.gz" value="bbnorm/normalised_R1.fastq"/>
268 </test> 266 </test>
269 <!-- PE as an interleaved file --> 267 <!-- PE as an interleaved file -->
270 <test expect_num_outputs="4"> 268 <test expect_num_outputs="4">
271 <param name="input_type" value="PE_1file"/> 269 <param name="input_type" value="PE_1file"/>
272 <param name="read1" ftype="fastqsanger" value="bbnorm/input_interleaved.fastq"/> 270 <param name="read1" value="bbnorm/input_interleaved.fastq" ftype="fastqsanger"/>
273 <param name="target" value="4"/> 271 <param name="target" value="4"/>
274 <section name="norm_params"> 272 <section name="norm_params">
275 <param name="deterministic" value="true"/> 273 <param name="deterministic" value="true"/>
276 <param name="mindepth" value="0"/> 274 <param name="mindepth" value="0"/>
277 </section> 275 </section>
285 <output name="kmer_hist_output" ftype="tabular" file="bbnorm/kmer_hist_output.tabular"/> 283 <output name="kmer_hist_output" ftype="tabular" file="bbnorm/kmer_hist_output.tabular"/>
286 </test> 284 </test>
287 <!-- PE as 2 files --> 285 <!-- PE as 2 files -->
288 <test expect_num_outputs="2"> 286 <test expect_num_outputs="2">
289 <param name="input_type" value="PE_2files"/> 287 <param name="input_type" value="PE_2files"/>
290 <param name="read1" ftype="fastqsanger" value="bbnorm/input_R1.fastq"/> 288 <param name="read1" value="bbnorm/input_R1.fastq" ftype="fastqsanger"/>
291 <param name="read2" ftype="fastqsanger" value="bbnorm/input_R2.fastq"/> 289 <param name="read2" value="bbnorm/input_R2.fastq" ftype="fastqsanger"/>
292 <param name="target" value="4"/> 290 <param name="target" value="4"/>
293 <section name="norm_params"> 291 <section name="norm_params">
294 <param name="deterministic" value="true"/> 292 <param name="deterministic" value="true"/>
295 <param name="mindepth" value="0"/> 293 <param name="mindepth" value="0"/>
296 </section> 294 </section>
388 * The sequencing platform has a very high error rate (ex: ONT) that might mislead this algorithm. 386 * The sequencing platform has a very high error rate (ex: ONT) that might mislead this algorithm.
389 387
390 </help> 388 </help>
391 <expand macro="citations"/> 389 <expand macro="citations"/>
392 </tool> 390 </tool>
393