comparison freebayes.xml @ 16:6d9407020066 draft

Uploaded
author devteam
date Tue, 16 Dec 2014 16:15:43 -0500
parents 59731e950e23
children 4c80a1387285
comparison
equal deleted inserted replaced
15:59731e950e23 16:6d9407020066
1 <?xml version="1.0"?> 1 <?xml version="1.0"?>
2 <tool id="freebayes" name="FreeBayes" version="freebayes-0.9.14"> 2 <tool id="freebayes" name="FreeBayes" version="0.3">
3 <requirements> 3 <requirements>
4 <requirement type="package" version="freebayes-0.9.14_8a407cf5f4">freebayes</requirement> 4 <requirement type="package" version="0.9.18_0059bdf">freebayes</requirement>
5 <requirement type="package" version="0.1.18">samtools</requirement> 5 <requirement type="package" version="0.1.18">samtools</requirement>
6 </requirements> 6 </requirements>
7 <description> - Bayesian genetic variant detector</description> 7 <description> - bayesian genetic variant detector</description>
8 <command> 8 <command>
9 ##set up input files 9 ##set up input files
10 10
11 #set $reference_fasta_filename = "localref.fa" 11 #set $reference_fasta_filename = "localref.fa"
12 12
22 ln -s "${input_bam.input_bam.metadata.bam_index}" "localbam_${bam_count}.bam.bai" &amp;&amp; 22 ln -s "${input_bam.input_bam.metadata.bam_index}" "localbam_${bam_count}.bam.bai" &amp;&amp;
23 #end for 23 #end for
24 24
25 ## Tabixize optional input_varinat_vcf file (for --variant-input option) 25 ## Tabixize optional input_varinat_vcf file (for --variant-input option)
26 26
27 #if ( str( $options_type.options_type_selector ) == 'cline' or str( $options_type.options_type_selector ) == 'full' ) and str( $options_type.optional_inputs.optional_inputs_selector ) == 'set' and str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf": 27 #if ( str( $options_type.options_type_selector ) == 'cline' or str( $options_type.options_type_selector ) == 'full' ) and $options_type.optional_inputs.optional_inputs_selector and str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf":
28 ln -s "${options_type.optional_inputs.input_variant_type.input_variant_vcf}" input_variant_vcf.vcf.gz &amp;&amp; 28 ln -s "${options_type.optional_inputs.input_variant_type.input_variant_vcf}" "input_variant_vcf.vcf.gz" &amp;&amp;
29 ln -s "${Tabixized_input}" input_variant_vcf.vcf.gz.tbi &amp;&amp; 29 ln -s "${Tabixized_input}" "input_variant_vcf.vcf.gz.tbi" &amp;&amp;
30 #end if 30 #end if
31 31
32 ##finished setting up inputs 32 ##finished setting up inputs
33 33
34 ##COMMAND LINE STARTS HERE 34 ##COMMAND LINE STARTS HERE
72 --min-alternate-fraction 0 72 --min-alternate-fraction 0
73 --pooled-continuous 73 --pooled-continuous
74 --report-monomorphic 74 --report-monomorphic
75 --standard-filters 75 --standard-filters
76 --min-coverage "${options_type.min_coverage}" 76 --min-coverage "${options_type.min_coverage}"
77 77
78 #elif str( $options_type.options_type_selector ) == "cline": 78 ## Command line direct text entry is not allowed at this time for security reasons
79 79
80 ${options_type.cline} 80 ## #elif str( $options_type.options_type_selector ) == "cline":
81
82 ## ${options_type.cline}
81 83
82 @optional_inputs_outputs@ 84 ## @optional_inputs_outputs@
83 85
84 #elif str( $options_type.options_type_selector ) == "full": 86 #elif str( $options_type.options_type_selector ) == "full":
85 87
86 ##optional inputs and outputs 88 ##optional inputs and outputs
87 89
191 193
192 </command> 194 </command>
193 195
194 <macros> 196 <macros>
195 <token name="@optional_inputs_outputs@"> 197 <token name="@optional_inputs_outputs@">
196 ## This token gets injected in commane in two instances: when options_type.options_type_selector == "full" and "cline" 198 ## This token gets injected in commane in two instances: when options_type.options_type_selector == "full" and "cline" ( cline is not supported at this time )
197 199
198 #if $options_type.optional_inputs.optional_inputs_selector: 200 #if $options_type.optional_inputs.optional_inputs_selector:
199 201
200 #if $options_type.optional_inputs.output_trace_option: 202 #if $options_type.optional_inputs.output_trace_option:
201 --trace "${output_trace}" 203 --trace "${output_trace}"
216 #if $options_type.optional_inputs.A: 218 #if $options_type.optional_inputs.A:
217 --cnv-map "${options_type.optional_inputs.A}" 219 --cnv-map "${options_type.optional_inputs.A}"
218 #end if 220 #end if
219 221
220 #if str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf": 222 #if str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf":
221 --variant-input input_variant_vcf.vcf.gz ## input_variant_vcf.vcf.gz is symlinked to a galaxy-generated dataset in "Tabixize optional input_varinat_vcf file" section of the command line above 223 --variant-input "input_variant_vcf.vcf.gz" ## input_variant_vcf.vcf.gz is symlinked to a galaxy-generated dataset in "Tabixize optional input_varinat_vcf file" section of the command line above
222 ${options_type.optional_inputs.input_variant_type.only_use_input_alleles} 224 ${options_type.optional_inputs.input_variant_type.only_use_input_alleles}
223 #end if 225 #end if
224 226
225 #if $options_type.optional_inputs.haplotype_basis_alleles: 227 #if $options_type.optional_inputs.haplotype_basis_alleles:
226 --haplotype-basis-alleles "${options_type.optional_inputs.haplotype_basis_alleles}" 228 --haplotype-basis-alleles "${options_type.optional_inputs.haplotype_basis_alleles}"
280 </param> 282 </param>
281 <when value="cached"> 283 <when value="cached">
282 <repeat name="input_bams" title="Sample BAM file" min="1"> 284 <repeat name="input_bams" title="Sample BAM file" min="1">
283 <param name="input_bam" type="data" format="bam" label="BAM file"> 285 <param name="input_bam" type="data" format="bam" label="BAM file">
284 <validator type="unspecified_build" /> 286 <validator type="unspecified_build" />
285 <validator type="dataset_metadata_in_data_table" table_name="sam_fa_indexes" metadata_name="dbkey" metadata_column="1" message="Sequences are not currently available for the specified build." /> 287 <validator type="dataset_metadata_in_data_table" table_name="fasta_indexes" metadata_name="dbkey" metadata_column="1" message="Sequences are not currently available for the specified build." />
286 </param> 288 </param>
287 </repeat> 289 </repeat>
290
288 <param name="ref_file" type="select" label="Using reference genome"> 291 <param name="ref_file" type="select" label="Using reference genome">
289 <options from_data_table="sam_fa_indexes"> 292 <options from_data_table="fasta_indexes"></options>
290 <!-- <filter type="sam_fa_indexes" key="dbkey" ref="input_bam" column="value"/> does not yet work in a repeat...-->
291 </options>
292 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/> 293 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
293 </param> 294 </param>
294 </when> 295 </when>
295 <when value="history"> <!-- FIX ME!!!! --> 296 <when value="history"> <!-- FIX ME!!!! -->
296 <repeat name="input_bams" title="Sample BAM file" min="1"> 297 <repeat name="input_bams" title="Sample BAM file" min="1">
297 <param name="input_bam" type="data" format="bam" label="BAM file" /> 298 <param name="input_bam" type="data" format="bam" label="BAM file" />
298 </repeat> 299 </repeat>
299 <param name="ref_file" type="data" format="fasta" label="Use the folloing dataset as the reference sequence" help="You can upload a FASTA sequence to the history and use it as reference" /> 300 <param name="ref_file" type="data" format="fasta" label="Use the following dataset as the reference sequence" help="You can upload a FASTA sequence to the history and use it as reference" />
300 </when> 301 </when>
301 </conditional> 302 </conditional>
302 303
303 <conditional name="target_limit_type"> 304 <conditional name="target_limit_type">
304 <param name="target_limit_type_selector" type="select" label="Limit variant calling to a set of regions?" help="Sets --targets or --region options"> 305 <param name="target_limit_type_selector" type="select" label="Limit variant calling to a set of regions?" help="Sets --targets or --region options">
324 <option value="simple" selected="True">1:Simple diploid calling</option> 325 <option value="simple" selected="True">1:Simple diploid calling</option>
325 <option value="simple_w_filters">2:Simple diploid calling with filtering and coverage</option> 326 <option value="simple_w_filters">2:Simple diploid calling with filtering and coverage</option>
326 <option value="naive">3:Frequency-based pooled calling</option> 327 <option value="naive">3:Frequency-based pooled calling</option>
327 <option value="naive_w_filters">4:Frequency-based pooled calling with filtering and coverage</option> 328 <option value="naive_w_filters">4:Frequency-based pooled calling with filtering and coverage</option>
328 <option value="full">5:Complete list of all options</option> 329 <option value="full">5:Complete list of all options</option>
330 <!-- We will not alloow command line text boxes at this time
329 <option value="cline">6:Input parameters on the command line</option> 331 <option value="cline">6:Input parameters on the command line</option>
332 -->
330 </param> 333 </param>
331 <when value="full"> 334 <when value="full">
332 335
333 <expand macro="optional_file_inputs" /> <!-- see macros section --> 336 <expand macro="optional_file_inputs" /> <!-- see macros section -->
334 337
501 </when> 504 </when>
502 <when value="naive_w_filters"> 505 <when value="naive_w_filters">
503 <!-- do nothing build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic standard-filters--> 506 <!-- do nothing build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic standard-filters-->
504 <param name="min_coverage" type="integer" value="0" label="Require at least this coverage to process a site" help="-! --min-coverage; default=0 " /> 507 <param name="min_coverage" type="integer" value="0" label="Require at least this coverage to process a site" help="-! --min-coverage; default=0 " />
505 </when> 508 </when>
509
510 <!-- We will not allow command line textboxes at this time
506 <when value="cline"> 511 <when value="cline">
507 512
508 <expand macro="optional_file_inputs" /> <!-- see macros section --> 513 <expand macro="optional_file_inputs" />
509 514
510 <param name="cline" size="60" type="text" value="-m 20 -q 30" label="Type command line tags here" help="All paremeters that DO NOT involve filenames can be typed here. Use &quot;Do you want to provide additional inputs?&quot; section above to control input and output files. For full syntax check help section below"> 515 <param name="cline" size="60" type="text" value="-m 20 -q 30" label="Type command line tags here" help="All paremeters that DO NOT involve filenames can be typed here. Use &quot;Do you want to provide additional inputs?&quot; section above to control input and output files. For full syntax check help section below">
511 <sanitizer> 516 <sanitizer>
512 <valid initial="string.printable"> 517 <valid initial="string.printable">
513 <remove value="&apos;"/> 518 <remove value="&apos;"/>
516 <add source="&apos;" target="__sq__"/> 521 <add source="&apos;" target="__sq__"/>
517 </mapping> 522 </mapping>
518 </sanitizer> 523 </sanitizer>
519 </param> 524 </param>
520 </when> 525 </when>
526 -->
521 527
522 </conditional> 528 </conditional>
523 529
524 </inputs> 530 </inputs>
525 <outputs> 531 <outputs>
548 554
549 FreeBayes is a Bayesian genetic variant detector designed to find small polymorphisms, specifically SNPs (single-nucleotide polymorphisms), indels (insertions and deletions), MNPs (multi-nucleotide polymorphisms), and complex events (composite insertion and substitution events) smaller than the length of a short-read sequencing alignment. 555 FreeBayes is a Bayesian genetic variant detector designed to find small polymorphisms, specifically SNPs (single-nucleotide polymorphisms), indels (insertions and deletions), MNPs (multi-nucleotide polymorphisms), and complex events (composite insertion and substitution events) smaller than the length of a short-read sequencing alignment.
550 556
551 See https://github.com/ekg/freebayes for details on FreeBayes. 557 See https://github.com/ekg/freebayes for details on FreeBayes.
552 558
553 This Galaxy instance of FreeBayes corresponds to release 8a407cf5f4416b5eba5bf27ca80144cd5e75bb80 559 This Galaxy instance of FreeBayes corresponds to release 0.9.18
554 560
555 ------ 561 ------
556 562
557 **Description** 563 **Description**
558 564
575 1. *Simple diploid calling*: The simples possible FreeBayes application. Equvalent of using FreeBayes with only a BAM input and no other parameter options. 581 1. *Simple diploid calling*: The simples possible FreeBayes application. Equvalent of using FreeBayes with only a BAM input and no other parameter options.
576 2. *Simple diploid calling with filtering and coverage*: Same as #1 plus two additional options: -0 (standard filters: --min-mapping-quality 30 --min-base-quality 20 --min-supporting-allele-qsum 0 --genotype-varinat-threshold 0) and --min-coverage. 582 2. *Simple diploid calling with filtering and coverage*: Same as #1 plus two additional options: -0 (standard filters: --min-mapping-quality 30 --min-base-quality 20 --min-supporting-allele-qsum 0 --genotype-varinat-threshold 0) and --min-coverage.
577 3. *Frequency-based pooled calling*: This is equivalent to using FreeBayes with the following options: --haplotype-length 0 --min-alternate-count 1 --min-alternate-fraction 0 --pooled-continuous --report-monomorphic. This is the best choice for calling varinats in mixtures such as viral, bacterial, or organellar genomes. 583 3. *Frequency-based pooled calling*: This is equivalent to using FreeBayes with the following options: --haplotype-length 0 --min-alternate-count 1 --min-alternate-fraction 0 --pooled-continuous --report-monomorphic. This is the best choice for calling varinats in mixtures such as viral, bacterial, or organellar genomes.
578 4. *Frequency-based pooled calling with filtering and coverage*: Same as #3 but adds -0 and --min-coverage like in #2. 584 4. *Frequency-based pooled calling with filtering and coverage*: Same as #3 but adds -0 and --min-coverage like in #2.
579 5. *Complete list of all options*: Gives you full control by exposing all FreeBayes options as Galaxy widgets. 585 5. *Complete list of all options*: Gives you full control by exposing all FreeBayes options as Galaxy widgets.
580 6. *Input parameters on the command line*: Similar to the choice above but for those who does not like clicking. Here options can be directly typed into a text box.
581 586
582 ----- 587 -----
583 588
584 **FreeBayes options** 589 **FreeBayes options**
585 590
834 For the underlying tool, please cite `Erik Garrison and Gabor Marth. Haplotype-based variant detection from short-read sequencing &lt;http://arxiv.org/abs/1207.3907&gt;`_. 839 For the underlying tool, please cite `Erik Garrison and Gabor Marth. Haplotype-based variant detection from short-read sequencing &lt;http://arxiv.org/abs/1207.3907&gt;`_.
835 840
836 The initial version of the wrapper was produced by Dan Blankenberg and upgraded by Anton Nekrutenko. 841 The initial version of the wrapper was produced by Dan Blankenberg and upgraded by Anton Nekrutenko.
837 842
838 </help> 843 </help>
844
845 <citations>
846 <citation type="bibtex">@misc{1207.3907,
847 Author = {Erik Garrison},
848 Title = {Haplotype-based variant detection from short-read sequencing},
849 Year = {2012},
850 Eprint = {arXiv:1207.3907},
851 url = {http://arxiv.org/abs/1207.3907},
852 }</citation>
853 </citations>
839 </tool> 854 </tool>