annotate bwa-mem.xml @ 10:6069ffa8b240 draft

planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
author devteam
date Fri, 08 Jan 2016 17:02:09 -0500
parents 7bee165c3a44
children 546ada4a9f43
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
1 <?xml version="1.0"?>
10
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
2 <tool id="bwa_mem" name="Map with BWA-MEM" version="0.7.12">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
3 <description>- map medium and long reads (&gt; 100 bp) against reference genome</description>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
4 <macros>
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
5 <import>read_group_macros.xml</import>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
6 <import>bwa_macros.xml</import>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
7 </macros>
7
d8c9597bfb09 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
devteam
parents: 6
diff changeset
8 <expand macro="requirements" />
6
09a7281d24c5 planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents: 5
diff changeset
9 <expand macro="stdio" />
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
10 <command>
10
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
11 <![CDATA[
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
12 #set $reference_fasta_filename = "localref.fa"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
13
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
14 #if str( $reference_source.reference_source_selector ) == "history":
10
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
15 ln -s "${reference_source.ref_file}" "${reference_fasta_filename}" &&
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
16
10
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
17 ## The following shell commands decide which of the BWA indexing algorithms (IS or BWTSW) will be run
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
18 ## depending on the size of the input FASTA dataset
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
19 ( size=`stat -c %s "${reference_source.ref_file}" 2>/dev/null`; ## Linux
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
20 if [ $? -ne 0 ]; then
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
21 size=\$(stat -f %z "${reference_source.ref_file}"); ## OSX
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
22 fi &&
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
23 if [ "\$size" -lt 2000000000 ]; then
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
24 echo "Reference genome size is \$size bytes, generating BWA index with is algorithm";
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
25 bwa index -a is "${reference_fasta_filename}";
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
26 else
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
27 echo "Reference genome size is \$size bytes, generating BWA index with bwtsw algorithm";
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
28 bwa index -a bwtsw "${reference_fasta_filename}";
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
29 fi
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
30 ) &&
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
31 #else:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
32 #set $reference_fasta_filename = str( $reference_source.ref_file.fields.path )
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
33 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
34
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
35 ## Begin BWA-MEM command line
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
36
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
37 bwa mem
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
38 -t "\${GALAXY_SLOTS:-1}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
39 -v 1 ## Verbosity is set to 1 (errors only)
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
40
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
41 #if str( $fastq_input.fastq_input_selector ) == "paired_iv": ## For interleaved fastq files set -p option
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
42 -p
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
43 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
44 -I "${fastq_input.iset_stats}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
45 #end if
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
46 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
47
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
48 #if str( $analysis_type.analysis_type_selector ) == "pacbio":
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
49 -x pacbio
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
50 #elif str( $analysis_type.analysis_type_selector ) == "full":
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
51 #if str( $analysis_type.algorithmic_options.algorithmic_options_selector ) == "set": ## Algorithmic options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
52 -k "${analysis_type.algorithmic_options.k}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
53 -w "${analysis_type.algorithmic_options.w}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
54 -d "${analysis_type.algorithmic_options.d}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
55 -r "${analysis_type.algorithmic_options.r}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
56 -y "${analysis_type.algorithmic_options.y}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
57 -c "${analysis_type.algorithmic_options.c}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
58 -D "${analysis_type.algorithmic_options.D}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
59 -W "${analysis_type.algorithmic_options.W}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
60 -m "${analysis_type.algorithmic_options.m}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
61 ${analysis_type.algorithmic_options.S}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
62 ${analysis_type.algorithmic_options.P}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
63 ${analysis_type.algorithmic_options.e}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
64 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
65
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
66 #if str( $analysis_type.scoring_options.scoring_options_selector ) == "set": ## Scoring options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
67 -A "${analysis_type.scoring_options.A}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
68 -B "${analysis_type.scoring_options.B}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
69 -O "${analysis_type.scoring_options.O}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
70 -E "${analysis_type.scoring_options.E}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
71 -L "${analysis_type.scoring_options.L}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
72 -U "${analysis_type.scoring_options.U}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
73 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
74
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
75 #if str( $analysis_type.io_options.io_options_selector ) == "set": ## IO options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
76 -T "${analysis_type.io_options.T}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
77 -h "${analysis_type.io_options.h}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
78 ${analysis_type.io_options.a}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
79 ${analysis_type.io_options.C}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
80 ${analysis_type.io_options.V}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
81 ${analysis_type.io_options.Y}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
82 ${analysis_type.io_options.M}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
83 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
84
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
85 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
86
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
87 ## Handle read group options...
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
88 @define_read_group_helpers@
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
89 #if str( $fastq_input.fastq_input_selector ) == "paired":
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
90 #set $rg_auto_name = $read_group_name_default($fastq_input.fastq_input1, $fastq_input.fastq_input2)
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
91 #else:
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
92 #set $rg_auto_name = $read_group_name_default($fastq_input.fastq_input1)
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
93 #end if
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
94 @set_use_rg_var@
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
95 @set_read_group_vars@
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
96 #if $use_rg
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
97 @set_rg_string@
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
98 -R '$rg_string'
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
99 #end if
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
100
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
101 #if str( $fastq_input.fastq_input_selector ) == "paired":
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
102 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
103 -I "${fastq_input.iset_stats}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
104 #end if
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
105
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
106 "${reference_fasta_filename}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
107 "${fastq_input.fastq_input1}" "${fastq_input.fastq_input2}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
108 #elif str( $fastq_input.fastq_input_selector ) == "paired_collection":
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
109 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
110 -I "${fastq_input.iset_stats}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
111 #end if
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
112
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
113 "${reference_fasta_filename}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
114 "${fastq_input.fastq_input1.forward}" "${fastq_input.fastq_input1.reverse}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
115 #else:
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
116 "${reference_fasta_filename}"
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
117 "${fastq_input.fastq_input1}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
118 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
119
10
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
120 | samtools view -Sb - > temporary_bam_file.bam &&
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
121
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
122 samtools sort -f temporary_bam_file.bam ${bam_output}
10
6069ffa8b240 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit 653588a3c59eb9965097f87c99e6fca1806365cd
devteam
parents: 9
diff changeset
123 ]]>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
124 </command>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
125
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
126 <inputs>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
127
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
128 <conditional name="reference_source">
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
129 <param name="reference_source_selector" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options. See `Indexes` section of help below">
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
130 <option value="cached">Use a built-in genome index</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
131 <option value="history">Use a genome from history and build index</option>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
132 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
133 <when value="cached">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
134 <param name="ref_file" type="select" label="Using reference genome" help="Select genome from the list">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
135 <options from_data_table="bwa_mem_indexes">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
136 <filter type="sort_by" column="2" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
137 <validator type="no_options" message="No indexes are available" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
138 </options>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
139 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
140 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
141 </when>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
142 <when value="history">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
143 <param name="ref_file" type="data" format="fasta" label="Use the following dataset as the reference sequence" help="You can upload a FASTA sequence to the history and use it as reference" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
144 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
145 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
146 <conditional name="fastq_input">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
147 <param name="fastq_input_selector" type="select" label="Single or Paired-end reads" help="Select between paired and single end data">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
148 <option value="paired">Paired</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
149 <option value="single">Single</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
150 <option value="paired_collection">Paired Collection</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
151 <option value="paired_iv">Paired Interleaved</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
152 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
153 <when value="paired">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
154 <param name="fastq_input1" type="data" format="fastqsanger" label="Select first set of reads" help="Specify dataset with forward reads"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
155 <param name="fastq_input2" type="data" format="fastqsanger" label="Select second set of reads" help="Specify dataset with reverse reads"/>
7
d8c9597bfb09 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
devteam
parents: 6
diff changeset
156 <param name="iset_stats" type="text" optional="True" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
157 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
158 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
159 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
160 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
161 </when>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
162 <when value="single">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
163 <param name="fastq_input1" type="data" format="fastqsanger" label="Select fastq dataset" help="Specify dataset with single reads"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
164 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
165 <when value="paired_collection">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
166 <param name="fastq_input1" format="fastqsanger" type="data_collection" collection_type="paired" label="Select a paired collection" help="See help section for an explanation of dataset collections"/>
7
d8c9597bfb09 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
devteam
parents: 6
diff changeset
167 <param name="iset_stats" type="text" optional="True" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
168 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
169 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
170 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
171 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
172 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
173 <when value="paired_iv">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
174 <param name="fastq_input1" type="data" format="fastqsanger" label="Select fastq dataset" help="Specify dataset with interleaved reads"/>
7
d8c9597bfb09 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
devteam
parents: 6
diff changeset
175 <param name="iset_stats" type="text" optional="True" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
176 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
177 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
178 </sanitizer>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
179 </param>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
180 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
181 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
182
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
183 <expand macro="read_group_conditional" />
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
184
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
185 <conditional name="analysis_type">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
186 <param name="analysis_type_selector" type="select" label="Select analysis mode">
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
187 <option value="illumina">1.Simple Illumina mode</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
188 <option value="pacbio">2.PacBio mode (-x pacbio)</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
189 <option value="full">3.Full list of options</option>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
190 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
191 <when value="illumina">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
192 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
193 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
194 <when value="pacbio">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
195 <!-- do nothing. all magic happens within <command> tag -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
196 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
197 <when value="full">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
198 <conditional name="algorithmic_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
199 <param name="algorithmic_options_selector" type="select" label="Set algorithmic options?" help="Sets -k, -w, -d, -r, -y, -c, -D, -W, -m, -S, -P, and -e options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
200 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
201 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
202 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
203 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
204 <param name="k" type="integer" value="19" label="Minimum seed length" help="-k; default=19"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
205 <param name="w" type="integer" value="100" label="Band width for banded alignment" help="-w; default=100"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
206 <param name="d" type="integer" value="100" label="Off-diagonal X-dropoff" help="-d; default=100"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
207 <param name="r" type="float" value="1.5" label="Look for internal seeds inside a seed longer than -k * THIS VALUE" help="-r; default=1.5; This is a key heuristic parameter for tuning the performance. Larger value yields fewer seeds, which leads to faster alignment speed but lower accuracy" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
208 <param name="y" type="integer" value="20" label="Seed occurrence for the 3rd round seeding" help="-y; default=20" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
209 <param name="c" type="integer" value="500" label="Skip seeds with more than that many occurrences" help="-c; default=500"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
210 <param name="D" type="float" value="0.5" label="Drop chains shorter than this fraction of the longest overlapping chain" help="-D; default=0.5"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
211 <param name="W" type="integer" value="0" label="Discard a chain if seeded bases shorter than THIS VALUE" help="-W; default=0"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
212 <param name="m" type="integer" value="50" label="Perform at most this many rounds of mate rescues for each read" help="-m; default=50"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
213 <param name="S" type="boolean" truevalue="-S" falsevalue="" label="Skip mate rescue" help="-S"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
214 <param name="P" type="boolean" truevalue="-P" falsevalue="" label="Skip pairing; mate rescue performed unless -S also in use" help="-P"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
215 <param name="e" type="boolean" truevalue="-e" falsevalue="" label="Discard full-length exact matches" help="-e"/>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
216 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
217 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
218 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
219 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
220 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
221
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
222 <conditional name="scoring_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
223 <param name="scoring_options_selector" type="select" label="Set scoring options?" help="Sets -A, -B, -O, -E, -L, and -U options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
224 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
225 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
226 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
227 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
228 <param name="A" type="integer" value="1" label="Score for a sequence match" help="-A; scales options -T, -d, -B, -O, -E, -L, and -U unless overridden; default=1"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
229 <param name="B" type="integer" value="4" label="Penalty for a mismatch" help="-B; default=4"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
230 <param name="O" type="text" value="6,6" label="Gap open penalties for deletions and insertions" help="-O; default=6,6">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
231 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
232 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
233 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
234 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
235 <param name="E" type="text" value="1,1" label="Gap extension penalties; a gap of size k cost &#39;-O + -E*k&#39;. If two numbers are specified, the first is the penalty of extending a deletion and the second for extending an insertion" help="-E; default=1,1">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
236 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
237 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
238 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
239 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
240 <param name="L" type="text" value="5,5" label="Penalties for 5&#39;-end and 3&#39;-end clipping" help="-L; default=5,5; When performing Smith-Waterman extension, BWA-MEM keeps track of the best score reaching the end of query. If this score is larger than the best Smith-Waterman score minus the clipping penalty, clipping will not be applied. Note that in this case, the SAM AS tag reports the best Smith-Waterman score; clipping penalty is not deduced">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
241 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
242 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
243 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
244 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
245 <param name="U" type="integer" value="17" label="Penalty for an unpaired read pair" help="-U; default=17"/>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
246 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
247 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
248 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
249 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
250 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
251
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
252 <conditional name="io_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
253 <param name="io_options_selector" type="select" label="Set input/output options" help="Sets -T, -h, -a, -C, -V, -Y, and -M options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
254 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
255 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
256 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
257 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
258 <param name="T" type="integer" value="30" label="Minimum score to output" help="-T; default=30"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
259 <param name="h" type="integer" value="5" label="If there are less than THIS VALUE hits with score &gt;80% of the max score, output them all in the XA tag" help="-h; default=5" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
260 <param name="a" type="boolean" truevalue="-a" falsevalue="" label="Output all alignments for single-ends or unpaired paired-ends" help="-a; These alignments will be flagged as secondary alignments"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
261 <param name="C" type="boolean" truevalue="-C" falsevalue="" label="Append FASTA/FASTQ comment to BAM output" help="-C"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
262 <param name="V" type="boolean" truevalue="-V" falsevalue="" label="Output the reference FASTA header in the XR tag" help="-C"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
263 <param name="Y" type="boolean" truevalue="-Y" falsevalue="" label="Use soft clipping for supplementary alignments" help="-Y; By default, BWA-MEM uses soft clipping for the primary alignment and hard clipping for supplementary alignments" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
264 <param name="M" type="boolean" truevalue="-M" falsevalue="" label="Mark shorter split hits of a chimeric alignment in the FLAG field as 'secondary alignment' instead of 'supplementary alignment'" help="-M; For Picard&lt;1.96 compatibility" />
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
265 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
266 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
267 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
268 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
269 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
270 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
271 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
272 </inputs>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
273
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
274 <outputs>
6
09a7281d24c5 planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents: 5
diff changeset
275 <data format="bam" name="bam_output" label="${tool.name} on ${on_string} (mapped reads in BAM format)">
09a7281d24c5 planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents: 5
diff changeset
276 <expand macro="dbKeyActionsBwaMem" />
09a7281d24c5 planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents: 5
diff changeset
277 </data>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
278 </outputs>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
279
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
280 <tests>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
281 <test>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
282 <param name="reference_source_selector" value="history" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
283 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
284 <param name="fastq_input_selector" value="paired"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
285 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
286 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
287 <param name="analysis_type_selector" value="illumina"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
288 <output name="bam_output" ftype="bam" file="bwa-mem-test1.bam" lines_diff="2" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
289 </test>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
290 <test>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
291 <param name="reference_source_selector" value="history" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
292 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
293 <param name="fastq_input_selector" value="paired"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
294 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
295 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
296 <param name="rg_selector" value="set"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
297 <param name="ID" value="rg1"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
298 <param name="PL" value="CAPILLARY"/>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
299 <param name="LB" value="AARDVARK-1" />
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
300 <param name="analysis_type_selector" value="illumina"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
301 <output name="bam_output" ftype="bam" file="bwa-mem-test2.bam" lines_diff="2" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
302 </test>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
303 </tests>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
304 <help>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
305 **What is does**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
306
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
307 From http://arxiv.org/abs/1303.3997:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
308
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
309 BWA-MEM is a new alignment algorithm for aligning sequence reads or long query sequences against a large reference genome such as human.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
310 It automatically chooses between local and end-to-end alignments, supports paired-end reads and performs chimeric alignment.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
311 The algorithm is robust to sequencing errors and applicable to a wide range of sequence lengths from 70bp to a few megabases.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
312 For mapping 100bp sequences, BWA-MEM shows better performance than several state-of-art read aligners to date.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
313
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
314 It is best suited for mapping long (>70 nt) reads against large reference genomes.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
315
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
316 This Galaxy tool wraps bwa-mem module of bwa read mapping tool. Galaxy implementation takes fastq files as input and produces output in BAM (not SAM) format, which can be further processed using various BAM utilities exiting in Galaxy (BAMTools, SAMTools, Picard).
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
317
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
318 -----
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
319
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
320 **Indices: Selecting reference genomes for BWA**
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
321
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
322 Galaxy wrapper for BWA allows you select between precomputed and user-defined indices for reference genomes using **Will you select a reference genome from your history or use a built-in index?** flag. This flag has two options:
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
323
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
324 1. **Use a built-in genome index** - when selected (this is default), Galaxy provides the user with **Select reference genome index** dropdown. Genomes listed in this dropdown have been pre-indexed with bwa index utility and are ready to be mapped against.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
325 2. **Use a genome from the history and build index** - when selected, Galaxy provides the user with **Select reference genome sequence** dropdown. This dropdown is populated by all FASTA formatted files listed in your current history. If your genome of interest is uploaded into history it will be shown there. Selecting a genome from this dropdown will cause Galaxy to first transparently index it using `bwa index` command, and then run mapping with `bwa mem`.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
326
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
327 If your genome of interest is not listed here you have two choices:
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
328
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
329 1. Contact galaxy team using **Help->Support** link at the top of the interface and let us know that an index needs to be added
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
330 2. Upload your genome of interest as a FASTA file to Galaxy history and selected **Use a genome from the history and build index** option.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
331
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
332 -----
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
333
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
334 **Galaxy-specific option**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
335
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
336 Galaxy allows four levels of control over bwa-mem options provided by **Select analysis mode** menu option. These are:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
337
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
338 1. *Simple Illumina mode*: The simplest possible bwa mem application in which it alignes single or paired-end data to reference using default parameters. It is equivalent to the following command: bwa mem &lt;reference index&gt; &lt;fastq dataset1&gt; [fastq dataset2]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
339 2. *PacBio mode*: The mode adjusted specifically for mapping of long PacBio subreads. Equivalent to the following command: bwa mem -k17 -W40 -r10 -A1 -B1 -O1 -E1 -L0 &lt;reference index&gt; &lt;PacBio dataset in fastq format&gt;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
340 3. *Full list of options*: Allows access to all options through Galaxy interface.
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
341
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
342 ------
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
343
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
344 **BWA MEM options**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
345
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
346 Each Galaxy parameter widget corresponds to command line flags listed below:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
347
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
348 Algorithm options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
349
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
350 -k INT minimum seed length [19]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
351 -w INT band width for banded alignment [100]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
352 -d INT off-diagonal X-dropoff [100]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
353 -r FLOAT look for internal seeds inside a seed longer than {-k} * FLOAT [1.5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
354 -y INT find MEMs longer than {-k} * {-r} with size less than INT [0]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
355 -c INT skip seeds with more than INT occurrences [500]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
356 -D FLOAT drop chains shorter than FLOAT fraction of the longest overlapping chain [0.50]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
357 -W INT discard a chain if seeded bases shorter than INT [0]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
358 -m INT perform at most INT rounds of mate rescues for each read [50]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
359 -S skip mate rescue
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
360 -P skip pairing; mate rescue performed unless -S also in use
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
361 -e discard full-length exact matches
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
362
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
363 Scoring options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
364
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
365 -A INT score for a sequence match, which scales options -TdBOELU unless overridden [1]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
366 -B INT penalty for a mismatch [4]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
367 -O INT[,INT] gap open penalties for deletions and insertions [6,6]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
368 -E INT[,INT] gap extension penalty; a gap of size k cost '{-O} + {-E}*k' [1,1]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
369 -L INT[,INT] penalty for 5'- and 3'-end clipping [5,5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
370 -U INT penalty for an unpaired read pair [17]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
371
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
372 Input/output options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
373
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
374 -p first query file consists of interleaved paired-end sequences
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
375 -R STR read group header line such as '@RG\tID:foo\tSM:bar' [null]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
376
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
377 -v INT verbose level: 1=error, 2=warning, 3=message, 4+=debugging [3]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
378 -T INT minimum score to output [30]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
379 -h INT if there are &lt;INT hits with score &gt;80% of the max score, output all in XA [5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
380 -a output all alignments for SE or unpaired PE
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
381 -C append FASTA/FASTQ comment to SAM output
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
382 -V output the reference FASTA header in the XR tag
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
383 -Y use soft clipping for supplementary alignments
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
384 -M mark shorter split hits as secondary
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
385
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
386 -I FLOAT[,FLOAT[,INT[,INT]]]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
387 specify the mean, standard deviation (10% of the mean if absent), max
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
388 (4 sigma from the mean if absent) and min of the insert size distribution.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
389 FR orientation only. [inferred]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
390
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
391 @dataset_collections@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
392
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
393 @RG@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
394
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
395 @info@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
396 </help>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
397 <citations>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
398 <citation type="doi">10.1093/bioinformatics/btp324</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
399 <citation type="doi">10.1093/bioinformatics/btp698</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
400 <citation type="bibtex">@misc{1303.3997,
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
401 Author = {Heng Li},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
402 Title = {Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
403 Year = {2013},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
404 Eprint = {arXiv:1303.3997},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
405 url = {http://arxiv.org/abs/1303.3997},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
406 }</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
407 </citations>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
408 </tool>