annotate bwa-mem.xml @ 4:ac30bfd3e2a8 draft

planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
author devteam
date Thu, 18 Jun 2015 17:35:40 -0400
parents e29bc5c169bc
children fbf460831036
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
1 <?xml version="1.0"?>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
2 <tool id="bwa_mem" name="Map with BWA-MEM" version="0.2.2">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
3 <description>- map medium and long reads (&gt; 100 bp) against reference genome</description>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
4 <macros>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
5 <import>bwa_macros.xml</import>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
6 </macros>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
7 <requirements>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
8 <requirement type="package" version="0.7.10.039ea20639">bwa</requirement>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
9 <requirement type="package" version="1.1">samtools</requirement>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
10 </requirements>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
11 <stdio>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
12 <exit_code range="1:" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
13 </stdio>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
14 <command>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
15 #set $reference_fasta_filename = "localref.fa"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
16
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
17 #if str( $reference_source.reference_source_selector ) == "history":
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
18 ln -s "${reference_source.ref_file}" "${reference_fasta_filename}" &amp;&amp;
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
19
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
20 ## The following shell commands decide with of the BWA indexing algorithms (IS or BWTSW) will be run
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
21 ## depending ob the size of the input FASTA dataset
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
22 (
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
23 size=`stat -c %s "${reference_fasta_filename}" 2&gt;/dev/null`; ## Linux
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
24 if [ $? -eq 0 ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
25 then
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
26 if [ "\$size" -lt 2000000000 ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
27 then
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
28 bwa index -a is "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
29 echo "Generating BWA index with is algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
30 else
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
31 bwa index -a bwtsw "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
32 echo "Generating BWA index with bwtsw algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
33 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
34 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
35
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
36 eval \$(stat -s "${reference_fasta_filename}" 2&gt;/dev/null); ## OSX
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
37 if [ -n "\$st_size" ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
38 then
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
39 if [ "\$st_size" -lt 2000000000 ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
40 then
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
41 bwa index -a is "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
42 echo "Generating BWA index with is algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
43 else
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
44 bwa index -a bwtsw "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
45 echo "Generating BWA index with bwtsw algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
46 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
47 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
48 ) &amp;&amp;
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
49
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
50 #else:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
51 #set $reference_fasta_filename = str( $reference_source.ref_file.fields.path )
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
52 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
53
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
54 ## Begin BWA-MEM command line
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
55
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
56 bwa mem
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
57 -t "\${GALAXY_SLOTS:-1}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
58 -v 1 ## Verbosity is set to 1 (errors only)
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
59
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
60 #if str( $fastq_input.fastq_input_selector ) == "paired_iv": ## For interleaved fastq files set -p option
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
61 -p
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
62 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
63 -I "${fastq_input.iset_stats}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
64 #end if
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
65 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
66
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
67 #if str( $analysis_type.analysis_type_selector ) == "pacbio":
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
68 -x pacbio
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
69 #elif str( $analysis_type.analysis_type_selector ) == "full":
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
70 #if str( $analysis_type.algorithmic_options.algorithmic_options_selector ) == "set": ## Algorithmic options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
71 -k "${analysis_type.algorithmic_options.k}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
72 -w "${analysis_type.algorithmic_options.w}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
73 -d "${analysis_type.algorithmic_options.d}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
74 -r "${analysis_type.algorithmic_options.r}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
75 -y "${analysis_type.algorithmic_options.y}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
76 -c "${analysis_type.algorithmic_options.c}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
77 -D "${analysis_type.algorithmic_options.D}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
78 -W "${analysis_type.algorithmic_options.W}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
79 -m "${analysis_type.algorithmic_options.m}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
80 ${analysis_type.algorithmic_options.S}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
81 ${analysis_type.algorithmic_options.P}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
82 ${analysis_type.algorithmic_options.e}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
83 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
84
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
85 #if str( $analysis_type.scoring_options.scoring_options_selector ) == "set": ## Scoring options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
86 -A "${analysis_type.scoring_options.A}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
87 -B "${analysis_type.scoring_options.B}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
88 -O "${analysis_type.scoring_options.O}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
89 -E "${analysis_type.scoring_options.E}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
90 -L "${analysis_type.scoring_options.L}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
91 -U "${analysis_type.scoring_options.U}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
92 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
93
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
94 #if str( $analysis_type.io_options.io_options_selector ) == "set": ## IO options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
95 -T "${analysis_type.io_options.T}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
96 -h "${analysis_type.io_options.h}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
97 ${analysis_type.io_options.a}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
98 ${analysis_type.io_options.C}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
99 ${analysis_type.io_options.V}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
100 ${analysis_type.io_options.Y}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
101 ${analysis_type.io_options.M}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
102 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
103
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
104 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
105
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
106 #if str( $rg.rg_selector ) == "set":
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
107 @set_rg_string@
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
108 -R '$rg_string'
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
109 #end if
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
110
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
111 #if str( $fastq_input.fastq_input_selector ) == "paired":
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
112 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
113 -I "${fastq_input.iset_stats}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
114 #end if
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
115
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
116 "${reference_fasta_filename}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
117 "${fastq_input.fastq_input1}" "${fastq_input.fastq_input2}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
118 #elif str( $fastq_input.fastq_input_selector ) == "paired_collection":
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
119 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
120 -I "${fastq_input.iset_stats}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
121 #end if
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
122
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
123 "${reference_fasta_filename}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
124 "${fastq_input.fastq_input1.forward}" "${fastq_input.fastq_input1.reverse}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
125 #else:
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
126 "${reference_fasta_filename}"
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
127 "${fastq_input.fastq_input1}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
128 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
129
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
130 | samtools view -Sb - > temporary_bam_file.bam &amp;&amp;
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
131
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
132 samtools sort -f temporary_bam_file.bam ${bam_output}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
133 </command>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
134
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
135 <inputs>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
136
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
137 <conditional name="reference_source">
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
138 <param name="reference_source_selector" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options. See `Indexes` section of help below">
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
139 <option value="cached">Use a built-in genome index</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
140 <option value="history">Use a genome from history and build index</option>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
141 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
142 <when value="cached">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
143 <param name="ref_file" type="select" label="Using reference genome" help="Select genome from the list">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
144 <options from_data_table="bwa_mem_indexes">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
145 <filter type="sort_by" column="2" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
146 <validator type="no_options" message="No indexes are available" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
147 </options>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
148 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
149 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
150 </when>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
151 <when value="history">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
152 <param name="ref_file" type="data" format="fasta" label="Use the following dataset as the reference sequence" help="You can upload a FASTA sequence to the history and use it as reference" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
153 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
154 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
155 <conditional name="fastq_input">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
156 <param name="fastq_input_selector" type="select" label="Single or Paired-end reads" help="Select between paired and single end data">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
157 <option value="paired">Paired</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
158 <option value="single">Single</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
159 <option value="paired_collection">Paired Collection</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
160 <option value="paired_iv">Paired Interleaved</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
161 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
162 <when value="paired">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
163 <param name="fastq_input1" type="data" format="fastqsanger" label="Select first set of reads" help="Specify dataset with forward reads"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
164 <param name="fastq_input2" type="data" format="fastqsanger" label="Select second set of reads" help="Specify dataset with reverse reads"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
165 <param name="iset_stats" type="text" optional="True" size="10" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
166 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
167 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
168 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
169 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
170 </when>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
171 <when value="single">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
172 <param name="fastq_input1" type="data" format="fastqsanger" label="Select fastq dataset" help="Specify dataset with single reads"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
173 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
174 <when value="paired_collection">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
175 <param name="fastq_input1" format="fastqsanger" type="data_collection" collection_type="paired" label="Select a paired collection" help="See help section for an explanation of dataset collections"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
176 <param name="iset_stats" type="text" optional="True" size="10" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
177 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
178 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
179 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
180 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
181 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
182 <when value="paired_iv">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
183 <param name="fastq_input1" type="data" format="fastqsanger" label="Select fastq dataset" help="Specify dataset with interleaved reads"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
184 <param name="iset_stats" type="text" optional="True" size="10" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
185 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
186 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
187 </sanitizer>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
188 </param>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
189 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
190 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
191
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
192 <expand macro="readgroup_params" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
193
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
194 <conditional name="analysis_type">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
195 <param name="analysis_type_selector" type="select" label="Select analysis mode">
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
196 <option value="illumina">1.Simple Illumina mode</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
197 <option value="pacbio">2.PacBio mode (-x pacbio)</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
198 <option value="full">3.Full list of options</option>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
199 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
200 <when value="illumina">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
201 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
202 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
203 <when value="pacbio">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
204 <!-- do nothing. all magic happens within <command> tag -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
205 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
206 <when value="full">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
207 <conditional name="algorithmic_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
208 <param name="algorithmic_options_selector" type="select" label="Set algorithmic options?" help="Sets -k, -w, -d, -r, -y, -c, -D, -W, -m, -S, -P, and -e options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
209 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
210 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
211 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
212 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
213 <param name="k" type="integer" value="19" label="Minimum seed length" help="-k; default=19"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
214 <param name="w" type="integer" value="100" label="Band width for banded alignment" help="-w; default=100"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
215 <param name="d" type="integer" value="100" label="Off-diagonal X-dropoff" help="-d; default=100"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
216 <param name="r" type="float" value="1.5" label="Look for internal seeds inside a seed longer than -k * THIS VALUE" help="-r; default=1.5; This is a key heuristic parameter for tuning the performance. Larger value yields fewer seeds, which leads to faster alignment speed but lower accuracy" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
217 <param name="y" type="integer" value="20" label="Seed occurrence for the 3rd round seeding" help="-y; default=20" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
218 <param name="c" type="integer" value="500" label="Skip seeds with more than that many occurrences" help="-c; default=500"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
219 <param name="D" type="float" value="0.5" label="Drop chains shorter than this fraction of the longest overlapping chain" help="-D; default=0.5"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
220 <param name="W" type="integer" value="0" label="Discard a chain if seeded bases shorter than THIS VALUE" help="-W; default=0"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
221 <param name="m" type="integer" value="50" label="Perform at most this many rounds of mate rescues for each read" help="-m; default=50"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
222 <param name="S" type="boolean" truevalue="-S" falsevalue="" label="Skip mate rescue" help="-S"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
223 <param name="P" type="boolean" truevalue="-P" falsevalue="" label="Skip pairing; mate rescue performed unless -S also in use" help="-P"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
224 <param name="e" type="boolean" truevalue="-e" falsevalue="" label="Discard full-length exact matches" help="-e"/>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
225 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
226 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
227 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
228 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
229 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
230
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
231 <conditional name="scoring_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
232 <param name="scoring_options_selector" type="select" label="Set scoring options?" help="Sets -A, -B, -O, -E, -L, and -U options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
233 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
234 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
235 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
236 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
237 <param name="A" type="integer" value="1" label="Score for a sequence match" help="-A; scales options -T, -d, -B, -O, -E, -L, and -U unless overridden; default=1"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
238 <param name="B" type="integer" value="4" label="Penalty for a mismatch" help="-B; default=4"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
239 <param name="O" type="text" value="6,6" label="Gap open penalties for deletions and insertions" help="-O; default=6,6">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
240 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
241 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
242 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
243 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
244 <param name="E" type="text" value="1,1" label="Gap extension penalties; a gap of size k cost &#39;-O + -E*k&#39;. If two numbers are specified, the first is the penalty of extending a deletion and the second for extending an insertion" help="-E; default=1,1">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
245 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
246 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
247 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
248 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
249 <param name="L" type="text" value="5,5" label="Penalties for 5&#39;-end and 3&#39;-end clipping" help="-L; default=5,5; When performing Smith-Waterman extension, BWA-MEM keeps track of the best score reaching the end of query. If this score is larger than the best Smith-Waterman score minus the clipping penalty, clipping will not be applied. Note that in this case, the SAM AS tag reports the best Smith-Waterman score; clipping penalty is not deduced">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
250 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
251 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
252 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
253 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
254 <param name="U" type="integer" value="17" label="Penalty for an unpaired read pair" help="-U; default=17"/>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
255 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
256 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
257 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
258 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
259 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
260
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
261 <conditional name="io_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
262 <param name="io_options_selector" type="select" label="Set input/output options" help="Sets -T, -h, -a, -C, -V, -Y, and -M options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
263 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
264 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
265 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
266 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
267 <param name="T" type="integer" value="30" label="Minimum score to output" help="-T; default=30"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
268 <param name="h" type="integer" value="5" label="If there are less than THIS VALUE hits with score &gt;80% of the max score, output them all in the XA tag" help="-h; default=5" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
269 <param name="a" type="boolean" truevalue="-a" falsevalue="" label="Output all alignments for single-ends or unpaired paired-ends" help="-a; These alignments will be flagged as secondary alignments"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
270 <param name="C" type="boolean" truevalue="-C" falsevalue="" label="Append FASTA/FASTQ comment to BAM output" help="-C"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
271 <param name="V" type="boolean" truevalue="-V" falsevalue="" label="Output the reference FASTA header in the XR tag" help="-C"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
272 <param name="Y" type="boolean" truevalue="-Y" falsevalue="" label="Use soft clipping for supplementary alignments" help="-Y; By default, BWA-MEM uses soft clipping for the primary alignment and hard clipping for supplementary alignments" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
273 <param name="M" type="boolean" truevalue="-M" falsevalue="" label="Mark shorter split hits of a chimeric alignment in the FLAG field as 'secondary alignment' instead of 'supplementary alignment'" help="-M; For Picard&lt;1.96 compatibility" />
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
274 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
275 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
276 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
277 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
278 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
279 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
280 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
281 </inputs>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
282
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
283 <outputs>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
284 <data format="bam" name="bam_output" label="${tool.name} on ${on_string} (mapped reads in BAM format)"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
285 </outputs>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
286
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
287 <tests>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
288 <test>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
289 <param name="reference_source_selector" value="history" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
290 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
291 <param name="fastq_input_selector" value="paired"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
292 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
293 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
294 <param name="analysis_type_selector" value="illumina"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
295 <output name="bam_output" ftype="bam" file="bwa-mem-test1.bam" lines_diff="2" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
296 </test>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
297 <test>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
298 <param name="reference_source_selector" value="history" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
299 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
300 <param name="fastq_input_selector" value="paired"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
301 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
302 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
303 <param name="rg_selector" value="set"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
304 <param name="ID" value="rg1"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
305 <param name="PL" value="CAPILLARY"/>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
306 <param name="LB" value="AARDVARK-1" />
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
307 <param name="analysis_type_selector" value="illumina"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
308 <output name="bam_output" ftype="bam" file="bwa-mem-test2.bam" lines_diff="2" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
309 </test>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
310 </tests>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
311 <help>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
312 **What is does**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
313
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
314 From http://arxiv.org/abs/1303.3997:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
315
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
316 BWA-MEM is a new alignment algorithm for aligning sequence reads or long query sequences against a large reference genome such as human.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
317 It automatically chooses between local and end-to-end alignments, supports paired-end reads and performs chimeric alignment.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
318 The algorithm is robust to sequencing errors and applicable to a wide range of sequence lengths from 70bp to a few megabases.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
319 For mapping 100bp sequences, BWA-MEM shows better performance than several state-of-art read aligners to date.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
320
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
321 It is best suited for mapping long (>70 nt) reads against large reference genomes.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
322
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
323 This Galaxy tool wraps bwa-mem module of bwa read mapping tool. Galaxy implementation takes fastq files as input and produces output in BAM (not SAM) format, which can be further processed using various BAM utilities exiting in Galaxy (BAMTools, SAMTools, Picard).
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
324
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
325 -----
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
326
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
327 **Indices: Selecting reference genomes for BWA**
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
328
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
329 Galaxy wrapper for BWA allows you select between precomputed and user-defined indices for reference genomes using **Will you select a reference genome from your history or use a built-in index?** flag. This flag has two options:
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
330
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
331 1. **Use a built-in genome index** - when selected (this is default), Galaxy provides the user with **Select reference genome index** dropdown. Genomes listed in this dropdown have been pre-indexed with bwa index utility and are ready to be mapped against.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
332 2. **Use a genome from the history and build index** - when selected, Galaxy provides the user with **Select reference genome sequence** dropdown. This dropdown is populated by all FASTA formatted files listed in your current history. If your genome of interest is uploaded into history it will be shown there. Selecting a genome from this dropdown will cause Galaxy to first transparently index it using `bwa index` command, and then run mapping with `bwa mem`.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
333
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
334 If your genome of interest is not listed here you have two choices:
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
335
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
336 1. Contact galaxy team using **Help->Support** link at the top of the interface and let us know that an index needs to be added
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
337 2. Upload your genome of interest as a FASTA file to Galaxy history and selected **Use a genome from the history and build index** option.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
338
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
339 -----
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
340
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
341 **Galaxy-specific option**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
342
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
343 Galaxy allows four levels of control over bwa-mem options provided by **Select analysis mode** menu option. These are:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
344
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
345 1. *Simple Illumina mode*: The simplest possible bwa mem application in which it alignes single or paired-end data to reference using default parameters. It is equivalent to the following command: bwa mem &lt;reference index&gt; &lt;fastq dataset1&gt; [fastq dataset2]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
346 2. *PacBio mode*: The mode adjusted specifically for mapping of long PacBio subreads. Equivalent to the following command: bwa mem -k17 -W40 -r10 -A1 -B1 -O1 -E1 -L0 &lt;reference index&gt; &lt;PacBio dataset in fastq format&gt;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
347 3. *Full list of options*: Allows access to all options through Galaxy interface.
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
348
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
349 ------
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
350
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
351 **BWA MEM options**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
352
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
353 Each Galaxy parameter widget corresponds to command line flags listed below:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
354
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
355 Algorithm options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
356
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
357 -k INT minimum seed length [19]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
358 -w INT band width for banded alignment [100]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
359 -d INT off-diagonal X-dropoff [100]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
360 -r FLOAT look for internal seeds inside a seed longer than {-k} * FLOAT [1.5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
361 -y INT find MEMs longer than {-k} * {-r} with size less than INT [0]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
362 -c INT skip seeds with more than INT occurrences [500]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
363 -D FLOAT drop chains shorter than FLOAT fraction of the longest overlapping chain [0.50]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
364 -W INT discard a chain if seeded bases shorter than INT [0]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
365 -m INT perform at most INT rounds of mate rescues for each read [50]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
366 -S skip mate rescue
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
367 -P skip pairing; mate rescue performed unless -S also in use
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
368 -e discard full-length exact matches
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
369
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
370 Scoring options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
371
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
372 -A INT score for a sequence match, which scales options -TdBOELU unless overridden [1]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
373 -B INT penalty for a mismatch [4]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
374 -O INT[,INT] gap open penalties for deletions and insertions [6,6]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
375 -E INT[,INT] gap extension penalty; a gap of size k cost '{-O} + {-E}*k' [1,1]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
376 -L INT[,INT] penalty for 5'- and 3'-end clipping [5,5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
377 -U INT penalty for an unpaired read pair [17]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
378
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
379 Input/output options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
380
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
381 -p first query file consists of interleaved paired-end sequences
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
382 -R STR read group header line such as '@RG\tID:foo\tSM:bar' [null]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
383
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
384 -v INT verbose level: 1=error, 2=warning, 3=message, 4+=debugging [3]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
385 -T INT minimum score to output [30]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
386 -h INT if there are &lt;INT hits with score &gt;80% of the max score, output all in XA [5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
387 -a output all alignments for SE or unpaired PE
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
388 -C append FASTA/FASTQ comment to SAM output
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
389 -V output the reference FASTA header in the XR tag
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
390 -Y use soft clipping for supplementary alignments
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
391 -M mark shorter split hits as secondary
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
392
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
393 -I FLOAT[,FLOAT[,INT[,INT]]]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
394 specify the mean, standard deviation (10% of the mean if absent), max
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
395 (4 sigma from the mean if absent) and min of the insert size distribution.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
396 FR orientation only. [inferred]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
397
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
398 @dataset_collections@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
399
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
400 @RG@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
401
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
402 @info@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
403 </help>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
404 <citations>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
405 <citation type="doi">10.1093/bioinformatics/btp324</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
406 <citation type="doi">10.1093/bioinformatics/btp698</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
407 <citation type="bibtex">@misc{1303.3997,
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
408 Author = {Heng Li},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
409 Title = {Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
410 Year = {2013},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
411 Eprint = {arXiv:1303.3997},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
412 url = {http://arxiv.org/abs/1303.3997},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
413 }</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
414 </citations>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
415 </tool>