comparison STACKS_procrad.xml @ 0:d6ba40f6c824

first commit
author cmonjeau
date Mon, 24 Aug 2015 09:29:12 +0000
parents
children c9e10e0d6c10
comparison
equal deleted inserted replaced
-1:000000000000 0:d6ba40f6c824
1 <?xml version="1.0"?>
2 <tool id="STACKSprocrad" name="STACKS : Process radtags" force_history_refresh="True" version="1.1.0">
3 <description>Run the STACKS cleaning script</description>
4 <configfiles>
5 <configfile name="input_single">
6 #if str( $options_type.options_type_selector ) == "single":
7 #for $input in $options_type.inputs_single:
8 ${input.display_name}::${input}
9 #end for
10 #end if
11 </configfile>
12 <configfile name="input_paired1">
13 #if str( $options_type.options_type_selector ) == "paired":
14 #for $input in $options_type.inputs_paired1:
15 ${input.display_name}::${input}
16 #end for
17 #end if
18 </configfile>
19 <configfile name="input_paired2">
20 #if str( $options_type.options_type_selector ) == "paired":
21 #for $input in $options_type.inputs_paired2:
22 ${input.display_name}::${input}
23 #end for
24 #end if
25 </configfile>
26 </configfiles>
27 <requirements>
28 <requirement type="package" version="1.18">stacks</requirement>
29 </requirements>
30 <command interpreter="python">
31
32 STACKS_procrad.py
33 --input_type $options_type.options_type_selector
34 #if str( $options_type.options_type_selector ) == "single":
35 --input_single $input_single
36 #else
37 --input_paired1 $input_paired1
38 --input_paired2 $input_paired2
39 #end if
40 --inputype $inputype
41 --barcode $barcode
42 --sample_name $sample_name
43 --output_choice $options_output_infos_selector
44 #if str( $options_output_infos_selector ) != "1":
45 --output_archive $output_archive
46 #end if
47 --input_enzyme $options_enzyme.options_enzyme_selector
48 --enzyme1 $options_enzyme.enzyme
49 #if str( $options_enzyme.options_enzyme_selector ) == "2":
50 --enzyme2 $options_enzyme.enzyme2
51 #end if
52 --outype $outype
53 --qualitenc $options_quality.qualitenc
54 #if $capture:
55 -D
56 #end if
57 --activate_advanced_options $activate_advanced_options
58 -t $options_advanced.truncate
59 #if $options_advanced.discard:
60 -q
61 #end if
62 #if $options_advanced.rescue:
63 -r
64 #end if
65 -w $options_advanced.sliding
66 -s $options_advanced.score
67 #if $options_advanced.remove:
68 -c
69 #end if
70 #if $options_advanced.inline:
71 --inline_null
72 #end if
73 #if $options_advanced.index:
74 --index_null
75 #end if
76 #if $options_advanced.inlinein:
77 --inline_inline
78 #end if
79 #if $options_advanced.indexind:
80 --index_index
81 #end if
82 #if $options_advanced.inlineind:
83 --inline_index
84 #end if
85 #if $options_advanced.indexin:
86 --index_inline
87 #end if
88 --logfile $output
89
90 </command>
91
92 <inputs>
93
94 <conditional name="options_type">
95 <param name="options_type_selector" type="select" label="Single-end or paired-end reads files">
96 <option value="single" selected="True">Single-end files</option>
97 <option value="paired">Paired-end files</option>
98 </param>
99 <when value="single">
100 <param name="inputs_single" format="fastq,fastq.gz" type="data" multiple="true" label="singles-end reads infile(s)" help="input files" />
101 </when>
102 <when value="paired">
103 <param name="inputs_paired1" format="fastq,fastq.gz" type="data" multiple="true" label="paired-end reads infile(s) 1" help="Files must have this syntax : name_R1_001.fastq" />
104 <param name="inputs_paired2" format="fastq,fastq.gz" type="data" multiple="true" label="paired-end reads infile(s) 2" help="Files must have this syntax : name_R2_001.fastq" />
105 </when>
106 </conditional>
107 <param name="inputype" type="select" format="text" label="Inputs format">
108 <option value="fastq" selected="True">fastq</option>
109 <option value="gzfastq">fastq.gz</option>
110 <option value="bustard">Illumina BUSTARD</option>
111 </param>
112 <param name="barcode" type="data" format="tabular,txt" label="Barcode file" help="Barcode file" />
113
114 <param name="sample_name" type="text" value="sample" label="Sample name" help="Precise the sample name if using several NGS runs" />
115
116 <conditional name="options_enzyme">
117 <param name="options_enzyme_selector" type="select" label="Number of enzymes">
118 <option value="1" >One</option>
119 <option value="2">Two</option>
120 </param>
121 <when value="1">
122 <param name="enzyme" type="select" format="text" label="Enzyme" help="provide the restriction enzyme used" >
123 <option value="apeKI">apeKI</option>
124 <option value="bamHI">bamHI</option>
125 <option value="claI">claI</option>
126 <option value="dpnII">dpnII</option>
127 <option value="eaeI">eaeI</option>
128 <option value="ecoRI">ecoRI</option>
129 <option value="ecoT22I">ecoT22I</option>
130 <option value="hindIII">hindIII</option>
131 <option value="mluCI">mluCI</option>
132 <option value="mseI">mseI</option>
133 <option value="mspI">mspI</option>
134 <option value="ndeI">ndeI</option>
135 <option value="nlaIII">nlaIII</option>
136 <option value="notI">notI</option>
137 <option value="nsiI">nsiI</option>
138 <option value="pstI">pstI</option>
139 <option value="sau3AI">sau3AI</option>
140 <option value="sbfI">sbfI</option>
141 <option value="sexAI">sexAI</option>
142 <option value="sgrAI">sgrAI</option>
143 <option value="sphI">sphI</option>
144 <option value="taqI">taqI</option>
145 <option value="xbaI">xbaI</option>
146 </param>
147 </when>
148 <when value="2">
149 <param name="enzyme" type="select" format="text" label="Enzyme" help="provide the restriction enzyme used" >
150 <option value="apeKI">apeKI</option>
151 <option value="bamHI">bamHI</option>
152 <option value="claI">claI</option>
153 <option value="dpnII">dpnII</option>
154 <option value="eaeI">eaeI</option>
155 <option value="ecoRI">ecoRI</option>
156 <option value="ecoT22I">ecoT22I</option>
157 <option value="hindIII">hindIII</option>
158 <option value="mluCI">mluCI</option>
159 <option value="mseI">mseI</option>
160 <option value="mspI">mspI</option>
161 <option value="ndeI">ndeI</option>
162 <option value="nlaIII">nlaIII</option>
163 <option value="notI">notI</option>
164 <option value="nsiI">nsiI</option>
165 <option value="pstI">pstI</option>
166 <option value="sau3AI">sau3AI</option>
167 <option value="sbfI">sbfI</option>
168 <option value="sexAI">sexAI</option>
169 <option value="sgrAI">sgrAI</option>
170 <option value="sphI">sphI</option>
171 <option value="taqI">taqI</option>
172 <option value="xbaI">xbaI</option>
173 </param>
174 <param name="enzyme2" type="select" format="text" label="Second enzyme" help="provide the second restriction enzyme used" >
175 <option value="apeKI">apeKI</option>
176 <option value="bamHI">bamHI</option>
177 <option value="claI">claI</option>
178 <option value="dpnII">dpnII</option>
179 <option value="eaeI">eaeI</option>
180 <option value="ecoRI">ecoRI</option>
181 <option value="ecoT22I">ecoT22I</option>
182 <option value="hindIII">hindIII</option>
183 <option value="mluCI">mluCI</option>
184 <option value="mseI">mseI</option>
185 <option value="mspI">mspI</option>
186 <option value="ndeI">ndeI</option>
187 <option value="nlaIII">nlaIII</option>
188 <option value="notI">notI</option>
189 <option value="nsiI">nsiI</option>
190 <option value="pstI">pstI</option>
191 <option value="sau3AI">sau3AI</option>
192 <option value="sbfI">sbfI</option>
193 <option value="sexAI">sexAI</option>
194 <option value="sgrAI">sgrAI</option>
195 <option value="sphI">sphI</option>
196 <option value="taqI">taqI</option>
197 <option value="xbaI">xbaI</option>
198 </param>
199 </when>
200 </conditional>
201 <param name="capture" type="boolean" label="Capture discarded reads to a file" />
202 <section name="options_quality" title="quality options" expanded="False">
203 <param name="qualitenc" type="select" format="text" label="Quality encoded type" help="specify how quality scores are encoded, 'phred33' (Illumina 1.8+, Sanger, default) or 'phred64' (Illumina 1.3 - 1.5)" >
204 <option value="phred33">phred33</option>
205 <option value="phred64">phred64</option>
206 </param>
207 </section>
208 <param name="activate_advanced_options" type="boolean" label="Activate advanced options" help="advanced options are defined below" />
209 <section name="options_advanced" title="advanced options" expanded="False">
210 <param name="sliding" type="float" value="0.15" label="set the size of the sliding window as a fraction of the read length, between 0 and 1 (default 0.15)" />
211 <param name="score" type="integer" value="10" label="Set the score limit. If the average score within the sliding window drops below this value, the read is discarded (default 10)" />
212 <param name="remove" type="boolean" checked="false" default="false" label="Clean data, remove any read with an uncalled base" />
213 <param name="discard" type="boolean" checked="false" default="false" label="Discard reads with low quality scores"/>
214 <param name="rescue" type="boolean" checked="false" default="false" label="Rescue barcodes and RAD-Tags?"/>
215 <param name="truncate" type="integer" value="-1" label="Truncate final read length to this value" help="default = -1" />
216 <param name="inline" type="boolean" checked="true" default="true" label="Barcode options -> inline_null" help="barcode is inline with sequence, occurs only on single-end read" />
217 <param name="index" type="boolean" checked="false" default="false" label="Barcode options -> index_null" help="barcode is provided in FASTQ header, occurs only on single-end read"/>
218 <param name="inlinein" type="boolean" checked="false" default="false" label="Barcode options -> inline_inline" help="barcode is inline with sequence, occurs on single and paired-end read" />
219 <param name="indexind" type="boolean" checked="false" default="false" label="Barcode options -> index_index" help="barcode is provided in FASTQ header, occurs on single and paired-end read" />
220 <param name="inlineind" type="boolean" checked="false" default="false" label="Barcode options -> inline_index" help="barcode is inline with sequence on single-end read, occurs in FASTQ header for paired-end read" />
221 <param name="indexin" type="boolean" checked="false" default="false" label="Barcode options -> index_inline" help="barcode occurs in FASTQ header for single-end read, is inline with sequence on paired-end read" />
222 </section>
223 <param name="outype" type="select" format="text" label="Output format" help="output type, either 'fastq' or 'fasta' (default fastq)" >
224 <option value="fastq">fastq</option>
225 <option value="fasta">fasta</option>
226 </param>
227
228 <param name="options_output_infos_selector" type="select" label="Output type">
229 <option value="1">Normal (a fastq file by barcode)</option>
230 <option value="2" selected="True">Additional zip archive with all files (Normal + one archive with all fastq files)</option>
231 <option value="3">Only a zip archive with all files (one archive with all fastq files)</option>
232 </param>
233
234 </inputs>
235 <outputs>
236
237 <data format="txt" name="output" label="results.log with ${tool.name} on ${on_string}: demultiplexed and cleaned reads" />
238 <data format="txt" name="additional" label="fast(a/q) file with ${tool.name}" hidden="true">
239 <discover_datasets pattern="__designation_and_ext__" directory="galaxy_outputs" visible="true" />
240 </data>
241 <data format="zip" name="output_archive" label="all_files.zip with ${tool.name} on ${on_string}: demultiplexed and cleaned reads ">
242 <filter>options_output_infos_selector != "1"</filter>
243 </data>
244 <data format="fastq" name="discard_file" label="discard.fastq with ${tool.name} on ${on_string}: demultiplexed and cleaned reads ">
245 <filter>capture</filter>
246 </data>
247
248
249 </outputs>
250
251 <stdio>
252 <exit_code range="1" level="fatal" description="Error in Stacks Process radtag execution" />
253 </stdio>
254
255
256 <help>
257
258 .. class:: infomark
259
260 **What it does**
261
262 This program examines raw reads from an Illumina sequencing run and first, checks that the barcode and the RAD cutsite are intact, and demultiplexes the data. If there are
263 errors in the barcode or the RAD site within a certain allowance process_radtags can correct them. Second, it slides a window down the length of the read and checks the
264 average quality score within the window. If the score drops below 90% probability of being correct (a raw phred score of 10), the read is discarded. This allows for some
265 seqeuncing errors while elimating reads where the sequence is degrading as it is being sequenced. By default the sliding window is 15% of the length of the read, but can be
266 specified on the command line (the threshold and window size can be adjusted).
267 The process_radtags program can:
268 handle data that is barcoded, either inline or using an index, or unbarcoded.
269 use combinatorial barcodes.
270 check and correct for a restriction enzyme cutsite for single or double-digested
271 data.
272 filter adapter sequence while allowing for sequencing error in the adapter pattern.
273 process individual files or whole directories of files.
274 directly read gzipped data
275 filter reads based on Illumina's Chastity filter
276
277 --------
278
279 **Help**
280
281 Input files:
282
283 - FASTQ, FASTA, zip, tar.gz
284
285 - Barcode File Format
286
287 The barcode file is a very simple format : one barcode per line.
288
289 CGATA
290 CGGCG
291 GAAGC
292 GAGAT
293 CGATA
294 CGGCG
295 GAAGC
296 GAGAT
297
298 Combinatorial barcodes are specified, one per column, separated by a tab::
299
300 CGATA ACGTA
301 CGGCG CGTA
302 GAAGC CGTA
303 GAGAT CGTA
304 CGATA AGCA
305 CGGCG AGCA
306 GAAGC AGCA
307 GAGAT AGCA
308
309
310 Instructions to add the functionality of archives management in Galaxy on the `eBiogenouest HUB wiki &lt;https://www.e-biogenouest.org/wiki/ManArchiveGalaxy&gt;`_ .
311
312 --------
313
314
315 **Created by:**
316
317 Stacks was developed by Julian Catchen with contributions from Angel Amores, Paul Hohenlohe, and Bill Cresko
318
319 --------
320
321 **Project links:**
322
323 `STACKS website &lt;http://creskolab.uoregon.edu/stacks/&gt;`_ .
324
325 `STACKS manual &lt;http://creskolab.uoregon.edu/stacks/stacks_manual.pdf&gt;`_ .
326
327 `STACKS google group &lt;https://groups.google.com/forum/#!forum/stacks-users&gt;`_ .
328
329 --------
330
331 **References:**
332
333 -J. Catchen, P. Hohenlohe, S. Bassham, A. Amores, and W. Cresko. Stacks: an analysis tool set for population genomics. Molecular Ecology. 2013.
334
335 -J. Catchen, S. Bassham, T. Wilson, M. Currey, C. O'Brien, Q. Yeates, and W. Cresko. The population structure and recent colonization history of Oregon threespine stickleback determined using restriction-site associated DNA-sequencing. Molecular Ecology. 2013.
336
337 -J. Catchen, A. Amores, P. Hohenlohe, W. Cresko, and J. Postlethwait. Stacks: building and genotyping loci de novo from short-read sequences. G3: Genes, Genomes, Genetics, 1:171-182, 2011.
338
339 -A. Amores, J. Catchen, A. Ferrara, Q. Fontenot and J. Postlethwait. Genome evolution and meiotic maps by massively parallel DNA sequencing: Spotted gar, an outgroup for the teleost genome duplication. Genetics, 188:799'808, 2011.
340
341 -P. Hohenlohe, S. Amish, J. Catchen, F. Allendorf, G. Luikart. RAD sequencing identifies thousands of SNPs for assessing hybridization between rainbow trout and westslope cutthroat trout. Molecular Ecology Resources, 11(s1):117-122, 2011.
342
343 -K. Emerson, C. Merz, J. Catchen, P. Hohenlohe, W. Cresko, W. Bradshaw, C. Holzapfel. Resolving postglacial phylogeography using high-throughput sequencing. Proceedings of the National Academy of Science, 107(37):16196-200, 2010.
344
345 --------
346
347 **Integrated by:**
348
349 Yvan Le Bras and Cyril Monjeaud
350
351 GenOuest Bio-informatics Core Facility
352
353 UMR 6074 IRISA INRIA-CNRS-UR1 Rennes (France)
354
355 support@genouest.org
356
357 If you use this tool in Galaxy, please cite :
358
359 `Y. Le Bras, A. Roult, C. Monjeaud, M. Bahin, O. Quenez, C. Heriveau, A. Bretaudeau, O. Sallou, O. Collin, Towards a Life Sciences Virtual Research Environment : an e-Science initiative in Western France. JOBIM 2013. &lt;https://www.e-biogenouest.org/resources/128&gt;`_
360
361
362
363 </help>
364 <citations>
365 <citation type="doi">10.1111/mec.12354</citation>
366 <citation type="doi">10.1111/mec.12330</citation>
367 <citation type="doi">10.1534/g3.111.000240</citation>
368 <citation type="doi">10.1534/genetics.111.127324</citation>
369 <citation type="doi">10.1111/j.1755-0998.2010.02967.x</citation>
370 <citation type="doi">10.1073/pnas.1006538107</citation>
371
372 <citation type="bibtex">@INPROCEEDINGS{JOBIM2013,
373 author = {Le Bras, Y. and ROULT, A. and Monjeaud, C. and Bahin, M. and Quenez, O. and Heriveau, C. and Bretaudeau, A. and Sallou, O. and Collin, O.},
374 title = {Towards a Life Sciences Virtual Research Environment: An e-Science initiative in Western France},
375 booktitle = {JOBIM 2013 Proceedings},
376 year = {2013},
377 url = {https://www.e-biogenouest.org/resources/128},
378 pages = {97-106}
379 }</citation>
380 </citations>
381 </tool>
382