annotate tools/fastq_paired_unpaired/fastq_paired_unpaired.xml @ 5:b38bbcbd458d draft

v0.1.2 belatedly declare Biopython dependency
author peterjc
date Wed, 05 Aug 2015 11:17:49 -0400
parents 09f9f0e29e47
children f396701fbf32
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
5
b38bbcbd458d v0.1.2 belatedly declare Biopython dependency
peterjc
parents: 4
diff changeset
1 <tool id="fastq_paired_unpaired" name="Divide FASTQ file into paired and unpaired reads" version="0.1.2">
4
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
2 <description>using the read name suffices</description>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
3 <requirements>
5
b38bbcbd458d v0.1.2 belatedly declare Biopython dependency
peterjc
parents: 4
diff changeset
4 <requirement type="package" version="1.65">biopython</requirement>
4
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
5 <requirement type="python-module">Bio</requirement>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
6 </requirements>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
7 <stdio>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
8 <!-- Anything other than zero is an error -->
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
9 <exit_code range="1:" />
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
10 <exit_code range=":-1" />
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
11 </stdio>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
12 <version_command interpreter="python">fastq_paired_unpaired.py --version</version_command>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
13 <command interpreter="python">
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
14 fastq_paired_unpaired.py $input_fastq.extension $input_fastq
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
15 #if $output_choice_cond.output_choice=="separate"
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
16 $output_forward $output_reverse
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
17 #elif $output_choice_cond.output_choice=="interleaved"
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
18 $output_paired
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
19 #end if
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
20 $output_singles
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
21 </command>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
22 <inputs>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
23 <param name="input_fastq" type="data" format="fastq" label="FASTQ file to divide into paired and unpaired reads"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
24 <conditional name="output_choice_cond">
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
25 <param name="output_choice" type="select" label="How to output paired reads?">
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
26 <option value="separate">Separate (two FASTQ files, for the forward and reverse reads, in matching order).</option>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
27 <option value="interleaved">Interleaved (one FASTQ file, alternating forward read then partner reverse read).</option>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
28 </param>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
29 <!-- Seems need these dummy entries here, compare this to indels/indel_sam2interval.xml -->
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
30 <when value="separate" />
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
31 <when value="interleaved" />
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
32 </conditional>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
33 </inputs>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
34 <outputs>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
35 <data name="output_singles" format_source="input_fastq" label="Orphan or single reads"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
36 <data name="output_forward" format_source="input_fastq" label="Forward paired reads">
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
37 <filter>output_choice_cond["output_choice"] == "separate"</filter>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
38 </data>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
39 <data name="output_reverse" format_source="input_fastq" label="Reverse paired reads">
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
40 <filter>output_choice_cond["output_choice"] == "separate"</filter>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
41 </data>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
42 <data name="output_paired" format_source="input_fastq" label="Interleaved paired reads">
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
43 <filter>output_choice_cond["output_choice"] == "interleaved"</filter>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
44 </data>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
45 </outputs>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
46 <tests>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
47 <test>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
48 <param name="input_fastq" value="sanger-pairs-mixed.fastq" ftype="fastq"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
49 <param name="output_choice" value="separate"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
50 <output name="output_singles" file="sanger-pairs-singles.fastq" ftype="fastq"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
51 <output name="output_forward" file="sanger-pairs-forward.fastq" ftype="fastq"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
52 <output name="output_reverse" file="sanger-pairs-reverse.fastq" ftype="fastq"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
53 </test>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
54 <test>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
55 <param name="input_fastq" value="sanger-pairs-mixed.fastq" ftype="fastq"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
56 <param name="output_choice" value="interleaved"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
57 <output name="output_singles" file="sanger-pairs-singles.fastq" ftype="fastq"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
58 <output name="output_paired" file="sanger-pairs-interleaved.fastq" ftype="fastq"/>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
59 </test>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
60 </tests>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
61 <help>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
62
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
63 **What it does**
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
64
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
65 Using the common read name suffix conventions, it divides a FASTQ file into
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
66 paired reads, and orphan or single reads.
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
67
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
68 The input file should be a valid FASTQ file which has been sorted so that
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
69 any partner forward+reverse reads are consecutive. The output files all
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
70 preserve this sort order. Pairing are recognised based on standard name
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
71 suffices. See below or run the tool with no arguments for more details.
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
72
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
73 Any reads where the forward/reverse naming suffix used is not recognised
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
74 are treated as orphan reads. The tool supports the /1 and /2 convention
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
75 originally used by Illumina, .f and .r convention, the Sanger convention
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
76 (see http://staden.sourceforge.net/manual/pregap4_unix_50.html for details),
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
77 and the current Illumina convention where the reads get the same identifier
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
78 with the fragment number in the description, for example:
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
79
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
80 * @HWI-ST916:79:D04M5ACXX:1:1101:10000:100326 1:N:0:TGNCCA
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
81 * @HWI-ST916:79:D04M5ACXX:1:1101:10000:100326 2:N:0:TGNCCA
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
82
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
83 Note that this does support multiple forward and reverse reads per template
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
84 (which is quite common with Sanger sequencing), e.g. this which is sorted
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
85 alphabetically:
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
86
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
87 * WTSI_1055_4p17.p1kapIBF
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
88 * WTSI_1055_4p17.p1kpIBF
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
89 * WTSI_1055_4p17.q1kapIBR
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
90 * WTSI_1055_4p17.q1kpIBR
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
91
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
92 or this where the reads already come in pairs:
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
93
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
94 * WTSI_1055_4p17.p1kapIBF
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
95 * WTSI_1055_4p17.q1kapIBR
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
96 * WTSI_1055_4p17.p1kpIBF
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
97 * WTSI_1055_4p17.q1kpIBR
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
98
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
99 both become:
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
100
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
101 * WTSI_1055_4p17.p1kapIBF paired with WTSI_1055_4p17.q1kapIBR
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
102 * WTSI_1055_4p17.p1kpIBF paired with WTSI_1055_4p17.q1kpIBR
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
103
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
104 **References**
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
105
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
106 If you use this Galaxy tool in work leading to a scientific publication please
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
107 cite the following paper:
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
108
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
109 Peter J.A. Cock, Björn A. Grüning, Konrad Paszkiewicz and Leighton Pritchard (2013).
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
110 Galaxy tools and workflows for sequence analysis with applications
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
111 in molecular plant pathology. PeerJ 1:e167
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
112 http://dx.doi.org/10.7717/peerj.167
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
113
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
114 This tool is available to install into other Galaxy Instances via the Galaxy
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
115 Tool Shed at http://toolshed.g2.bx.psu.edu/view/peterjc/fastq_paired_unpaired
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
116 </help>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
117 <citations>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
118 <citation type="doi">10.7717/peerj.167</citation>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
119 </citations>
09f9f0e29e47 v0.0.6 use format_source; v0.0.5 error handling & citation
peterjc
parents:
diff changeset
120 </tool>