annotate sickle.xml @ 9:7939dd56c4b4 draft

Uploaded
author nikhil-joshi
date Sat, 14 Mar 2015 18:19:57 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
9
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
1 <tool id="sickle" name="Sickle" version="1.33">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
2 <description>Windowed Adaptive Trimming of FastQ data</description>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
3
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
4 <command>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
5 sickle
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
6
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
7 #if str($readtype.single_or_paired) == "se":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
8 se -f $input_single -o $output_single
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
9
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
10 #if $input_single.ext == "fastq":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
11 -t sanger
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
12 #else if $input_single.ext == "fastqsanger":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
13 -t sanger
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
14 #else if $input_single.ext == "fastqillumina":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
15 -t illumina
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
16 #else if $input_single.ext == "fastqsolexa":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
17 -t solexa
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
18 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
19
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
20 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
21
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
22 #if str($readtype.single_or_paired) == "pe_combo":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
23 #if $readtype.output_n:
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
24 pe -c $input_combo -M $output_combo
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
25 #else
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
26 pe -c $input_combo -m $output_combo -s $output_combo_single
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
27 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
28
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
29 #if $input_combo.ext == "fastq":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
30 -t sanger
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
31 #else if $input_combo.ext == "fastqsanger":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
32 -t sanger
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
33 #else if $input_combo.ext == "fastqillumina":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
34 -t illumina
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
35 #else if $input_combo.ext == "fastqsolexa":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
36 -t solexa
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
37 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
38
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
39 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
40
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
41 #if str($readtype.single_or_paired) == "pe_sep":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
42 pe -f $input_paired1 -r $input_paired2 -o $output_paired1 -p $output_paired2 -s $output_paired_single
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
43
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
44 #if $input_paired1.ext == "fastq":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
45 -t sanger
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
46 #else if $input_paired1.ext == "fastqsanger":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
47 -t sanger
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
48 #else if $input_paired1.ext == "fastqillumina":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
49 -t illumina
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
50 #else if $input_paired1.ext == "fastqsolexa":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
51 -t solexa
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
52 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
53
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
54 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
55
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
56 #if str($qual_threshold) != "":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
57 -q $qual_threshold
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
58 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
59
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
60 #if str($length_threshold) != "":
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
61 -l $length_threshold
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
62 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
63
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
64 #if $no_five_prime:
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
65 -x
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
66 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
67
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
68 #if $trunc_n:
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
69 -n
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
70 #end if
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
71
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
72 </command>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
73
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
74 <inputs>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
75 <conditional name="readtype">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
76 <param name="single_or_paired" type="select" optional="false" label="Single-End or Paired-End reads?" help="Note: Sickle will infer the quality type of the file from its datatype. I.e., if the datatype is fastqsanger, then the quality type is sanger. The default is fastqsanger.">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
77 <option value="se" selected="true">Single-End</option>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
78 <option value="pe_combo">Paired-End (one interleaved input file)</option>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
79 <option value="pe_sep">Paired-End (two separate input files)</option>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
80 </param>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
81
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
82 <when value="se">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
83 <param format="fastq, fastqsanger, fastqillumina, fastqsolexa" name="input_single" type="data" optional="false" label="Single-End FastQ Reads"/>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
84 </when>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
85
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
86 <when value="pe_combo">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
87 <param format="fastq, fastqsanger, fastqillumina, fastqsolexa" name="input_combo" type="data" optional="false" label="Paired-End Interleaved FastQ Reads"/>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
88 <param name="output_n" type="boolean" label="Output only one file with all reads" help="This will output only one file with all the reads, where the reads that did not pass filter will be replaced with a single 'N', rather than discarded."/>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
89 </when>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
90
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
91 <when value="pe_sep">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
92 <param format="fastq, fastqsanger, fastqillumina, fastqsolexa" name="input_paired1" type="data" optional="false" label="Paired-End Forward Strand FastQ Reads"/>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
93 <param format="fastq, fastqsanger, fastqillumina, fastqsolexa" name="input_paired2" type="data" optional="false" label="Paired-End Reverse Strand FastQ Reads"/>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
94 </when>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
95 </conditional>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
96
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
97 <param name="qual_threshold" value="20" type="integer" optional="true" label="Quality Threshold">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
98 <validator type="in_range" min="0" message="Minimum value is 0"/>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
99 </param>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
100
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
101 <param name="length_threshold" value="20" type="integer" optional="true" label="Length Threshold">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
102 <validator type="in_range" min="0" message="Minimum value is 0"/>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
103 </param>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
104
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
105 <param name="no_five_prime" type="boolean" label="Don't do 5' trimming"/>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
106 <param name="trunc_n" type="boolean" label="Truncate sequences with Ns at first N position"/>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
107 </inputs>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
108
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
109 <outputs>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
110 <data format_source="input_single" name="output_single" label="Single-End output of ${tool.name} on ${on_string}">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
111 <filter>(readtype['single_or_paired'] == 'se')</filter>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
112 </data>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
113
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
114 <data format_source="input_combo" name="output_combo" label="Paired-End interleaved output of ${tool.name} on ${on_string}">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
115 <filter>(readtype['single_or_paired'] == 'pe_combo')</filter>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
116 </data>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
117
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
118 <data format_source="input_combo" name="output_combo_single" label="Singletons from Paired-End interleaved output of ${tool.name} on ${on_string}">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
119 <filter>(readtype['single_or_paired'] == 'pe_combo')</filter>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
120 <filter>(readtype['output_n'] == False)</filter>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
121 </data>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
122
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
123 <data format_source="input_paired1" name="output_paired1" label="Paired-End forward strand output of ${tool.name} on ${on_string}">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
124 <filter>(readtype['single_or_paired'] == 'pe_sep')</filter>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
125 </data>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
126
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
127 <data format_source="input_paired2" name="output_paired2" label="Paired-End reverse strand output of ${tool.name} on ${on_string}">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
128 <filter>(readtype['single_or_paired'] == 'pe_sep')</filter>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
129 </data>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
130
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
131 <data format_source="input_paired1" name="output_paired_single" label="Singletons from Paired-End output of ${tool.name} on ${on_string}">
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
132 <filter>(readtype['single_or_paired'] == 'pe_sep')</filter>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
133 </data>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
134 </outputs>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
135
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
136 <help>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
137 **Sickle - A windowed adaptive trimming tool for FASTQ files using quality**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
138
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
139 .. class:: infomark
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
140
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
141 **About**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
142
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
143 Most modern sequencing technologies produce reads that have
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
144 deteriorating quality towards the 3'-end and some towards the 5'-end
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
145 as well. Incorrectly called bases in both regions negatively impact
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
146 assembles, mapping, and downstream bioinformatics analyses.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
147
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
148 Sickle is a tool that uses sliding windows along with quality and
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
149 length thresholds to determine when quality is sufficiently low to
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
150 trim the 3'-end of reads and also determines when the quality is
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
151 sufficiently high enough to trim the 5'-end of reads. It will also
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
152 discard reads based upon the length threshold. It takes the quality
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
153 values and slides a window across them whose length is 0.1 times the
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
154 length of the read. If this length is less than 1, then the window is
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
155 set to be equal to the length of the read. Otherwise, the window
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
156 slides along the quality values until the average quality in the
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
157 window rises above the threshold, at which point the algorithm
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
158 determines where within the window the rise occurs and cuts the read
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
159 and quality there for the 5'-end cut. Then when the average quality
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
160 in the window drops below the threshold, the algorithm determines
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
161 where in the window the drop occurs and cuts both the read and quality
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
162 strings there for the 3'-end cut. However, if the length of the
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
163 remaining sequence is less than the minimum length threshold, then the
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
164 read is discarded entirely (or replaced with an "N" record). 5'-end
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
165 trimming can be disabled. Sickle also has an option to truncate reads
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
166 with Ns at the first N position.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
167
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
168 Sickle supports three types of quality values: Illumina, Solexa, and
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
169 Sanger. Note that the Solexa quality setting is an approximation (the
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
170 actual conversion is a non-linear transformation). The end
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
171 approximation is close. Illumina quality refers to qualities encoded
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
172 with the CASAVA pipeline between versions 1.3 and 1.7. Illumina
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
173 quality using CASAVA >= 1.8 is Sanger encoded. The quality value will
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
174 be determined from the datatype of the data, i.e. a fastqsanger datatype
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
175 is assumed to be Sanger encoded.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
176
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
177 Note that Sickle will remove the 2nd fastq record header (on the "+"
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
178 line) and replace it with simply a "+". This is the default format for
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
179 CASAVA >= 1.8.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
180
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
181 -----
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
182
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
183 .. class:: infomark
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
184
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
185 **Options**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
186
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
187 **Single-end**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
188
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
189 This option takes one single-end input file and outputs one single-end
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
190 output file of reads that passed the filters.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
191
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
192 **Paired-End (one interleaved input file)**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
193
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
194 This option takes as input one interleaved paired-end file. If you then
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
195 check the "Output only one file with all reads" checkbox, it will output
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
196 one interleaved file where any read that did not pass filter will be replaced
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
197 with a FastQ record where the sequence is a single "N" and the quality is the
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
198 lowest quality possible for that quality type. This will preserve the paired
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
199 nature of the data. If you leave the checkbox unchecked, it will output two files,
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
200 one interleaved file with all the passed pairs and one singletons file where only
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
201 one of the pair passed filter.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
202
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
203 **Paired-End (two separate input files)**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
204
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
205 This option takes two separate (forward and reverse) paired-end files as input.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
206 The output is three files: Two paired-end files with pairs that passed filter and
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
207 a singletons file where only one of the pair passed filter.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
208
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
209 **Quality threshold**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
210
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
211 Input your desired quality threshold. This threshold is phred-scaled, which is typically
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
212 values between 0-41 for FastQ data.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
213
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
214 **Length threshold**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
215
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
216 Input your desired length threshold. This is the threshold to determine if a read is kept
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
217 after all the trimming steps are done.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
218
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
219 **Disable 5-prime trimming**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
220
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
221 An option to disable trimming the read on the 5-prime end. This trimming trims the read
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
222 if the average quality values dip below the quality threshold at the 5-prime end.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
223
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
224 **Truncate sequences with Ns**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
225
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
226 This option will trim a read at the first "N" base in the read after doing quality trimming.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
227 It is then still subject to the length threshold.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
228
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
229 -----
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
230
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
231 .. class:: infomark
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
232
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
233 **Citation**
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
234
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
235 Sickle doesn't have a paper, but you can cite it like this::
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
236
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
237 Joshi NA, Fass JN. (2011). Sickle: A sliding-window, adaptive, quality-based trimming tool for FastQ files
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
238 (Version 1.33) [Software]. Available at https://github.com/najoshi/sickle.
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
239
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
240 -----
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
241
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
242 Copyright: Nikhil Joshi
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
243
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
244 http://bioinformatics.ucdavis.edu
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
245
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
246 http://github.com/ucdavis-bioinformatics
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
247
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
248 http://github.com/najoshi
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
249
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
250 </help>
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
251
7939dd56c4b4 Uploaded
nikhil-joshi
parents:
diff changeset
252 </tool>