annotate paired_fastq_filtering.xml @ 34:91996b991991 draft default tip

Uploaded
author petr-novak
date Fri, 16 Feb 2024 15:22:21 +0000
parents f1738f8649b0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
23
36c418bca8b2 planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 22
diff changeset
1 <tool id="paired_fastq_filtering" name="Preprocessing of FASTQ paired-end reads" version="1.0.0.3">
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
2 <stdio>
23
36c418bca8b2 planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 22
diff changeset
3 <exit_code range="1:" level="fatal" description="Error"/>
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
4 </stdio>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
5 <description>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
6 Preprocessing of paired-end reads in FASTQ format
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
7 including trimming, quality filtering, cutadapt filtering and interlacing. Broken
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
8 pairs are discarded.
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
9 </description>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
10 <requirements>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
11 <requirement type="package">blast</requirement>
33
f1738f8649b0 planemo upload commit 39094a128ea3dd2c39f4997c6de739c33c07e5f3-dirty
petr-novak
parents: 23
diff changeset
12 <requirement type="package" version="4.4">cutadapt</requirement>
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
13 <requirement type="package">bioconductor-shortread</requirement>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
14 <requirement type="package">r-optparse</requirement>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
15 </requirements>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
16 <required_files>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
17 <include type="literal" path="paired_fastq_filtering_wrapper.sh"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
18 <include type="literal" path="paired_fastq_filtering.R"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
19 <include type="literal" path="fasta_interlacer.py"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
20 </required_files>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
21 <command>
33
f1738f8649b0 planemo upload commit 39094a128ea3dd2c39f4997c6de739c33c07e5f3-dirty
petr-novak
parents: 23
diff changeset
22 cutadapt --version;
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
23 bash '$__tool_directory__'/paired_fastq_filtering_wrapper.sh -a ${A} -b ${B} -o
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
24 ${paired} -c ${cut_off} -p ${percent_above} -N ${max_n} $rename -G ${png_output}
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
25
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
26 #if $sampling.sequence_sampling :
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
27 -n $sampling.sample_size
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
28 #end if
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
29
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
30 #if $trimming.sequence_trimming :
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
31 -e $trimming.trim_end -s $trimming.trim_start
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
32 #end if
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
33
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
34 #if $cutadapt.use_custom :
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
35 -C "${cutadapt.custom_options}"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
36 #end if
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
37
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
38 #if $similarity_filtering.include :
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
39 -F "${similarity_filtering.filter_database}"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
40 #end if
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
41
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
42 </command>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
43
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
44 <inputs>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
45 <param format="fastq,fastq.gz" type="data" name="A" label="Left-hand reads"/>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
46
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
47 <param format="fastq,fastq.gz" type="data" name="B" label="Right-hand reads"/>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
48
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
49 <conditional name="sampling">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
50 <param name="sequence_sampling" type="boolean" truevalue="true"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
51 falsevalue="false" checked="False" label="Read sampling"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
52 <when value="false">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
53 <!-- do nothing here -->
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
54 </when>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
55 <when value="true">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
56 <param name="sample_size" type="integer"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
57 label="Sample size (number of pairs)"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
58 help="How many read pairs should be sampled" value="500000"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
59 min="0"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
60 </when>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
61 </conditional>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
62
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
63 <param type="integer" name="cut_off" label="Quality cutoff" value="10" min="0"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
64 help="See below how to correctly set the quality cutoff"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
65 <param type="integer" name="percent_above" label="Percent above cutoff" value="95"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
66 min="0"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
67 help="Percentage of bases in the read that must have quality equal to or higher than the cutoff value"/>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
68
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
69 <conditional name="trimming">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
70 <param name="sequence_trimming" type="boolean" truevalue="true"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
71 falsevalue="false" checked="False" label="Trim reads"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
72 <when value="false">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
73 <!-- do nothing here -->
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
74 </when>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
75 <when value="true">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
76 <param type="integer" name="trim_start" label="Start position" value="1"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
77 min="1"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
78 help="Reads are trimmed at the specified start"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
79 <param type="integer" name="trim_end" label="End position" value="100"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
80 min="1"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
81 help="Reads are trimmed to the specified end position, shorted sequences are discarded"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
82 </when>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
83
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
84 </conditional>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
85 <param name="max_n" type="integer" label="Maximum Ns"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
86 help="Maximal number of Ns allowed in reads" value="0" min="0" max="10"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
87
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
88 <conditional name="cutadapt">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
89 <param name="use_custom" type="boolean" truevalue="true" falsevalue="false"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
90 checked="False" label="Custom cutadapt options"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
91 <when value="false">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
92 <!-- do nothing here -->
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
93 </when>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
94 <when value="true">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
95 <param name="custom_options" type="text" area="True" size="8x30"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
96 label="Custom options" help="Consult cutadapt for usage" value="">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
97 <sanitizer sanitize="False"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
98 </param>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
99 >
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
100 </when>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
101 </conditional>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
102
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
103 <conditional name="similarity_filtering">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
104 <param name="include" type="boolean" truevalue="true" falsevalue="false"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
105 checked="False" label="Use similarity search filtering"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
106 <when value="false">
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
107 <!-- do nothing here -->
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
108 </when>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
109 <when value="true">
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
110
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
111 <param name="filter_database" format="fasta" type="data"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
112 label="Sequence filter database"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
113 help="Provide DNA sequences in FASTA format. Reads that have at least 90% similarity over 90% of their length to sequence in the filter database will be removed. This option is suitable for removing organellar or other contaminating sequences."/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
114 </when>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
115 </conditional>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
116
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
117 <param name="rename" type="boolean" truevalue="-R" falsevalue="" checked="True"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
118 label="Rename reads"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
119 help="By default, original read names are used. In case your reads do not follow proper naming scheme to label paired-end mates, use this option. All read pairs must be complete!"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
120 </inputs>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
121
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
122
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
123 <outputs>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
124 <data format="fasta" name="paired"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
125 label="Interlaced paired reads from datasets ${A.hid} and ${B.hid} "/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
126 <data format="png" name="png_output"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
127 label="Nucleotide composition after filtering of ${A.hid} and ${B.hid} "/>"
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
128 </outputs>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
129
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
130
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
131 <tests>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
132 <test>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
133 <param name="A" value="ERR215189_1_part.fastq.gz"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
134 <param name="B" value="ERR215189_2_part.fastq.gz"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
135 <param name="max_n" value="0"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
136 <param name="cut_off" value="10"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
137 <param name="percent_above" value="95"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
138 <output name="output" value="paired_output.fasta"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
139 <output name="png_output" value="paired_output.png"/>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
140 </test>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
141 </tests>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
142
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
143 <help>
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
144 **What it does**
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
145
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
146 This tool is designed to make memory efficient preprocessing of two
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
147 fastq files. Output of this file can be used as input of RepeatExplorer
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
148 clustering.
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
149 Input files can be in GNU zipped archive (.gz extension).
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
150 Reads are filtered based on the quality, presence of N bases and
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
151 adapters. Two input fastq files are procesed in parallel. Only complete pair
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
152 are kept. As the input files are process in chunks, it is required that
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
153 pair reads are complete and in the same order in both input files. All
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
154 reads which pass the quality filter fill be writen into output files.
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
155 If sampling is specified, only sample of sequences will be
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
156 returned. Cutadapt us run with this options::
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
157
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
158 --anywhere='AATGATACGGCGACCACCGAGATCTACACTCTTTCCCTACACGACGCTCTTCCGATCT'
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
159 --anywhere='AGATCGGAAGAGCGTCGTGTAGGGAAAGAGTGTAGATCTCGGTGGTCGCCGTATCATT'
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
160 --anywhere='GATCGGAAGAGCACACGTCTGAACTCCAGTCAC'
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
161 --anywhere='ATCTCGTATGCCGTCTTCTGCTTG'
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
162 --anywhere='CAAGCAGAAGACGGCATACGAGAT'
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
163 --anywhere='GTGACTGGAGTTCAGACGTGTGCTCTTCCGATC'
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
164 --error-rate=0.05
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
165 --times=1 --overlap=15 --discard
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
166
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
167
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
168 **Order of fastq files processing**
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
169
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
170 1. Trimming (optional)
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
171 #. Filter by quality
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
172 #. Discard single reads, keep complete pairs
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
173 #. Cutadapt filtering
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
174 #. Discard single reads, keep complete pairs
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
175 #. Sampling (optional)
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
176 #. Interlacing two fasta files
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
177
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
178 **Quality setting cutoff**
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
179
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
180 To correctly set quality cutoff, you need to know how the quality is encoded in
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
181 your fastq file, default
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
182 filtering which is suitable for Sanger and Illumina 1.8 encoding is shown below::
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
183
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
184
22
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
185 Default filtering cutoff
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
186 |
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
187 |
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
188 V
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
189 SSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSS.....................................................
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
190 ..........................XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX......................
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
191 ...............................IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII......................
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
192 .................................JJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJ......................
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
193 LLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLL....................................................
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
194 !"#$%&amp;'()*+,-./0123456789:;&lt;=&gt;?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
195 | | | | | |
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
196 33 59 64 73 104 126
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
197 0........................26...31.......40
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
198 -5....0........9.............................40
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
199 0........9.............................40
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
200 3.....9.............................40
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
201 0.2......................26...31........41
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
202
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
203 S - Sanger Phred+33, raw reads typically (0, 40)
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
204 X - Solexa Solexa+64, raw reads typically (-5, 40)
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
205 I - Illumina 1.3+ Phred+64, raw reads typically (0, 40)
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
206 J - Illumina 1.5+ Phred+64, raw reads typically (3, 40)
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
207 with 0=unused, 1=unused, 2=Read Segment Quality Control Indicator (bold)
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
208 (Note: See discussion above).
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
209 L - Illumina 1.8+ Phred+33, raw reads typically (0, 41)
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
210
58807b35777a planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents: 10
diff changeset
211 </help>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
212 </tool>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
213