Mercurial > repos > petr-novak > re_utils
annotate paired_fastq_filtering.xml @ 34:91996b991991 draft default tip
Uploaded
author | petr-novak |
---|---|
date | Fri, 16 Feb 2024 15:22:21 +0000 |
parents | f1738f8649b0 |
children |
rev | line source |
---|---|
23
36c418bca8b2
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
22
diff
changeset
|
1 <tool id="paired_fastq_filtering" name="Preprocessing of FASTQ paired-end reads" version="1.0.0.3"> |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
2 <stdio> |
23
36c418bca8b2
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
22
diff
changeset
|
3 <exit_code range="1:" level="fatal" description="Error"/> |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
4 </stdio> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
5 <description> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
6 Preprocessing of paired-end reads in FASTQ format |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
7 including trimming, quality filtering, cutadapt filtering and interlacing. Broken |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
8 pairs are discarded. |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
9 </description> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
10 <requirements> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
11 <requirement type="package">blast</requirement> |
33
f1738f8649b0
planemo upload commit 39094a128ea3dd2c39f4997c6de739c33c07e5f3-dirty
petr-novak
parents:
23
diff
changeset
|
12 <requirement type="package" version="4.4">cutadapt</requirement> |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
13 <requirement type="package">bioconductor-shortread</requirement> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
14 <requirement type="package">r-optparse</requirement> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
15 </requirements> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
16 <required_files> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
17 <include type="literal" path="paired_fastq_filtering_wrapper.sh"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
18 <include type="literal" path="paired_fastq_filtering.R"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
19 <include type="literal" path="fasta_interlacer.py"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
20 </required_files> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
21 <command> |
33
f1738f8649b0
planemo upload commit 39094a128ea3dd2c39f4997c6de739c33c07e5f3-dirty
petr-novak
parents:
23
diff
changeset
|
22 cutadapt --version; |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
23 bash '$__tool_directory__'/paired_fastq_filtering_wrapper.sh -a ${A} -b ${B} -o |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
24 ${paired} -c ${cut_off} -p ${percent_above} -N ${max_n} $rename -G ${png_output} |
0 | 25 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
26 #if $sampling.sequence_sampling : |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
27 -n $sampling.sample_size |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
28 #end if |
0 | 29 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
30 #if $trimming.sequence_trimming : |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
31 -e $trimming.trim_end -s $trimming.trim_start |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
32 #end if |
0 | 33 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
34 #if $cutadapt.use_custom : |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
35 -C "${cutadapt.custom_options}" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
36 #end if |
0 | 37 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
38 #if $similarity_filtering.include : |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
39 -F "${similarity_filtering.filter_database}" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
40 #end if |
0 | 41 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
42 </command> |
0 | 43 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
44 <inputs> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
45 <param format="fastq,fastq.gz" type="data" name="A" label="Left-hand reads"/> |
0 | 46 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
47 <param format="fastq,fastq.gz" type="data" name="B" label="Right-hand reads"/> |
0 | 48 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
49 <conditional name="sampling"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
50 <param name="sequence_sampling" type="boolean" truevalue="true" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
51 falsevalue="false" checked="False" label="Read sampling"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
52 <when value="false"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
53 <!-- do nothing here --> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
54 </when> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
55 <when value="true"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
56 <param name="sample_size" type="integer" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
57 label="Sample size (number of pairs)" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
58 help="How many read pairs should be sampled" value="500000" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
59 min="0"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
60 </when> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
61 </conditional> |
0 | 62 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
63 <param type="integer" name="cut_off" label="Quality cutoff" value="10" min="0" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
64 help="See below how to correctly set the quality cutoff"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
65 <param type="integer" name="percent_above" label="Percent above cutoff" value="95" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
66 min="0" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
67 help="Percentage of bases in the read that must have quality equal to or higher than the cutoff value"/> |
0 | 68 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
69 <conditional name="trimming"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
70 <param name="sequence_trimming" type="boolean" truevalue="true" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
71 falsevalue="false" checked="False" label="Trim reads"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
72 <when value="false"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
73 <!-- do nothing here --> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
74 </when> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
75 <when value="true"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
76 <param type="integer" name="trim_start" label="Start position" value="1" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
77 min="1" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
78 help="Reads are trimmed at the specified start"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
79 <param type="integer" name="trim_end" label="End position" value="100" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
80 min="1" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
81 help="Reads are trimmed to the specified end position, shorted sequences are discarded"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
82 </when> |
0 | 83 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
84 </conditional> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
85 <param name="max_n" type="integer" label="Maximum Ns" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
86 help="Maximal number of Ns allowed in reads" value="0" min="0" max="10"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
87 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
88 <conditional name="cutadapt"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
89 <param name="use_custom" type="boolean" truevalue="true" falsevalue="false" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
90 checked="False" label="Custom cutadapt options"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
91 <when value="false"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
92 <!-- do nothing here --> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
93 </when> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
94 <when value="true"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
95 <param name="custom_options" type="text" area="True" size="8x30" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
96 label="Custom options" help="Consult cutadapt for usage" value=""> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
97 <sanitizer sanitize="False"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
98 </param> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
99 > |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
100 </when> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
101 </conditional> |
0 | 102 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
103 <conditional name="similarity_filtering"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
104 <param name="include" type="boolean" truevalue="true" falsevalue="false" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
105 checked="False" label="Use similarity search filtering"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
106 <when value="false"> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
107 <!-- do nothing here --> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
108 </when> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
109 <when value="true"> |
0 | 110 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
111 <param name="filter_database" format="fasta" type="data" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
112 label="Sequence filter database" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
113 help="Provide DNA sequences in FASTA format. Reads that have at least 90% similarity over 90% of their length to sequence in the filter database will be removed. This option is suitable for removing organellar or other contaminating sequences."/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
114 </when> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
115 </conditional> |
0 | 116 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
117 <param name="rename" type="boolean" truevalue="-R" falsevalue="" checked="True" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
118 label="Rename reads" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
119 help="By default, original read names are used. In case your reads do not follow proper naming scheme to label paired-end mates, use this option. All read pairs must be complete!"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
120 </inputs> |
0 | 121 |
122 | |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
123 <outputs> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
124 <data format="fasta" name="paired" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
125 label="Interlaced paired reads from datasets ${A.hid} and ${B.hid} "/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
126 <data format="png" name="png_output" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
127 label="Nucleotide composition after filtering of ${A.hid} and ${B.hid} "/>" |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
128 </outputs> |
0 | 129 |
130 | |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
131 <tests> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
132 <test> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
133 <param name="A" value="ERR215189_1_part.fastq.gz"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
134 <param name="B" value="ERR215189_2_part.fastq.gz"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
135 <param name="max_n" value="0"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
136 <param name="cut_off" value="10"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
137 <param name="percent_above" value="95"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
138 <output name="output" value="paired_output.fasta"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
139 <output name="png_output" value="paired_output.png"/> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
140 </test> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
141 </tests> |
0 | 142 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
143 <help> |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
144 **What it does** |
0 | 145 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
146 This tool is designed to make memory efficient preprocessing of two |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
147 fastq files. Output of this file can be used as input of RepeatExplorer |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
148 clustering. |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
149 Input files can be in GNU zipped archive (.gz extension). |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
150 Reads are filtered based on the quality, presence of N bases and |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
151 adapters. Two input fastq files are procesed in parallel. Only complete pair |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
152 are kept. As the input files are process in chunks, it is required that |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
153 pair reads are complete and in the same order in both input files. All |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
154 reads which pass the quality filter fill be writen into output files. |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
155 If sampling is specified, only sample of sequences will be |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
156 returned. Cutadapt us run with this options:: |
0 | 157 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
158 --anywhere='AATGATACGGCGACCACCGAGATCTACACTCTTTCCCTACACGACGCTCTTCCGATCT' |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
159 --anywhere='AGATCGGAAGAGCGTCGTGTAGGGAAAGAGTGTAGATCTCGGTGGTCGCCGTATCATT' |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
160 --anywhere='GATCGGAAGAGCACACGTCTGAACTCCAGTCAC' |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
161 --anywhere='ATCTCGTATGCCGTCTTCTGCTTG' |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
162 --anywhere='CAAGCAGAAGACGGCATACGAGAT' |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
163 --anywhere='GTGACTGGAGTTCAGACGTGTGCTCTTCCGATC' |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
164 --error-rate=0.05 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
165 --times=1 --overlap=15 --discard |
0 | 166 |
167 | |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
168 **Order of fastq files processing** |
0 | 169 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
170 1. Trimming (optional) |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
171 #. Filter by quality |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
172 #. Discard single reads, keep complete pairs |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
173 #. Cutadapt filtering |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
174 #. Discard single reads, keep complete pairs |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
175 #. Sampling (optional) |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
176 #. Interlacing two fasta files |
0 | 177 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
178 **Quality setting cutoff** |
0 | 179 |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
180 To correctly set quality cutoff, you need to know how the quality is encoded in |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
181 your fastq file, default |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
182 filtering which is suitable for Sanger and Illumina 1.8 encoding is shown below:: |
0 | 183 |
184 | |
22
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
185 Default filtering cutoff |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
186 | |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
187 | |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
188 V |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
189 SSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSS..................................................... |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
190 ..........................XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX...................... |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
191 ...............................IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII...................... |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
192 .................................JJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJ...................... |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
193 LLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLLL.................................................... |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
194 !"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~ |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
195 | | | | | | |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
196 33 59 64 73 104 126 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
197 0........................26...31.......40 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
198 -5....0........9.............................40 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
199 0........9.............................40 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
200 3.....9.............................40 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
201 0.2......................26...31........41 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
202 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
203 S - Sanger Phred+33, raw reads typically (0, 40) |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
204 X - Solexa Solexa+64, raw reads typically (-5, 40) |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
205 I - Illumina 1.3+ Phred+64, raw reads typically (0, 40) |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
206 J - Illumina 1.5+ Phred+64, raw reads typically (3, 40) |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
207 with 0=unused, 1=unused, 2=Read Segment Quality Control Indicator (bold) |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
208 (Note: See discussion above). |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
209 L - Illumina 1.8+ Phred+33, raw reads typically (0, 41) |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
210 |
58807b35777a
planemo upload commit 20bdf879b52796d3fb251a20807191ff02084d3c-dirty
petr-novak
parents:
10
diff
changeset
|
211 </help> |
0 | 212 </tool> |
213 |