comparison fastq_quality_trimmer.xml @ 0:27e997d5c273 draft default tip

"planemo upload for repository https://github.com/ebi-gene-expression-group/container-galaxy-sc-tertiary/tree/develop/tools/qc/fastq_quality_trimmer commit b8f23cd5bce0118cc9aab61253056b596e42a06f"
author ebi-gxa
date Fri, 11 Mar 2022 03:56:00 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:27e997d5c273
1 <tool id="cshl_fastq_quality_trimmer" name="Trim By Quality" profile="18.01" version="0.0.14+galaxy0">
2 <description>Trims reads at the 3'-end based on quality, discarding reads with trimmed length less than threshold.</description>
3 <requirements>
4 <requirement type="package" version="0.0.14">fastx_toolkit</requirement>
5 </requirements>
6 <command><![CDATA[
7 fastq_quality_trimmer
8 -i '$input'
9 -t '$cutoff'
10 -l '$minlen'
11 -Q '$phred'
12 -v
13 -o '$output'
14 ]]></command>
15
16 <inputs>
17 <param name="input" label="Library to clip" argument="-i" type="data" format="fastq,fastqsanger" optional="false" />
18 <param name="cutoff" size="4" type="integer" value="20">
19 <label>Minimum quality score</label>
20 <help>Nucleotides below this quality will be trimmed</help>
21 </param>
22 <param name="minlen" size="4" type="integer" value="1">
23 <label>Minimum sequence length</label>
24 <help>Sequences shorter than this length will be discard. Leave at zero to keep all sequences</help>
25 </param>
26 <param name="phred" label="PHRED Encoding" argument="-Q" type="select" help="PHRED encoding used in the input files">
27 <option value="33" selected="true">33</option>
28 <option value="64">64</option>
29 </param>
30 </inputs>
31
32 <outputs>
33 <data label="${tool.name} on ${on_string}: Trimmed fastq" name="output" format_source="input" />
34 </outputs>
35
36 <tests>
37 <test>
38 <param name="input" value="fastq_quality_trimmer.fastq" ftype="fastq" />
39 <param name="cutoff" value="30"/>
40 <param name="minlen" value="16"/>
41 <param name="phred" value="64"/>
42 <output name="output" md5="5173e32392286a05e1317387cc0d567e" />
43 </test>
44 </tests>
45
46 <help>
47 **What it does**
48
49 This tool scans the sequence from the end for the first nucleotide to possess the specified minimum quality score. It will then trim (remove nucleotides from) the sequence after this position. After trimming, sequences that are shorter than the minimum length are discarded.
50
51 --------
52
53 **Example**
54
55 Input Fasta file (with 20 bases in each sequences)::
56
57 @1
58 TATGGTCAGAAACCATATGC
59 +1
60 40 40 40 40 40 40 40 40 40 40 40 20 19 19 19 19 19 19 19 19
61 @2
62 CAGCGAGGCTTTAATGCCAT
63 +2
64 40 40 40 40 40 40 40 40 30 20 19 20 19 19 19 19 19 19 19 19
65 @3
66 CAGCGAGGCTTTAATGCCAT
67 +3
68 40 40 40 40 40 40 40 40 20 19 19 19 19 19 19 19 19 19 19 19
69
70
71 Trimming with a cutoff of 20, we get the following FASTQ file::
72
73 @1
74 TATGGTCAGAAA
75 +1
76 40 40 40 40 40 40 40 40 40 40 40 20
77 @2
78 CAGCGAGGCTTT
79 +2
80 40 40 40 40 40 40 40 40 30 20 19 20
81 @3
82 CAGCGAGGC
83 +3
84 40 40 40 40 40 40 40 40 20
85
86 Trimming with a cutoff of 20 and a minimum length of 12, we get the following FASTQ file::
87
88 @1
89 TATGGTCAGAAA
90 +1
91 40 40 40 40 40 40 40 40 40 40 40 20
92 @2
93 CAGCGAGGCTTT
94 +2
95 40 40 40 40 40 40 40 40 30 20 19 20
96
97 ------
98
99 This tool is based on `FASTX-toolkit`__ by Assaf Gordon.
100
101 .. __: http://hannonlab.cshl.edu/fastx_toolkit/
102
103 </help>
104 <citations>
105 <citation type="bibtex"><![CDATA[
106 @ARTICLE{Gordon2009,
107 author = {Gordon, A.},
108 title = {fastx_toolkit},
109 year = {2009},
110 publisher = {GitHub},
111 journal = {GitHub repository},
112 howpublished = {\url{https://github.com/agordon/fastx_toolkit}},
113 commit = {ea0ca83ba24dce80c20ca589b838a281fe5deb0c}
114 }]]></citation>
115 </citations>
116 </tool>
117 <!-- FASTX-Quality-Trimmer is part of the FASTX-toolkit, by A.Gordon (gordon@cshl.edu) -->