comparison dorado_trimming.xml @ 0:1957f881bdf4 draft

planemo upload for repository https://github.com/usegalaxy-au/tools-au/tree/master/tools/dorado commit 8f48f7ee85162eeaa9c0247c7bb7d699f84d6ca7
author galaxy-australia
date Mon, 04 Nov 2024 03:27:55 +0000
parents
children 7ff7680fa713
comparison
equal deleted inserted replaced
-1:000000000000 0:1957f881bdf4
1 <tool id="dorado_trimming" name="Dorado adapter and primer trimming" version="@VERSION@+galaxy0" python_template_version="3.5" profile="24.1">
2 <description>for Oxford Nanopore (ONT) DNA reads</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <expand macro="xrefs"/>
7 <expand macro="requirements"/>
8 <command detect_errors="exit_code"><![CDATA[
9
10 ln -s '$reads' ./reads
11
12 &&
13
14 dorado trim
15 --verbose
16 --threads "\${GALAXY_SLOTS}"
17 #if $no_trim_primers
18 --no-trim-primers
19 #end if
20 #if $primer_sequences
21 --primer-sequences '$primer_sequences'
22 #end if
23 reads
24 > trimmed.bam
25
26 &&
27
28 dorado summary
29 trimmed.bam
30 > summary.tsv
31
32
33 ]]></command>
34 <inputs>
35 <param name="reads" type="data" format="bam,fastqsanger,unsorted.bam" label="Existing, basecalled DNA dataset" help="Note: this tool does not support trimming adaptors from RNA reads. These need to be removed during basecalling."/>
36 <param argument="--no-trim-primers" type="boolean" label="Don't trim primers" help="This option can be used to prevent the trimming of primer sequences. In this case only adapter sequences will be trimmed."/>
37 <param argument="--primer-sequences" type="data" format="fasta" optional="true" label="Custom primer sequences" help="You can specify an alternative set of primer sequences to search for when trimming by adding a FASTA file containing the primer sequences you want to search for. The record names of the sequences do not matter. Note that if you use this option the normal primer sequences built-in to the dorado software will not be searched for."/>
38 </inputs>
39 <outputs>
40 <data format="unsorted.bam" name="out_bam" label="Reads from ${on_string} trimmed by the ${tool.name} tool" from_work_dir="trimmed.bam"/>
41 <data format="tsv" name="out_tsv" label="${tool.name} sequencing summary for ${on_string}" from_work_dir="summary.tsv"/>
42 </outputs>
43 <tests>
44 <test expect_num_outputs="2">
45 <param name="reads" value="FAL00375_473bf0ed_0.ten_reads.bam"/>
46 <output name="out_bam" ftype="unsorted.bam" file="dorado_trimming_test1.bam"/>
47 <output name="out_tsv" ftype="tsv" file="dorado_trimming_test1.tsv"/>
48 </test>
49 <test expect_num_outputs="2">
50 <param name="reads" value="FAL00375_473bf0ed_0.ten_reads.bam"/>
51 <param name="no_trim_primers" value="True"/>
52 <output name="out_bam" ftype="unsorted.bam" file="dorado_trimming_test2.bam"/>
53 <output name="out_tsv" ftype="tsv" file="dorado_trimming_test2.tsv"/>
54 </test>
55 <test expect_num_outputs="2">
56 <param name="reads" value="lsk109_single_read.fastqsanger.gz" ftype="fastqsanger.gz"/>
57 <param name="primer_sequences" value="custom_primers.fasta.gz" ftype="fasta.gz"/>
58 <output name="out_bam" ftype="unsorted.bam" file="dorado_trimming_test3.bam"/>
59 <output name="out_tsv" ftype="tsv" file="dorado_trimming_test3.tsv"/>
60 </test>
61 </tests>
62 <help><![CDATA[
63 Detect and remove any adapter and/or primer sequences from the beginning
64 and end of DNA reads using Oxford Nanopore’s open source
65 `Dorado <https://github.com/nanoporetech/dorado/>`__ basecaller.
66
67 This tool scans existing, basecalled datasets for adapter and/or primer
68 sequences at either end, and trims any such found sequences.
69
70 **If you have raw (un-basecalled) data, you can trim them during
71 basecalling with the Dorado tool on Galaxy**.
72
73 Note that if you intend to demultiplex the reads later, trimming
74 adapters and primers may result in some portions of the flanking regions
75 of the barcodes being removed, which could interfere with correct
76 demultiplexing.
77
78 The **Don't trim primers** option can be used to prevent the trimming of
79 primer sequences. In this case only adapter sequences will be trimmed.
80
81 The output of will always be unaligned records, regardless of whether
82 the input is aligned/sorted or not.
83
84 Custom primer trimming
85 ----------------------
86
87 The software automatically searches for primer sequences used in Oxford
88 Nanopore kits. However, you can specify an alternative set of primer
89 sequences to search by adding a FASTA file of primer sequences in the
90 **Custom primer sequences** option. The record names of the sequences do
91 not matter. Note that if you use this option the normal primer sequences
92 built-in to the dorado software will not be searched for.
93
94 RNA adapter trimming
95 --------------------
96
97 Adapters for RNA002 and RNA004 kits are automatically trimmed during
98 basecalling. However, unlike in DNA, the RNA adapter cannot be trimmed
99 post-basecalling.
100 ]]></help>
101 <expand macro="citation"/>
102 </tool>