annotate diamond_makedb.xml @ 49:a203fc50858c draft

Uploaded
author p.lucas
date Tue, 04 Jun 2024 15:07:42 +0000
parents 2474240f89ff
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
42
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
1 <tool id="pl_diamond_makedb" name="PL_Diamond makedb" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="19.01">
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
2 <description>Build database from a FASTA file</description>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
3 <macros>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
4 <import>macros.xml</import>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
5 </macros>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
6
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
7 <expand macro="stdio" />
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
8 <expand macro="version_command" />
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
9
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
10 <command detect_errors="aggressive">
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
11 <!-- DB has two files, *.dmnd and *.tx -->
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
12 <![CDATA[
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
13 /usr/bin/diamond makedb
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
14 --threads "\${GALAXY_SLOTS:-12}"
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
15 --in '$infile'
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
16 --db ./database
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
17
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
18 #if str($tax_cond.tax_select) == 'yes':
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
19 --taxonmap '$tax_cond.taxonmap'
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
20 --taxonnodes '$tax_cond.taxonnodes'
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
21 --taxonnames '$tax_cond.taxonnames'
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
22 #end if
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
23 ]]>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
24 </command>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
25
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
26 <inputs>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
27 <param name="infile" type="data" format="fasta" label="Input reference file in FASTA format" />
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
28 <conditional name="tax_cond">
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
29 <param name="tax_select" type="select" label="Add taxonomic data?" help="Needs to be supplied in order to provide taxonomy features of the aligner">
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
30 <option value="yes">Yes</option>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
31 <option value="no" selected="true">No</option>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
32 </param>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
33 <when value="yes">
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
34 <param argument="--taxonmap" type="data" format="tabular"
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
35 label="Protein accession to taxid mapping file"
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
36 help="Path to mapping file that maps NCBI protein accession numbers to taxon ids (gzip compressed). This parameter is optional and needs to be supplied in order to provide taxonomy features.
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
37 A custom file following the same format may be supplied here. Note that the first line of this file is assumed to contain headings and will be ignored" />
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
38 <param argument="--taxonnodes" type="data" format="tabular" label="Taxonomy nodes.dmp from NCBI" help="This parameter is optional and needs to be supplied in order to provide taxonomy features" />
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
39 <param argument="--taxonnames" type="data" format="tabular" label="Taxonomy names.dmp from NCBI" help="This parameter is optional and needs to be supplied in order to provide taxonomy features" />
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
40 </when>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
41 <when value="no"/>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
42 </conditional>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
43 </inputs>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
44
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
45 <outputs>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
46 <data format="dmnd" name="outfile" from_work_dir="database.dmnd" label="${tool.name} on ${on_string}"/>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
47 </outputs>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
48
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
49 <help>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
50 <![CDATA[
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
51
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
52 .. class:: infomark
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
53
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
54 **What it does**
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
55
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
56 DIAMOND_ is a new alignment tool for aligning short DNA sequencing reads to a protein reference database such as NCBI-NR.
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
57 On Illumina reads of length 100-150bp, in fast mode, DIAMOND is about 20,000 times faster than BLASTX, while reporting
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
58 about 80-90% of all matches that BLASTX finds, with an e-value of at most 1e-5. In sensitive mode, DIAMOND is about 2,500
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
59 times faster than BLASTX, finding more than 94% of all matches.
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
60
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
61 .. _DIAMOND: http://ab.inf.uni-tuebingen.de/software/diamond/
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
62
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
63
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
64 - taxonmap: Path to mapping file that maps NCBI protein accession numbers to taxon ids (gzip compressed). This parameter is optional and needs to be supplied in order to provide taxonomy features. The file can be downloaded from NCBI: ftp://ftp.ncbi.nlm.nih.gov/pub/taxonomy/accession2taxid/prot.accession2taxid.gz
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
65
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
66 - taxonnames: Path to the names.dmp file from the NCBI taxonomy. This parameter is optional and needs to be supplied in order to provide taxonomy features. The file is contained within this archive downloadable at NCBI: ftp.ncbi.nlm.nih.gov/pub/taxonomy/taxdmp.zip
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
67
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
68 - taxonnodes: Path to the nodes.dmp file from the NCBI taxonomy. This parameter is optional and needs to be supplied in order to provide taxonomy features. The file is contained within this archive downloadable at NCBI: ftp.ncbi.nlm.nih.gov/pub/taxonomy/taxdmp.zip
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
69 ]]>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
70 </help>
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
71
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
72 <expand macro="citations" />
2474240f89ff Uploaded
p.lucas
parents:
diff changeset
73 </tool>