annotate diamond_makedb.xml @ 6:bd12f97bf39d draft

Uploaded table sample
author p.lucas
date Tue, 28 May 2024 12:55:16 +0000
parents f7ebcfa91ab4
children 849e9c51fe6b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
1 <tool id="bg_diamond_makedb" name="Diamond makedb" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="19.01">
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
2 <description>Build database from a FASTA file</description>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
3 <macros>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
4 <import>macros.xml</import>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
5 </macros>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
6
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
7 <expand macro="stdio" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
8 <expand macro="version_command" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
9
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
10 <command detect_errors="aggressive">
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
11 <!-- DB has two files, *.dmnd and *.tx -->
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
12 <![CDATA[
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
13 /usr/bin/diamond makedb
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
14 --threads "\${GALAXY_SLOTS:-12}"
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
15 --in '$infile'
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
16 --db ./database
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
17
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
18 #if str($tax_cond.tax_select) == 'yes':
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
19 --taxonmap '$tax_cond.taxonmap'
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
20 --taxonnodes '$tax_cond.taxonnodes'
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
21 --taxonnames '$tax_cond.taxonnames'
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
22 #end if
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
23 ]]>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
24 </command>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
25
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
26 <inputs>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
27 <param name="infile" type="data" format="fasta" label="Input reference file in FASTA format" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
28 <conditional name="tax_cond">
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
29 <param name="tax_select" type="select" label="Add taxonomic data?" help="Needs to be supplied in order to provide taxonomy features of the aligner">
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
30 <option value="yes">Yes</option>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
31 <option value="no" selected="true">No</option>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
32 </param>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
33 <when value="yes">
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
34 <param argument="--taxonmap" type="data" format="tabular"
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
35 label="Protein accession to taxid mapping file"
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
36 help="Path to mapping file that maps NCBI protein accession numbers to taxon ids (gzip compressed). This parameter is optional and needs to be supplied in order to provide taxonomy features.
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
37 A custom file following the same format may be supplied here. Note that the first line of this file is assumed to contain headings and will be ignored" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
38 <param argument="--taxonnodes" type="data" format="tabular" label="Taxonomy nodes.dmp from NCBI" help="This parameter is optional and needs to be supplied in order to provide taxonomy features" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
39 <param argument="--taxonnames" type="data" format="tabular" label="Taxonomy names.dmp from NCBI" help="This parameter is optional and needs to be supplied in order to provide taxonomy features" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
40 </when>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
41 <when value="no"/>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
42 </conditional>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
43 </inputs>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
44
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
45 <outputs>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
46 <data format="dmnd" name="outfile" from_work_dir="database.dmnd" label="${tool.name} on ${on_string}"/>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
47 </outputs>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
48
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
49 <tests>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
50 <test>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
51 <param name="infile" value="db.fasta" ftype="fasta"/>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
52 <output name="outfile" value="db.dmnd" compare="sim_size" delta="2"/>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
53 </test>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
54 <test>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
55 <param name="infile" value="db.fasta" ftype="fasta"/>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
56 <conditional name="tax_cond">
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
57 <param name="tax_select" value="yes"/>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
58 <param name="taxonmap" ftype="tabular" value="prot.accession2taxid" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
59 <param name="taxonnodes" ftype="tabular" value="nodes.dmp" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
60 <param name="taxonnames" ftype="tabular" value="names.dmp" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
61 </conditional>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
62 <output name="outfile" value="db-wtax.dmnd" compare="sim_size" delta="2"/>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
63 </test>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
64 </tests>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
65
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
66 <help>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
67 <![CDATA[
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
68
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
69 .. class:: infomark
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
70
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
71 **What it does**
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
72
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
73 DIAMOND_ is a new alignment tool for aligning short DNA sequencing reads to a protein reference database such as NCBI-NR.
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
74 On Illumina reads of length 100-150bp, in fast mode, DIAMOND is about 20,000 times faster than BLASTX, while reporting
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
75 about 80-90% of all matches that BLASTX finds, with an e-value of at most 1e-5. In sensitive mode, DIAMOND is about 2,500
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
76 times faster than BLASTX, finding more than 94% of all matches.
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
77
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
78 .. _DIAMOND: http://ab.inf.uni-tuebingen.de/software/diamond/
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
79
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
80
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
81 - taxonmap: Path to mapping file that maps NCBI protein accession numbers to taxon ids (gzip compressed). This parameter is optional and needs to be supplied in order to provide taxonomy features. The file can be downloaded from NCBI: ftp://ftp.ncbi.nlm.nih.gov/pub/taxonomy/accession2taxid/prot.accession2taxid.gz
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
82
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
83 - taxonnames: Path to the names.dmp file from the NCBI taxonomy. This parameter is optional and needs to be supplied in order to provide taxonomy features. The file is contained within this archive downloadable at NCBI: ftp.ncbi.nlm.nih.gov/pub/taxonomy/taxdmp.zip
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
84
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
85 - taxonnodes: Path to the nodes.dmp file from the NCBI taxonomy. This parameter is optional and needs to be supplied in order to provide taxonomy features. The file is contained within this archive downloadable at NCBI: ftp.ncbi.nlm.nih.gov/pub/taxonomy/taxdmp.zip
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
86 ]]>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
87 </help>
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
88
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
89 <expand macro="citations" />
f7ebcfa91ab4 Uploaded makedb
p.lucas
parents:
diff changeset
90 </tool>