annotate diamond_makedb.xml @ 34:e8835c6844ac draft

Uploaded
author p.lucas
date Tue, 28 May 2024 14:33:09 +0000
parents be17909bcbf0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
23
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
1 <tool id="pl_diamond_makedb" name="PL_Diamond makedb" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="19.01">
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
2 <description>Build database from a FASTA file</description>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
3 <macros>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
4 <import>macros.xml</import>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
5 </macros>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
6
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
7 <expand macro="stdio" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
8 <expand macro="version_command" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
9
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
10 <command detect_errors="aggressive">
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
11 <!-- DB has two files, *.dmnd and *.tx -->
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
12 <![CDATA[
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
13 /usr/bin/diamond makedb
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
14 --threads "\${GALAXY_SLOTS:-12}"
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
15 --in '$infile'
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
16 --db ./database
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
17
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
18 #if str($tax_cond.tax_select) == 'yes':
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
19 --taxonmap '$tax_cond.taxonmap'
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
20 --taxonnodes '$tax_cond.taxonnodes'
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
21 --taxonnames '$tax_cond.taxonnames'
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
22 #end if
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
23 ]]>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
24 </command>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
25
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
26 <inputs>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
27 <param name="infile" type="data" format="fasta" label="Input reference file in FASTA format" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
28 <conditional name="tax_cond">
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
29 <param name="tax_select" type="select" label="Add taxonomic data?" help="Needs to be supplied in order to provide taxonomy features of the aligner">
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
30 <option value="yes">Yes</option>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
31 <option value="no" selected="true">No</option>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
32 </param>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
33 <when value="yes">
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
34 <param argument="--taxonmap" type="data" format="tabular"
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
35 label="Protein accession to taxid mapping file"
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
36 help="Path to mapping file that maps NCBI protein accession numbers to taxon ids (gzip compressed). This parameter is optional and needs to be supplied in order to provide taxonomy features.
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
37 A custom file following the same format may be supplied here. Note that the first line of this file is assumed to contain headings and will be ignored" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
38 <param argument="--taxonnodes" type="data" format="tabular" label="Taxonomy nodes.dmp from NCBI" help="This parameter is optional and needs to be supplied in order to provide taxonomy features" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
39 <param argument="--taxonnames" type="data" format="tabular" label="Taxonomy names.dmp from NCBI" help="This parameter is optional and needs to be supplied in order to provide taxonomy features" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
40 </when>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
41 <when value="no"/>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
42 </conditional>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
43 </inputs>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
44
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
45 <outputs>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
46 <data format="dmnd" name="outfile" from_work_dir="database.dmnd" label="${tool.name} on ${on_string}"/>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
47 </outputs>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
48
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
49 <tests>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
50 <test>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
51 <param name="infile" value="db.fasta" ftype="fasta"/>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
52 <output name="outfile" value="db.dmnd" compare="sim_size" delta="2"/>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
53 </test>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
54 <test>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
55 <param name="infile" value="db.fasta" ftype="fasta"/>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
56 <conditional name="tax_cond">
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
57 <param name="tax_select" value="yes"/>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
58 <param name="taxonmap" ftype="tabular" value="prot.accession2taxid" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
59 <param name="taxonnodes" ftype="tabular" value="nodes.dmp" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
60 <param name="taxonnames" ftype="tabular" value="names.dmp" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
61 </conditional>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
62 <output name="outfile" value="db-wtax.dmnd" compare="sim_size" delta="2"/>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
63 </test>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
64 </tests>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
65
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
66 <help>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
67 <![CDATA[
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
68
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
69 .. class:: infomark
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
70
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
71 **What it does**
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
72
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
73 DIAMOND_ is a new alignment tool for aligning short DNA sequencing reads to a protein reference database such as NCBI-NR.
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
74 On Illumina reads of length 100-150bp, in fast mode, DIAMOND is about 20,000 times faster than BLASTX, while reporting
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
75 about 80-90% of all matches that BLASTX finds, with an e-value of at most 1e-5. In sensitive mode, DIAMOND is about 2,500
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
76 times faster than BLASTX, finding more than 94% of all matches.
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
77
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
78 .. _DIAMOND: http://ab.inf.uni-tuebingen.de/software/diamond/
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
79
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
80
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
81 - taxonmap: Path to mapping file that maps NCBI protein accession numbers to taxon ids (gzip compressed). This parameter is optional and needs to be supplied in order to provide taxonomy features. The file can be downloaded from NCBI: ftp://ftp.ncbi.nlm.nih.gov/pub/taxonomy/accession2taxid/prot.accession2taxid.gz
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
82
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
83 - taxonnames: Path to the names.dmp file from the NCBI taxonomy. This parameter is optional and needs to be supplied in order to provide taxonomy features. The file is contained within this archive downloadable at NCBI: ftp.ncbi.nlm.nih.gov/pub/taxonomy/taxdmp.zip
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
84
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
85 - taxonnodes: Path to the nodes.dmp file from the NCBI taxonomy. This parameter is optional and needs to be supplied in order to provide taxonomy features. The file is contained within this archive downloadable at NCBI: ftp.ncbi.nlm.nih.gov/pub/taxonomy/taxdmp.zip
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
86 ]]>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
87 </help>
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
88
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
89 <expand macro="citations" />
be17909bcbf0 Uploaded
p.lucas
parents:
diff changeset
90 </tool>