Repository 'diamond'
hg clone https://toolshed.g2.bx.psu.edu/repos/bgruening/diamond

Changeset 1:df7738595640 (2017-02-06)
Previous changeset 0:98037ef3d2a9 (2015-02-08) Next changeset 2:fd14bf35c9fd (2017-02-06)
Commit message:
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/diamond commit cc80b878817d052398db16574917900ebe15292e
modified:
diamond.xml
diamond_makedb.xml
repository_dependencies.xml
added:
macros.xml
test-data/db.dmnd
test-data/db.fasta
test-data/diamond_results.tabular
test-data/protein.fasta
removed:
tool_dependencies.xml
b
diff -r 98037ef3d2a9 -r df7738595640 diamond.xml
--- a/diamond.xml Sun Feb 08 10:05:26 2015 -0500
+++ b/diamond.xml Mon Feb 06 07:08:25 2017 -0500
[
b'@@ -1,8 +1,11 @@\n-<tool id="bg_diamond" name="Diamond" version="0.1.6.0">\n+<tool id="bg_diamond" name="Diamond" version="@VERSION@">\n     <description>alignment tool for short sequences against a protein database</description>\n-    <requirements>\n-        <requirement type="package" version="0.6.13">diamond</requirement>\n-    </requirements>\n+    <macros>\n+        <import>macros.xml</import>\n+    </macros>\n+    <expand macro="requirements" />\n+    <expand macro="stdio" />\n+    <expand macro="version_command" />\n     <command>\n <![CDATA[\n \n@@ -15,41 +18,57 @@\n     &&\n \n     diamond\n-        $method.method_select\n+        $method_select\n         --threads "\\${GALAXY_SLOTS:-12}"\n         --db ./database\n-        --query $query\n-        --out $blast_output\n-        ##--sam $sam_output\n-        --compress 0\n-        --tmpdir ./\n+        --query \'$query\'\n+        --query-gencode \'$query_gencode\'\n+\n+        #if $output.outfmt == "5"\n+            --outfmt \'5\'\n+            --out \'$blast_xml\'\n+            $output.salltitles\n+        #else if $output.outfmt == "6"\n+            --outfmt \'6\' #echo \' \'.join(str($output.fields).split(\',\'))\n+            --out \'$blast_tabular\'\n+        #else if $output.outfmt == "101"\n+            --outfmt \'101\'\n+            --out \'$sam_output\'\n+            $output.salltitles\n+        #end if\n+\n+        --compress \'0\'\n+        $sensitive\n+        $more_sensitive\n+        --gapopen \'$gapopen\'\n+        --gapextend \'$gapextend\'\n+        --matrix \'$matrix\'\n+        --seg \'$seg\'\n \n         #if str($hit_filter.hit_filter_select) == \'max\':\n-            --max-target-seqs $hit_filter.max\n+            --max-target-seqs \'$hit_filter.max_target_seqs\'\n         #else:\n-            --top $hit_filter.percentage\n+            --top \'$hit_filter.top\'\n         #end if\n \n         #if str($filter_score.filter_score_select) == \'evalue\':\n-            --evalue $filter_score.evalue\n+            --evalue \'$filter_score.evalue\'\n         #else:\n-            --evalue $filter_score.bitscore\n+            --min-score \'$filter_score.min_score\'\n         #end if\n \n-        --id $identity\n-        $sensitive\n-        --gapopen $method.gapopen\n-        --gapextend $method.gapextend\n-        --matrix $matrix\n-        $seg\n-        $salltitles\n-\n+        --id \'$id\'\n+        --query-cover \'$query_cover\'\n+        --block-size \'$block_size\'\n ]]>\n     </command>\n+\n     <inputs>\n-\n-        <param name="query" type="data" format="fasta" label="Input query file in FASTA format" />\n-\n+        <param name="method_select" type="select" label="What do you want to align?" help="(--blastp/--blastx)">\n+            <option value="blastp">Align amino acid query sequences (blastp)</option>\n+            <option value="blastx">Align DNA query sequences (blastx)</option>\n+        </param>\n+        <param argument="--query" type="data" format="fasta,fastq" label="Input query file in FASTA or FASTQ format" />\n         <conditional name="ref_db_source">\n           <param name="db_source" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options">\n             <option value="indexed">Use a built-in index</option>\n@@ -62,90 +81,160 @@\n                 <validator type="no_options" message="No indexes are available for the selected input dataset"/>\n               </options>\n             </param>\n-          </when>  <!-- build-in -->\n+          </when>\n           <when value="history">\n-            <param name="reference_database" type="data" format="diamond_database" label="Select the reference database" />\n-          </when>  <!-- history -->\n+            <param name="reference_database" type="data" format="dmnd" label="Select the reference database" />\n+          </when>\n         </conditional>\n-\n-        <conditional name="method">\n-            <param name="method_select" type="select" label="What do you want to align" help="(--blastp/--blastx)">\n-                <option value="bl'..b'         label="Enable SEG masking of queries" help="(--seg)"/>\n-        <param name="sensitive" type="boolean" truevalue="--sensitive" falsevalue="" checked="false"\n-            label="Enable sensitive mode" help="(--sensitive)"/>\n-    </inputs>\n     <outputs>\n-        <!--data format="sam" name="sam_output"/-->\n-        <data format="tabular" name="blast_output"/>\n+        <data format="xml" name="blast_xml" label="${tool.name} on ${on_string}">\n+            <filter>output["outfmt"] == "5"</filter>\n+        </data>\n+        <data format="tabular" name="blast_tabular" label="${tool.name} on ${on_string}">\n+            <filter>output["outfmt"] == "6"</filter>\n+        </data>\n+        <data format="sam" name="sam_output" label="${tool.name} on ${on_string}">\n+            <filter>output["outfmt"] == "101"</filter>\n+        </data>\n     </outputs>\n+\n     <tests>\n         <test>\n-            <param name="method" value="blastp"/>\n+            <param name="method_select" value="blastp" />\n             <param name="query" value="protein.fasta" ftype="fasta"/>\n-            <param name="reference_database" value="diamond_makedb_result1.dmnd" ftype="diamond_database"/>\n             <param name="db_source" value="history"/>\n-            <output name="blast_output" file="diamond_result1.tabular" ftpye="tabular"/>\n+            <param name="reference_database" value="db.dmnd"/>\n+            <param name="query_gencode" value="1"/>\n+            <param name="outfmt" value="6"/>\n+            <param name="fields" value="qseqid,sseqid,pident,length,mismatch,gapopen,qstart,qend,sstart,send,evalue,bitscore"/>\n+            <param name="sensitive" value=""/>\n+            <param name="more_sensitive" value=""/>\n+            <param name="gapopen" value="11"/>\n+            <param name="gapextend" value="1"/>\n+            <param name="matrix" value="BLOSUM62"/>\n+            <param name="seg" value="yes"/>\n+            <param name="hit_filter_select" value="max"/>\n+            <param name="max_target_seqs" value="25" />\n+            <param name="filter_score_select" value="evalue"/>\n+            <param name="evalue" value="0.001" />\n+            <param name="id" value="0"/>\n+            <param name="query_cover" value="0"/>\n+            <param name="block_size" value="2"/>\n+            <output name="blast_tabular" file="diamond_results.tabular"/>\n         </test>\n     </tests>\n+\n     <help>\n <![CDATA[\n \n-.. class:: infomark\n-\n **What it does**\n \n DIAMOND_ is a new alignment tool for aligning short DNA sequencing reads to a protein reference database such as NCBI-NR.\n@@ -153,8 +242,33 @@\n about 80-90% of all matches that BLASTX finds, with an e-value of at most 1e-5. In sensitive mode, DIAMOND ist about 2,500\n times faster than BLASTX, finding more than 94% of all matches.\n \n+The DIAMOND algorithm is designed for the alignment of large datasets. The algorithm is not efficient for a small number of query sequences or only a single one of them, and speed will be low. BLAST is recommend for small datasets.\n+\n .. _DIAMOND: http://ab.inf.uni-tuebingen.de/software/diamond/\n \n+**Input**\n+\n+Input data is a large protein or nucleotide sequence file.\n+\n+\n+**Output**\n+\n+Diamond gives you a tabular output file with 12 columns:\n+\n+Column \tDescription\n+1 \t    Query Seq-id (ID of your sequence)\n+2 \t    Subject Seq-id (ID of the database hit)\n+3 \t    Percentage of identical matches\n+4 \t    Alignment length\n+5 \t    Number of mismatches\n+6 \t    Number of gap openings\n+7 \t    Start of alignment in query\n+8 \t    End of alignment in query\n+9 \t    Start of alignment in subject (database hit)\n+10 \t    End of alignment in subject (database hit)\n+11 \t    Expectation value (E-value)\n+12 \t    Bit score\n+\n \n Supported values for gap open and gap extend parameters depending on the selected scoring matrix.\n \n@@ -174,7 +288,5 @@\n \n ]]>\n     </help>\n-    <citations>\n-        <citation type="doi">10.1038/nmeth.3176</citation>\n-    </citations>\n+    <expand macro="citations" />\n </tool>\n'
b
diff -r 98037ef3d2a9 -r df7738595640 diamond_makedb.xml
--- a/diamond_makedb.xml Sun Feb 08 10:05:26 2015 -0500
+++ b/diamond_makedb.xml Mon Feb 06 07:08:25 2017 -0500
[
@@ -1,32 +1,38 @@
-<tool id="bg_diamond_makedb" name="Diamond makedb" version="0.6.13">
+<tool id="bg_diamond_makedb" name="Diamond makedb" version="@VERSION@">
     <description>Build database from a FASTA file</description>
-    <requirements>
-        <requirement type="package" version="0.6.13">diamond</requirement>
-    </requirements>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <expand macro="requirements" />
+    <expand macro="stdio" />
+    <expand macro="version_command" />
+
     <command>
     <!-- DB has two files, *.dmnd and *.tx -->
 <![CDATA[
-    diamond makedb 
+    diamond makedb
         --threads "\${GALAXY_SLOTS:-12}"
-        --in $infile
+        --in '$infile'
         --db ./database
-    &&
-    mv ./database.dmnd $outfile
 ]]>
     </command>
+
     <inputs>
         <param name="infile" type="data" format="fasta" label="Input reference file in FASTA format" />
     </inputs>
 
     <outputs>
-        <data format="diamond_database" name="outfile" label="Diamond database ${on_string}"/>
+        <data format="dmnd" name="outfile" from_work_dir="database.dmnd" label="${tool.name} on ${on_string}"/>
     </outputs>
+
     <tests>
         <test>
-            <param name="infile" value="protein.fasta" ftype="fasta"/>
-            <output name="outfile" file="diamond_makedb_result1.dmnd" ftpye="diamond_database"/>
+            <param name="infile" value="db.fasta" ftype="fasta"/>
+            <output name="outfile" value="db.dmnd"/>
         </test>
     </tests>
+
     <help>
 <![CDATA[
 
@@ -36,7 +42,7 @@
 
 DIAMOND_ is a new alignment tool for aligning short DNA sequencing reads to a protein reference database such as NCBI-NR.
 On Illumina reads of length 100-150bp, in fast mode, DIAMOND is about 20,000 times faster than BLASTX, while reporting
-about 80-90% of all matches that BLASTX finds, with an e-value of at most 1e-5. In sensitive mode, DIAMOND ist about 2,500
+about 80-90% of all matches that BLASTX finds, with an e-value of at most 1e-5. In sensitive mode, DIAMOND is about 2,500
 times faster than BLASTX, finding more than 94% of all matches.
 
 .. _DIAMOND: http://ab.inf.uni-tuebingen.de/software/diamond/
@@ -44,7 +50,6 @@
 
 ]]>
     </help>
-    <citations>
-        <citation type="doi">10.1038/nmeth.3176</citation>
-    </citations>
+
+    <expand macro="citations" />
 </tool>
b
diff -r 98037ef3d2a9 -r df7738595640 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Mon Feb 06 07:08:25 2017 -0500
b
@@ -0,0 +1,24 @@
+<macros>
+    <token name="@VERSION@">0.8.24</token>
+
+    <xml name="requirements">
+        <requirements>
+          <requirement type="package" version="@VERSION@">diamond</requirement>
+        </requirements>
+    </xml>
+
+    <xml name="stdio">
+        <stdio>
+        </stdio>
+    </xml>
+
+    <xml name="version_command">
+        <version_command>diamond version</version_command>
+    </xml>
+
+    <xml name="citations">
+        <citations>
+            <citation type="doi">10.1038/nmeth.3176</citation>
+        </citations>
+    </xml>
+</macros>
b
diff -r 98037ef3d2a9 -r df7738595640 repository_dependencies.xml
--- a/repository_dependencies.xml Sun Feb 08 10:05:26 2015 -0500
+++ b/repository_dependencies.xml Mon Feb 06 07:08:25 2017 -0500
b
@@ -1,4 +1,4 @@
 <?xml version="1.0"?>
 <repositories description="This requires the Diamond data manager.">
-  <repository changeset_revision="ce62d0912b10" name="data_manager_diamond_database_builder" owner="bgruening" toolshed="https://toolshed.g2.bx.psu.edu" />
+    <repository changeset_revision="ce62d0912b10" name="data_manager_diamond_database_builder" owner="bgruening" toolshed="https://toolshed.g2.bx.psu.edu" />
 </repositories>
b
diff -r 98037ef3d2a9 -r df7738595640 test-data/db.dmnd
b
Binary file test-data/db.dmnd has changed
b
diff -r 98037ef3d2a9 -r df7738595640 test-data/db.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/db.fasta Mon Feb 06 07:08:25 2017 -0500
[
@@ -0,0 +1,6 @@
+>gi|5524211|gb|AAD44166.1| cytochrome b [Elephas maximus maximus]
+LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV
+EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG
+LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL
+GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX
+IENY
b
diff -r 98037ef3d2a9 -r df7738595640 test-data/diamond_results.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/diamond_results.tabular Mon Feb 06 07:08:25 2017 -0500
b
@@ -0,0 +1,1 @@
+sequence gi|5524211|gb|AAD44166.1| 90.5 284 26 1 1 283 1 284 1.0e-152 521.2
b
diff -r 98037ef3d2a9 -r df7738595640 test-data/protein.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/protein.fasta Mon Feb 06 07:08:25 2017 -0500
b
@@ -0,0 +1,6 @@
+>sequence
+LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV
+EWIWGGFSVDKATLNRFFAFHFILFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG
+LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL
+GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX
+IENY
b
diff -r 98037ef3d2a9 -r df7738595640 tool_dependencies.xml
--- a/tool_dependencies.xml Sun Feb 08 10:05:26 2015 -0500
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,6 +0,0 @@
-<?xml version="1.0"?>
-<tool_dependency>
-  <package name="diamond" version="0.6.13">
-      <repository changeset_revision="47c4dfd5aed5" name="package_diamond_0_6_13" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" />
-    </package>
-</tool_dependency>