Repository 'khmer_filter_abundance'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/khmer_filter_abundance

Changeset 7:8c6433857aa8 (2019-12-18)
Previous changeset 6:dbe616d126b1 (2018-09-07) Next changeset 8:97f65399e30d (2021-03-23)
Commit message:
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/khmer commit 7de685f4763d988a5a9abce4a9c2b4714daaf165"
modified:
filter-abund.xml
macros.xml
added:
test-data/test-abund-read-2.fa.gz
b
diff -r dbe616d126b1 -r 8c6433857aa8 filter-abund.xml
--- a/filter-abund.xml Fri Sep 07 10:58:52 2018 -0400
+++ b/filter-abund.xml Wed Dec 18 16:05:31 2019 -0500
[
@@ -1,4 +1,4 @@
-<tool id="khmer_filter_abundance" name="Filter reads" version="@WRAPPER_VERSION@.0">
+<tool id="khmer_filter_abundance" name="khmer: Filter reads" version="@WRAPPER_VERSION@@TOOL_VERSION@">
     <description>
         by minimal k-mer abundance
     </description>
@@ -10,40 +10,36 @@
     <expand macro="stdio" />
     <expand macro="version" />
     <command><![CDATA[
-set -xu &&
-#for $num, $input in enumerate($inputs)
-    ln -s ${input} filter-abund-sequence-${num} &&
-#end for
+set -u &&
+@LINK_SEQUENCES@
 mkdir output && cd output &&
 @BINARY@
 --cutoff=${cutoff}
 ${variable_coverage}
 @THREADS@
 ${input_countgraph_filename}
-../filter-abund-sequence*
+@USE_SEQUENCES@
 ]]>
     </command>
     <inputs>
         <expand macro="input_sequences_filenames" />
-        <param name="variable_coverage" type="boolean" checked="false" truevalue="--variable-coverage" falsevalue=""
+        <param argument="--variable_coverage" name="variable_coverage" type="boolean" checked="false" truevalue="--variable-coverage" falsevalue=""
             label="Variable coverage"
-            help="Only trim when a sequence has high enough coverage; median abundance > 20 (--variable_coverage)" />
-        <param name="cutoff" type="integer" value="2" label="Cutoff"
-            help="Trim at k-mers below this abundance. (--cutoff)" />
+            help="Only trim when a sequence has high enough coverage; median abundance > 20" />
+        <param argument="--cutoff" name="cutoff" type="integer" value="2" label="Cutoff"
+            help="Trim at k-mers below this abundance" />
         <expand macro="input_countgraph_filename" />
     </inputs>
     <outputs>
-        <collection name="filter-abund-sequences" type="list">
-            <discover_datasets pattern="__name__" directory="output" />
-        </collection>
+        <expand macro="output_sequences" extension="abundfilt"/>
     </outputs>
     <tests>
         <test>
             <param name="inputs" value="test-abund-read-2.fa" />
             <param name="input_countgraph_filename"
                 value="test-abund-read-2.oxlicg" ftype="oxlicg" />
-            <output_collection name="filter-abund-sequences" type="list">
-                <element name="filter-abund-sequence-0.abundfilt">
+            <output_collection name="sequences" type="list">
+                <element name="test-abund-read-2.fa">
                     <assert_contents>
                         <has_text text="GGTTGACGGGGCTCAGGG" />
                     </assert_contents>
@@ -55,8 +51,8 @@
             <param name="input_countgraph_filename"
                 value="test-abund-read-2.oxlicg" ftype="oxlicg" />
             <param name="cutoff" value="1" />
-            <output_collection name="filter-abund-sequences" type="list">
-                <element name="filter-abund-sequence-0.abundfilt">
+            <output_collection name="sequences" type="list">
+                <element name="test-abund-read-2.fa">
                     <assert_contents>
                         <has_text text="GGTTGACGGGGCTCAGGG" />
                     </assert_contents>
b
diff -r dbe616d126b1 -r 8c6433857aa8 macros.xml
--- a/macros.xml Fri Sep 07 10:58:52 2018 -0400
+++ b/macros.xml Wed Dec 18 16:05:31 2019 -0500
[
@@ -1,8 +1,10 @@
 <macros>
-    <token name="@WRAPPER_VERSION@">3.0.0a1</token>
+    <token name="@WRAPPER_VERSION@">3.0.0a3</token>
+    <token name="@TOOL_VERSION@">+galaxy1</token>
     <xml name="requirements">
         <requirements>
             <requirement type="package" version="@WRAPPER_VERSION@">khmer</requirement>
+            <yield/>
         </requirements>
     </xml>
     <xml name="version">
@@ -35,7 +37,7 @@
                 <option value="specific">Show</option>
             </param>
             <when value="simple">
-                <param name="tablesize" type="select" label="Sample Type" display="radio">
+                <param argument="" name="tablesize" type="select" label="Sample Type" display="radio">
                     <option value="1e9" selected="true">Microbial Genome</option>
                     <option value="2e9">Animal Transcriptome</option>
                     <option value="4e9">Small Animal Genome or Low-Diversity Metagenome</option>
@@ -43,15 +45,32 @@
                 </param>
             </when>
             <when value="specific">
-                <param name="ksize" type="integer" value="20" label="k-mer size" help="k-mer size to use" />
-                <param name="n_tables" type="integer" min="1" value="4" label="n_tables" help="number of tables to use" />
-                <param name="tablesize_specific" type="text" value="1000000.0"
+                <param argument="--ksize" name="ksize" type="integer" value="20" label="k-mer size" help="k-mer size to use" />
+                <param argument="--n_tables" name="n_tables" type="integer" min="1" value="4" label="n_tables" help="number of tables to use" />
+                <param argument="--max-tablesize" name="tablesize_specific" type="text" value="1000000.0"
                     label="tablesize" help="(--max-tablesize) upper bound on the tablesize to use" />
             </when>
         </conditional>
     </xml>
+    <token name="@LINK_SEQUENCES@">
+<![CDATA[
+#import re
+mkdir input/ &&
+#set gzip=""
+#for $num, $input in enumerate($inputs)
+    ln -s '${input}' 'input/$re.sub("[^\w\-_.]", "_", $input.element_identifier).$input.ext' &&
+    #if str($input).endswith(".gz"):
+        #set gzip="--gzip"
+    #end if
+#end for]]></token>
+    <token name="@USE_SEQUENCES@">
+<![CDATA[
+#for $num, $input in enumerate($inputs)
+    '../input/$re.sub("[^\w\-_.]", "_", $input.element_identifier).$input.ext'
+#end for]]></token>
+
     <xml name="input_sequences_filenames">
-        <param  name="inputs" multiple="true" type="data" format="fasta,fastq"
+        <param  name="inputs" multiple="true" type="data" format="fasta,fastq,fasta.gz,fastq.gz"
             label="Sequences in FASTA or FASTQ format"
             help="Put in order of precedence such as longest reads first." />
     </xml>
@@ -66,27 +85,26 @@
     </xml>
     <xml name="abundance-histogram-output">
         <data name="output_histogram_filename" format="txt"
-            label="${tool.name} k-mer abundance histogram. The
+            label="${tool.name} on ${on_string}: k-mer abundance histogram. The
                 columns are: (1) k-mer abundance, (2) k-mer count, (3)
                 cumulative count, (4) fraction of total distinct k-mers." />
     </xml>
-    <xml name="output_sequences">
-        <data name="output" format_source="inputs"
-            label="${tool.name} processed nucleotide sequence file">
-            <discover_datasets pattern="__designation_and_ext__" directory="output" visible="true"/>
-        </data>
+    <xml name="output_sequences" token_extension="">
+        <collection name="sequences" type="list">
+            <discover_datasets pattern="(?P&lt;name&gt;.*)\.(?P&lt;ext&gt;fast[aq](\.gz)?)\.@EXTENSION@" directory="output" />
+        </collection>
     </xml>
     <xml name="output_sequences_single">
         <data name="output" format_source="input_sequence_filename"
-            label="${tool.name} processed nucleotide sequence file" />
+            label="${tool.name} on ${on_string}: processed nucleotide sequence file" />
     </xml>
     <xml name="input_zero">
-        <param name="zero" type="boolean" truevalue="" falsevalue="--no-zero" checked="true"
-            help="Output zero count bins (--no-zero)" />
+        <param argument="--no-zero" name="zero" type="boolean" truevalue="" falsevalue="--no-zero" checked="true"
+            help="Output zero count bins" />
     </xml>
     <xml name="input_bigcount">
-        <param  name="bigcount" type="boolean" truevalue="" falsevalue="--no-bigcount"
-            checked="true" help="Count k-mers past 255 occurences (--no-bigcount)" />
+        <param  argument="--no-bigcount" name="bigcount" type="boolean" truevalue="" falsevalue="--no-bigcount"
+            checked="true" help="Count k-mers past 255 occurences" />
     </xml>
     <token name="@HELP_FOOTER@"><![CDATA[
 (from the khmer project: http://khmer.readthedocs.org/en/v2.0/ )]]></token>
b
diff -r dbe616d126b1 -r 8c6433857aa8 test-data/test-abund-read-2.fa.gz
b
Binary file test-data/test-abund-read-2.fa.gz has changed