Repository 'obi_stat'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/obi_stat

Changeset 3:723a93febe89 (2021-05-10)
Previous changeset 2:39320fee9d70 (2019-11-28) Next changeset 4:5f4544915893 (2024-03-20)
Commit message:
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/obitools commit 5d3c7a7b3f7d687bb03ef7993ddf1a6507d655bd"
modified:
macros.xml
obistat.xml
test-data/output_ngsfilter_error_3.fastq
test-data/output_ngsfilter_unidentified.fastq
test-data/output_obisort.fastq
added:
test-data/illuminapairedend.output.fastq.gz
test-data/output_ngsfilter_error_3.fastq.gz
test-data/output_obiannotate.fasta.gz
test-data/output_obiclean_advanced.fasta.gz
test-data/output_obigrep_predicat.fasta.gz
test-data/output_obiuniq.fasta.gz
test-data/output_obiuniq_family.fasta.gz
test-data/wolf_small.F.fastq.gz
test-data/wolf_small.R.fastq.gz
b
diff -r 39320fee9d70 -r 723a93febe89 macros.xml
--- a/macros.xml Thu Nov 28 15:51:18 2019 -0500
+++ b/macros.xml Mon May 10 19:37:00 2021 +0000
[
@@ -6,7 +6,8 @@
         </requirements>
     </xml>
 
-    <token name="@TOOL_VERSION@">1.2.11</token>
+    <token name="@TOOL_VERSION@">1.2.13</token>
+    <token name="@PROFILE@">21.01</token>
 
     <xml name="stdio">
         <stdio>
@@ -14,6 +15,80 @@
         </stdio>
     </xml>
 
+    <token name="@INPUT_FORMATS@">fastqsanger,fastqsanger.gz,fastqsolexa,fastqsolexa.gz,fasta,fasta.gz</token>
+    <token name="@GUNZIP_INPUT@"><![CDATA[
+        #if $input.ext.endswith(".gz")
+            gunzip -c '$input' > input &&
+        #else
+            ln -s '$input' input &&
+        #end if
+    ]]></token>
+    <token name="@GZIP_OUTPUT@"><![CDATA[
+        #if $input.ext.endswith(".gz")
+        | gzip -c 
+    #end if
+    ]]></token>
+    
+    <!-- generate galaxy.json to determine output format
+        - by default same as input
+        - if out_format can be specified 
+          - fasta/fastq depending on $out_format (if != "")
+          - or fasta if the tool does not support choosing the output format, e.g. obiuniq which always outputs fasta
+        - gz if $input is zipped 
+    
+        A list of outputs to include in the json can be given by
+        setting a variable $outputs = [...] listing pairs of output names and the actual output
+        (defaults to [("output", $output)])
+    -->
+    <token name="@GENERATE_GALAXY_JSON@"><![CDATA[
+        #import json
+
+        #try:
+            #silent $outputs[0]
+        #except 
+            #set outputs = [("output", $output)]
+        #end try
+
+        #if $input.ext.startswith("fastq")
+            #set ext = "fastqsanger"
+        #else if $input.ext.startswith("fasta")
+            #set ext = "fasta"
+        #end if
+
+        #try
+            #if $out_format == "fasta"
+                #set ext = "fasta"
+            #else if $out_format == "fastq"
+                #set ext = "fastqsanger"
+            #end if
+        #except
+            #set ext = "fasta"
+        #end try
+
+        #if $input.ext.endswith(".gz")
+            #set ext = ext + ".gz"
+        #end if
+
+        #set gxy_json = {}
+        #for oname, o in $outputs
+            #silent gxy_json[oname] = {"ext": ext}
+        #end for
+        && echo '${json.dumps(gxy_json)}' >> galaxy.json
+    ]]></token>
+    
+    <token name="@OUT_FORMAT@"><![CDATA[
+        #if $out_format
+            --${out_format}-output
+        #end if
+    ]]></token>
+    
+    <xml name="out_format_macro">
+        <param name="out_format" type="select" optional="true" label="Output data type" help="For FASTA/Q the the default output type is the same as the input type">
+            <option value="fasta">fasta</option>
+            <option value="fastq">fastq</option>
+        </param>
+    </xml>
+
     <token name="@OBITOOLS_LINK@">
 <![CDATA[
 --------
@@ -105,15 +180,43 @@
         <option value="taxid">taxid</option>
     </xml>
 
-    <xml name="inputtype">
-        <option value="--genbank">genbank</option>
-        <option value="--embl">embl</option>
-        <option value="--sanger">sanger</option>
-        <option value="--solexa">solexa</option>
-        <option value="--ecopcr">ecopcr</option>
-        <option value="--ecopcrdb">ecopcrdb</option>
-        <option value="--fasta" selected="true">fasta</option>
+    <xml name="input_format_options_macro">
+        <section name="input_format_options" title="Input format options" expanded="false">
+            <param name="options_inputtype" type="select"  optional="true" label="Specify the input datatype" help="default: determine automatically (should only be necessay for non FASTA/FASTQ datasets)">
+                <option value="--genbank">genbank</option>
+                <option value="--embl">embl</option>
+                <option value="--sanger">sanger</option>
+                <option value="--solexa">solexa</option>
+                <option value="--ecopcr">ecopcr</option>
+                <option value="--ecopcrdb">ecopcrdb</option>
+                <option value="--fasta">fasta (including obitools fasta extentions)</option>
+                <option value="--raw-fasta">raw fasta (more tolerant format variant)</option>
+            </param>
+            <param name="options_seqtype" type="select" optional="true" label="Specify the sequence datatype" >
+                <option value="--nuc">nucleic</option>
+                <option value="--prot">protein</option>
+            </param>
+        </section>
     </xml>
+    
+    <token name="@INPUT_FORMAT@"><![CDATA[
+        #if $input_format_options.options_inputtype
+            $input_format_options.options_inputtype
+        #else
+            #if $input.ext.startswith("fasta")
+                --fasta
+            #else if $input.ext.startswith("fastqsolexa")
+                ## input file is in fastq nucleic format produced by solexa sequencer
+                --solexa
+            #else
+                ## input file is in sanger fastq nucleic format (standard fastq)
+                --sanger
+            #end if
+        #end if
+        #if $input_format_options.options_seqtype
+            $input_format_options.options_seqtype
+        #end if
+    ]]></token>
 
     <xml name="sanitizer">
         <sanitizer invalid_char="test">
b
diff -r 39320fee9d70 -r 723a93febe89 obistat.xml
--- a/obistat.xml Thu Nov 28 15:51:18 2019 -0500
+++ b/obistat.xml Mon May 10 19:37:00 2021 +0000
[
b'@@ -1,137 +1,147 @@\n-<tool id="obi_stat" name="obistat" version="@TOOL_VERSION@">\r\n-    <description>computes basic statistics for attribute values</description>\r\n-    <macros>\r\n-        <import>macros.xml</import>\r\n-    </macros>\r\n-    <expand macro="requirements"/>\r\n-    <expand macro="stdio"/>\r\n-\r\n-    <command>\r\n-\r\n-        <![CDATA[\r\n-\r\n-        obistat\r\n-        #for $attribute in $catattributes\r\n-            #if str( $attribute.options_attributespe.options_attributespe_selector) == "key"\r\n-                -c \'$attribute.options_attributespe.options_catattribute_selector\'\r\n-            #end if\r\n-            #if str( $attribute.options_attributespe.options_attributespe_selector) == "python"\r\n-                -c \'${attribute.options_attributespe.attribute}\'\r\n-            #end if\r\n-        #end for\r\n-\r\n-        #if str( $options_attribute.options_attributebe_selector) == "yes"\r\n-            #if str( $options_attribute.options_attribute_selector) == "min"\r\n-                -m \'$options_attribute.options_uniq_selector\'\r\n-            #end if\r\n-            #if str( $options_attribute.options_attribute_selector) == "max"\r\n-                -M \'$options_attribute.options_uniq_selector\'\r\n-            #end if\r\n-            #if str( $options_attribute.options_attribute_selector) == "mean"\r\n-                -a \'$options_attribute.options_uniq_selector\'\r\n-            #end if\r\n-            #if str( $options_attribute.options_attribute_selector) == "variance"\r\n-                -v \'$options_attribute.options_uniq_selector\'\r\n-            #end if\r\n-            #if str( $options_attribute.options_attribute_selector) == "std"\r\n-                -s \'$options_attribute.options_uniq_selector\'\r\n-            #end if\r\n-        #end if\r\n-\r\n-        \'$input\' > \'$output\'\r\n-\r\n-        ]]>\r\n-\r\n-\r\n-    </command>\r\n-\r\n-    <inputs>\r\n-        <param name="input" type="data" format="fasta,fastq" label="Input sequences file" />\r\n-\r\n-        <repeat name="catattributes" title="Category attribute" min="0">\r\n-            <conditional name="options_attributespe">\r\n-                <param name="options_attributespe_selector" type="select" label="How would you specify the category attribute key?" >\r\n-                    <option value="key" selected="true">simply by a key of an attribute</option>\r\n-                    <option value="python">by a python expression</option>\r\n-                </param>\r\n-                <when value="python">\r\n-                    <param name="attribute" type="text" label="Regular expression pattern matched against the attributes of the sequence record. the value of this attribute is of the form : key:regular_pattern. The pattern is case sensitive." >\r\n-                        <expand macro="sanitizer"/>\r\n-                    </param>\r\n-                </when>\r\n-                <when value="key">\r\n-                    <param name="options_catattribute_selector" type="select" label="Attribute used to categorize the sequence records" >\r\n-                        <expand macro="attributes"/>\r\n-                    </param>\r\n-                </when>\r\n-            </conditional>\r\n-        </repeat>\r\n-\r\n-        <conditional name="options_attribute">\r\n-            <param name="options_attributebe_selector" type="select" label="Use a specific option" >\r\n-                <option value="None" selected="true">no</option>\r\n-                <option value="yes">yes</option>\r\n-            </param>\r\n-            <when value="yes">\r\n-                <param name="options_attribute_selector" type="select" label="Select your specific option" >\r\n-                    <option value="min" selected="true">min</option>\r\n-                    <option value="max">max</option>\r\n-                    <option value="mean">mean</option>\r\n-                    <option value="variance">variance</option>\r\n-                    <option value="std">standard deviation</option>\r\n-                </param>\r\n-                <param name="options_uniq_selector" type="select" label="A'..b'peat>\n+        <conditional name="options_attribute">\n+            <param name="options_attributebe_selector" type="select" label="Use a specific option" >\n+                <option value="None" selected="true">no</option>\n+                <option value="yes">yes</option>\n+            </param>\n+            <when value="yes">\n+                <param name="options_attribute_selector" type="select" label="Select your specific option" >\n+                    <option value="min" selected="true">min</option>\n+                    <option value="max">max</option>\n+                    <option value="mean">mean</option>\n+                    <option value="variance">variance</option>\n+                    <option value="std">standard deviation</option>\n+                </param>\n+                <param name="options_uniq_selector" type="select" label="Attribute to merge" >\n+                    <expand macro="attributes"/>\n+                </param>\n+            </when>\n+            <when value="None"></when>\n+        </conditional>\n+        <expand macro="input_format_options_macro"/>\n+    </inputs>\n+    <outputs>\n+        <data format="txt" name="output"/>\n+    </outputs>\n+    <tests>\n+        <test>\n+            <param name="input" value="output_obiannotate.fasta" ftype="fasta"/>\n+            <conditional name="catattributes_0|options_attributespe">\n+                <param name="options_attributespe_selector" value="key"/>\n+                <param name="options_catattribute_selector" value="count" />\n+            </conditional>\n+            <conditional name="catattributes_1|options_attributespe">\n+                <param name="options_attributespe_selector" value="key"/>\n+                <param name="options_catattribute_selector" value="merged" />\n+            </conditional>\n+            <conditional name="options_attribute">\n+                <param name="options_attributebe_selector" value="yes"/>\n+                <param name="options_attribute_selector" value="min" />\n+                <param name="options_uniq_selector" value="seq_length" />\n+            </conditional>\n+            <output name="output" file="output_obistat.txt" ftype="txt" sort="True"/>\n+        </test>\n+        <test>\n+            <param name="input" value="output_obiannotate.fasta.gz" ftype="fasta.gz" />\n+            <conditional name="catattributes_0|options_attributespe">\n+                <param name="options_attributespe_selector" value="key"/>\n+                <param name="options_catattribute_selector" value="count" />\n+            </conditional>\n+            <conditional name="catattributes_1|options_attributespe">\n+                <param name="options_attributespe_selector" value="key"/>\n+                <param name="options_catattribute_selector" value="merged" />\n+            </conditional>\n+            <conditional name="options_attribute">\n+                <param name="options_attributebe_selector" value="yes"/>\n+                <param name="options_attribute_selector" value="min" />\n+                <param name="options_uniq_selector" value="seq_length" />\n+            </conditional>\n+            <output name="output" file="output_obistat.txt" ftype="txt" sort="True"/>\n+        </test>\n+    </tests>\n+    <help><![CDATA[\n+\n+.. class:: infomark\n+\n+**What it does**\n+\n+stats computes basic statistics for attribute values of sequence records. The sequence records can be categorized or not using one or several -c options. By default, only the number of sequence records and the total count are computed for each category. Additional statistics can be computed for attribute values in each category, like:\n+\n+\\*  minimum value (-m option)\n+\n+\\*  maximum value (-M option)\n+\n+\\*  mean value (-a option)\n+\n+\\*  variance (-v option)\n+\n+\\*  standard deviation (-s option)\n+\n+The result is a contingency table with the different categories in rows, and the computed statistics in columns.\n+\n+@OBITOOLS_LINK@\n+\n+        ]]>\n+    </help>\n+    <expand macro="citation" />\n+</tool>\n'
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/illuminapairedend.output.fastq.gz
b
Binary file test-data/illuminapairedend.output.fastq.gz has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/output_ngsfilter_error_3.fastq
b
Binary file test-data/output_ngsfilter_error_3.fastq has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/output_ngsfilter_error_3.fastq.gz
b
Binary file test-data/output_ngsfilter_error_3.fastq.gz has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/output_ngsfilter_unidentified.fastq
b
Binary file test-data/output_ngsfilter_unidentified.fastq has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/output_obiannotate.fasta.gz
b
Binary file test-data/output_obiannotate.fasta.gz has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/output_obiclean_advanced.fasta.gz
b
Binary file test-data/output_obiclean_advanced.fasta.gz has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/output_obigrep_predicat.fasta.gz
b
Binary file test-data/output_obigrep_predicat.fasta.gz has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/output_obisort.fastq
--- a/test-data/output_obisort.fastq Thu Nov 28 15:51:18 2019 -0500
+++ b/test-data/output_obisort.fastq Mon May 10 19:37:00 2021 +0000
b
b"@@ -1,172 +1,232 @@\n->HELIUM_000100422_612GNAAXX:7:57:18459:16145#0/2_CONS_SUB_SUB_CMP count=64; merged_sample={'26a_F040644': 64}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=99; obiclean_headcount=1; seq_rank=5; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'h'}; obiclean_head=True; \n-ttagccctaaacataaacattcaataaacaagaatgttcgccagagtactactagcaaca\n-gcctgaaactcaaaggacttggcggtgctttacatccct\n->HELIUM_000100422_612GNAAXX:7:22:8540:14708#0/2_CONS_SUB_SUB count=61; merged_sample={'29a_F260619': 30, '15a_F730814': 31}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=100; obiclean_headcount=2; seq_rank=4; obiclean_samplecount=2; obiclean_status={'29a_F260619': 'h', '15a_F730814': 'h'}; obiclean_head=True; \n-ttagccctaaacacaagtaattaatataacaaaattattcgccagagtactaccggcaat\n-agcttaaaactcaaaggacttggcggtgctttataccctt\n->HELIUM_000100422_612GNAAXX:7:6:9274:14951#0/2_CONS_SUB_SUB count=46; merged_sample={'13a_F730603': 46}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=100; obiclean_headcount=1; seq_rank=8; obiclean_samplecount=1; obiclean_status={'13a_F730603': 'h'}; obiclean_head=True; \n-ctagccttaaacacaaatagttatgcaaacaaaactattcgccagagtactaccggcaat\n-agcttaaaactcaaaggacttggcggtgctttataccctt\n->HELIUM_000100422_612GNAAXX:7:13:5742:9859#0/2_CONS_SUB_SUB count=7; merged_sample={'29a_F260619': 7}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=4; obiclean_headcount=0; seq_rank=16; obiclean_samplecount=1; obiclean_status={'29a_F260619': 's'}; obiclean_head=True; \n+@HELIUM_000100422_612GNAAXX:7:57:18459:16145#0/2_CONS_SUB_SUB_CMP count=64; merged_sample={'26a_F040644': 64}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=99; obiclean_headcount=1; seq_rank=5; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'h'}; obiclean_head=True; \n+ttagccctaaacataaacattcaataaacaagaatgttcgccagagtactactagcaacagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:22:8540:14708#0/2_CONS_SUB_SUB count=61; merged_sample={'29a_F260619': 30, '15a_F730814': 31}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=100; obiclean_headcount=2; seq_rank=4; obiclean_samplecount=2; obiclean_status={'29a_F260619': 'h', '15a_F730814': 'h'}; obiclean_head=True; \n+ttagccctaaacacaagtaattaatataacaaaattattcgccagagtactaccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:6:9274:14951#0/2_CONS_SUB_SUB count=46; merged_sample={'13a_F730603': 46}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=100; obiclean_headcount=1; seq_rank=8; obiclean_samplecount=1; obiclean_status={'13a_F730603': 'h'}; obiclean_head=True; \n+ctagccttaaacacaaatagttatgcaaacaaaactattcgccagagtactaccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:13:5742:9859#0/2_CONS_SUB_SUB count=7; merged_sample={'29a_F260619': 7}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=4; obiclean_headcount=0; seq_rank=16; obiclean_samplecount=1; obiclean_status={'29a_F260619': 's'}; obiclean_head=True; \n tttt\n->HELIUM_000100422_612GNAAXX:7:89:10281:5930#0/2_CONS_SUB_SUB_CMP count=3; merged_sample={'29a_F260619': 3}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=100; obiclean_headcount=0; seq_rank=6; obiclean_samplecount=1; obiclean_status={'29a_F260619': 's'}; obiclean_head=True; \n-ttagccctaaacacaaataattacacaaacaaaattgttcaccagagtactagcggcaac\n-agcttaaaactcaaaggacttggcggtgctttataccctt\n->HELIUM_000100422_612GNAAXX:7:29:15520:18035#0/2_CONS_SUB_SUB count=2; merged_sample={'29a_F260619': 2}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=100; obiclean_headcount=0; seq_rank=7; obiclean_sample"..b"M_000100422_612GNAAXX:7:10:9237:10532#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'29a_F260619': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=100; obiclean_headcount=0; seq_rank=51; obiclean_samplecount=1; obiclean_status={'29a_F260619': 'i'}; obiclean_head=False; \n+ttagccctaaacacaagtaattaatataacaaaataattcgccagagtactaccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:7:11998:4462#0/2_CONS_SUB_SUB count=1; merged_sample={'26a_F040644': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=99; obiclean_headcount=0; seq_rank=52; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'i'}; obiclean_head=False; \n+ttagccctaaacataaacattcaataaacaagaatgttcgccagagtagtactagcaacagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:111:18277:17779#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'26a_F040644': 1}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=99; obiclean_headcount=0; seq_rank=53; obiclean_samplecount=1; obiclean_status={'26a_F040644': 's'}; obiclean_head=True; \n+ttagccctaaacatagataattttacaacaaaataattcgccagaggactactagcaatagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:3:17077:6562#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'15a_F730814': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=100; obiclean_headcount=0; seq_rank=54; obiclean_samplecount=1; obiclean_status={'15a_F730814': 'i'}; obiclean_head=False; \n+ttagccctaaacacaagtaattaatataacaaaattattcgccagagtactgccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:19:4311:13343#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'26a_F040644': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=99; obiclean_headcount=0; seq_rank=55; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'i'}; obiclean_head=False; \n+ttagccctaaacataaacattcaataaacaagaatgttcgccagagtactacgagcaacagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:30:1800:7833#0/2_CONS_SUB_SUB count=1; merged_sample={'15a_F730814': 1}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=100; obiclean_headcount=0; seq_rank=56; obiclean_samplecount=1; obiclean_status={'15a_F730814': 's'}; obiclean_head=True; \n+ttagccctaaacacaagacattaatataacgagattaatcgacagagtactaccggctatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:108:9222:18258#0/2_CONS_SUB_SUB count=1; merged_sample={'13a_F730603': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=100; obiclean_headcount=0; seq_rank=57; obiclean_samplecount=1; obiclean_status={'13a_F730603': 'i'}; obiclean_head=False; \n+ctagccttaaacacaaatagttatgcagacaaaactattcgccagagtactaccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:38:3005:20881#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'26a_F040644': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=99; obiclean_headcount=0; seq_rank=58; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'i'}; obiclean_head=False; \n+ttagccctaaacatgaacattcaataaacaagaatgttcgccagagtactactagcaacagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n"
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/output_obiuniq.fasta.gz
b
Binary file test-data/output_obiuniq.fasta.gz has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/output_obiuniq_family.fasta.gz
b
Binary file test-data/output_obiuniq_family.fasta.gz has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/wolf_small.F.fastq.gz
b
Binary file test-data/wolf_small.F.fastq.gz has changed
b
diff -r 39320fee9d70 -r 723a93febe89 test-data/wolf_small.R.fastq.gz
b
Binary file test-data/wolf_small.R.fastq.gz has changed