Repository 'obi_annotate'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/obi_annotate

Changeset 3:f82cefbbcea5 (2021-05-10)
Previous changeset 2:3021b9f5809f (2019-11-28) Next changeset 4:d50dc96e3ce9 (2024-03-20)
Commit message:
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/obitools commit 5d3c7a7b3f7d687bb03ef7993ddf1a6507d655bd"
modified:
macros.xml
obiannotate.xml
test-data/output_ngsfilter_error_3.fastq
test-data/output_ngsfilter_unidentified.fastq
test-data/output_obisort.fastq
added:
test-data/illuminapairedend.output.fastq.gz
test-data/output_ngsfilter_error_3.fastq.gz
test-data/output_obiannotate.fasta.gz
test-data/output_obiclean_advanced.fasta.gz
test-data/output_obigrep_predicat.fasta.gz
test-data/output_obiuniq.fasta.gz
test-data/output_obiuniq_family.fasta.gz
test-data/wolf_small.F.fastq.gz
test-data/wolf_small.R.fastq.gz
b
diff -r 3021b9f5809f -r f82cefbbcea5 macros.xml
--- a/macros.xml Thu Nov 28 15:50:43 2019 -0500
+++ b/macros.xml Mon May 10 19:37:25 2021 +0000
[
@@ -6,7 +6,8 @@
         </requirements>
     </xml>
 
-    <token name="@TOOL_VERSION@">1.2.11</token>
+    <token name="@TOOL_VERSION@">1.2.13</token>
+    <token name="@PROFILE@">21.01</token>
 
     <xml name="stdio">
         <stdio>
@@ -14,6 +15,80 @@
         </stdio>
     </xml>
 
+    <token name="@INPUT_FORMATS@">fastqsanger,fastqsanger.gz,fastqsolexa,fastqsolexa.gz,fasta,fasta.gz</token>
+    <token name="@GUNZIP_INPUT@"><![CDATA[
+        #if $input.ext.endswith(".gz")
+            gunzip -c '$input' > input &&
+        #else
+            ln -s '$input' input &&
+        #end if
+    ]]></token>
+    <token name="@GZIP_OUTPUT@"><![CDATA[
+        #if $input.ext.endswith(".gz")
+        | gzip -c 
+    #end if
+    ]]></token>
+    
+    <!-- generate galaxy.json to determine output format
+        - by default same as input
+        - if out_format can be specified 
+          - fasta/fastq depending on $out_format (if != "")
+          - or fasta if the tool does not support choosing the output format, e.g. obiuniq which always outputs fasta
+        - gz if $input is zipped 
+    
+        A list of outputs to include in the json can be given by
+        setting a variable $outputs = [...] listing pairs of output names and the actual output
+        (defaults to [("output", $output)])
+    -->
+    <token name="@GENERATE_GALAXY_JSON@"><![CDATA[
+        #import json
+
+        #try:
+            #silent $outputs[0]
+        #except 
+            #set outputs = [("output", $output)]
+        #end try
+
+        #if $input.ext.startswith("fastq")
+            #set ext = "fastqsanger"
+        #else if $input.ext.startswith("fasta")
+            #set ext = "fasta"
+        #end if
+
+        #try
+            #if $out_format == "fasta"
+                #set ext = "fasta"
+            #else if $out_format == "fastq"
+                #set ext = "fastqsanger"
+            #end if
+        #except
+            #set ext = "fasta"
+        #end try
+
+        #if $input.ext.endswith(".gz")
+            #set ext = ext + ".gz"
+        #end if
+
+        #set gxy_json = {}
+        #for oname, o in $outputs
+            #silent gxy_json[oname] = {"ext": ext}
+        #end for
+        && echo '${json.dumps(gxy_json)}' >> galaxy.json
+    ]]></token>
+    
+    <token name="@OUT_FORMAT@"><![CDATA[
+        #if $out_format
+            --${out_format}-output
+        #end if
+    ]]></token>
+    
+    <xml name="out_format_macro">
+        <param name="out_format" type="select" optional="true" label="Output data type" help="For FASTA/Q the the default output type is the same as the input type">
+            <option value="fasta">fasta</option>
+            <option value="fastq">fastq</option>
+        </param>
+    </xml>
+
     <token name="@OBITOOLS_LINK@">
 <![CDATA[
 --------
@@ -105,15 +180,43 @@
         <option value="taxid">taxid</option>
     </xml>
 
-    <xml name="inputtype">
-        <option value="--genbank">genbank</option>
-        <option value="--embl">embl</option>
-        <option value="--sanger">sanger</option>
-        <option value="--solexa">solexa</option>
-        <option value="--ecopcr">ecopcr</option>
-        <option value="--ecopcrdb">ecopcrdb</option>
-        <option value="--fasta" selected="true">fasta</option>
+    <xml name="input_format_options_macro">
+        <section name="input_format_options" title="Input format options" expanded="false">
+            <param name="options_inputtype" type="select"  optional="true" label="Specify the input datatype" help="default: determine automatically (should only be necessay for non FASTA/FASTQ datasets)">
+                <option value="--genbank">genbank</option>
+                <option value="--embl">embl</option>
+                <option value="--sanger">sanger</option>
+                <option value="--solexa">solexa</option>
+                <option value="--ecopcr">ecopcr</option>
+                <option value="--ecopcrdb">ecopcrdb</option>
+                <option value="--fasta">fasta (including obitools fasta extentions)</option>
+                <option value="--raw-fasta">raw fasta (more tolerant format variant)</option>
+            </param>
+            <param name="options_seqtype" type="select" optional="true" label="Specify the sequence datatype" >
+                <option value="--nuc">nucleic</option>
+                <option value="--prot">protein</option>
+            </param>
+        </section>
     </xml>
+    
+    <token name="@INPUT_FORMAT@"><![CDATA[
+        #if $input_format_options.options_inputtype
+            $input_format_options.options_inputtype
+        #else
+            #if $input.ext.startswith("fasta")
+                --fasta
+            #else if $input.ext.startswith("fastqsolexa")
+                ## input file is in fastq nucleic format produced by solexa sequencer
+                --solexa
+            #else
+                ## input file is in sanger fastq nucleic format (standard fastq)
+                --sanger
+            #end if
+        #end if
+        #if $input_format_options.options_seqtype
+            $input_format_options.options_seqtype
+        #end if
+    ]]></token>
 
     <xml name="sanitizer">
         <sanitizer invalid_char="test">
b
diff -r 3021b9f5809f -r f82cefbbcea5 obiannotate.xml
--- a/obiannotate.xml Thu Nov 28 15:50:43 2019 -0500
+++ b/obiannotate.xml Mon May 10 19:37:25 2021 +0000
[
b'@@ -1,158 +1,175 @@\n-<tool id="obi_annotate" name="obiannotate" version="@TOOL_VERSION@">\r\n-    <description>Adds/Edits sequence record annotations</description>\r\n-    <macros>\r\n-        <import>macros.xml</import>\r\n-    </macros>\r\n-    <expand macro="requirements"/>\r\n-    <expand macro="stdio"/>\r\n-    <command>\r\n-\r\n-        <![CDATA[\r\n-        obiannotate\r\n-        ${seqrank}\r\n-\r\n-        #if $rename_tag.old_name and $rename_tag.new_name\r\n-            -R \'$rename_tag.old_name\':\'$rename_tag.new_name\'\r\n-        #end if\r\n-\r\n-        #if $deletetag_key\r\n-            --delete-tag=\'$deletetag_key\'\r\n-        #end if\r\n-\r\n-        #if $set_tag.key and $set_tag.pythonexpression\r\n-            -S \'$set_tag.key\':\'$set_tag.pythonexpression\'\r\n-        #end if\r\n-\r\n-        #if $taglist\r\n-            --tag-list=\'$taglist\'\r\n-        #end if\r\n-\r\n-        #if $setid_pythonexpression\r\n-            --set-identifier=\'$setid_pythonexpression\'\r\n-        #end if\r\n-\r\n-        #if $pythonexpression\r\n-            --run=\'$pythonexpression\'\r\n-        #end if\r\n-\r\n-        #if $setsequence_pythonexpression\r\n-            --set-sequence=\'$setsequence_pythonexpression\'\r\n-        #end if\r\n-\r\n-        #if $setdefinition_pythonexpression\r\n-            --set-definition=\'$setdefinition_pythonexpression\'\r\n-        #end if\r\n-\r\n-        #if $key_selector.key\r\n-            --keep=\'$key_selector.key\'\r\n-        #end if\r\n-        #if $key_selector.key2\r\n-            --keep=\'$key_selector.key2\'\r\n-        #end if\r\n-        #if $key_selector.key3\r\n-            --keep=\'$key_selector.key3\'\r\n-        #end if\r\n-        #if $key_selector.key4\r\n-            --keep=\'$key_selector.key4\'\r\n-        #end if\r\n-        #if $key_selector.key5\r\n-            --keep=\'$key_selector.key5\'\r\n-        #end if\r\n-\r\n-        ${length}\r\n-        ${clearbool}\r\n-        ${uniqid}\r\n-\r\n-        #if $rankname\r\n-            --with-taxon-at-rank=\'$rankname\'\r\n-        #end if\r\n-\r\n-        #if $mclfile\r\n-            --mcl=\'$mclfile\'\r\n-        #end if\r\n-\r\n-        \'$inputseq\' > \'$output\'\r\n-        ]]>\r\n-\r\n-    </command>\r\n-\r\n-    <inputs>\r\n-        <param name="inputseq" type="data" format="fastq,fasta" label="Input sequences file" />\r\n-        <param name="seqrank" type="boolean" label="Add a new attribute seq_rank" truevalue="--seq-rank" falsevalue="" help="Use this option if you want to add a new attribute named seq_rank to the sequence record indicating its entry number in the sequence file" />\r\n-        <section name="rename_tag" title="Rename attribute" expanded="False">\r\n-            <param name="old_name" type="text" label="old name" optional="true"/>\r\n-            <param name="new_name" type="text" label="new name" optional="true"/>\r\n-        </section>\r\n-        <param name="deletetag_key" type="text" label="Delete attribute" optional="true" help="Use this option if you want to delete attribute named ATTRIBUTE_NAME.When this attribute is missing, the sequence record is skipped and the next one is examined"/>\r\n-\r\n-        <section name="set_tag" title="Create a new attribute" expanded="False">\r\n-            <param name="key" type="text" label="key" optional="true"/>\r\n-            <param name="pythonexpression" type="text" label="python expression" optional="true"/>\r\n-        </section>\r\n-\r\n-        <param name="taglist" type="data" optional="true" format="txt,tabular" label="Use a tag list" help="file containing identifiers of sequences to select" />\r\n-\r\n-        <param name="setid_pythonexpression" type="text" label="Set sequence record identifier with a value" help="Use this option if you want to set sequence record identifier with a value computed from PYTHON_EXPRESSION" />\r\n-\r\n-        <param name="pythonexpression" type="text" label="Run a PYTHON_EXPRESSION on each selected sequence" optional="true" help="Use this option if you want to run a PYTHON_EXPRESSION on each selected sequence"/>\r\n-\r\n-        <param name="setsequence_pythonexpression" type="text" label="Change the sequence itself with a v'..b'thonexpression" type="text" label="Change the sequence itself with a value" help="Use this option if you want to change the sequence itself with a value computed from PYTHON_EXPRESSION"/>\n+\n+        <param name="setdefinition_pythonexpression" type="text" label="Set sequence definition with a value computed" help="Use this option if you want to set sequence definition with a value computed from PYTHON_EXPRESSION"/>\n+\n+        <param name="clearbool" type="boolean" label="Clear all attributes associated to the sequence records" truevalue="--clear" falsevalue="" help="Use this option if you want to clear all attributes associated to the sequence records" />\n+\n+        <section name="key_selector" title="Keep only attribute with key" expanded="False">\n+            <param name="key" type="text" label="key" optional="true" />\n+            <param name="key2" type="text" label="if you want to specify a second key" optional="true" />\n+            <param name="key3" type="text" label="if you want to specify a third key" optional="true" />\n+            <param name="key4" type="text" label="if you want to specify a fourth key" optional="true" />\n+            <param name="key5" type="text" label="if you want to specify a fifth key" optional="true" />\n+        </section>\n+\n+        <param name="length" type="boolean" label="Use the length option?" truevalue="--length" falsevalue="" help="Use this option if you want to add attribute with seq_length as a key and sequence length as a value" />\n+\n+        <param name="rankname" type="text" label="Add taxonomic annotation" help="Use this option if you want to add taxonomic annotation at taxonomic rank RANK_NAME"/>\n+\n+        <param name="mclfile" optional="true" type="data" format="txt,tabular" label="mcl file" help="use this option if you want to add a new attribute containing the number of the cluster the sequence record was assigned to, as indicated in file MCLFILE" />\n+\n+        <param name="uniqid" type="boolean" label="Force sequence record ids to be unique"  truevalue="--uniq-id" falsevalue="" help="Use this option if you want to force sequence record ids to be unique" />\n+        <expand macro="input_format_options_macro"/>\n+        <expand macro="out_format_macro"/>\n+    </inputs>\n+    <outputs>\n+        <data name="output" format="auto"/>\n+    </outputs>\n+    <tests>\n+        <test>\n+            <param name="input" value="output_obiuniq.fasta" ftype="fasta"/>\n+            <section name="key_selector">\n+                <param name="key" value="count" />\n+                <param name="key2" value="merged_sample" />\n+            </section>\n+            <param name="uniqid" value="true" />\n+            <param name="clearbool" value="true" />\n+            <param name="length" value="true" />\n+            <param name="seqrank" value="true" />\n+\n+            <output name="output" file="output_obiannotate.fasta" ftype="fasta"/>\n+        </test>\n+        <test>\n+            <param name="input" value="output_obiuniq.fasta.gz" ftype="fasta.gz"/>\n+            <section name="key_selector">\n+                <param name="key" value="count" />\n+                <param name="key2" value="merged_sample" />\n+            </section>\n+            <param name="uniqid" value="true" />\n+            <param name="clearbool" value="true" />\n+            <param name="length" value="true" />\n+            <param name="seqrank" value="true" />\n+            <output name="output" file="output_obiannotate.fasta.gz" ftype="fasta.gz" decompress="true"/>\n+        </test>\n+        <!-- TODO fastq input test -->\n+    </tests>\n+\n+    <help><![CDATA[\n+\n+.. class:: infomark\n+\n+**What it does**\n+\n+`obiannotate` is the command that allows adding/modifying/removing annotation attributes attached to sequence records.\n+\n+Once such attributes are added, they can be used by the other OBITools commands for filtering purposes or for statistics computing.\n+\n+@OBITOOLS_LINK@\n+\n+]]>\n+\n+    </help>\n+    <expand macro="citation" />\n+</tool>\n'
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/illuminapairedend.output.fastq.gz
b
Binary file test-data/illuminapairedend.output.fastq.gz has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/output_ngsfilter_error_3.fastq
b
Binary file test-data/output_ngsfilter_error_3.fastq has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/output_ngsfilter_error_3.fastq.gz
b
Binary file test-data/output_ngsfilter_error_3.fastq.gz has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/output_ngsfilter_unidentified.fastq
b
Binary file test-data/output_ngsfilter_unidentified.fastq has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/output_obiannotate.fasta.gz
b
Binary file test-data/output_obiannotate.fasta.gz has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/output_obiclean_advanced.fasta.gz
b
Binary file test-data/output_obiclean_advanced.fasta.gz has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/output_obigrep_predicat.fasta.gz
b
Binary file test-data/output_obigrep_predicat.fasta.gz has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/output_obisort.fastq
--- a/test-data/output_obisort.fastq Thu Nov 28 15:50:43 2019 -0500
+++ b/test-data/output_obisort.fastq Mon May 10 19:37:25 2021 +0000
b
b"@@ -1,172 +1,232 @@\n->HELIUM_000100422_612GNAAXX:7:57:18459:16145#0/2_CONS_SUB_SUB_CMP count=64; merged_sample={'26a_F040644': 64}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=99; obiclean_headcount=1; seq_rank=5; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'h'}; obiclean_head=True; \n-ttagccctaaacataaacattcaataaacaagaatgttcgccagagtactactagcaaca\n-gcctgaaactcaaaggacttggcggtgctttacatccct\n->HELIUM_000100422_612GNAAXX:7:22:8540:14708#0/2_CONS_SUB_SUB count=61; merged_sample={'29a_F260619': 30, '15a_F730814': 31}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=100; obiclean_headcount=2; seq_rank=4; obiclean_samplecount=2; obiclean_status={'29a_F260619': 'h', '15a_F730814': 'h'}; obiclean_head=True; \n-ttagccctaaacacaagtaattaatataacaaaattattcgccagagtactaccggcaat\n-agcttaaaactcaaaggacttggcggtgctttataccctt\n->HELIUM_000100422_612GNAAXX:7:6:9274:14951#0/2_CONS_SUB_SUB count=46; merged_sample={'13a_F730603': 46}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=100; obiclean_headcount=1; seq_rank=8; obiclean_samplecount=1; obiclean_status={'13a_F730603': 'h'}; obiclean_head=True; \n-ctagccttaaacacaaatagttatgcaaacaaaactattcgccagagtactaccggcaat\n-agcttaaaactcaaaggacttggcggtgctttataccctt\n->HELIUM_000100422_612GNAAXX:7:13:5742:9859#0/2_CONS_SUB_SUB count=7; merged_sample={'29a_F260619': 7}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=4; obiclean_headcount=0; seq_rank=16; obiclean_samplecount=1; obiclean_status={'29a_F260619': 's'}; obiclean_head=True; \n+@HELIUM_000100422_612GNAAXX:7:57:18459:16145#0/2_CONS_SUB_SUB_CMP count=64; merged_sample={'26a_F040644': 64}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=99; obiclean_headcount=1; seq_rank=5; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'h'}; obiclean_head=True; \n+ttagccctaaacataaacattcaataaacaagaatgttcgccagagtactactagcaacagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:22:8540:14708#0/2_CONS_SUB_SUB count=61; merged_sample={'29a_F260619': 30, '15a_F730814': 31}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=100; obiclean_headcount=2; seq_rank=4; obiclean_samplecount=2; obiclean_status={'29a_F260619': 'h', '15a_F730814': 'h'}; obiclean_head=True; \n+ttagccctaaacacaagtaattaatataacaaaattattcgccagagtactaccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:6:9274:14951#0/2_CONS_SUB_SUB count=46; merged_sample={'13a_F730603': 46}; obiclean_singletoncount=0; obiclean_internalcount=0; seq_length=100; obiclean_headcount=1; seq_rank=8; obiclean_samplecount=1; obiclean_status={'13a_F730603': 'h'}; obiclean_head=True; \n+ctagccttaaacacaaatagttatgcaaacaaaactattcgccagagtactaccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:13:5742:9859#0/2_CONS_SUB_SUB count=7; merged_sample={'29a_F260619': 7}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=4; obiclean_headcount=0; seq_rank=16; obiclean_samplecount=1; obiclean_status={'29a_F260619': 's'}; obiclean_head=True; \n tttt\n->HELIUM_000100422_612GNAAXX:7:89:10281:5930#0/2_CONS_SUB_SUB_CMP count=3; merged_sample={'29a_F260619': 3}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=100; obiclean_headcount=0; seq_rank=6; obiclean_samplecount=1; obiclean_status={'29a_F260619': 's'}; obiclean_head=True; \n-ttagccctaaacacaaataattacacaaacaaaattgttcaccagagtactagcggcaac\n-agcttaaaactcaaaggacttggcggtgctttataccctt\n->HELIUM_000100422_612GNAAXX:7:29:15520:18035#0/2_CONS_SUB_SUB count=2; merged_sample={'29a_F260619': 2}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=100; obiclean_headcount=0; seq_rank=7; obiclean_sample"..b"M_000100422_612GNAAXX:7:10:9237:10532#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'29a_F260619': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=100; obiclean_headcount=0; seq_rank=51; obiclean_samplecount=1; obiclean_status={'29a_F260619': 'i'}; obiclean_head=False; \n+ttagccctaaacacaagtaattaatataacaaaataattcgccagagtactaccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:7:11998:4462#0/2_CONS_SUB_SUB count=1; merged_sample={'26a_F040644': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=99; obiclean_headcount=0; seq_rank=52; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'i'}; obiclean_head=False; \n+ttagccctaaacataaacattcaataaacaagaatgttcgccagagtagtactagcaacagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:111:18277:17779#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'26a_F040644': 1}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=99; obiclean_headcount=0; seq_rank=53; obiclean_samplecount=1; obiclean_status={'26a_F040644': 's'}; obiclean_head=True; \n+ttagccctaaacatagataattttacaacaaaataattcgccagaggactactagcaatagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:3:17077:6562#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'15a_F730814': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=100; obiclean_headcount=0; seq_rank=54; obiclean_samplecount=1; obiclean_status={'15a_F730814': 'i'}; obiclean_head=False; \n+ttagccctaaacacaagtaattaatataacaaaattattcgccagagtactgccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:19:4311:13343#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'26a_F040644': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=99; obiclean_headcount=0; seq_rank=55; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'i'}; obiclean_head=False; \n+ttagccctaaacataaacattcaataaacaagaatgttcgccagagtactacgagcaacagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:30:1800:7833#0/2_CONS_SUB_SUB count=1; merged_sample={'15a_F730814': 1}; obiclean_singletoncount=1; obiclean_internalcount=0; seq_length=100; obiclean_headcount=0; seq_rank=56; obiclean_samplecount=1; obiclean_status={'15a_F730814': 's'}; obiclean_head=True; \n+ttagccctaaacacaagacattaatataacgagattaatcgacagagtactaccggctatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:108:9222:18258#0/2_CONS_SUB_SUB count=1; merged_sample={'13a_F730603': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=100; obiclean_headcount=0; seq_rank=57; obiclean_samplecount=1; obiclean_status={'13a_F730603': 'i'}; obiclean_head=False; \n+ctagccttaaacacaaatagttatgcagacaaaactattcgccagagtactaccggcaatagcttaaaactcaaaggacttggcggtgctttataccctt\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n+@HELIUM_000100422_612GNAAXX:7:38:3005:20881#0/2_CONS_SUB_SUB_CMP count=1; merged_sample={'26a_F040644': 1}; obiclean_singletoncount=0; obiclean_internalcount=1; seq_length=99; obiclean_headcount=0; seq_rank=58; obiclean_samplecount=1; obiclean_status={'26a_F040644': 'i'}; obiclean_head=False; \n+ttagccctaaacatgaacattcaataaacaagaatgttcgccagagtactactagcaacagcctgaaactcaaaggacttggcggtgctttacatccct\n++\n+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII\n"
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/output_obiuniq.fasta.gz
b
Binary file test-data/output_obiuniq.fasta.gz has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/output_obiuniq_family.fasta.gz
b
Binary file test-data/output_obiuniq_family.fasta.gz has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/wolf_small.F.fastq.gz
b
Binary file test-data/wolf_small.F.fastq.gz has changed
b
diff -r 3021b9f5809f -r f82cefbbcea5 test-data/wolf_small.R.fastq.gz
b
Binary file test-data/wolf_small.R.fastq.gz has changed