Repository 'vsearch'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/vsearch

Changeset 1:8c4e2933a17a (2015-08-26)
Previous changeset 0:fae6527990af (2015-05-21) Next changeset 2:f29e21388219 (2015-12-17)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/vsearch commit 95732e013ec4dfe5dae0b9ed81e9d7710cbaed9d
modified:
clustering.xml
dereplication.xml
sorting.xml
tool_dependencies.xml
vsearch_macros.xml
added:
test-data/clustering_blast6out_result2.tab
test-data/clustering_centroids_result2.fasta
test-data/clustering_centroids_result4.fasta
test-data/clustering_notmatched_result2.fasta
test-data/clustering_uc_result3.uc
test-data/dereplication_result2.fasta
test-data/dereplication_uc_result3.fasta
test-data/sorting_result3.fasta
test-data/sorting_result4.fasta
test-data/sorting_result5.fasta
b
diff -r fae6527990af -r 8c4e2933a17a clustering.xml
--- a/clustering.xml Thu May 21 03:58:09 2015 -0400
+++ b/clustering.xml Wed Aug 26 13:34:22 2015 -0400
[
b'@@ -1,4 +1,4 @@\n-<tool id="vsearch_clustering" name="VSearch clustering" version="@VERSION@.0">\n+<tool id="vsearch_clustering" name="VSearch clustering" version="@VERSION@.1">\n     <description></description>\n     <macros>\n         <import>vsearch_macros.xml</import>\n@@ -10,8 +10,12 @@\n <![CDATA[\n     vsearch\n         @GENERAL@\n-        --cluster_fast "$infile"\n-        ##--cluster_smallmem FILENAME  cluster sequences using a small amount of memory\n+\t\n+\t#if $clustering_mode.clustering_mode_select == \'cluster_fast\':\n+            --cluster_fast "$infile"\n+\t#else if $clustering_mode.clustering_mode_select == \'cluster_smallmem\':\n+            --cluster_smallmem "$infile"\n+        #end if\n         ##--clusters STRING            output each cluster to a separate FASTA file\n \n         #if $maxrejects:\n@@ -23,7 +27,7 @@\n \n         $cons_truncate\n         --id $id\n-        ##--iddef $iddef\n+        --iddef $iddef\n \n         #if \'--msaout\' in str($outputs):\n             --msaout $msaout\n@@ -52,24 +56,33 @@\n         #if $qmask != \'no\':\n             --qmask $qmask\n         #end if\n-        #if $sizein:\n-            --sizein $sizein\n-        #end if\n-        #if $sizeout:\n-            --sizeout $sizeout\n-        #end if\n+        $sizein\n+        $sizeout\n         --strand $strand\n-        --usersort $usersort\n+\t$usersort\n+\t#if $uc:\n+            --uc "$uc_outfile"\n+\t#end if\n \n ]]>\n     </command>\n     <inputs>\n-        <param name="infile" type="data" format="fasta" label="Select your FASTA file" help="(--cluster_fast)" />\n+        <param name="infile" type="data" format="fasta" label="Select your input FASTA file" help="" />\n+        <conditional name="clustering_mode">\n+            <param name="clustering_mode_select" type="select" label="Choose sorting method to use before clustering" help="">\n+                <option value="cluster_fast" default="True">Cluster sequences after sorting by length (--cluster-fast)</option>\n+                <option value="cluster_smallmem">Cluster already sorted sequences (--cluster-smallmem)</option>\n+            </param>\n+            <when value="cluster_fast">\n+            </when>\n+            <when value="cluster_smallmem">\n+          </when>\n+        </conditional>\n+        <param name="usersort" type="boolean" truevalue="--usersort" falsevalue="" checked="False" \n+            label="Indicate that input sequences are not presorted by length" help="(--usersort)"/>\n         <expand macro="id_and_iddef" />\n         <param name="cons_truncate" type="boolean" truevalue="--cons_truncate" falsevalue="" checked="False" \n             label="Do not ignore terminal gaps in MSA for consensus" help="(--cons_truncate)"/>\n-        <param name="usersort" type="boolean" truevalue="--usersort" falsevalue="" checked="False" \n-            label="Indicate that input sequences are presorted" help="(--usersort)"/>\n         <expand macro="qmask" />\n         <expand macro="sizein" />\n         <expand macro="sizeout" />\n@@ -83,6 +96,7 @@\n             <option value="--notmatched">Write non-matching query sequences to separate file</option>\n             <option value="--matched">Write matching query sequences to separate file</option>\n         </expand>\n+        <expand macro="uclust_like_output" />\n \n     </inputs>\n     <outputs>\n@@ -110,6 +124,9 @@\n         <data name="fastapairs" format="fasta" label="${tool.name} on ${on_string}: Query/Target sequences">\n             <filter>\'--fastapairs\' in outputs</filter>\n         </data>\n+        <data name="uc_outfile" format="tabular" label="${tool.name} on ${on_string}: UCLUST like output">\n+            <filter>uc is True</filter>\n+        </data>\n     </outputs>\n     <tests>\n         <test>\n@@ -117,7 +134,7 @@\n             <param name="id" value="0.99"/>\n             <param name="maxaccepts" value="1"/>\n             <param name="maxrejects" value="2"/>\n-            <param name="sizeout" value="--sizeout"/>\n+            <param name="sizeout" value=""/>\n             <param name="outputs'..b't_result2.tab" ftype="tabular" />\n+            <output name="notmatched" file="clustering_notmatched_result2.fasta" ftype="fasta" />\n+        </test>\n+\t<test>\n+            <param name="infile" value="BioMarKs5k.fsa.bz2" ftype="fasta" />\n+            <param name="clustering_mode_select" value="cluster_smallmem"/>\n+            <param name="usersort" value="--usersort"/>\n+            <param name="id" value="0.99"/>\n+            <param name="maxaccepts" value="1"/>\n+            <param name="maxrejects" value="2"/>\n+            <param name="sizeout" value="--sizeout"/>\n+            <param name="outputs" value="--centroids" />\n+            <param name="uc" value="--uc"/>\n+            <output name="centroids" file="clustering_centroids_result2.fasta" ftype="fasta" />\n+            <output name="uc_outfile" file="clustering_uc_result3.uc" ftype="tabular" />\n+        </test>\n+\t<test>\n+            <param name="infile" value="BioMarKs5k.fsa.bz2" ftype="fasta" />\n+            <param name="clustering_mode_select" value="cluster_smallmem"/>\n+            <param name="usersort" value="--usersort"/>\n+            <param name="id" value="0.99"/>\n+            <param name="maxaccepts" value="1"/>\n+            <param name="maxrejects" value="2"/>\n+            <param name="sizeout" value="--sizeout"/>\n+            <param name="outputs" value="--centroids" />\n+            <param name="iddef" value="0"/>\n+            <output name="centroids" file="clustering_centroids_result4.fasta" ftype="fasta" />\n+        </test>\n+\t<test>\n+            <param name="infile" value="BioMarKs5k.fsa.bz2" ftype="fasta" />\n+            <param name="clustering_mode_select" value="cluster_fast"/>\n+            <param name="usersort" value="--usersort"/>\n+            <param name="id" value="0.99"/>\n+            <param name="maxaccepts" value="1"/>\n+            <param name="maxrejects" value="2"/>\n+            <param name="sizeout" value=""/>\n+            <param name="outputs" value="--centroids" />\n+            <param name="qmask" value="none"/>\n+            <output name="centroids" file="clustering_centroids_result1.fasta" ftype="fasta" />\n+        </test>\n     </tests>\n     <help>\n <![CDATA[\n@@ -139,19 +206,21 @@\n \n Clustering options (most searching options also apply)\n   --centroids FILENAME         output centroid sequences to FASTA file\n-  --cluster_fast FILENAME      cluster sequences fast\n-  --cluster_smallmem FILENAME  cluster sequences using a small amount of memory\n+  --cluster_fast FILENAME      cluster sequences after sorting by length\n+  --cluster_size FILENAME      cluster sequences after sorting by abundance\n+  --cluster_smallmem FILENAME  cluster already sorted sequences (see -usersort)\n   --clusters STRING            output each cluster to a separate FASTA file\n   --consout FILENAME           output cluster consensus sequences to FASTA file\n   --cons_truncate              do not ignore terminal gaps in MSA for consensus\n   --id REAL                    reject if identity lower\n   --iddef INT                  id definition, 0-4=CD-HIT,all,int,MBL,BLAST (2)\n-  --msaout FILENAME            output multiple seq. alignments to FASTA file \n-  --qmask                      mask seqs with dust, soft or no method (dust)\n-  --sizein                     read abundance annotation from input\n+  --msaout FILENAME            output multiple seq. alignments to FASTA file\n+  --qmask                      seqs with dust, soft or no method (dust)\n+  --sizein                     propagate abundance annotation from input\n   --sizeout                    write cluster abundances to centroid file\n-  --strand                     cluster using "plus" or "both" strands (plus)\n-  --usersort                   indicate that input sequences are presorted\n+  --strand                     cluster using plus or both strands (plus)\n+  --uc FILENAME                filename for UCLUST-like output\n+  --usersort                   indicate sequences not presorted by length\n \n \n @EXTERNAL_DOCUMENTATION@\n'
b
diff -r fae6527990af -r 8c4e2933a17a dereplication.xml
--- a/dereplication.xml Thu May 21 03:58:09 2015 -0400
+++ b/dereplication.xml Wed Aug 26 13:34:22 2015 -0400
b
@@ -1,4 +1,4 @@
-<tool id="vsearch_dereplication" name="VSearch dereplication" version="@VERSION@.0">
+<tool id="vsearch_dereplication" name="VSearch dereplication" version="@VERSION@.1">
     <description></description>
     <macros>
         <import>vsearch_macros.xml</import>
@@ -18,16 +18,14 @@
             --minuniquesize $minuniquesize
         #end if
         --output $outfile
-        #if $sizein:
-            --sizein $sizein
+        $sizein
+ $sizeout
+        --strand $strand
+        #if $topn:
+            --topn $topn
         #end if
-        #if $sizeout:
-            --sizeout $sizeout
-        #end if
-        --strand $strand
-        --topn $topn
         #if $uc:
-            --uc $uc
+            --uc $uc_outfile
         #end if
 ]]>
     </command>
@@ -45,7 +43,7 @@
     </inputs>
     <outputs>
         <data name="outfile" format="fasta" label="${tool.name} on ${on_string}" />
-        <data name="uc" format="fasta" label="${tool.name} on ${on_string}: UCLUST like output">
+        <data name="uc_outfile" format="fasta" label="${tool.name} on ${on_string}: UCLUST like output">
             <filter>uc is True</filter>
         </data>
     </outputs>
@@ -55,9 +53,28 @@
             <param name="strand" value="both" />
             <param name="minuniquesize" value="1" />
             <param name="maxuniquesize" value="100000" />
+            <param name="topn" value="10000" />
+            <output name="outfile" file="dereplication_result1.fasta" ftype="fasta" />
+        </test>
+        <test>
+            <param name="infile" value="AF091148_first_rep.fsa.bz2" ftype="fasta" />
+            <param name="strand" value="both" />
+            <param name="minuniquesize" value="1" />
+            <param name="maxuniquesize" value="100000" />
+            <param name="sizeout" value="--sizeout"/>
+            <param name="topn" value="" />
+            <output name="outfile" file="dereplication_result2.fasta" ftype="fasta" />
+        </test>
+        <test>
+            <param name="infile" value="AF091148_first_rep.fsa.bz2" ftype="fasta" />
+            <param name="strand" value="both" />
+            <param name="minuniquesize" value="1" />
+            <param name="maxuniquesize" value="100000" />
             <param name="sizeout" value="--sizeout"/>
             <param name="topn" value="10000" />
-            <output name="outfile" file="dereplication_result1.fasta" ftype="fasta" />
+            <param name="uc" value="--uc" />
+            <output name="outfile" file="dereplication_result2.fasta" ftype="fasta" />
+            <output name="uc_outfile" file="dereplication_uc_result3.fasta" ftype="fasta" />
         </test>
     </tests>
     <help>
b
diff -r fae6527990af -r 8c4e2933a17a sorting.xml
--- a/sorting.xml Thu May 21 03:58:09 2015 -0400
+++ b/sorting.xml Wed Aug 26 13:34:22 2015 -0400
[
@@ -1,4 +1,4 @@
-<tool id="vsearch_sorting" name="VSearch sorting" version="@VERSION@.0">
+<tool id="vsearch_sorting" name="VSearch sorting" version="@VERSION@.1">
     <description></description>
     <macros>
         <import>vsearch_macros.xml</import>
@@ -22,9 +22,10 @@
             #end if
         #end if
         --output $outfile
-        #if $sizeout:
-            --sizeout $sizeout
+        #if $relabel:
+            --relabel "$relabel"
         #end if
+        $sizeout
         #if $topn:
             --topn $topn
         #end if
@@ -49,6 +50,8 @@
           </when>
         </conditional>
         <expand macro="topn" />
+        <param name="relabel" type="text" value="" 
+               label="Relabel with this prefix string after sorting" help="(--relabel)"/>
         <param name="sizeout" type="boolean" truevalue="--sizeout" falsevalue="" checked="False" 
             label="Add abundance annotation to output" help="(--sizeout)"/>
     </inputs>
@@ -66,6 +69,24 @@
             <param name="infile" value="db.fasta" ftype="fasta" />
             <output name="outfile" file="sorting_result2.fasta" ftype="fasta" />
         </test>
+        <test>
+            <param name="sorting_mode_select" value="sortbylength"/>
+            <param name="infile" value="db.fasta" ftype="fasta" />
+            <param name="relabel" value="TEST" />
+            <output name="outfile" file="sorting_result3.fasta" ftype="fasta" />
+        </test>
+        <test>
+            <param name="sorting_mode_select" value="sortbylength"/>
+            <param name="infile" value="db.fasta" ftype="fasta" />
+            <param name="sizeout" value="--sizeout" />
+            <output name="outfile" file="sorting_result4.fasta" ftype="fasta" />
+        </test>
+        <test>
+            <param name="sorting_mode_select" value="sortbylength"/>
+            <param name="infile" value="db.fasta" ftype="fasta" />
+            <param name="relabel" value="With spaces" />
+            <output name="outfile" file="sorting_result5.fasta" ftype="fasta" />
+        </test>
     </tests>
     <help>
 <![CDATA[
b
diff -r fae6527990af -r 8c4e2933a17a test-data/clustering_blast6out_result2.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/clustering_blast6out_result2.tab Wed Aug 26 13:34:22 2015 -0400
b
b'@@ -0,0 +1,3624 @@\n+b7ffa8f46cb16542d89dc5293ade2098;size=3629\tb235271fbc8a6c9d990037857189ee9a;size=22254\t99.7\t388\t0\t1\t1\t388\t1\t387\t-1\t0\n+aff14fabb2213686a8bc18bf98edd8fd;size=3501\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\t99.7\t375\t0\t1\t1\t375\t1\t374\t-1\t0\n+5bf3b429509ca7b31bbce32fa4d77e33;size=3298\tefbd11c972faa734253f779fc4eb2a64;size=5440\t99.7\t383\t1\t0\t1\t383\t1\t383\t-1\t0\n+8dbb6f1dafe133984c7c7d899a730e1c;size=2722\t78951b2d4ca30531381672a30be0978a;size=3655\t99.5\t381\t2\t0\t1\t381\t1\t381\t-1\t0\n+397a9be0ac23a54c504ad0cd4f86ddb9;size=2689\t4edf10a5e3aa4bd4ed28b1694727a060;size=3078\t99.7\t383\t1\t0\t1\t383\t1\t383\t-1\t0\n+fef76769bd8d3a969b567d6d037a9594;size=2592\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\t99.7\t374\t0\t1\t1\t373\t1\t374\t-1\t0\n+dcb878b5e3696aaa3fded2a9f7dea7cd;size=2312\ta9d668eae33f9fd4484585d9fe52b05e;size=8638\t99.5\t384\t2\t0\t1\t384\t1\t385\t-1\t0\n+2cb0faa31a23b37e7a40aa1d4ea12534;size=2194\t39392bbb9626a64e6663c05b70293e7c;size=11535\t99.7\t384\t0\t1\t1\t384\t1\t383\t-1\t0\n+d56b9d19ecd14c245a89c7ac5f10e437;size=2070\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\t99.7\t375\t0\t1\t1\t375\t1\t374\t-1\t0\n+585a7f513b67529b955093b393a269bc;size=1982\tb970fcbdd71ad2a333f702c7ecfe7114;size=10907\t99.7\t384\t0\t1\t1\t383\t1\t384\t-1\t0\n+91347cd2230896780f6a8d8ec7a3eb63;size=1899\tea64ae1d6dddc2146105a882229c81bb;size=5125\t99.7\t387\t0\t1\t1\t387\t1\t386\t-1\t0\n+156b1f0da0c6d2b99c93ca960ad238e1;size=1865\t39392bbb9626a64e6663c05b70293e7c;size=11535\t99.7\t383\t0\t1\t1\t382\t1\t383\t-1\t0\n+0da2223146fae1b8f135d4a714ab758a;size=1658\tefbd11c972faa734253f779fc4eb2a64;size=5440\t99.5\t384\t1\t1\t1\t384\t1\t383\t-1\t0\n+e3678986fcd4c8b340dde7edc8769cff;size=1654\tb970fcbdd71ad2a333f702c7ecfe7114;size=10907\t99.5\t383\t2\t0\t1\t383\t1\t384\t-1\t0\n+5b2f9bda94dd54330d8de22256613968;size=1644\tfd9c8703206ef0b3c0fcd3846f26fb50;size=2770\t99.5\t381\t2\t0\t1\t381\t1\t381\t-1\t0\n+f0e31f5fc37262f3a54fe156214ada67;size=1565\t26d2046e1a0f79450d6233ef29aab44e;size=4937\t99.5\t380\t2\t0\t1\t380\t1\t381\t-1\t0\n+09c0939b69af725fcefdeb6c35cdaa5b;size=1498\tb235271fbc8a6c9d990037857189ee9a;size=22254\t99.5\t386\t2\t0\t1\t386\t1\t387\t-1\t0\n+480f81bba6b456e691c9ae3af1944050;size=1476\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\t99.7\t375\t0\t1\t1\t375\t1\t374\t-1\t0\n+9edca20763bd11809a3d8f3967db2877;size=1472\t38a1e68923981030900a4744924d4694;size=2491\t99.2\t381\t3\t0\t1\t381\t1\t381\t-1\t0\n+b5ab0dbcb415c673734c5feede1e68c0;size=1402\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\t99.5\t374\t0\t2\t1\t372\t1\t374\t-1\t0\n+540b404fd00e9ac0fd64a1013100ff60;size=1396\tb235271fbc8a6c9d990037857189ee9a;size=22254\t99.7\t388\t0\t1\t1\t388\t1\t387\t-1\t0\n+7b06ce2140c60cda9883867bf19fdc70;size=1316\t38a1e68923981030900a4744924d4694;size=2491\t99.5\t381\t2\t0\t1\t381\t1\t381\t-1\t0\n+6182032c31fcc52e80485eb65f57a3b0;size=1283\taecd442213d89e3f43949aee5040a3ed;size=5318\t99.5\t380\t2\t0\t1\t380\t1\t381\t-1\t0\n+4d6c118910206a89191ce805180fe971;size=1205\t0758959c27aa3f623d5484ca0cefb2dc;size=1595\t99.7\t381\t1\t0\t1\t381\t1\t381\t-1\t0\n+d1521a9319e576119236c1d23e84b6ef;size=1202\ta4fcbfbd0bab3615b1357ea94b0abe1b;size=1542\t99.5\t385\t2\t0\t1\t385\t1\t386\t-1\t0\n+f5ee2e1acf1ecc6a1e1f8db80e42c270;size=1201\t39392bbb9626a64e6663c05b70293e7c;size=11535\t99.7\t384\t0\t1\t1\t384\t1\t383\t-1\t0\n+dcf0057c94c92fad51472cd1fef22f5e;size=1172\t721460e46e8804111d74cb730340492f;size=3538\t99.5\t381\t2\t0\t1\t381\t1\t382\t-1\t0\n+b796257549c946cfffa56aceb6cbc95a;size=1166\tda17e1a54e88120e294c7e68e350f47f;size=6062\t99.7\t374\t0\t1\t1\t373\t1\t374\t-1\t0\n+11eb106b385d9b548ae2216ea66ba928;size=1127\ta9d668eae33f9fd4484585d9fe52b05e;size=8638\t99.7\t386\t0\t1\t1\t386\t1\t385\t-1\t0\n+c7ff79b83a3a5a22215e511c751f083b;size=1108\ta3b19115a503e03c27f9577b3e9c673e;size=2708\t99.7\t381\t1\t0\t1\t381\t1\t381\t-1\t0\n+817512aac90b499dbeb9a8c91816a9bf;size=1094\t78951b2d4ca30531381672a30be0978a;size=3655\t99.7\t381\t1\t0\t1\t381\t1\t381\t-1\t0\n+4347ae2e59508730eb759fc73d80cc40;size=1052\tf06d17d4b0138ffa08d4f76dc098b6b1;size=1076\t99.2\t387\t0\t3\t1\t386\t1\t385\t-1\t0\n+2ad33e9d24121dc57113fa22292616ce;size=1048\ta1fe4d26985b4fd62b7bef1949d111f4;size=4547\t99.5\t375\t2\t0\t1\t376\t1\t375\t-1\t0\n+ea0fef204a1066a299a9bf6aeb9fbd8a;size=991\t39392bbb9626a64e6663c05b70293e7c;size=11535\t99.7\t384\t0\t1\t1\t384\t'..b'1\t0\n+8098d0f76e64475d211bdf4bb7c193b5;size=29\tda17e1a54e88120e294c7e68e350f47f;size=6062\t99.5\t375\t0\t2\t1\t374\t1\t374\t-1\t0\n+835fd6c5c54a8651c00b059284ecfd3b;size=29\t9701b75c97af0ba765c88b2014f38e86;size=128\t99.7\t381\t0\t1\t1\t381\t1\t380\t-1\t0\n+839e78cbcaa38d36d86a49e90a7176c4;size=29\te401b165aa34a990ec26b307fb8a93c5;size=1445\t99.7\t382\t0\t1\t1\t382\t1\t381\t-1\t0\n+83b59c5798c4f802422cd674ce8883dc;size=29\t794febe7f0e75cadf7a8117f0026e7df;size=234\t99.7\t381\t1\t0\t1\t381\t1\t381\t-1\t0\n+89ec5bf22b89b5fed88eb5b163685995;size=29\td35654eb7b71f92a7122dd25696b4daa;size=253\t99.7\t383\t1\t0\t1\t383\t1\t383\t-1\t0\n+8d339c62296eca340c7acb045295c05e;size=29\te380031f8f6d7ed53c033b8c5981c084;size=98\t99.7\t382\t0\t1\t1\t382\t1\t381\t-1\t0\n+8f74bedb82f8c3ae32eca1334fa9a2a2;size=29\t367981d8723cf4e3d71baf722702b583;size=955\t99.7\t382\t0\t1\t1\t382\t1\t381\t-1\t0\n+8f97fb55171c8402950a35e8cd45ea60;size=29\t8189c62883b074718aa565dd3a377d32;size=64\t99.5\t384\t2\t0\t1\t384\t1\t384\t-1\t0\n+90fef2cdcb4526d62ccf228cf2f65036;size=29\tc5ffc66b15459f2709fa625c42de4981;size=269\t99.7\t374\t0\t1\t1\t373\t1\t374\t-1\t0\n+948fae47a59f06837b296195e9533481;size=29\tb235271fbc8a6c9d990037857189ee9a;size=22254\t99.7\t387\t1\t0\t1\t387\t1\t387\t-1\t0\n+96e5ebe13592405389371e79097fe24b;size=29\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\t99.5\t374\t0\t2\t1\t372\t1\t374\t-1\t0\n+97d07a69c81b8915f910806f49e1dfce;size=29\t9aa859a343f11ef50552680c294ab3d6;size=59\t99.5\t380\t0\t2\t1\t378\t1\t380\t-1\t0\n+9b9e6561b71bacb65b011e11233b558a;size=29\t40ee3d716c5d6182074f0a132734dc08;size=547\t99.7\t381\t0\t1\t1\t380\t1\t381\t-1\t0\n+9cc276e5562b2e067000cb804716cc72;size=29\t1ad5d7db6aa24146e665af7d4d8a5645;size=41\t99.2\t384\t0\t3\t1\t382\t1\t383\t-1\t0\n+9ded02e7fe5ddf955662e0838c9405da;size=29\t3b9c1697cd9fa5e1fb8e2acb74f6880d;size=145\t99.5\t380\t2\t0\t1\t380\t1\t381\t-1\t0\n+a10ef95bf74e767de728aaf250f82216;size=29\tc79afaf32375a47ab67be556fa3b564e;size=41\t99.2\t380\t3\t0\t1\t381\t1\t380\t-1\t0\n+a2d30bb89fe95b2bb2b26190230b6269;size=29\t6b394e36e1bef9a54ee149410df5edd4;size=1366\t99.7\t374\t0\t1\t1\t373\t1\t374\t-1\t0\n+a6b565b23702c4c81f2b9640cd2ed0f5;size=29\t4fd9e532b34b278047b4a588cc98708a;size=1762\t99.5\t382\t0\t2\t1\t382\t1\t380\t-1\t0\n+a8fa1f030499f69b8fb66a5b092f99ed;size=29\t38a1e68923981030900a4744924d4694;size=2491\t99.5\t381\t2\t0\t1\t381\t1\t381\t-1\t0\n+a99f65aa4c312b67b876b0d2b46004a5;size=29\t1c7a4a95f9f23058b6176ae6e7360636;size=99\t99.5\t380\t2\t0\t1\t380\t1\t380\t-1\t0\n+ab0e8a4a8831aef6e2035920bad0af8a;size=29\t165c8aa6c294466e476a628e2d42326e;size=343\t99.7\t380\t1\t0\t1\t380\t1\t380\t-1\t0\n+acb0b77870a486baf4b722a345c5c3be;size=29\t354bfa6c30fdd33ca8b1824f0c386b31;size=243\t99.7\t381\t0\t1\t1\t381\t1\t380\t-1\t0\n+acc5f37521e0eeacfb71521f731c1982;size=29\t7ff818ff14477645d9748f9e80212e1a;size=791\t99.2\t379\t2\t1\t1\t378\t1\t380\t-1\t0\n+b0613a10ff3c5d8f689c7514b929dd97;size=29\t41adb02887726df1852fe9938796a325;size=97\t99.5\t383\t0\t2\t1\t383\t1\t381\t-1\t0\n+b16bd7eaabd549f5a8da90e2876cc4ff;size=29\t980d40447ad2bed74e1a36ff7a2d8362;size=244\t99.2\t382\t2\t1\t1\t382\t1\t382\t-1\t0\n+b24ac35e6510476fadee6eb47569b6bd;size=29\te16848b95cf7309d011c4c97a7bcd2f9;size=1507\t99.2\t369\t3\t0\t1\t369\t1\t369\t-1\t0\n+b2daba5635e59a330b9a233031882bef;size=29\t6d534239f9c5ebd883a72f96e2d21557;size=546\t99.7\t381\t0\t1\t1\t380\t1\t381\t-1\t0\n+b765ebc6c4d8ce8455dd1b24ed76cd62;size=29\ta52196ae2db82d5f270103453bc3a2ac;size=1101\t99.5\t381\t2\t0\t1\t381\t1\t381\t-1\t0\n+ba839876211fb0b6fb9113d05ce8a6b4;size=29\t006eb542c4ddd1086af742069fc840ba;size=294\t99.7\t385\t0\t1\t1\t385\t1\t384\t-1\t0\n+bc04647af93059a38915012d5f17d308;size=29\t1e7bf5b9268da3a50505214ab3a5670f;size=575\t99.4\t361\t0\t2\t1\t359\t1\t361\t-1\t0\n+bca7d1b2f489d827fc22ee3e509e096d;size=29\t99ba81c88f63f83daf290add3918d38b;size=1787\t99.5\t387\t0\t2\t1\t386\t1\t386\t-1\t0\n+bd3a0cff22a32ba782f8df17e8ef6a90;size=29\t5683a4033863e64015d0facb4961a38a;size=1129\t99.5\t380\t1\t1\t1\t379\t1\t380\t-1\t0\n+bd722cae807361199a837719abb82aa5;size=29\t2f5d10970ddf2332d2df676704aa0c78;size=46\t99.5\t383\t1\t1\t1\t382\t1\t383\t-1\t0\n+c5ffb5368376c81f723b6402ca2b84ba;size=29\t1f854f3a83c7c03dc88303978686c39a;size=427\t99.5\t383\t2\t0\t1\t383\t1\t383\t-1\t0\n+c7230827efa17f5f79a837fa1d3d9e9b;size=29\t7ba6b7e87ff4f03a195f5b23b517ecb2;size=104\t99.2\t381\t2\t1\t1\t382\t1\t380\t-1\t0\n'
b
diff -r fae6527990af -r 8c4e2933a17a test-data/clustering_centroids_result2.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/clustering_centroids_result2.fasta Wed Aug 26 13:34:22 2015 -0400
b
b'@@ -0,0 +1,8256 @@\n+>b235271fbc8a6c9d990037857189ee9a;size=86;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGTGCATTCCACTGGCCTATTGG\n+TTAACTCCAACTTGGCTCATTTGGAATACGCCATCTTTAGGCAGACCCGTCGTGGCATTAGGTTGTCGTGATGGTTACGC\n+CTATCGTTTACTGTGAAGAAATTAGGGTGTTCAAAGCAGGCTTATGCCATGAATACGTTAGCATGGAATAATGAGATAGG\n+ATTTCGGTACTATTTTGTTGGTTTGTGTACGGAAATAATGATTAACAGGAACAGTGTTGTGGGTATTCGTATTTCGTTGT\n+CAGAGGTGAAATTCTTGGATTTACGAAAGACGAACGACTGCGAAAGCATTTACCAAGGATGTTTTCA\n+>7e02ae2e1e404d4e7c6035a6e374d29d;size=105;\n+AGCTCCAATAGCGTATACTAATGTTGTTGCAGTTAAAAAGCTCGTAGTCGGATTTCAGTAGGCTCAGTTAAGTCTCTTCT\n+ATTGAGTTCTTTATGGGCCTGCTTCTTTGACAGAAACTTCTATGTTATTCATTTAGCGTGGGTAGCGACTGTCTCTTTTA\n+CTTTGAGAAAATTAGAGTGTTCAAAGCAGGTATTCGCCTGAATATTACTCTTGGAATAATGCTATAAGACTTTGGTTCTA\n+ATGTATTGGTGATTGGGACCAGAGTAATGATTGATAGGGACGGTTGGGGTCTTACGTACTGCAAAGCGAGAGGTGAAATT\n+CTTGGACCTTTGTATGACGAACAACTGCGAAAGCATTGGACTAGGACGTTCCCG\n+>39392bbb9626a64e6663c05b70293e7c;size=94;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGGATCTCGGCGGACTGAGGGCGGTTTGCTTG\n+CTAGTATTACTGCCCTATAGTCCGTAGTTTTGCCAGAGGTTTCGGGGTGCTCTTAATCGAGTGTCCCGGGATGCTGGCAG\n+GTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCTATTACGCCTGAATATTCGTGCATGGAATAATAGAATAGGAAGT\n+CGTTTCTATTTTGTTGGTTTTCGGAAATCGACTTAATGATTAATAGGGACAGTCGGGGGCATTTGTATTCAAACGACAGA\n+GGTGAAATTCTTGGACCGTTTGAAGACAAACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>b970fcbdd71ad2a333f702c7ecfe7114;size=63;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGCAGGAGCGACCGGTCACACAC\n+TCTGTGCGTGAACTTGTGTTGTCTCTGGCCATCCTTGGGGAGATCCTGTTTGGCATTAAGTTGTCGGGCAGGGGATACCC\n+ATCGTTTACTGTGAAAAAATTAGAGTGTTTAAAGCAGGCTTATGCCGTTGAATATATTAGCATGGAATAATAAGATAGGA\n+CTTCGGAACTATTTTGTTGGTTTGCGTTACGAAGTAATGATTAATAGGGACAGTTGGGGGTATTCGTATTTCATTGTCAG\n+AGGTGAAATTCTTGGATTTCTGAAAGACGAACTACTGCGAAAGCATTTACCAAGGATGTTTTCA\n+>a9d668eae33f9fd4484585d9fe52b05e;size=73;\n+AGCTCCAATAGCGTATACTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATCTTGGAGTGTGAGTGAATGGTCGATCG\n+AAAGATTGTACTGTTCGGCACACTCTTCTCTTCGGTTGCGTGTGTAGTGCCCTTAACTGAGTGCTGCACTCGACCGGAAT\n+TTTTACCTTGAAAAAATTAGAGTGTTCAAAGCAGACCTGATTATGTCTGAATATTCGTGCATGGAATAATAAAATAAGAA\n+CTTGGTTCTATTTTATTGGTTTTCGGAACTCGAGTTAATGATTAAGAGGGACAGACGGGGGCATCCGTACTCTGCCGTTA\n+GAGGTGAAATTCTTGGATCGGCGGAAGACGCGCAACTGCGAAAGCATTTGCCAAGAATGTTTTCT\n+>da17e1a54e88120e294c7e68e350f47f;size=38;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGGGGGCGCAGATTGTCCGCAGA\n+CGCGTGTGCAGATGCGCCCTTTCATCCTTCTGTTAACGTCTCTTGACATTCATTTGTTGGTGGCGGGCTCAGATATTTTA\n+CCTTGAGAAAATTAGAGTGTTTCAGGCAGGCTCGCGTCGGAATACATTAGCATGGAATAATAGAATAGGACTCAGTCCTC\n+CTTTGTTGGTTTGAGGGGTCAGAGTAATGGTTAATAGGGATAGTTGGGGGCATTAGTATTTGACTGTCAGAGGTGAAATT\n+CTCGGATTTGTTAAAGACTAACTTATGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>efbd11c972faa734253f779fc4eb2a64;size=70;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGGATCTCAACAGCCTTGAAGCGGTTAACTTT\n+GTAGTTTTACTGCTTTGTAGGCTGTGCTTTTGCTGGAGGTTTAGGGGTGCTCTTGATCGAGTGTCTCTGGATGCCAGCAG\n+GTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCTAAAATGCCTGAATATTCGTGCATGGAATAATAGAATAGGATGT\n+CGATCCTATTTTGTTGGTTTTCGGGACTCGACATAATGATAAATAGGGACAGTCGGGGGCATTTGTATTCAAACGACAGA\n+GGTGAAATTCTTGGACCGTTTGAAGACAAACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>aecd442213d89e3f43949aee5040a3ed;size=50;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGACCTCGGAGCAGGTTGATTGGTCCGTCCT\n+GAAGGATGCTGTACTGATCGGTCTGCTCTTCTTCGCGAAGACTCCGTGTGCCCTTAACTGGGTGGGCGAAGGATTCGCGA\n+CGTTTACTTTGAAAAAATTAGAGTGTTCAAAGCAGGCAATCGCTTGGATATCTCAGCATGGAATAATAGAATAGGACTTT\n+GGTCTTATTTTGTTGGTTTCCGAGACCGAAGTAATGATTAATAGGGACAGTTGGGGGCATTCGTATTTCATTGTCAGAGG\n+TGAAATTCTTGGATTTATGAAAGACGAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>ea64ae1d6dddc2146105a882229c81bb;size=58;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATCTCGGCGGGCAGGGGGTGGTTCGCTCT\n+TCAGCGCTACTGCCCCGCTTTGCCCGTGTGATTGGCGGAGGTTTCGGGGTGCTCTTCGTTGAGTGACTCGGAGCGCCGTC\n+AGGTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCTTTTCACGCTTGAATATTCGTGCATGGAATAATGGAATAGGA\n+ACTCGTTTCTATTTTGTTGGTTTTCGGAAATCGAGTTAATGATTAACAGGGACAATTGGGGGCATTAGTATTCAGACGAC\n+AGAGGTGAAATTCTTGGACCGTCTGAAGACTGACTACTGCGAAAGCATTTGCCAAGAGTGTTTTCA\n+>26d2046e1a0f79450d6233ef29aab44e;size=36;\n+AGCTCCAATAG'..b'ATTCTTGGATCGCAGCAAGACGAACTAACGCGAAAGCATTTGTCAAGAATGTTTTTG\n+>8b580ba225c9ae8df06f925310b59e4e;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTCTGAGTCTTGGCCGGCGGTGAGCGTCCGTGGC\n+TGAATTTTTTGGTCGCGCGCATGCGATACCCGCTAGCCATTGTACTTCGGAGGAACACGGCTTGTGCTTTTCATTAAGTG\n+CTCGTGGGATTCCGATAGTTTACTTTGAGAAAAATAGAGTGTTCAAAGCAGGCGTTTTTGCCGTTGAATACATTAGCATG\n+GGATAATGGAATAGGACATTGGTTCTATTTTGTTGGTTTACGGACCGATGTAATGATTAATAGGAACAGTTGGGGACATT\n+TATATTCCATGGCTAGAGGTGAAATTCTTGGATTCATGGAAGATAAACTATTGCGAAAGCATTTGTCAAAGATGTTTTCA\n+>8e9a6185e05151042cc0beaadb77eec0;size=1;\n+AGCTCCGGTAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGCATTGCTTTTCAGCTAACCTG\n+CTCGCTAGTCGAGTTTGTGTTTGGTCTGAAGCTGCCATCCTTCCAGAGACCTTGTCATACCCTTCATTGGGCCGTGATAG\n+TGATCTGGAACTTTTACTTTGAAAAAATTAGAGTGTTCAAAGCAGGCGATCTCGCTGTGAATACATTAGCATGGAATAAT\n+AATTTAGGACTTCTGTTCCTATTTTGTTGGTTCTAGGACTGAAGTAATGATTGATAGGGATAGTTGGGGGTGCTCGTATT\n+GAATGGCCAGAGGTGAAATTCTTGGATTCATTCAAGACGAACTTATGCGAAAGCATTCACCAAGGATGTCTTCT\n+>a23d5d75d02581e3115e23a6a2fe031b;size=1;\n+AGCTCCGCCAGTGTATATCTATGCTGCTGCGGTTAAAAAGCTCGTAGTTGGATCTGCGTGCTAGAGACTGGTCCACCTAT\n+GGGTGTGCACTGGATCTCAGCACTGAATCGTTGGTTTTCTCTTTATGCCTTTAACCGGGTGTACTGAGTGACTAACATGT\n+TTACTTTGAAAAAATTAGAGTGCTTAAAACAAGCGATTTGCTTGAATATTCGTGCATGGAATAATAGAATAGGACCTTGG\n+TTCTATTTTGTTGGTTTTCGGAACACAAGGTAATGATTAAGAGGGACAGACGGGGGCATTCATATTTCGACGTTAGAGGT\n+GAAATTCTTGGATCGTCGAAAGATGCACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>a9a1fbfca4ade41ce328b07594f11688;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATTTCTGTTGAGGACAGCCGGTCCGCACT\n+ATGTGCGTGTATCTGGTTTGGCCTTGGCATCCTCTTGAGGAACGTTTCTGCGCTTAATTGCGTGGAGCGGTATTCAAGAC\n+TTTTACTTTGAGGAAATTAGAGTGTTCACGGCAGGCAAGCGCCTTGAATACATTAGCATGGAATGATAATATAGGATCTT\n+GGTTCTATTTTGTTGGTTTCTAGGGCTAAGGTAATGATTAATAGGGATAATTGGGGGCATTTGTATTAACGCGTCAGAGG\n+TGGAATTCTTGGATTGCGTTACGACAAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>aa026d2676cecd33e4a002dbb455ada8;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGGATCTCGGCGGACTGAGGGCGGTTTGCTTG\n+CTAGTATTACTGCCCTATAGTCCGTAGTTTTGCCAGAGGTTTCGGGTGCTCTTAATCGAGTGTCCCGGGATGCTGGCAGG\n+TTTACTTTGAAAAAAATTAGAGTGCTCAAAGCAGGCTATTACGCCTGAATATTCGTGCATGGAATAATAGAATAGGAAGT\n+CGTTTCTATTTTGTTGGTTTTTCGGAAATCGACTTAATGATTAATAGGGACAGTCGGGGGGCATTTGTATTCAAACGACA\n+GAGGTGAAATTCTTGGACCGTTTGAAGACAAACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>b0f7bb5e2512ce1b8140fd67d40f0ca2;size=1;\n+AGCTCCAGTAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGATATTACGCCCTAGTCTGCCGC\n+AAGTTGTGGTTTGTGCTGGTGTGCGTTTATCTTCCTTCTAGAAAGGCTTGTGGCGTCTTTGTGCGTCCACTTGTTCGATC\n+TAGATCTTTTACTTTGAATAAATTAGAGTGTTCAAAGCAGGCAATCGCTGTGAATACATTAGCATGGAATAATAATATAG\n+GACTTCGATTCTATTTTGTTGGTTTTCAGAACGAAGTAATGATTGATAGGGATAGTTGGGGGTGCTAGTATTGGCCGGCT\n+AGAGGTGAAATTCGTATTCGGCTAAGACTAACTTATGCGAAAGCATTCACCAAGGATGTCTTCT\n+>bdaad40d1a72de52eebf25010f5b300f;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATTTCTGCTGAGGATGACCGGTCCGCCCA\n+CTGGGTGAGTATCTGGCTCAGCCTTGGCATCTTCCTGAAGAACGTATCTGCACTTGACTGTGTGGTTCGGTATTTAGGAC\n+ATTTACTTTGAGGAAATTAGAGTGTTTCAAGCAAGCGTACGCCTTGAATACATTAGCATGGAATAATAAGATAGGACCTC\n+AGTCCTATTTTGTTGGTTTCTAGAGCTGAGGTAATGATTGATAGGGATAGTTGGGGGCATTCGTATTTAACTGTCAGAGG\n+TGAAATTCTTGGATTTGTTAAAGACGGACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>c72b7875fe56dca4f7d9c24360650a25;size=1;\n+AGCTCTAATAGCGTATATTAATGTTGTTGCGGTTAAAAAGCTCGTGGTTGAAAGTGAAGGGTAAAACTGGATCTGGGGAA\n+ACCCATTTGCAGTTATTAGCGCGTTTTAAGGTATTCGGTTTACTTGACTTAATTGTCAAATAAGCTTAACGGATGCCTTG\n+TAGCTACTCTGATAAAATCAGAGTGCTTAAAACAAGCCTTTAAGCTTGTATATTTGTGCATAGTATAGCAAAATATGACC\n+TAAGCTAATAAAGATGGTGATTAGCCGTGGTAATGATTAAAAGGGATTGTCGGAGGCATTTGTATTTGAAAGTGAGAGGT\n+GAAATTCTATGATCTTTCAAAGACAAACTAGCGCGAAAGCATTTGCCAAGTATGTTTTCA\n+>c8403bc529537d14794709f99640ac8f;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGACCTCGGAGCAGGTTGATTGGTCCGTCCT\n+GAAGGATGCTGTACTGATCGGTCTGCTCTTCTTCGCGAAGACTCCGTGTGCCCTTAACTGGGTGGGCGAAGGATTCGCGA\n+CGTTTACTTGAAAAAATTGAGTGTTCAAAGCAGGCAATCGCTTGGATATCTCAGCATGGAATAATAGAATAGGACTTTGG\n+TCTTATTTTGTTGGTTTCCGAGACCGAAGTAATGATTAATAGGGACAGTTGGGGGCATTCGTATTTCATTGTCAGAGGTG\n+AAATTCTTGGATTTATGAAAGACGAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n'
b
diff -r fae6527990af -r 8c4e2933a17a test-data/clustering_centroids_result4.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/clustering_centroids_result4.fasta Wed Aug 26 13:34:22 2015 -0400
b
b'@@ -0,0 +1,7871 @@\n+>b235271fbc8a6c9d990037857189ee9a;size=94;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGTGCATTCCACTGGCCTATTGG\n+TTAACTCCAACTTGGCTCATTTGGAATACGCCATCTTTAGGCAGACCCGTCGTGGCATTAGGTTGTCGTGATGGTTACGC\n+CTATCGTTTACTGTGAAGAAATTAGGGTGTTCAAAGCAGGCTTATGCCATGAATACGTTAGCATGGAATAATGAGATAGG\n+ATTTCGGTACTATTTTGTTGGTTTGTGTACGGAAATAATGATTAACAGGAACAGTGTTGTGGGTATTCGTATTTCGTTGT\n+CAGAGGTGAAATTCTTGGATTTACGAAAGACGAACGACTGCGAAAGCATTTACCAAGGATGTTTTCA\n+>7e02ae2e1e404d4e7c6035a6e374d29d;size=117;\n+AGCTCCAATAGCGTATACTAATGTTGTTGCAGTTAAAAAGCTCGTAGTCGGATTTCAGTAGGCTCAGTTAAGTCTCTTCT\n+ATTGAGTTCTTTATGGGCCTGCTTCTTTGACAGAAACTTCTATGTTATTCATTTAGCGTGGGTAGCGACTGTCTCTTTTA\n+CTTTGAGAAAATTAGAGTGTTCAAAGCAGGTATTCGCCTGAATATTACTCTTGGAATAATGCTATAAGACTTTGGTTCTA\n+ATGTATTGGTGATTGGGACCAGAGTAATGATTGATAGGGACGGTTGGGGTCTTACGTACTGCAAAGCGAGAGGTGAAATT\n+CTTGGACCTTTGTATGACGAACAACTGCGAAAGCATTGGACTAGGACGTTCCCG\n+>39392bbb9626a64e6663c05b70293e7c;size=118;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGGATCTCGGCGGACTGAGGGCGGTTTGCTTG\n+CTAGTATTACTGCCCTATAGTCCGTAGTTTTGCCAGAGGTTTCGGGGTGCTCTTAATCGAGTGTCCCGGGATGCTGGCAG\n+GTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCTATTACGCCTGAATATTCGTGCATGGAATAATAGAATAGGAAGT\n+CGTTTCTATTTTGTTGGTTTTCGGAAATCGACTTAATGATTAATAGGGACAGTCGGGGGCATTTGTATTCAAACGACAGA\n+GGTGAAATTCTTGGACCGTTTGAAGACAAACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>b970fcbdd71ad2a333f702c7ecfe7114;size=64;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGCAGGAGCGACCGGTCACACAC\n+TCTGTGCGTGAACTTGTGTTGTCTCTGGCCATCCTTGGGGAGATCCTGTTTGGCATTAAGTTGTCGGGCAGGGGATACCC\n+ATCGTTTACTGTGAAAAAATTAGAGTGTTTAAAGCAGGCTTATGCCGTTGAATATATTAGCATGGAATAATAAGATAGGA\n+CTTCGGAACTATTTTGTTGGTTTGCGTTACGAAGTAATGATTAATAGGGACAGTTGGGGGTATTCGTATTTCATTGTCAG\n+AGGTGAAATTCTTGGATTTCTGAAAGACGAACTACTGCGAAAGCATTTACCAAGGATGTTTTCA\n+>a9d668eae33f9fd4484585d9fe52b05e;size=78;\n+AGCTCCAATAGCGTATACTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATCTTGGAGTGTGAGTGAATGGTCGATCG\n+AAAGATTGTACTGTTCGGCACACTCTTCTCTTCGGTTGCGTGTGTAGTGCCCTTAACTGAGTGCTGCACTCGACCGGAAT\n+TTTTACCTTGAAAAAATTAGAGTGTTCAAAGCAGACCTGATTATGTCTGAATATTCGTGCATGGAATAATAAAATAAGAA\n+CTTGGTTCTATTTTATTGGTTTTCGGAACTCGAGTTAATGATTAAGAGGGACAGACGGGGGCATCCGTACTCTGCCGTTA\n+GAGGTGAAATTCTTGGATCGGCGGAAGACGCGCAACTGCGAAAGCATTTGCCAAGAATGTTTTCT\n+>da17e1a54e88120e294c7e68e350f47f;size=38;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGGGGGCGCAGATTGTCCGCAGA\n+CGCGTGTGCAGATGCGCCCTTTCATCCTTCTGTTAACGTCTCTTGACATTCATTTGTTGGTGGCGGGCTCAGATATTTTA\n+CCTTGAGAAAATTAGAGTGTTTCAGGCAGGCTCGCGTCGGAATACATTAGCATGGAATAATAGAATAGGACTCAGTCCTC\n+CTTTGTTGGTTTGAGGGGTCAGAGTAATGGTTAATAGGGATAGTTGGGGGCATTAGTATTTGACTGTCAGAGGTGAAATT\n+CTCGGATTTGTTAAAGACTAACTTATGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>efbd11c972faa734253f779fc4eb2a64;size=61;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGGATCTCAACAGCCTTGAAGCGGTTAACTTT\n+GTAGTTTTACTGCTTTGTAGGCTGTGCTTTTGCTGGAGGTTTAGGGGTGCTCTTGATCGAGTGTCTCTGGATGCCAGCAG\n+GTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCTAAAATGCCTGAATATTCGTGCATGGAATAATAGAATAGGATGT\n+CGATCCTATTTTGTTGGTTTTCGGGACTCGACATAATGATAAATAGGGACAGTCGGGGGCATTTGTATTCAAACGACAGA\n+GGTGAAATTCTTGGACCGTTTGAAGACAAACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>aecd442213d89e3f43949aee5040a3ed;size=55;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGACCTCGGAGCAGGTTGATTGGTCCGTCCT\n+GAAGGATGCTGTACTGATCGGTCTGCTCTTCTTCGCGAAGACTCCGTGTGCCCTTAACTGGGTGGGCGAAGGATTCGCGA\n+CGTTTACTTTGAAAAAATTAGAGTGTTCAAAGCAGGCAATCGCTTGGATATCTCAGCATGGAATAATAGAATAGGACTTT\n+GGTCTTATTTTGTTGGTTTCCGAGACCGAAGTAATGATTAATAGGGACAGTTGGGGGCATTCGTATTTCATTGTCAGAGG\n+TGAAATTCTTGGATTTATGAAAGACGAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>ea64ae1d6dddc2146105a882229c81bb;size=62;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATCTCGGCGGGCAGGGGGTGGTTCGCTCT\n+TCAGCGCTACTGCCCCGCTTTGCCCGTGTGATTGGCGGAGGTTTCGGGGTGCTCTTCGTTGAGTGACTCGGAGCGCCGTC\n+AGGTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCTTTTCACGCTTGAATATTCGTGCATGGAATAATGGAATAGGA\n+ACTCGTTTCTATTTTGTTGGTTTTCGGAAATCGAGTTAATGATTAACAGGGACAATTGGGGGCATTAGTATTCAGACGAC\n+AGAGGTGAAATTCTTGGACCGTCTGAAGACTGACTACTGCGAAAGCATTTGCCAAGAGTGTTTTCA\n+>26d2046e1a0f79450d6233ef29aab44e;size=45;\n+AGCTCCAATA'..b'\n+GAAATTCTTGGATTTATGAAAGATGAACTTATGCGAAAGCATTTACCAAGGATGTTTTCA\n+>829a92af0a7cb2a6faf53a31f74ac32e;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGCCGGGCACCGATGTCCGCTGA\n+TCGCGTGCGCAGAGGTGCCCCGCCATCCTTCTGTTAACTCAGCCACTGGATTTACTTCCGGGTTGAGGGCTCAGATATTT\n+TACCTTGAGAAAATTAGAGTGTTTCAGGCAGGCTTGCGCCGGAATACATTAGCATGGAATAATGGAATAGGACTTCCGCC\n+TCTTCTGTTGGTCTGAGGGGTGAAAGTAATGATTAATAGGGATAGTTGGGGGCATTAGTACTTAACTGTCAGAGGTGAAA\n+TTCTCGGATTAGTTAAAGACTAACTTATGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>85a816fc48b95e011c25738668ff92f5;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATTTCTGTGGTAGGCAGCCGGTCCACACT\n+ATGTGTGAGTATCTGGTTCGGCTACTGCATCCTCCTGAGGAACGTTGGTGCGCTTCACTGCGTGGCACGGTATTCAGGAC\n+TTTTACTTTGAGGAAATTAGAGTGTTCACGGCAGGCGTTTGCCCTGAATATATTAGCATGGAATAATGATATAGGATCCA\n+CGTCCTATTTTGTTGGTTTCTAGGACGAGGATAATGATTAATAGGGATAATTGGGGGCATTCGTATTAACACGTCAGAGG\n+TGGAATTCTTGGATTGTGTTACGACGAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>88ee2d113b38cac2a65f4b8fdefc85e6;size=1;\n+AGCCTTCACAAGCATATACAAATGCTGTTGCGTTTAAAAAGCTCGTAGTTGAATTTGTTGTGTACTGCTCTAAAATCATA\n+CAAAATTGTATGTAAGAGTAAGTAACCATCGTGTTGTCGAGTTTACTTGCGCTTAACTGTGATGAGTTTTTGAGATGTAC\n+GCTTTACTTTGAGAAAATTTGGGTGTTTAAAGCAGCCTTTGGGTGTGAATGCTGTAGCATGGAATAATAGAAAATGACTG\n+TATACCCGTTTGGTTGGTCTTGGGTTATGTAGTAATGATTGAAAAGGACAGGCGGGGACATTCGAATTGTTGCGTTAGAG\n+GTGAAATTCTTGGATCGCAGCAAGACGAACTAACGCGAAAGCATTTGTCAAGAATGTTTTTG\n+>8b580ba225c9ae8df06f925310b59e4e;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTCTGAGTCTTGGCCGGCGGTGAGCGTCCGTGGC\n+TGAATTTTTTGGTCGCGCGCATGCGATACCCGCTAGCCATTGTACTTCGGAGGAACACGGCTTGTGCTTTTCATTAAGTG\n+CTCGTGGGATTCCGATAGTTTACTTTGAGAAAAATAGAGTGTTCAAAGCAGGCGTTTTTGCCGTTGAATACATTAGCATG\n+GGATAATGGAATAGGACATTGGTTCTATTTTGTTGGTTTACGGACCGATGTAATGATTAATAGGAACAGTTGGGGACATT\n+TATATTCCATGGCTAGAGGTGAAATTCTTGGATTCATGGAAGATAAACTATTGCGAAAGCATTTGTCAAAGATGTTTTCA\n+>8e9a6185e05151042cc0beaadb77eec0;size=1;\n+AGCTCCGGTAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGCATTGCTTTTCAGCTAACCTG\n+CTCGCTAGTCGAGTTTGTGTTTGGTCTGAAGCTGCCATCCTTCCAGAGACCTTGTCATACCCTTCATTGGGCCGTGATAG\n+TGATCTGGAACTTTTACTTTGAAAAAATTAGAGTGTTCAAAGCAGGCGATCTCGCTGTGAATACATTAGCATGGAATAAT\n+AATTTAGGACTTCTGTTCCTATTTTGTTGGTTCTAGGACTGAAGTAATGATTGATAGGGATAGTTGGGGGTGCTCGTATT\n+GAATGGCCAGAGGTGAAATTCTTGGATTCATTCAAGACGAACTTATGCGAAAGCATTCACCAAGGATGTCTTCT\n+>a23d5d75d02581e3115e23a6a2fe031b;size=1;\n+AGCTCCGCCAGTGTATATCTATGCTGCTGCGGTTAAAAAGCTCGTAGTTGGATCTGCGTGCTAGAGACTGGTCCACCTAT\n+GGGTGTGCACTGGATCTCAGCACTGAATCGTTGGTTTTCTCTTTATGCCTTTAACCGGGTGTACTGAGTGACTAACATGT\n+TTACTTTGAAAAAATTAGAGTGCTTAAAACAAGCGATTTGCTTGAATATTCGTGCATGGAATAATAGAATAGGACCTTGG\n+TTCTATTTTGTTGGTTTTCGGAACACAAGGTAATGATTAAGAGGGACAGACGGGGGCATTCATATTTCGACGTTAGAGGT\n+GAAATTCTTGGATCGTCGAAAGATGCACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>a9a1fbfca4ade41ce328b07594f11688;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATTTCTGTTGAGGACAGCCGGTCCGCACT\n+ATGTGCGTGTATCTGGTTTGGCCTTGGCATCCTCTTGAGGAACGTTTCTGCGCTTAATTGCGTGGAGCGGTATTCAAGAC\n+TTTTACTTTGAGGAAATTAGAGTGTTCACGGCAGGCAAGCGCCTTGAATACATTAGCATGGAATGATAATATAGGATCTT\n+GGTTCTATTTTGTTGGTTTCTAGGGCTAAGGTAATGATTAATAGGGATAATTGGGGGCATTTGTATTAACGCGTCAGAGG\n+TGGAATTCTTGGATTGCGTTACGACAAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>b0f7bb5e2512ce1b8140fd67d40f0ca2;size=1;\n+AGCTCCAGTAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGATATTACGCCCTAGTCTGCCGC\n+AAGTTGTGGTTTGTGCTGGTGTGCGTTTATCTTCCTTCTAGAAAGGCTTGTGGCGTCTTTGTGCGTCCACTTGTTCGATC\n+TAGATCTTTTACTTTGAATAAATTAGAGTGTTCAAAGCAGGCAATCGCTGTGAATACATTAGCATGGAATAATAATATAG\n+GACTTCGATTCTATTTTGTTGGTTTTCAGAACGAAGTAATGATTGATAGGGATAGTTGGGGGTGCTAGTATTGGCCGGCT\n+AGAGGTGAAATTCGTATTCGGCTAAGACTAACTTATGCGAAAGCATTCACCAAGGATGTCTTCT\n+>bdaad40d1a72de52eebf25010f5b300f;size=1;\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATTTCTGCTGAGGATGACCGGTCCGCCCA\n+CTGGGTGAGTATCTGGCTCAGCCTTGGCATCTTCCTGAAGAACGTATCTGCACTTGACTGTGTGGTTCGGTATTTAGGAC\n+ATTTACTTTGAGGAAATTAGAGTGTTTCAAGCAAGCGTACGCCTTGAATACATTAGCATGGAATAATAAGATAGGACCTC\n+AGTCCTATTTTGTTGGTTTCTAGAGCTGAGGTAATGATTGATAGGGATAGTTGGGGGCATTCGTATTTAACTGTCAGAGG\n+TGAAATTCTTGGATTTGTTAAAGACGGACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n'
b
diff -r fae6527990af -r 8c4e2933a17a test-data/clustering_notmatched_result2.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/clustering_notmatched_result2.fasta Wed Aug 26 13:34:22 2015 -0400
b
b'@@ -0,0 +1,8256 @@\n+>b235271fbc8a6c9d990037857189ee9a;size=22254\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGTGCATTCCACTGGCCTATTGG\n+TTAACTCCAACTTGGCTCATTTGGAATACGCCATCTTTAGGCAGACCCGTCGTGGCATTAGGTTGTCGTGATGGTTACGC\n+CTATCGTTTACTGTGAAGAAATTAGGGTGTTCAAAGCAGGCTTATGCCATGAATACGTTAGCATGGAATAATGAGATAGG\n+ATTTCGGTACTATTTTGTTGGTTTGTGTACGGAAATAATGATTAACAGGAACAGTGTTGTGGGTATTCGTATTTCGTTGT\n+CAGAGGTGAAATTCTTGGATTTACGAAAGACGAACGACTGCGAAAGCATTTACCAAGGATGTTTTCA\n+>7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\n+AGCTCCAATAGCGTATACTAATGTTGTTGCAGTTAAAAAGCTCGTAGTCGGATTTCAGTAGGCTCAGTTAAGTCTCTTCT\n+ATTGAGTTCTTTATGGGCCTGCTTCTTTGACAGAAACTTCTATGTTATTCATTTAGCGTGGGTAGCGACTGTCTCTTTTA\n+CTTTGAGAAAATTAGAGTGTTCAAAGCAGGTATTCGCCTGAATATTACTCTTGGAATAATGCTATAAGACTTTGGTTCTA\n+ATGTATTGGTGATTGGGACCAGAGTAATGATTGATAGGGACGGTTGGGGTCTTACGTACTGCAAAGCGAGAGGTGAAATT\n+CTTGGACCTTTGTATGACGAACAACTGCGAAAGCATTGGACTAGGACGTTCCCG\n+>39392bbb9626a64e6663c05b70293e7c;size=11535\n+AGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGGATCTCGGCGGACTGAGGGCGGTTTGCTTG\n+CTAGTATTACTGCCCTATAGTCCGTAGTTTTGCCAGAGGTTTCGGGGTGCTCTTAATCGAGTGTCCCGGGATGCTGGCAG\n+GTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCTATTACGCCTGAATATTCGTGCATGGAATAATAGAATAGGAAGT\n+CGTTTCTATTTTGTTGGTTTTCGGAAATCGACTTAATGATTAATAGGGACAGTCGGGGGCATTTGTATTCAAACGACAGA\n+GGTGAAATTCTTGGACCGTTTGAAGACAAACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>b970fcbdd71ad2a333f702c7ecfe7114;size=10907\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGCAGGAGCGACCGGTCACACAC\n+TCTGTGCGTGAACTTGTGTTGTCTCTGGCCATCCTTGGGGAGATCCTGTTTGGCATTAAGTTGTCGGGCAGGGGATACCC\n+ATCGTTTACTGTGAAAAAATTAGAGTGTTTAAAGCAGGCTTATGCCGTTGAATATATTAGCATGGAATAATAAGATAGGA\n+CTTCGGAACTATTTTGTTGGTTTGCGTTACGAAGTAATGATTAATAGGGACAGTTGGGGGTATTCGTATTTCATTGTCAG\n+AGGTGAAATTCTTGGATTTCTGAAAGACGAACTACTGCGAAAGCATTTACCAAGGATGTTTTCA\n+>a9d668eae33f9fd4484585d9fe52b05e;size=8638\n+AGCTCCAATAGCGTATACTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATCTTGGAGTGTGAGTGAATGGTCGATCG\n+AAAGATTGTACTGTTCGGCACACTCTTCTCTTCGGTTGCGTGTGTAGTGCCCTTAACTGAGTGCTGCACTCGACCGGAAT\n+TTTTACCTTGAAAAAATTAGAGTGTTCAAAGCAGACCTGATTATGTCTGAATATTCGTGCATGGAATAATAAAATAAGAA\n+CTTGGTTCTATTTTATTGGTTTTCGGAACTCGAGTTAATGATTAAGAGGGACAGACGGGGGCATCCGTACTCTGCCGTTA\n+GAGGTGAAATTCTTGGATCGGCGGAAGACGCGCAACTGCGAAAGCATTTGCCAAGAATGTTTTCT\n+>da17e1a54e88120e294c7e68e350f47f;size=6062\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGGGGGCGCAGATTGTCCGCAGA\n+CGCGTGTGCAGATGCGCCCTTTCATCCTTCTGTTAACGTCTCTTGACATTCATTTGTTGGTGGCGGGCTCAGATATTTTA\n+CCTTGAGAAAATTAGAGTGTTTCAGGCAGGCTCGCGTCGGAATACATTAGCATGGAATAATAGAATAGGACTCAGTCCTC\n+CTTTGTTGGTTTGAGGGGTCAGAGTAATGGTTAATAGGGATAGTTGGGGGCATTAGTATTTGACTGTCAGAGGTGAAATT\n+CTCGGATTTGTTAAAGACTAACTTATGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>efbd11c972faa734253f779fc4eb2a64;size=5440\n+AGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGGATCTCAACAGCCTTGAAGCGGTTAACTTT\n+GTAGTTTTACTGCTTTGTAGGCTGTGCTTTTGCTGGAGGTTTAGGGGTGCTCTTGATCGAGTGTCTCTGGATGCCAGCAG\n+GTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCTAAAATGCCTGAATATTCGTGCATGGAATAATAGAATAGGATGT\n+CGATCCTATTTTGTTGGTTTTCGGGACTCGACATAATGATAAATAGGGACAGTCGGGGGCATTTGTATTCAAACGACAGA\n+GGTGAAATTCTTGGACCGTTTGAAGACAAACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>aecd442213d89e3f43949aee5040a3ed;size=5318\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGACCTCGGAGCAGGTTGATTGGTCCGTCCT\n+GAAGGATGCTGTACTGATCGGTCTGCTCTTCTTCGCGAAGACTCCGTGTGCCCTTAACTGGGTGGGCGAAGGATTCGCGA\n+CGTTTACTTTGAAAAAATTAGAGTGTTCAAAGCAGGCAATCGCTTGGATATCTCAGCATGGAATAATAGAATAGGACTTT\n+GGTCTTATTTTGTTGGTTTCCGAGACCGAAGTAATGATTAATAGGGACAGTTGGGGGCATTCGTATTTCATTGTCAGAGG\n+TGAAATTCTTGGATTTATGAAAGACGAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>ea64ae1d6dddc2146105a882229c81bb;size=5125\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATCTCGGCGGGCAGGGGGTGGTTCGCTCT\n+TCAGCGCTACTGCCCCGCTTTGCCCGTGTGATTGGCGGAGGTTTCGGGGTGCTCTTCGTTGAGTGACTCGGAGCGCCGTC\n+AGGTTTACTTTGAAAAAATTAGAGTGCTCAAAGCAGGCTTTTCACGCTTGAATATTCGTGCATGGAATAATGGAATAGGA\n+ACTCGTTTCTATTTTGTTGGTTTTCGGAAATCGAGTTAATGATTAACAGGGACAATTGGGGGCATTAGTATTCAGACGAC\n+AGAGGTGAAATTCTTGGACCGTCTGAAGACTGACTACTGCGAAAGCATTTGCCAAGAGTGTTTTCA\n+>26d2046e1a0f79450d6233ef29aab44e;size=4937'..b'ATTCTTGGATCGCAGCAAGACGAACTAACGCGAAAGCATTTGTCAAGAATGTTTTTG\n+>8b580ba225c9ae8df06f925310b59e4e;size=29\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTCTGAGTCTTGGCCGGCGGTGAGCGTCCGTGGC\n+TGAATTTTTTGGTCGCGCGCATGCGATACCCGCTAGCCATTGTACTTCGGAGGAACACGGCTTGTGCTTTTCATTAAGTG\n+CTCGTGGGATTCCGATAGTTTACTTTGAGAAAAATAGAGTGTTCAAAGCAGGCGTTTTTGCCGTTGAATACATTAGCATG\n+GGATAATGGAATAGGACATTGGTTCTATTTTGTTGGTTTACGGACCGATGTAATGATTAATAGGAACAGTTGGGGACATT\n+TATATTCCATGGCTAGAGGTGAAATTCTTGGATTCATGGAAGATAAACTATTGCGAAAGCATTTGTCAAAGATGTTTTCA\n+>8e9a6185e05151042cc0beaadb77eec0;size=29\n+AGCTCCGGTAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGGCATTGCTTTTCAGCTAACCTG\n+CTCGCTAGTCGAGTTTGTGTTTGGTCTGAAGCTGCCATCCTTCCAGAGACCTTGTCATACCCTTCATTGGGCCGTGATAG\n+TGATCTGGAACTTTTACTTTGAAAAAATTAGAGTGTTCAAAGCAGGCGATCTCGCTGTGAATACATTAGCATGGAATAAT\n+AATTTAGGACTTCTGTTCCTATTTTGTTGGTTCTAGGACTGAAGTAATGATTGATAGGGATAGTTGGGGGTGCTCGTATT\n+GAATGGCCAGAGGTGAAATTCTTGGATTCATTCAAGACGAACTTATGCGAAAGCATTCACCAAGGATGTCTTCT\n+>a23d5d75d02581e3115e23a6a2fe031b;size=29\n+AGCTCCGCCAGTGTATATCTATGCTGCTGCGGTTAAAAAGCTCGTAGTTGGATCTGCGTGCTAGAGACTGGTCCACCTAT\n+GGGTGTGCACTGGATCTCAGCACTGAATCGTTGGTTTTCTCTTTATGCCTTTAACCGGGTGTACTGAGTGACTAACATGT\n+TTACTTTGAAAAAATTAGAGTGCTTAAAACAAGCGATTTGCTTGAATATTCGTGCATGGAATAATAGAATAGGACCTTGG\n+TTCTATTTTGTTGGTTTTCGGAACACAAGGTAATGATTAAGAGGGACAGACGGGGGCATTCATATTTCGACGTTAGAGGT\n+GAAATTCTTGGATCGTCGAAAGATGCACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>a9a1fbfca4ade41ce328b07594f11688;size=29\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATTTCTGTTGAGGACAGCCGGTCCGCACT\n+ATGTGCGTGTATCTGGTTTGGCCTTGGCATCCTCTTGAGGAACGTTTCTGCGCTTAATTGCGTGGAGCGGTATTCAAGAC\n+TTTTACTTTGAGGAAATTAGAGTGTTCACGGCAGGCAAGCGCCTTGAATACATTAGCATGGAATGATAATATAGGATCTT\n+GGTTCTATTTTGTTGGTTTCTAGGGCTAAGGTAATGATTAATAGGGATAATTGGGGGCATTTGTATTAACGCGTCAGAGG\n+TGGAATTCTTGGATTGCGTTACGACAAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>aa026d2676cecd33e4a002dbb455ada8;size=29\n+AGCTCCAATAGCGTATATTAAAGTTGTTGTGGTTAAAAAGCTCGTAGTTGGATCTCGGCGGACTGAGGGCGGTTTGCTTG\n+CTAGTATTACTGCCCTATAGTCCGTAGTTTTGCCAGAGGTTTCGGGTGCTCTTAATCGAGTGTCCCGGGATGCTGGCAGG\n+TTTACTTTGAAAAAAATTAGAGTGCTCAAAGCAGGCTATTACGCCTGAATATTCGTGCATGGAATAATAGAATAGGAAGT\n+CGTTTCTATTTTGTTGGTTTTTCGGAAATCGACTTAATGATTAATAGGGACAGTCGGGGGGCATTTGTATTCAAACGACA\n+GAGGTGAAATTCTTGGACCGTTTGAAGACAAACTACTGCGAAAGCATTTGCCAAGAATGTTTTCA\n+>b0f7bb5e2512ce1b8140fd67d40f0ca2;size=29\n+AGCTCCAGTAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGATATTACGCCCTAGTCTGCCGC\n+AAGTTGTGGTTTGTGCTGGTGTGCGTTTATCTTCCTTCTAGAAAGGCTTGTGGCGTCTTTGTGCGTCCACTTGTTCGATC\n+TAGATCTTTTACTTTGAATAAATTAGAGTGTTCAAAGCAGGCAATCGCTGTGAATACATTAGCATGGAATAATAATATAG\n+GACTTCGATTCTATTTTGTTGGTTTTCAGAACGAAGTAATGATTGATAGGGATAGTTGGGGGTGCTAGTATTGGCCGGCT\n+AGAGGTGAAATTCGTATTCGGCTAAGACTAACTTATGCGAAAGCATTCACCAAGGATGTCTTCT\n+>bdaad40d1a72de52eebf25010f5b300f;size=29\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCGGTTAAAAAGCTCGTAGTTGGATTTCTGCTGAGGATGACCGGTCCGCCCA\n+CTGGGTGAGTATCTGGCTCAGCCTTGGCATCTTCCTGAAGAACGTATCTGCACTTGACTGTGTGGTTCGGTATTTAGGAC\n+ATTTACTTTGAGGAAATTAGAGTGTTTCAAGCAAGCGTACGCCTTGAATACATTAGCATGGAATAATAAGATAGGACCTC\n+AGTCCTATTTTGTTGGTTTCTAGAGCTGAGGTAATGATTGATAGGGATAGTTGGGGGCATTCGTATTTAACTGTCAGAGG\n+TGAAATTCTTGGATTTGTTAAAGACGGACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n+>c72b7875fe56dca4f7d9c24360650a25;size=29\n+AGCTCTAATAGCGTATATTAATGTTGTTGCGGTTAAAAAGCTCGTGGTTGAAAGTGAAGGGTAAAACTGGATCTGGGGAA\n+ACCCATTTGCAGTTATTAGCGCGTTTTAAGGTATTCGGTTTACTTGACTTAATTGTCAAATAAGCTTAACGGATGCCTTG\n+TAGCTACTCTGATAAAATCAGAGTGCTTAAAACAAGCCTTTAAGCTTGTATATTTGTGCATAGTATAGCAAAATATGACC\n+TAAGCTAATAAAGATGGTGATTAGCCGTGGTAATGATTAAAAGGGATTGTCGGAGGCATTTGTATTTGAAAGTGAGAGGT\n+GAAATTCTATGATCTTTCAAAGACAAACTAGCGCGAAAGCATTTGCCAAGTATGTTTTCA\n+>c8403bc529537d14794709f99640ac8f;size=29\n+AGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGACCTCGGAGCAGGTTGATTGGTCCGTCCT\n+GAAGGATGCTGTACTGATCGGTCTGCTCTTCTTCGCGAAGACTCCGTGTGCCCTTAACTGGGTGGGCGAAGGATTCGCGA\n+CGTTTACTTGAAAAAATTGAGTGTTCAAAGCAGGCAATCGCTTGGATATCTCAGCATGGAATAATAGAATAGGACTTTGG\n+TCTTATTTTGTTGGTTTCCGAGACCGAAGTAATGATTAATAGGGACAGTTGGGGGCATTCGTATTTCATTGTCAGAGGTG\n+AAATTCTTGGATTTATGAAAGACGAACTACTGCGAAAGCATTTGCCAAGGATGTTTTCA\n'
b
diff -r fae6527990af -r 8c4e2933a17a test-data/clustering_uc_result3.uc
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/clustering_uc_result3.uc Wed Aug 26 13:34:22 2015 -0400
b
b'@@ -0,0 +1,6374 @@\n+S\t0\t387\t*\t*\t*\t*\t*\tb235271fbc8a6c9d990037857189ee9a;size=22254\t*\n+S\t1\t374\t*\t*\t*\t*\t*\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\t*\n+S\t2\t383\t*\t*\t*\t*\t*\t39392bbb9626a64e6663c05b70293e7c;size=11535\t*\n+S\t3\t384\t*\t*\t*\t*\t*\tb970fcbdd71ad2a333f702c7ecfe7114;size=10907\t*\n+S\t4\t385\t*\t*\t*\t*\t*\ta9d668eae33f9fd4484585d9fe52b05e;size=8638\t*\n+S\t5\t374\t*\t*\t*\t*\t*\tda17e1a54e88120e294c7e68e350f47f;size=6062\t*\n+S\t6\t383\t*\t*\t*\t*\t*\tefbd11c972faa734253f779fc4eb2a64;size=5440\t*\n+S\t7\t381\t*\t*\t*\t*\t*\taecd442213d89e3f43949aee5040a3ed;size=5318\t*\n+S\t8\t386\t*\t*\t*\t*\t*\tea64ae1d6dddc2146105a882229c81bb;size=5125\t*\n+S\t9\t381\t*\t*\t*\t*\t*\t26d2046e1a0f79450d6233ef29aab44e;size=4937\t*\n+S\t10\t375\t*\t*\t*\t*\t*\ta1fe4d26985b4fd62b7bef1949d111f4;size=4547\t*\n+S\t11\t384\t*\t*\t*\t*\t*\t96ba76b9e5bd26447d84901071634c23;size=4384\t*\n+S\t12\t382\t*\t*\t*\t*\t*\tde935b7625d937ebe744b3125cfd1dfc;size=3868\t*\n+S\t13\t376\t*\t*\t*\t*\t*\t7e3fa204e95db351839d719215fba508;size=3689\t*\n+S\t14\t381\t*\t*\t*\t*\t*\t78951b2d4ca30531381672a30be0978a;size=3655\t*\n+H\t0\t388\t99.7\t+\t0\t0\t319MD68M\tb7ffa8f46cb16542d89dc5293ade2098;size=3629\tb235271fbc8a6c9d990037857189ee9a;size=22254\n+S\t15\t382\t*\t*\t*\t*\t*\t721460e46e8804111d74cb730340492f;size=3538\t*\n+H\t1\t375\t99.7\t+\t0\t0\t34MD340M\taff14fabb2213686a8bc18bf98edd8fd;size=3501\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\n+S\t16\t385\t*\t*\t*\t*\t*\teec3955a38ab32f15ee315b4c26f9af6;size=3440\t*\n+H\t6\t383\t99.7\t+\t0\t0\t383M\t5bf3b429509ca7b31bbce32fa4d77e33;size=3298\tefbd11c972faa734253f779fc4eb2a64;size=5440\n+S\t17\t383\t*\t*\t*\t*\t*\t4edf10a5e3aa4bd4ed28b1694727a060;size=3078\t*\n+S\t18\t369\t*\t*\t*\t*\t*\t57529eb32f16fd6b0ca316c7d376501f;size=2965\t*\n+S\t19\t386\t*\t*\t*\t*\t*\tbe32a04d8af28ab822f66005c721cc1a;size=2849\t*\n+S\t20\t381\t*\t*\t*\t*\t*\tfd9c8703206ef0b3c0fcd3846f26fb50;size=2770\t*\n+S\t21\t386\t*\t*\t*\t*\t*\t0af8e08a076e300ff906097a4030b9bb;size=2733\t*\n+H\t14\t381\t99.5\t+\t0\t0\t381M\t8dbb6f1dafe133984c7c7d899a730e1c;size=2722\t78951b2d4ca30531381672a30be0978a;size=3655\n+S\t22\t381\t*\t*\t*\t*\t*\ta3b19115a503e03c27f9577b3e9c673e;size=2708\t*\n+H\t17\t383\t99.7\t+\t0\t0\t383M\t397a9be0ac23a54c504ad0cd4f86ddb9;size=2689\t4edf10a5e3aa4bd4ed28b1694727a060;size=3078\n+H\t1\t373\t99.7\t+\t0\t0\t155MI218M\tfef76769bd8d3a969b567d6d037a9594;size=2592\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\n+S\t23\t384\t*\t*\t*\t*\t*\t86bdf526074a459b826e641cd6131868;size=2562\t*\n+S\t24\t382\t*\t*\t*\t*\t*\t32a6455756704a5ceca00b9f7beefc0c;size=2516\t*\n+S\t25\t383\t*\t*\t*\t*\t*\t7228f266f04a46bfb85ea74e73546004;size=2508\t*\n+S\t26\t381\t*\t*\t*\t*\t*\t38a1e68923981030900a4744924d4694;size=2491\t*\n+S\t27\t385\t*\t*\t*\t*\t*\t132ced0592418845eee2359a1359672f;size=2452\t*\n+S\t28\t381\t*\t*\t*\t*\t*\t809c29f61330f3ce6c7939cb98b7daa5;size=2440\t*\n+S\t29\t381\t*\t*\t*\t*\t*\t3a6ac67b4b0f35b2c4c7537fef7b8c15;size=2326\t*\n+H\t4\t384\t99.5\t+\t0\t0\t384MI\tdcb878b5e3696aaa3fded2a9f7dea7cd;size=2312\ta9d668eae33f9fd4484585d9fe52b05e;size=8638\n+H\t2\t384\t99.7\t+\t0\t0\t170MD213M\t2cb0faa31a23b37e7a40aa1d4ea12534;size=2194\t39392bbb9626a64e6663c05b70293e7c;size=11535\n+S\t30\t381\t*\t*\t*\t*\t*\t653897d9ba97be73ecdabcf6efed61ca;size=2163\t*\n+S\t31\t386\t*\t*\t*\t*\t*\tbbab8ae32b8c7afaef852b438e6dc70d;size=2148\t*\n+H\t1\t375\t99.7\t+\t0\t0\t285MD89M\td56b9d19ecd14c245a89c7ac5f10e437;size=2070\t7e02ae2e1e404d4e7c6035a6e374d29d;size=20728\n+S\t32\t374\t*\t*\t*\t*\t*\tdb38f1b47bbe57241030f94f3cab84cd;size=2069\t*\n+S\t33\t308\t*\t*\t*\t*\t*\tb4e1bd5eac322b803425414f19938cd6;size=1992\t*\n+H\t3\t383\t99.7\t+\t0\t0\t295MI88M\t585a7f513b67529b955093b393a269bc;size=1982\tb970fcbdd71ad2a333f702c7ecfe7114;size=10907\n+S\t34\t381\t*\t*\t*\t*\t*\t8cf1de80f6c4fb75463e4ec3ee0e36c4;size=1937\t*\n+S\t35\t378\t*\t*\t*\t*\t*\t4084bd8293b08a58e03158d6668952f9;size=1934\t*\n+H\t8\t387\t99.7\t+\t0\t0\t172MD214M\t91347cd2230896780f6a8d8ec7a3eb63;size=1899\tea64ae1d6dddc2146105a882229c81bb;size=5125\n+H\t2\t382\t99.7\t+\t0\t0\t123MI259M\t156b1f0da0c6d2b99c93ca960ad238e1;size=1865\t39392bbb9626a64e6663c05b70293e7c;size=11535\n+S\t36\t386\t*\t*\t*\t*\t*\t99ba81c88f63f83daf290add3918d38b;size=1787\t*\n+S\t37\t374\t*\t*\t*\t*\t*\t40db14c7dc6215a64051a172a8b0fec1;size=1775\t*\n+S\t38\t380\t*\t*\t*\t*\t*\t4fd9e532b34b278047b4a588cc98708a;size=1762\t*\n+S\t39\t382\t*\t*\t*\t*\t*\t750451de425698bad38d5e1c872b2f12;size=1660\t*\n+H\t6\t384'..b'81f68498a73523d1711;size=30\t*\n+C\t1312\t1\t*\t*\t*\t*\t*\t42601e1912a50fef89df8280559ab035;size=30\t*\n+C\t1313\t1\t*\t*\t*\t*\t*\t4585948ca8ce056aafd2a7e42b06ea32;size=30\t*\n+C\t1314\t1\t*\t*\t*\t*\t*\t45b6b0d15ad3b48fdad06d2e0bc9c42a;size=30\t*\n+C\t1315\t1\t*\t*\t*\t*\t*\t48a4508cde004abf97c5c437a32b890b;size=30\t*\n+C\t1316\t1\t*\t*\t*\t*\t*\t52360d4cb2376a3d2a5ed6034728a6fc;size=30\t*\n+C\t1317\t1\t*\t*\t*\t*\t*\t53f76ffe69cbb269ff7a820f46bc8756;size=30\t*\n+C\t1318\t1\t*\t*\t*\t*\t*\t5cd7c6ac35c0f87dcb8c180ec992d3bf;size=30\t*\n+C\t1319\t1\t*\t*\t*\t*\t*\t6028380ec9df2fb137312651bb388e47;size=30\t*\n+C\t1320\t1\t*\t*\t*\t*\t*\t6148a94e658d1196c674f24c94298edd;size=30\t*\n+C\t1321\t1\t*\t*\t*\t*\t*\t6f6743b938ec66f62a6de93b522fb376;size=30\t*\n+C\t1322\t1\t*\t*\t*\t*\t*\t71d0bf30d0c6d9f4d00240044594ce0e;size=30\t*\n+C\t1323\t1\t*\t*\t*\t*\t*\t71db1bb7502a93243aeda2f6fa031e0c;size=30\t*\n+C\t1324\t1\t*\t*\t*\t*\t*\t741e6cd748029a12afb76b918c6d77ce;size=30\t*\n+C\t1325\t1\t*\t*\t*\t*\t*\t7b7e7fff6405e22ad292c692fdc1ab9a;size=30\t*\n+C\t1326\t1\t*\t*\t*\t*\t*\t8073525f69e70ecf9c0b01d4ead746c2;size=30\t*\n+C\t1327\t1\t*\t*\t*\t*\t*\t81be08d11a962aa24c5b379f0afa1a4a;size=30\t*\n+C\t1328\t1\t*\t*\t*\t*\t*\t84c75f81d6462f4f6bdfc1b80cc2863b;size=30\t*\n+C\t1329\t1\t*\t*\t*\t*\t*\t85b0b74ff08f182913b6b2e2b828ab36;size=30\t*\n+C\t1330\t1\t*\t*\t*\t*\t*\t8fbc557181558c713d540dd86ade1cf3;size=30\t*\n+C\t1331\t1\t*\t*\t*\t*\t*\t96c93f6f9819a680fc494c9c0dcbe418;size=30\t*\n+C\t1332\t1\t*\t*\t*\t*\t*\t9925797c99b3b812e7179b59b113490f;size=30\t*\n+C\t1333\t1\t*\t*\t*\t*\t*\t9fd94ba744e5447dd917214d5f333399;size=30\t*\n+C\t1334\t1\t*\t*\t*\t*\t*\ta062133fa6e7c89c011019c2f94fb594;size=30\t*\n+C\t1335\t1\t*\t*\t*\t*\t*\ta779123e689e4c9585c5ef603d765405;size=30\t*\n+C\t1336\t1\t*\t*\t*\t*\t*\tb09df1d089c98349eec50ee5fb192f36;size=30\t*\n+C\t1337\t1\t*\t*\t*\t*\t*\tb84a4c94f511bcd643425530fac83d53;size=30\t*\n+C\t1338\t1\t*\t*\t*\t*\t*\tbd6ec630887dbbad937d8caf082d5b6f;size=30\t*\n+C\t1339\t1\t*\t*\t*\t*\t*\tc27b4d38781ee248676d51f5dc0dd01e;size=30\t*\n+C\t1340\t1\t*\t*\t*\t*\t*\tc9610c2a2222757bd7eddf582979539b;size=30\t*\n+C\t1341\t1\t*\t*\t*\t*\t*\tc9e8d206463c2c1b657e79f4935dc7f7;size=30\t*\n+C\t1342\t1\t*\t*\t*\t*\t*\td26ce0d3dc1674f9f61dac770645b957;size=30\t*\n+C\t1343\t1\t*\t*\t*\t*\t*\td9dd80f66077bd29d1569180753d1ea6;size=30\t*\n+C\t1344\t1\t*\t*\t*\t*\t*\t06ec4b215640a9d44a35861354b60bcf;size=29\t*\n+C\t1345\t1\t*\t*\t*\t*\t*\t09d9016732327d30c3cc7c56bb4f171b;size=29\t*\n+C\t1346\t1\t*\t*\t*\t*\t*\t0f7b2738c163da7592b2ec5b091e430c;size=29\t*\n+C\t1347\t1\t*\t*\t*\t*\t*\t14fe7d71921400066f68568c1ee66f64;size=29\t*\n+C\t1348\t1\t*\t*\t*\t*\t*\t1d70fd34fe06fbe95fba7f655f655758;size=29\t*\n+C\t1349\t1\t*\t*\t*\t*\t*\t20604f8a2c76f83892fd14f7bcfe76df;size=29\t*\n+C\t1350\t1\t*\t*\t*\t*\t*\t26769256ffebeb1a6e0371ac660a25fc;size=29\t*\n+C\t1351\t1\t*\t*\t*\t*\t*\t33715194bd7bd2a7b9a077b741f6cc2e;size=29\t*\n+C\t1352\t1\t*\t*\t*\t*\t*\t38526a0979700335599178945868ce22;size=29\t*\n+C\t1353\t1\t*\t*\t*\t*\t*\t3b8091cb7dc8c56e6be20afafebfec6a;size=29\t*\n+C\t1354\t1\t*\t*\t*\t*\t*\t52a4a2f1371e78d7a7cdfdd999eb3546;size=29\t*\n+C\t1355\t1\t*\t*\t*\t*\t*\t52b4839f784baae85fe516e7c3d3da61;size=29\t*\n+C\t1356\t1\t*\t*\t*\t*\t*\t544588bc8cc3527abda2c1fece847e42;size=29\t*\n+C\t1357\t1\t*\t*\t*\t*\t*\t5d95068a9a0e1cd216427e5ad4e78188;size=29\t*\n+C\t1358\t1\t*\t*\t*\t*\t*\t637f9ec05c3503b7a982f9faf1c4a478;size=29\t*\n+C\t1359\t1\t*\t*\t*\t*\t*\t6b54e906df82703cd0a7241729adb4ef;size=29\t*\n+C\t1360\t1\t*\t*\t*\t*\t*\t748ac5205f48bd0a3a321e1e57163040;size=29\t*\n+C\t1361\t1\t*\t*\t*\t*\t*\t7b50737990725c82d470868ca5f02238;size=29\t*\n+C\t1362\t1\t*\t*\t*\t*\t*\t7dd480e0369ded364a5476b8b5c0a20e;size=29\t*\n+C\t1363\t1\t*\t*\t*\t*\t*\t829a92af0a7cb2a6faf53a31f74ac32e;size=29\t*\n+C\t1364\t1\t*\t*\t*\t*\t*\t85a816fc48b95e011c25738668ff92f5;size=29\t*\n+C\t1365\t1\t*\t*\t*\t*\t*\t88ee2d113b38cac2a65f4b8fdefc85e6;size=29\t*\n+C\t1366\t1\t*\t*\t*\t*\t*\t8b580ba225c9ae8df06f925310b59e4e;size=29\t*\n+C\t1367\t1\t*\t*\t*\t*\t*\t8e9a6185e05151042cc0beaadb77eec0;size=29\t*\n+C\t1368\t1\t*\t*\t*\t*\t*\ta23d5d75d02581e3115e23a6a2fe031b;size=29\t*\n+C\t1369\t1\t*\t*\t*\t*\t*\ta9a1fbfca4ade41ce328b07594f11688;size=29\t*\n+C\t1370\t1\t*\t*\t*\t*\t*\taa026d2676cecd33e4a002dbb455ada8;size=29\t*\n+C\t1371\t1\t*\t*\t*\t*\t*\tb0f7bb5e2512ce1b8140fd67d40f0ca2;size=29\t*\n+C\t1372\t1\t*\t*\t*\t*\t*\tbdaad40d1a72de52eebf25010f5b300f;size=29\t*\n+C\t1373\t1\t*\t*\t*\t*\t*\tc72b7875fe56dca4f7d9c24360650a25;size=29\t*\n+C\t1374\t1\t*\t*\t*\t*\t*\tc8403bc529537d14794709f99640ac8f;size=29\t*\n'
b
diff -r fae6527990af -r 8c4e2933a17a test-data/dereplication_result2.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/dereplication_result2.fasta Wed Aug 26 13:34:22 2015 -0400
b
@@ -0,0 +1,3 @@
+>97485665bcded44c4d86c131ca714848;size=4;
+gtcgctcctaccgattgaatacgttggtgattgaattggataaagagatatcatcttaaatgatagcaaagcggtaaaca
+tttgtaaactagattatttagaggaaggagaagtcgtaacaaggtttcc
b
diff -r fae6527990af -r 8c4e2933a17a test-data/dereplication_uc_result3.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/dereplication_uc_result3.fasta Wed Aug 26 13:34:22 2015 -0400
b
@@ -0,0 +1,5 @@
+S 0 129 * * * * * 97485665bcded44c4d86c131ca714848 *
+H 0 129 100.0 * 0 0 * 97485665bcded44c4d86c131ca714848 97485665bcded44c4d86c131ca714848
+H 0 129 100.0 * 0 0 * 97485665bcded44c4d86c131ca714848 97485665bcded44c4d86c131ca714848
+H 0 129 100.0 * 0 0 * 97485665bcded44c4d86c131ca714848 97485665bcded44c4d86c131ca714848
+C 0 4 * * * * * 97485665bcded44c4d86c131ca714848 *
b
diff -r fae6527990af -r 8c4e2933a17a test-data/sorting_result3.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sorting_result3.fasta Wed Aug 26 13:34:22 2015 -0400
b
@@ -0,0 +1,48 @@
+>TEST1
+MDVTVVVSTADHANVKRRRRRSHVRNRRARGYKSSRARSARMHGVDVDWDVVRSSVTSVSYSDDTDWAGNWAGS
+>TEST2
+MSRVVTAVASARATGDSGMGYVHATKTADTTTMRVAARDWVTGRSSKDYWSTTGKSGWDSTAVTTASAK
+>TEST3
+MRGTRRGSGGWSGARYAGSVAASDRSDTRATTSAYRHTHAASGARTRAHARHARHRVTVHVVAGVCARV
+>TEST4
+MGVYKCYNKKKVGVAVKRYVTKKSYKTANSNADSYNCRKCCKAKGCCDRYWKTVKNDKCKKGVVVYY
+>TEST5
+MTVSNTVDYTVSGDRSKKDCNRTCGWRDVRCRTKGTGNSTVTVTKARTVDAVKKMKRTTNSDA
+>TEST6
+MVSTRKKNSVYTGRKYGSYHKDDKKYADNKNRKRYVYSVDDAKAKATAKSVD
+>TEST7
+MTGAGTSGKKNTTTHTKCRRCGKSYHTKKKVCSSCGGKSAKRRDYWSKAG
+>TEST8
+MTGSGTSGKKNKTVHVKCRRCGASYHKTKKVCASCGGKSAKRRDYAWKAG
+>TEST9
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>TEST10
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>TEST11
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>TEST12
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>TEST13
+MSSTDTGHATKRTGDCRCGRKGVGKYDWCRCRARGMGRKYK
+>TEST14
+MSTVTGKSRDGYSTTDANNVARHVYSGSHGKRSDVSA
+>TEST15
+MSTYTVRGSARDGKVDANNVARVYSDGSHNKRTTVAA
+>TEST16
+MSTVTGKSRDGYATTDANNVARHVSGSHGKRTDVS
+>TEST17
+MTNAGRSKACDCKRKVGCSRYK
+>TEST18
+MTNAGRSKACDCKRKVGCSRYK
+>TEST19
+MATDSWAAVDAAASRTSYSTS
+>TEST20
+MRVRVDRVGVVGGGTKKRGV
+>TEST21
+KRGAHGKMNGSVKTTMGSGR
+>TEST22
+MSSNATSTGNMNSNHRDSST
+>TEST23
+MAHSDNRDTADYGGAHAA
+>TEST24
+MMDGSDMDDWRDD
b
diff -r fae6527990af -r 8c4e2933a17a test-data/sorting_result4.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sorting_result4.fasta Wed Aug 26 13:34:22 2015 -0400
b
@@ -0,0 +1,48 @@
+>sp|Q66125|2B_CMVQ Suppressor of silencing 2b OS=Cucumber mosaic virus (strain Q) GN=ORF2b PE=1 SV=1
+MDVTVVVSTADHANVKRRRRRSHVRNRRARGYKSSRARSARMHGVDVDWDVVRSSVTSVSYSDDTDWAGNWAGS
+>sp|P0DMP9|APOC3_PANTA Apolipoprotein C-III OS=Panthera tigris altaica GN=APOC3 PE=3 SV=1
+MSRVVTAVASARATGDSGMGYVHATKTADTTTMRVAARDWVTGRSSKDYWSTTGKSGWDSTAVTTASAK
+>sp|Q89681|DR4_HHV6U Uncharacterized protein DR4 OS=Human herpesvirus 6A (strain Uganda-1102) GN=DR4L PE=4 SV=1
+MRGTRRGSGGWSGARYAGSVAASDRSDTRATTSAYRHTHAASGARTRAHARHARHRVTVHVVAGVCARV
+>sp|Q91G65|032R_IIV6 Uncharacterized protein 032R OS=Invertebrate iridescent virus 6 GN=IIV6-032R PE=4 SV=1
+MGVYKCYNKKKVGVAVKRYVTKKSYKTANSNADSYNCRKCCKAKGCCDRYWKTVKNDKCKKGVVVYY
+>sp|B3MQ24|ENY2_DROAN Enhancer of yellow 2 transcription factor OS=Drosophila ananassae GN=e(y)2 PE=3 SV=1
+MTVSNTVDYTVSGDRSKKDCNRTCGWRDVRCRTKGTGNSTVTVTKARTVDAVKKMKRTTNSDA
+>sp|P20194|A100_SSV1 Uncharacterized protein A-100 OS=Sulfolobus spindle-shape virus 1 GN=a100 PE=1 SV=1
+MVSTRKKNSVYTGRKYGSYHKDDKKYADNKNRKRYVYSVDDAKAKATAKSVD
+>tr|M0KT65|M0KT65_9EURY 50S ribosomal protein L37e OS=Haloarcula amylolytica JCM 13557 GN=rpl37e PE=3 SV=1
+MTGAGTSGKKNTTTHTKCRRCGKSYHTKKKVCSSCGGKSAKRRDYWSKAG
+>tr|M0MK44|M0MK44_9EURY 50S ribosomal protein L37e OS=Halococcus saccharolyticus DSM 5350 GN=rpl37e PE=3 SV=1
+MTGSGTSGKKNKTVHVKCRRCGASYHKTKKVCASCGGKSAKRRDYAWKAG
+>tr|M0D8K9|M0D8K9_9EURY 30S ribosomal protein S14 type Z OS=Halorubrum terrestre JCM 10247 GN=rps14P PE=3 SV=1
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>tr|M0F5C2|M0F5C2_9EURY 30S ribosomal protein S14 type Z OS=Halorubrum hochstenium ATCC 700873 GN=rps14P PE=3 SV=1
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>tr|M0NIQ6|M0NIQ6_9EURY 30S ribosomal protein S14 type Z OS=Halorubrum lipolyticum DSM 21995 GN=rps14P PE=3 SV=1
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>tr|M0PIT7|M0PIT7_9EURY 30S ribosomal protein S14 type Z OS=Halorubrum arcis JCM 13916 GN=rps14P PE=3 SV=1
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>tr|M0MEH5|M0MEH5_9EURY 30S ribosomal protein S14 type Z OS=Halococcus saccharolyticus DSM 5350 GN=rps14P PE=3 SV=1
+MSSTDTGHATKRTGDCRCGRKGVGKYDWCRCRARGMGRKYK
+>tr|L9WHT8|L9WHT8_9EURY 50S ribosomal protein L18Ae OS=Natronorubrum bangense JCM 10635 GN=rplX PE=3 SV=1
+MSTVTGKSRDGYSTTDANNVARHVYSGSHGKRSDVSA
+>tr|M0KH83|M0KH83_9EURY 50S ribosomal protein L18Ae OS=Haloarcula amylolytica JCM 13557 GN=rplX PE=3 SV=1
+MSTYTVRGSARDGKVDANNVARVYSDGSHNKRTTVAA
+>tr|L9WBT3|L9WBT3_9EURY 50S ribosomal protein L18Ae OS=Natronorubrum sulfidifaciens JCM 14089 GN=rplX PE=3 SV=1
+MSTVTGKSRDGYATTDANNVARHVSGSHGKRTDVS
+>tr|W9PMP6|W9PMP6_FUSOX Uncharacterized protein OS=Fusarium oxysporum f. sp. pisi HDV247 GN=FOVG_07074 PE=4 SV=1
+MTNAGRSKACDCKRKVGCSRYK
+>tr|X0LYM3|X0LYM3_FUSOX Uncharacterized protein OS=Fusarium oxysporum f. sp. vasinfectum 25433 GN=FOTG_17987 PE=4 SV=1
+MTNAGRSKACDCKRKVGCSRYK
+>tr|H3BPV3|H3BPV3_HUMAN ATP-dependent RNA helicase DDX19B OS=Homo sapiens GN=DDX19B PE=4 SV=1
+MATDSWAAVDAAASRTSYSTS
+>tr|H0ACG9|H0ACG9_HALSG Uncharacterized protein OS=Haloredivivus sp. (strain G17) GN=HRED_08116 PE=4 SV=1
+MRVRVDRVGVVGGGTKKRGV
+>tr|N6VV02|N6VV02_9EURY Uncharacterized protein (Fragment) OS=Thermoplasmatales archaeon SCGC AB-539-C06 GN=MBGDC06_00209 PE=4 SV=1
+KRGAHGKMNGSVKTTMGSGR
+>tr|Q53RS6|Q53RS6_HUMAN Putative uncharacterized protein ALS2CR3 (Fragment) OS=Homo sapiens GN=ALS2CR3 PE=4 SV=1
+MSSNATSTGNMNSNHRDSST
+>tr|V9H0X7|V9H0X7_NEUCS Neurospora crassa DNA for RNA polymerase I second-largest subunit OS=Neurospora crassa PE=4 SV=1
+MAHSDNRDTADYGGAHAA
+>tr|Q9BZF8|Q9BZF8_HUMAN NF-E2-related factor 2 (Fragment) OS=Homo sapiens PE=2 SV=1
+MMDGSDMDDWRDD
b
diff -r fae6527990af -r 8c4e2933a17a test-data/sorting_result5.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sorting_result5.fasta Wed Aug 26 13:34:22 2015 -0400
b
@@ -0,0 +1,48 @@
+>With spaces1
+MDVTVVVSTADHANVKRRRRRSHVRNRRARGYKSSRARSARMHGVDVDWDVVRSSVTSVSYSDDTDWAGNWAGS
+>With spaces2
+MSRVVTAVASARATGDSGMGYVHATKTADTTTMRVAARDWVTGRSSKDYWSTTGKSGWDSTAVTTASAK
+>With spaces3
+MRGTRRGSGGWSGARYAGSVAASDRSDTRATTSAYRHTHAASGARTRAHARHARHRVTVHVVAGVCARV
+>With spaces4
+MGVYKCYNKKKVGVAVKRYVTKKSYKTANSNADSYNCRKCCKAKGCCDRYWKTVKNDKCKKGVVVYY
+>With spaces5
+MTVSNTVDYTVSGDRSKKDCNRTCGWRDVRCRTKGTGNSTVTVTKARTVDAVKKMKRTTNSDA
+>With spaces6
+MVSTRKKNSVYTGRKYGSYHKDDKKYADNKNRKRYVYSVDDAKAKATAKSVD
+>With spaces7
+MTGAGTSGKKNTTTHTKCRRCGKSYHTKKKVCSSCGGKSAKRRDYWSKAG
+>With spaces8
+MTGSGTSGKKNKTVHVKCRRCGASYHKTKKVCASCGGKSAKRRDYAWKAG
+>With spaces9
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>With spaces10
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>With spaces11
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>With spaces12
+MSANNDTGHAAKRTDSRHTCRRCDRGVGKYDNCRCRVARDMGKYS
+>With spaces13
+MSSTDTGHATKRTGDCRCGRKGVGKYDWCRCRARGMGRKYK
+>With spaces14
+MSTVTGKSRDGYSTTDANNVARHVYSGSHGKRSDVSA
+>With spaces15
+MSTYTVRGSARDGKVDANNVARVYSDGSHNKRTTVAA
+>With spaces16
+MSTVTGKSRDGYATTDANNVARHVSGSHGKRTDVS
+>With spaces17
+MTNAGRSKACDCKRKVGCSRYK
+>With spaces18
+MTNAGRSKACDCKRKVGCSRYK
+>With spaces19
+MATDSWAAVDAAASRTSYSTS
+>With spaces20
+MRVRVDRVGVVGGGTKKRGV
+>With spaces21
+KRGAHGKMNGSVKTTMGSGR
+>With spaces22
+MSSNATSTGNMNSNHRDSST
+>With spaces23
+MAHSDNRDTADYGGAHAA
+>With spaces24
+MMDGSDMDDWRDD
b
diff -r fae6527990af -r 8c4e2933a17a tool_dependencies.xml
--- a/tool_dependencies.xml Thu May 21 03:58:09 2015 -0400
+++ b/tool_dependencies.xml Wed Aug 26 13:34:22 2015 -0400
b
@@ -1,6 +1,6 @@
 <?xml version="1.0"?>
 <tool_dependency>
   <package name="vsearch" version="1.1.3">
-      <repository changeset_revision="c1fc77fac9fb" name="package_vsearch_1_1_3" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" />
+      <repository changeset_revision="559454eab468" name="package_vsearch_1_1_3" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" />
     </package>
 </tool_dependency>
b
diff -r fae6527990af -r 8c4e2933a17a vsearch_macros.xml
--- a/vsearch_macros.xml Thu May 21 03:58:09 2015 -0400
+++ b/vsearch_macros.xml Wed Aug 26 13:34:22 2015 -0400
b
@@ -31,7 +31,7 @@
     </xml>
     <xml name="qmask">
         <param name="qmask" type="select" label="Mask sequences" help="(--qmask)">
-            <option value="no">No masking</option>
+            <option value="none">No masking</option>
             <option value="dust" selected="True">dust</option>
             <option value="soft">soft</option>
         </param>