Repository 'rdp_multiclassifier'
hg clone https://toolshed.g2.bx.psu.edu/repos/qfab/rdp_multiclassifier

Changeset 0:a73ae72b47aa (2014-05-29)
Commit message:
Uploaded
added:
rdpmulticlassifier/README.txt
rdpmulticlassifier/rdp_multi_classifier.xml
rdpmulticlassifier/rdpmulticlassifier.sh
rdpmulticlassifier/scripts/.svn/all-wcprops
rdpmulticlassifier/scripts/.svn/entries
rdpmulticlassifier/scripts/.svn/text-base/generateOTUtable.py.svn-base
rdpmulticlassifier/scripts/generateOTUtable.py
rdpmulticlassifier/test-data/class_detail.tab
rdpmulticlassifier/test-data/class_hier.tab
rdpmulticlassifier/test-data/otu_table.tab
rdpmulticlassifier/test-data/otuseqs.tab
rdpmulticlassifier/test-data/preotu.tab
rdpmulticlassifier/tool_dependencies.xml
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/README.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/README.txt Thu May 29 02:27:56 2014 -0400
b
@@ -0,0 +1,44 @@
+Galaxy wrappers for RDP Multi Classifier - Assign Taxonomy to OTU Table
+========================================================================
+
+The RDP MultiClassifier allows rapid Assignment of rRNA Sequences into
+the new bacterial taxonomy.
+This version of the RDP MultiClassifier allows the completion of the
+intermediate OTU table generated by the USEARCH - Map Reads to OTUs tool
+of the metagenomics workflow.
+
+
+Requirements
+========================================================================
+
+Java Runtime Enviroment
+
+
+Installation
+========================================================================
+
+Galaxy will automatically install the RDP MultiClassifier
+
+
+Disclaimer
+========================================================================
+
+This source code is provided by QFAB Bioinformatics "as is", in the hope
+that it will be useful, and any express or implied warranties, including,
+but not limited to, the implied warranties of merchantability and fitness
+for a particular purpose are disclaimed.
+IN NO EVENT SHALL QFAB BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES HOWEVER CAUSED AND ON ANY THEORY
+OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT(INCLUDING
+NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOURCE
+CODE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+
+License
+========================================================================
+
+This work by QFAB Bioinformatics (as part of the GVL project
+http://genome.edu.au)
+is licensed under a Creative Commons Attribution-NonCommercial-ShareAlike 4.0
+International License.
+                        
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/rdp_multi_classifier.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/rdp_multi_classifier.xml Thu May 29 02:27:56 2014 -0400
[
@@ -0,0 +1,143 @@
+<tool id="rdpmulticlassifier" name="RDP MultiClassifier" version="1.1">
+ <description>Rapid Assignment of rRNA Sequences into the New Bacterial Taxonomy</description>
+ <command interpreter="bash">
+       #if $table.addotutable
+         rdpmulticlassifier.sh $gene $table.addotutable $input $otu $conf $hier $assign $otutable $format 
+       #else
+         rdpmulticlassifier.sh $gene $table.addotutable $input NULL $conf $hier $assign NULL $format
+       #end if
+ </command>
+ <requirements>
+    <requirement type="package" version="1.1">rdp_multi_classifier_1.1</requirement>
+ </requirements>
+ <inputs>
+  <param name="gene" type="select" label="Select Gene Trainings Model" help="The Multi-Classifier provides two training models: 16S rRNA or Fungal LSU genes.">
+        <option value="16srrna" selected="true">16S rRNA</option>
+        <option value="fungallsu">Fungal LSU</option>
+  </param>
+ <conditional name="table">
+  <param name="addotutable" type="boolean" value="true" label="Select to generate an OTU Table" help="This is to complete the intermediate OTU Table generated by the 'Map Reads to OTU' tool of the metagenomics workflow. The intermediate OTU table and relabelled OTUs output files of the 'Map Reads to OTU' tool will be required." />
+  <when value="true">
+  <param name="input" type="data" format="fasta" label="Relabelled OTU input reads of the 'Map Reads to OTU' tool in FASTA format"/>
+  <param name="otu" type="data" format="tabular" label="PRE OTU table of the 'Map Reads to OTU' tool" />
+  </when>
+  <when value="false">
+  <param name="input" type="data" format="fasta" label="Input reads file in FASTA format"/>
+  </when>
+  </conditional> -->
+  <param name="conf" type="float" value="0.8" label="Assignment confidence cutoff" help="Specifies the assignment confidence cutoff used to determine the assignment count in the hierarchical format. Range [0-1], Default is 0.8. For sequences shorter than 250 base pairs, the confidence threshold 50% is recommended to improve classification coverage." />
+  <param name="format" type="select" label="Tab delimited output format" help="Please see the description below on the 'Tab delimited output format' options.">
+        <option value="allrank" selected="true">allrank</option>
+        <option value="fixrank">fixrank</option>
+        <option value="db">db</option>
+  </param>
+ </inputs>
+ <outputs>
+  <data name="hier" format="tabular" label="${tool.name} on ${on_string}:classification_assignment_hierarchical.tab" />
+  <data name="assign" format="tabular" label="${tool.name} on ${on_string}:classification_assignment_details.tab" />
+  <data name="otutable" format="tabular" label="${tool.name} on ${on_string}: OTU_Table.tab" >
+   <filter>table['addotutable']</filter>
+  </data>
+ </outputs>
+ <help>
+===========
+Description
+===========
+
+The RDP MultiClassifier allows rapid Assignment of rRNA sequences into the new bacterial taxonomy. 
+This version of the RDP MultiClassifier allows the completion of the intermediate OTU table generated by the USEARCH - 'Map Reads to OTU' tool of the metagenomics workflow.
+
+-----
+
+-----
+Input
+-----
+
+**No OTU Table generation selected:**
+
+A) File of reads in FASTA format.
+
+.. class:: infomark
+
+Input sequences should be at least 50bp for accurate results. Uppercase and lowercase formats are allowed.
+
+**OTU Table generations is selected:**
+
+A) Relabelled OTU input reads in FASTA format of the 'Map Reads to OTU' tool.
+
+.. class:: warningmark
+
+Please note the 'relabelled OTU' output of the 'Map Reads to OTU' tool is hidden. To access the hidden output, click on the cog wheel in the upper right corner of the History panel and select 'Include Hidden Datasets'. The output dataset will appear with a dialog box. Follow the instruction in the dialog box and click 'here' to unhide the dataset.
+
+
+B) Pre-OTU Table of the 'Map Reads to OTU' tool in tabular format.
+
+----------
+Parameters
+----------
+
+Gene Trainings Model
+   RDP naive Bayesian Classifier offers two hierarchy models for 16S rRNA and Fungal LSU genes
+
+OTU Table generation
+   For OTU Table generation, check the above checkbox and provide the intermediate OTU table (Pre-OTU Table) and the 'relabelled OTU' input reads of the 'Map Reads to OTU' tool of the metagenomics workflow.
+
+Confidence cutoff
+   Used to determine the assignment count in the hierarchial format. Range[0-1], default is 0.8. For sequences shorter than 250 base pairs, the confidence threshold 50% is recommended to improve classification coverage.
+
+Tab delimited output format
+   a) allrank: outputs the results for all ranks applied for each sequence: seqname, orientation, taxon name, rank, conf, etc
+   b) fixrank: only outputs the results for fixed ranks in order: domain, phylum, class, order, family, genus
+   c) db: outputs the seqname, trainset_no, tax_id, conf
+
+------
+Output
+------
+
+The tool generates 2 or 3 outputs depending if 'OTU Table generations' is selected.
+
+**No OTU Table generation selected:**
+
+(A) Sequence count for each taxon in the hierarchy in tab-format: classification_assignment_hierarchical.tab
+
+(B) Sequence-by-sequence classification results including confidence scores at each level of the hierarchy in tab-format: classification_assignment_details.tab   
+
+**OTU Table generations is selected:**
+
+(A) Sequence count for each taxon in the hierarchy in tab-format: classification_assignment_hierarchical.tab
+
+(B) Sequence-by-sequence classification results including confidence scores at each level of the hierarchy in tab-format: classification_assignment_details.tab
+
+(C) OTU Table in tab-format
+
+-----
+
+=========
+Resources
+=========
+
+RDP_MultiClassifier_Tutorial_
+
+.. _RDP_MultiClassifier_Tutorial: http://rdp.cme.msu.edu/tutorials/classifier/RDPtutorial_MULTICLASSIFIER.html
+
+
+**Wrapper Author**
+
+QFAB Bioinformatics (support@qfab.org)
+
+</help>
+<tests>
+  <test>
+    <param name="gene" value="16srrna" />
+    <param name="addotutable" value="true" />
+    <param name="input" value="otuseqs.fasta" />
+    <param name="otu" value="preotu.tab" />
+    <param name="conf" value="0.8" />
+    <param name="format" value="fixrank" />
+    <output name="hier" file="class_hier.tab" ftype="tabular" lines_diff="10" />
+    <output name="assign" file="class_detail.tab" ftype="tabular" lines_diff="10" />
+    <output name="otutable" file="otu_table.tab" ftype="tabular" lines_diff="10" />
+  </test>
+</tests>
+</tool>
+
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/rdpmulticlassifier.sh
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/rdpmulticlassifier.sh Thu May 29 02:27:56 2014 -0400
[
@@ -0,0 +1,19 @@
+#!/bash/bin
+#echo $@
+
+gene=$1
+addotutable=$2
+input_file=$3
+otu_input_file=$4
+conf=$5
+output_hier=$6
+output_assign=$7
+output_otutable=$8
+format=$9
+full_path=$(echo "`dirname $0`";)
+
+echo `java -Xmx1g -jar $JAVA_JAR_PATH/MultiClassifier.jar --gene=$gene --conf=$conf --hier_outfile=$output_hier --assign_outfile=$output_assign --format=$format $input_file`;
+if [ $addotutable == True ] 
+then
+  echo `python $full_path\/scripts\/generateOTUtable.py $output_otutable $otu_input_file $output_assign`;
+fi
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/scripts/.svn/all-wcprops
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/scripts/.svn/all-wcprops Thu May 29 02:27:56 2014 -0400
b
@@ -0,0 +1,11 @@
+K 25
+svn:wc:ra_dav:version-url
+V 80
+/svn/projects/!svn/ver/744/10_146_GVL/01_Metagenomics/multiRDPclassifier/scripts
+END
+generateOTUtable.py
+K 25
+svn:wc:ra_dav:version-url
+V 100
+/svn/projects/!svn/ver/746/10_146_GVL/01_Metagenomics/multiRDPclassifier/scripts/generateOTUtable.py
+END
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/scripts/.svn/entries
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/scripts/.svn/entries Thu May 29 02:27:56 2014 -0400
b
@@ -0,0 +1,62 @@
+10
+
+dir
+744
+http://procyon.qfab.org:8080/svn/projects/10_146_GVL/01_Metagenomics/multiRDPclassifier/scripts
+http://procyon.qfab.org:8080/svn/projects
+
+
+
+2013-12-20T01:34:14.208737Z
+744
+a.kunert
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+e042828a-163e-41b9-9f75-8c7748f18e0d
+
+generateOTUtable.py
+file
+746
+
+
+
+2013-12-20T01:36:24.000000Z
+12c0d7cbb1b0dc8580c9b0fb5d598adb
+2013-12-20T01:36:35.680317Z
+746
+a.kunert
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+982
+
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/scripts/.svn/text-base/generateOTUtable.py.svn-base
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/scripts/.svn/text-base/generateOTUtable.py.svn-base Thu May 29 02:27:56 2014 -0400
[
@@ -0,0 +1,34 @@
+# create OTU Table by merging pre otu table with taxonomy assign by
+# rdpmulticlassifier
+# Tab-separated fields:
+# 1=OTU Label, 2=Count, 3=Sequence, 4 and following=Assigned taxonomy by
+# RDP Multi Classifier
+
+import sys, os
+
+OTUtable = sys.argv[1]
+PreOTUtable = sys.argv[2]
+RdpTaxonomy = sys.argv[3]
+
+def merge(output, preotu, tax):
+    writeoutput = open(output, 'w')
+    lookup = {} 
+    with open(tax) as f:
+        for x in f:
+     list = x.split('\t')
+            length = len(list)
+     rest =''
+            for k in range(1, length):
+                item= list[k].replace(' ','') 
+                item= item.replace('\n','')
+             rest = rest+ item + '\t'
+     lookup[list[0]] = rest
+    with open(preotu) as f:
+ for x in f:
+     columns = x.split('\t')
+            otu = columns[0].replace(' ','')         
+            taxonomy = lookup[otu]
+            line = x.replace('\n','')
+     writeoutput.write(line+taxonomy+'\n')
+
+merge(OTUtable, PreOTUtable, RdpTaxonomy)
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/scripts/generateOTUtable.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/scripts/generateOTUtable.py Thu May 29 02:27:56 2014 -0400
[
@@ -0,0 +1,34 @@
+# create OTU Table by merging pre otu table with taxonomy assign by
+# rdpmulticlassifier
+# Tab-separated fields:
+# 1=OTU Label, 2=Count, 3=Sequence, 4 and following=Assigned taxonomy by
+# RDP Multi Classifier
+
+import sys, os
+
+OTUtable = sys.argv[1]
+PreOTUtable = sys.argv[2]
+RdpTaxonomy = sys.argv[3]
+
+def merge(output, preotu, tax):
+    writeoutput = open(output, 'w')
+    lookup = {} 
+    with open(tax) as f:
+        for x in f:
+     list = x.split('\t')
+            length = len(list)
+     rest =''
+            for k in range(1, length):
+                item= list[k].replace(' ','') 
+                item= item.replace('\n','')
+             rest = rest+ item + '\t'
+     lookup[list[0]] = rest
+    with open(preotu) as f:
+ for x in f:
+     columns = x.split('\t')
+            otu = columns[0].replace(' ','')         
+            taxonomy = lookup[otu]
+            line = x.replace('\n','')
+     writeoutput.write(line+taxonomy+'\n')
+
+merge(OTUtable, PreOTUtable, RdpTaxonomy)
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/test-data/class_detail.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/test-data/class_detail.tab Thu May 29 02:27:56 2014 -0400
b
b'@@ -0,0 +1,536 @@\n+OTU_1\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t1.0\tAlteromonadales\torder\t1.0\tAlteromonadaceae\tfamily\t1.0\tHaliea\tgenus\t1.0\n+OTU_2\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t0.98\tAlphaproteobacteria\tclass\t0.89\tRhizobiales\torder\t0.42\t"Aurantimonadaceae"\tfamily\t0.22\tMartelella\tgenus\t0.22\n+OTU_3\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Actinobacteria"\tphylum\t1.0\tActinobacteria\tclass\t1.0\tActinobacteridae\tsubclass\t0.98\tActinomycetales\torder\t0.98\tMicrococcineae\tsuborder\t0.57\tMicrobacteriaceae\tfamily\t0.42\tOkibacterium\tgenus\t0.16\n+OTU_4\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t0.99\tAlphaproteobacteria\tclass\t0.96\tRhizobiales\torder\t0.52\t"Aurantimonadaceae"\tfamily\t0.34\tMartelella\tgenus\t0.34\n+OTU_5\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\tCyanobacteria/Chloroplast\tphylum\t1.0\tCyanobacteria\tclass\t1.0\tFamily II\tfamily\t1.0\tGpIIa\tgenus\t1.0\n+OTU_6\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Actinobacteria"\tphylum\t1.0\tActinobacteria\tclass\t1.0\tActinobacteridae\tsubclass\t1.0\tActinomycetales\torder\t1.0\tMicrococcineae\tsuborder\t0.55\tIntrasporangiaceae\tfamily\t0.28\tOrnithinicoccus\tgenus\t0.19\n+OTU_7\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhodobacterales\torder\t1.0\tRhodobacteraceae\tfamily\t1.0\tPelagibaca\tgenus\t1.0\n+OTU_8\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\tOD1\tphylum\t1.0\tOD1_genera_incertae_sedis\tgenus\t1.0\n+OTU_9\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhizobiales\torder\t0.8\t"Aurantimonadaceae"\tfamily\t0.63\tMartelella\tgenus\t0.63\n+OTU_10\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t1.0\tChromatiales\torder\t1.0\tChromatiaceae\tfamily\t1.0\tThiohalocapsa\tgenus\t1.0\n+OTU_11\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\tSR1\tphylum\t1.0\tSR1_genera_incertae_sedis\tgenus\t1.0\n+OTU_12\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Actinobacteria"\tphylum\t0.72\tActinobacteria\tclass\t0.72\tAcidimicrobidae\tsubclass\t0.3\tAcidimicrobiales\torder\t0.3\t"Acidimicrobineae"\tsuborder\t0.3\tAcidimicrobiaceae\tfamily\t0.27\tFerrimicrobium\tgenus\t0.16\n+OTU_13\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Verrucomicrobia"\tphylum\t1.0\tOpitutae\tclass\t1.0\tPuniceicoccales\torder\t1.0\tPuniceicoccaceae\tfamily\t1.0\tCoraliomargarita\tgenus\t1.0\n+OTU_14\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tBetaproteobacteria\tclass\t1.0\tBurkholderiales\torder\t1.0\tComamonadaceae\tfamily\t1.0\tHydrogenophaga\tgenus\t0.92\n+OTU_15\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t0.99\tMethylococcales\torder\t0.34\tMethylococcaceae\tfamily\t0.34\tMethylosoma\tgenus\t0.28\n+OTU_16\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tDeltaproteobacteria\tclass\t1.0\tBdellovibrionales\torder\t1.0\tBacteriovoracaceae\tfamily\t1.0\tBacteriovorax\tgenus\t1.0\n+OTU_17\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\tOP11\tphylum\t1.0\tOP11_genera_incertae_sedis\tgenus\t1.0\n+OTU_18\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t1.0\tMethylococcales\torder\t0.18\tMethylococcaceae\tfamily\t0.18\tMethylococcus\tgenus\t0.14\n+OTU_19\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t1.0\tOceanospirillales\torder\t0.68\tOleiphilaceae\tfamily\t0.25\tOleiphilus\tgenus\t0.25\n+OTU_20\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t1.0\tChromatiales\torder\t1.0\tChromatiaceae\tfamily\t1.0\tThiodictyon\tgenus\t1.0\n+OTU_21\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t1.0\tOceanospirillales\torder\t0.55\tOceanospirillaceae\tfamily\t0.48\tBermanella\tgenus\t0.36\n+OTU_22\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tDeltaproteobacteria\tclass\t0.76\tDesulfuromonadales\torder\t0.17\tDesulfuromonadaceae\tfamily\t0.14\tMalonomonas\tgenus\t0.14\n+OTU_23\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteo'..b'family\t0.98\tParachlamydia\tgenus\t0.75\n+OTU_514\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhodobacterales\torder\t1.0\tRhodobacteraceae\tfamily\t1.0\tLabrenzia\tgenus\t0.69\n+OTU_515\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\tCyanobacteria/Chloroplast\tphylum\t1.0\tChloroplast\tclass\t1.0\tChloroplast\tfamily\t1.0\tChlorophyta\tgenus\t1.0\n+OTU_516\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Bacteroidetes"\tphylum\t1.0\tFlavobacteria\tclass\t1.0\t"Flavobacteriales"\torder\t1.0\tFlavobacteriaceae\tfamily\t1.0\tFlavobacterium\tgenus\t1.0\n+OTU_517\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Chloroflexi"\tphylum\t0.33\tAnaerolineae\tclass\t0.33\tAnaerolineales\torder\t0.33\tAnaerolineaceae\tfamily\t0.33\tBellilinea\tgenus\t0.25\n+OTU_518\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhodobacterales\torder\t1.0\tRhodobacteraceae\tfamily\t1.0\tAntarctobacter\tgenus\t0.69\n+OTU_519\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\tCyanobacteria/Chloroplast\tphylum\t1.0\tChloroplast\tclass\t1.0\tChloroplast\tfamily\t1.0\tCryptomonadaceae\tgenus\t1.0\n+OTU_520\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhizobiales\torder\t0.64\tMethylocystaceae\tfamily\t0.48\tTerasakiella\tgenus\t0.48\n+OTU_521\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\tSR1\tphylum\t1.0\tSR1_genera_incertae_sedis\tgenus\t1.0\n+OTU_522\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhodospirillales\torder\t1.0\tRhodospirillaceae\tfamily\t1.0\tRhodocista\tgenus\t1.0\n+OTU_523\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Bacteroidetes"\tphylum\t1.0\tFlavobacteria\tclass\t0.8\t"Flavobacteriales"\torder\t0.8\tCryomorphaceae\tfamily\t0.76\tFluviicola\tgenus\t0.59\n+OTU_524\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Actinobacteria"\tphylum\t1.0\tActinobacteria\tclass\t1.0\tActinobacteridae\tsubclass\t1.0\tBifidobacteriales\torder\t1.0\tBifidobacteriaceae\tfamily\t1.0\tBifidobacterium\tgenus\t1.0\n+OTU_525\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhodospirillales\torder\t0.69\tRhodospirillaceae\tfamily\t0.68\tPelagibius\tgenus\t0.31\n+OTU_526\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tBetaproteobacteria\tclass\t1.0\tNeisseriales\torder\t1.0\tNeisseriaceae\tfamily\t1.0\tNeisseria\tgenus\t1.0\n+OTU_527\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tDeltaproteobacteria\tclass\t1.0\tBdellovibrionales\torder\t1.0\tBacteriovoracaceae\tfamily\t1.0\tPeredibacter\tgenus\t0.76\n+OTU_528\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhodobacterales\torder\t1.0\tRhodobacteraceae\tfamily\t1.0\tAlbidovulum\tgenus\t0.4\n+OTU_529\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Chlorobi"\tphylum\t1.0\t"Chlorobia"\tclass\t1.0\tChlorobiales\torder\t1.0\tChlorobiaceae\tfamily\t1.0\tProsthecochloris\tgenus\t1.0\n+OTU_530\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\tOD1\tphylum\t0.78\tOD1_genera_incertae_sedis\tgenus\t0.78\n+OTU_531\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Actinobacteria"\tphylum\t1.0\tActinobacteria\tclass\t1.0\tActinobacteridae\tsubclass\t1.0\tActinomycetales\torder\t1.0\tFrankineae\tsuborder\t1.0\tAcidothermaceae\tfamily\t1.0\tAcidothermus\tgenus\t1.0\n+OTU_532\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhodobacterales\torder\t1.0\tRhodobacteraceae\tfamily\t1.0\tRhodobacter\tgenus\t1.0\n+OTU_533\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t0.74\tDeltaproteobacteria\tclass\t0.48\tDesulfarculales\torder\t0.1\tDesulfarculaceae\tfamily\t0.1\tDesulfarculus\tgenus\t0.1\n+OTU_534\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhodobacterales\torder\t1.0\tRhodobacteraceae\tfamily\t1.0\tOceanicola\tgenus\t1.0\n+OTU_535\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t1.0\tPseudomonadales\torder\t0.46\tPseudomonadales_incertae_sedis\tfamily\t0.39\tDasania\tgenus\t0.39\n+OTU_536\t\tRoot\trootrank\t1.0\tBacteria\tdomain\t0.99\tOD1\tphylum\t0.37\tOD1_genera_incertae_sedis\tgenus\t0.37\n'
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/test-data/class_hier.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/test-data/class_hier.tab Thu May 29 02:27:56 2014 -0400
b
b'@@ -0,0 +1,388 @@\n+taxid\tlineage\tname\trank\tdataset_105.dat\n+0\tnull\tRoot\tno rank\t536\n+1\tRoot;rootrank;Bacteria;domain;\tBacteria\tdomain\t526\n+841\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;\t"Proteobacteria"\tphylum\t249\n+1501\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;\tGammaproteobacteria\tclass\t74\n+1520\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Alteromonadales;order;\tAlteromonadales\torder\t10\n+1521\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Alteromonadales;order;Alteromonadaceae;family;\tAlteromonadaceae\tfamily\t8\n+1529\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Alteromonadales;order;Alteromonadaceae;family;Haliea;genus;\tHaliea\tgenus\t6\n+1530\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Alteromonadales;order;Alteromonadaceae;family;Marinimicrobium;genus;\tMarinimicrobium\tgenus\t1\n+1526\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Alteromonadales;order;Alteromonadaceae;family;Alteromonas;genus;\tAlteromonas\tgenus\t1\n+1551\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Alteromonadales;order;Pseudoalteromonadaceae;family;\tPseudoalteromonadaceae\tfamily\t2\n+1553\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Alteromonadales;order;Pseudoalteromonadaceae;family;Pseudoalteromonas;genus;\tPseudoalteromonas\tgenus\t2\n+1566\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Chromatiales;order;\tChromatiales\torder\t4\n+1567\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Chromatiales;order;Chromatiaceae;family;\tChromatiaceae\tfamily\t3\n+1588\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Chromatiales;order;Chromatiaceae;family;Thiohalocapsa;genus;\tThiohalocapsa\tgenus\t1\n+1586\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Chromatiales;order;Chromatiaceae;family;Thiodictyon;genus;\tThiodictyon\tgenus\t1\n+1595\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Chromatiales;order;Ectothiorhodospiraceae;family;\tEctothiorhodospiraceae\tfamily\t1\n+1608\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Chromatiales;order;Ectothiorhodospiraceae;family;Thiorhodospira;genus;\tThiorhodospira\tgenus\t1\n+-1568\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Chromatiales;order;Chromatiaceae;family;unclassified_Chromatiaceae;;\tunclassified_Chromatiaceae\t\t1\n+1668\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Legionellales;order;\tLegionellales\torder\t8\n+1669\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Legionellales;order;Coxiellaceae;family;\tCoxiellaceae\tfamily\t7\n+1671\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Legionellales;order;Coxiellaceae;family;Coxiella;genus;\tCoxiella\tgenus\t6\n+1670\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Legionellales;order;Coxiellaceae;family;Aquicella;genus;\tAquicella\tgenus\t1\n+1672\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Legionellales;order;Legionellaceae;family;\tLegionellaceae\tfamily\t1\n+1674\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Legionellales;order;Legionellaceae;family;Legionella;genus;\tLegionella\tgenus\t1\n+1762\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Pseudomonadales;order;\tPseudomonadales\torder\t8\n+1763\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Pseudomonadales;order;Moraxellaceae;family;\tMoraxellaceae\tfamily\t3\n+1764\tRoot;rootrank;Bacteria;domain;"Proteobacteria";phylum;Gammaproteobacteria;class;Pseudomonadales;order;Moraxellaceae;family;Acinetobacter;gen'..b'ycetes"\tphylum\t2\n+837\tRoot;rootrank;Bacteria;domain;"Planctomycetes";phylum;Phycisphaerae;class;\tPhycisphaerae\tclass\t1\n+838\tRoot;rootrank;Bacteria;domain;"Planctomycetes";phylum;Phycisphaerae;class;Phycisphaerales;order;\tPhycisphaerales\torder\t1\n+839\tRoot;rootrank;Bacteria;domain;"Planctomycetes";phylum;Phycisphaerae;class;Phycisphaerales;order;Phycisphaeraceae;family;\tPhycisphaeraceae\tfamily\t1\n+840\tRoot;rootrank;Bacteria;domain;"Planctomycetes";phylum;Phycisphaerae;class;Phycisphaerales;order;Phycisphaeraceae;family;Phycisphaera;genus;\tPhycisphaera\tgenus\t1\n+825\tRoot;rootrank;Bacteria;domain;"Planctomycetes";phylum;"Planctomycetacia";class;\t"Planctomycetacia"\tclass\t1\n+826\tRoot;rootrank;Bacteria;domain;"Planctomycetes";phylum;"Planctomycetacia";class;Planctomycetales;order;\tPlanctomycetales\torder\t1\n+827\tRoot;rootrank;Bacteria;domain;"Planctomycetes";phylum;"Planctomycetacia";class;Planctomycetales;order;Planctomycetaceae;family;\tPlanctomycetaceae\tfamily\t1\n+-828\tRoot;rootrank;Bacteria;domain;"Planctomycetes";phylum;"Planctomycetacia";class;Planctomycetales;order;Planctomycetaceae;family;unclassified_Planctomycetaceae;;\tunclassified_Planctomycetaceae\t\t1\n+-2165\tRoot;rootrank;Bacteria;domain;"Verrucomicrobia";phylum;unclassified_"Verrucomicrobia";;\tunclassified_"Verrucomicrobia"\t\t1\n+804\tRoot;rootrank;Bacteria;domain;"Gemmatimonadetes";phylum;\t"Gemmatimonadetes"\tphylum\t2\n+805\tRoot;rootrank;Bacteria;domain;"Gemmatimonadetes";phylum;Gemmatimonadetes;class;\tGemmatimonadetes\tclass\t2\n+806\tRoot;rootrank;Bacteria;domain;"Gemmatimonadetes";phylum;Gemmatimonadetes;class;Gemmatimonadales;order;\tGemmatimonadales\torder\t2\n+807\tRoot;rootrank;Bacteria;domain;"Gemmatimonadetes";phylum;Gemmatimonadetes;class;Gemmatimonadales;order;Gemmatimonadaceae;family;\tGemmatimonadaceae\tfamily\t2\n+808\tRoot;rootrank;Bacteria;domain;"Gemmatimonadetes";phylum;Gemmatimonadetes;class;Gemmatimonadales;order;Gemmatimonadaceae;family;Gemmatimonas;genus;\tGemmatimonas\tgenus\t2\n+667\tRoot;rootrank;Bacteria;domain;"Chlamydiae";phylum;\t"Chlamydiae"\tphylum\t2\n+668\tRoot;rootrank;Bacteria;domain;"Chlamydiae";phylum;Chlamydiae;class;\tChlamydiae\tclass\t2\n+669\tRoot;rootrank;Bacteria;domain;"Chlamydiae";phylum;Chlamydiae;class;Chlamydiales;order;\tChlamydiales\torder\t2\n+673\tRoot;rootrank;Bacteria;domain;"Chlamydiae";phylum;Chlamydiae;class;Chlamydiales;order;Parachlamydiaceae;family;\tParachlamydiaceae\tfamily\t2\n+674\tRoot;rootrank;Bacteria;domain;"Chlamydiae";phylum;Chlamydiae;class;Chlamydiales;order;Parachlamydiaceae;family;Neochlamydia;genus;\tNeochlamydia\tgenus\t1\n+-674\tRoot;rootrank;Bacteria;domain;"Chlamydiae";phylum;Chlamydiae;class;Chlamydiales;order;Parachlamydiaceae;family;unclassified_Parachlamydiaceae;;\tunclassified_Parachlamydiaceae\t\t1\n+1921\tRoot;rootrank;Bacteria;domain;"Tenericutes";phylum;\t"Tenericutes"\tphylum\t1\n+1922\tRoot;rootrank;Bacteria;domain;"Tenericutes";phylum;Mollicutes;class;\tMollicutes\tclass\t1\n+1923\tRoot;rootrank;Bacteria;domain;"Tenericutes";phylum;Mollicutes;class;Acholeplasmatales;order;\tAcholeplasmatales\torder\t1\n+1924\tRoot;rootrank;Bacteria;domain;"Tenericutes";phylum;Mollicutes;class;Acholeplasmatales;order;Acholeplasmataceae;family;\tAcholeplasmataceae\tfamily\t1\n+1925\tRoot;rootrank;Bacteria;domain;"Tenericutes";phylum;Mollicutes;class;Acholeplasmatales;order;Acholeplasmataceae;family;Acholeplasma;genus;\tAcholeplasma\tgenus\t1\n+-2260\tRoot;rootrank;Bacteria;domain;Firmicutes;phylum;unclassified_Firmicutes;;\tunclassified_Firmicutes\t\t1\n+694\tRoot;rootrank;Bacteria;domain;"Chloroflexi";phylum;\t"Chloroflexi"\tphylum\t1\n+-695\tRoot;rootrank;Bacteria;domain;"Chloroflexi";phylum;unclassified_"Chloroflexi";;\tunclassified_"Chloroflexi"\t\t1\n+-2\tRoot;rootrank;Bacteria;domain;unclassified_Bacteria;;\tunclassified_Bacteria\t\t49\n+1966\tRoot;rootrank;Archaea;domain;\tArchaea\tdomain\t10\n+2010\tRoot;rootrank;Archaea;domain;"Euryarchaeota";phylum;\t"Euryarchaeota"\tphylum\t10\n+-2011\tRoot;rootrank;Archaea;domain;"Euryarchaeota";phylum;unclassified_"Euryarchaeota";;\tunclassified_"Euryarchaeota"\t\t10\n'
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/test-data/otu_table.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/test-data/otu_table.tab Thu May 29 02:27:56 2014 -0400
b
b'@@ -0,0 +1,536 @@\n+OTU_2\t60\t\tAACGTACGCTGGCGGCACGCCTAACACATGCAAGTCGAACGCAGTAGCAATACTGAGTGGCAAACGGGTGAGTATAATGTGGGAATCTGCCTTTTGGTTTGGAATAACACGGGGAAACTTGTGCTAATACCGAATAAGCCCTTACGGGGAAAGTTTTAACGCCGAAAGATGAGCCTGCACTTGATTAGCTAGTTGGTAAGGTAAAAGCTTACCAAGGCAACGATCAATAGCTGTTCTTAGAGGAAGACCAGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCACAATGGgggAAACCCTGATGCAGCGATGCCGCGTGAGTGAAGAGGGCCCTTGGGTTGTAAAACTCTTTCGTCGGGGAAGAAAATGACTGTACCCGAATAAGAAGGTCCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGACCTAGCGTAGTTCGGAATTACTGGGCTTAAAGAGCTCGTAGGTGGTTAAaaaaGTTGATGGTGAAATCCCAAGGCTCAACCTTGGAACTGCCATCAAAACTTtttAGCTAGAGTGTGATAGAGGTAAGTGGAATTTCTAGTGTAGAGGTGAAATTCGTAGATATTAGAAAGAACACCAAATGCGAAGGCAACTTACTGGGTCACTACTGACACTGAGGAGCGAAAGCATGGGTAGCGAAGAGGATTAGATACCCTCGTAGTCCATGCCGTAAACGATGtgtgCTAGACGTTGGAAATatatTtttCAGTGTCGCAGCGAAAGCATTAAGCACACCGCCTGGGGAGTACGACCGCAAGGTTAAAACTCAAATGAATTGACGGGGACCCGCACAAGCAGTGGAGCATGTGGTTTAATTCGAAGATACGCGCAGAACCTTACCAACACTTGACATGTTCGTCGCGAAACTAAGAGATTAGTTttttCAGTTCGGCTGGACGAAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTACTTTTAGTTGCCACCATTTAGTTGGGCACTTTAAAAGAACTGCCAGTGATAAGCTGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGTGTTGGGCTACacacGTGCTACAATGGTACTTACAATGGGATGCAAAGAGGTGACTCTTAGCTAATCCCTAAAATGTACCTCAGTTCGGATTGTACTCTGTAACTCGAGTGCATGAAGCTGGAATTGCTAGTAATCGCGGATCAGCgcgcCGCGGTGAATACGTTCCCGGGTCTTGTACacacCGCCCGTCACACCATGGAAGTTGGTTACACCTTAAGGCAAAGCTTATACCTTTGACTACGGTACGATCAGCAACTGGGGTGAAGTCGTAACAAGGTAGCCGTAGGGGAACCTGCGGCTGGATTACCTCCTTTCTAAGGA\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t0.98\tAlphaproteobacteria\tclass\t0.89\tRhizobiales\torder\t0.42\t"Aurantimonadaceae"\tfamily\t0.22\tMartelella\tgenus\t0.22\t\n+OTU_1\t4\t\tAGAGTTTGATCCTGGCTCAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGCGAAATCTCCTTCGGGAGTGAGTAGAGCGGCGGACGGGTGAGTAACGCGTAGGAATCTACCCAGTGGTGGgggACAACCTGGGGAAACCCAGGCTAATACCGCATACGCCCTACGGgggAAAGCGGgggCTctctTCGGAGACCTCGCGCCATTGGATGAGCCTGCGTTGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCATAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGgggAAACCCTGACGCAGCCATGCCGCGTgtgtgAAGAAGGCTCTAGGGTTGTAAAGCACTTTCAGTAGGGAGAAaaaGCTCATGTTTAATAGATGTGAGTGTTGATGTTACCTACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCgcgcgTAGGCGGTTTGTTAAGTCGGATGTGAAAGCCCCGGGCTCAACCTGGGAATTGCATTCGATACTGATCGACTAGAGTACGAgagagGGAGGTAGAATTCCACGTGTAGCGGTGAAATGCGTAGATATGTGGAGGAATACCGGTGGCGAAGGCGGCCTCCTGGCTCGATACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCAACTAGCCGTTGGGGAACTTGATTCCTTAGTGGCGCAGCTAACGCAATAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGgggCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTGAAAACTTTCCAGAGATGGATTGGTGCCTTCGGGAATTCAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTGCCAGCACGTAATGGTGGGAACTCTAAGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGACCTGGGCTACacacGTGCTACAATGGTCGGTACAGACGGCTGCGAACCCGCGAGGgggAGCGAATCCGAGAAAACCGATCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGCGAATCAGAATGTCGCGGTGAATACGTTCCCGGGCCTTGTACacacCGCCCGTCACACCATGGGAGTGGGTTGCTCCAGAAGTGGTTAGCCTAACCTTAGGGAGGGCGATCACCACGGAGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACC\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t1.0\tAlteromonadales\torder\t1.0\tAlteromonadaceae\tfamily\t1.0\tHaliea\tgenus\t1.0\t\n+OTU_3\t3\t\tAGAGTTTGATCATGGCTCAGGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGATGAAGCACCTTCGGGTGTGAATTAGCGGCGAACGGGTGAGGAACACGTGAGAAATCTGCCTTCAACACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATATGAAACCTGCGGGCATCCGCGGGTTTGGAAAGTTtttCGGTTGAAGATGATCTCGCGGCCTATCAGCTTGTTGGTGAGGTAATGGCTCACCAAGGCAACGACGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCAACGCCGCGTGCGGGATGAAGGCCTTCGGGTTGTAAACCTCTTTCAGTAGGGAAGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTAGACACGTCGGATGTGAAAACTGGgggCTCAACCcccAGCCTGCATTCGATACGGGAGGACTCGAGGACGGCAGGGGAGACTGGAACTTCTGG'..b'CGGTCGCAAGATTAAAACTCAAAGGAATTGACGGgggCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGCAGAACCTTACCAACCCTTGACATCCTGTGCTACATGGAgagaTCCATGGTTCCCTTCGGGGACGCAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTCGGTTAAGTCCGGCAACGAGCGCAACCCACACCCTTAGTTGCCAGCAGTTCGGCTGGGCACTCTAGGGGAACTGCCCGTGATAAGCGGGAGGAAGGTGTGGATGACGTCAAGTCCTCATGGCCCTTACGGGTTGGGCTACacacGTGCTACAATGGCAGTGACAATGGGTTAATCCCCAAaaaCTGTCTCAGTTCGGATTGTCGTCTGCAACTCGACGGCATGAAGTCGGAATCGCTAGTAATCGCGTAACAGCATGACGCGGTGAATACGTTCCCGGGCCTTGTACacacCGCCCGTCACATCATGGGAGTTGGGTTTACCCGAAGACGGTGCGCCAACCTGTTCGCAGGgggCAGCTGGCCACGGTAGGCTCAGCGACTGGGATGAAGTCGTAACAAGGTAGCCGTAGGGGAACCTGCGGCTGGATCACCTCCTTTCT\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tAlphaproteobacteria\tclass\t1.0\tRhodobacterales\torder\t1.0\tRhodobacteraceae\tfamily\t1.0\tOceanicola\tgenus\t1.0\t\n+OTU_535\t1\t\tCGCTGGCGGCAGGCTTAACACATGCAAGTCGAGCGGTAACAGGGGAGCTTGCTCCCGCTGACGAGCGGCGGACGGGTGAGTAACGCGTAGGAATCTGCCCAATAGTGGgggATAGCCCGGGGAAACTCGGATTAATACCGCATACGCCCTACGGgggAAAGGCCGGGATCTTCGGACCGGTCGCTATTGGATGAGCCTGCGTAAGATTAGCTAGTTGGTAGGGTAAAGGCCTACCAAGGCGACGATCTTTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGgggCAACCCTGATCCAGCCATGCCGCGTgtgtgAAGAAGGCCTTAGGGTTGTAAAGCACTTTAAGTTGGGAGGAAGGCTCTGTAGCTAATATCTGCAGGGATTGACGTTACCAACAGAATAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCgcgcgTAGGCGGTTTGGTAAGTGTGATGTGAAAGCCCAGGGCTTAACCTTGGAACTGCATCACATACTGCCAGGCTAGAGTACGGTAGAGGggggTAGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAATACCAGTGGCGAAGGCGGCCcccTGGATCGATACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCAACTAGCCGTTGGAAGGGTAATCCTTTTAGTGGCGCAGCTAACGCTCTAAGTTGACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAATGAATTGACGGgggCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGAAGAACCTTACCTGGTCTTGACATCCTGCGAACTTTCCAGAGATGGATTGGTGCCTTCGGGAGCGCAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTGCCATCATTTAGTTGGGCACTTTAGGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACacacGTGCTACAATGGAGCGTACAAAGGGTTGCAACCCCGCGAGGGTGAGCTAATCCCATAAAACGTTTCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGCGAATCAGAATGTCGCGGTGAATACGTTCCCGGGCCTTGTACacacCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTGGGTAGCATAACCGCAAGGAGTGCGCTCACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGTA\tRoot\trootrank\t1.0\tBacteria\tdomain\t1.0\t"Proteobacteria"\tphylum\t1.0\tGammaproteobacteria\tclass\t1.0\tPseudomonadales\torder\t0.46\tPseudomonadales_incertae_sedis\tfamily\t0.39\tDasania\tgenus\t0.39\t\n+OTU_536\t1\t\tGAGTTTGATCCTGGCTCAGGATGAACGCTGGCGGCGTGGATAAGTCATGCAAGTCAAGGgggCTCGCAAGAGCAACCGGCAGACGAGGTAGTAATAAGTAGGTACGTCCCTTCAAGTCACGAATAGCCCGTCGAAAGACGGGGTAATACGCGATAGTCCCTTCGGGGTAAAGATTTATCGCTTGAAGAACGGCCTGCTCGGTATCAGCTAGTTGGCGGTGTAAAAGACCACCAAGGCTATGACGCCTAGGGGAGCTGAGAGGCTGACCcccACCGATGGGACTGAGATACGGCCCATACACCTACGGGTGGCTGCAGACGAGAATATTCCACAATGGACGAAAGTCTGATGGAGCGACGCCGCGTGCAGGATGAAGTTCTTCGGGATGTAAACTGCTTTTATGAGCGAGAAAGTTTATTGATCAGCTCATGAATAAGAGGTTGCTAAACTCGTGCCAGCAGCAGCGGTAATACGAGTGCCTCAAGCGTTATCCGGAATCATTGGGCGTAAAGGGTgtgtAGGTGGTCGCGTTAGTCTTCCGTTAAATTCTTCGGCTCAACCGGgggCATGCGGgggAAACGGCGCGACTTGAGGATGCGAGAGGAAAGCGGAACTCATAGTGTAGCGGTGAAATGCGTTGATATTATGGGGAACACCAAATGCGAAGGCAGCTTTCTGGAGCATCCTGACACTGAAACACGAAAGCGTGGGTAGCGAACGGGATTAGATACCCCGGTAGTCCACGCCCTAAACGATGATCACTAGCTATTCGGAGTATCGACCTCCAAGTGGCGTAGCTAACGCGTTAAGTGATCCGCCTGGGTAGTACGGCCGCAAGGCTAAAACTCAAAGGAATAGACGGGGACTTGCACAAGCGGAGGAACATGTGGTTCAATTCGATGGTAAACGAAaaaCCTTACCAGGGTTGGAAATCAGTTGAGATAGGCAGAAACGTCTATGCCGCAAGGCAATTAGACAGGTGCTGCATGGTCGTCGTCAGTTCGTGGCTTGAGTTGTTCCCTTCAGTGGGGTAACGAACGCAACCcccGTTGCCTGGTATAAGTATCAGGCGAGACTGCCCAGGTTAACTGGGAGGAAGGTGGGGATGACGCCAGATCAGCATGGCCCTTATACCTGGGCCTACacacGTGTTACAATGGCCGACTCACGCGAGGCGAAGAGGAAACTCGGAGCAAATCGTAAaaaGTCGGCCAAGTTCGGATTGAGGGCTGCAACTCGCCCTCATGAAGCGGGATTCGCTAGTAATCGCAGATCAGCATGCTGCGGTGAATACGTTCTCAAGTCTTGTACTCACCGCCCGTCAACTCAAGGGAGCTGGGAATACCCGAAGTCGCCCTTGGGCGCCTAAGGTAAGCTCAGTGACAGGGAGTAAGTCGTAACAAGGTAACCGT\tRoot\trootrank\t1.0\tBacteria\tdomain\t0.99\tOD1\tphylum\t0.37\tOD1_genera_incertae_sedis\tgenus\t0.37\t\n'
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/test-data/otuseqs.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/test-data/otuseqs.tab Thu May 29 02:27:56 2014 -0400
b
b'@@ -0,0 +1,10558 @@\n+>OTU_1\n+AGAGTTTGATCCTGGCTCAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGCGAAATCTCCTTCGGGAGT\n+GAGTAGAGCGGCGGACGGGTGAGTAACGCGTAGGAATCTACCCAGTGGTGGgggACAACCTGGGGAAACCCAGGCTAATA\n+CCGCATACGCCCTACGGgggAAAGCGGgggCTctctTCGGAGACCTCGCGCCATTGGATGAGCCTGCGTTGGATTAGCTA\n+GTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCATAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACAC\n+GGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGgggAAACCCTGACGCAGCCATGCCGCGTgtgtg\n+AAGAAGGCTCTAGGGTTGTAAAGCACTTTCAGTAGGGAGAAaaaGCTCATGTTTAATAGATGTGAGTGTTGATGTTACCT\n+ACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCG\n+TAAAGCgcgcgTAGGCGGTTTGTTAAGTCGGATGTGAAAGCCCCGGGCTCAACCTGGGAATTGCATTCGATACTGATCGA\n+CTAGAGTACGAgagagGGAGGTAGAATTCCACGTGTAGCGGTGAAATGCGTAGATATGTGGAGGAATACCGGTGGCGAAG\n+GCGGCCTCCTGGCTCGATACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGC\n+CGTAAACGATGTCAACTAGCCGTTGGGGAACTTGATTCCTTAGTGGCGCAGCTAACGCAATAAGTTGACCGCCTGGGGAG\n+TACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGgggCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAAC\n+GCGAAGAACCTTACCAGGTCTTGACATCCTGAAAACTTTCCAGAGATGGATTGGTGCCTTCGGGAATTCAGTGACAGGTG\n+CTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTGCCA\n+GCACGTAATGGTGGGAACTCTAAGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCC\n+CTTACGACCTGGGCTACacacGTGCTACAATGGTCGGTACAGACGGCTGCGAACCCGCGAGGgggAGCGAATCCGAGAAA\n+ACCGATCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGCGAATCAGAATGTCGC\n+GGTGAATACGTTCCCGGGCCTTGTACacacCGCCCGTCACACCATGGGAGTGGGTTGCTCCAGAAGTGGTTAGCCTAACC\n+TTAGGGAGGGCGATCACCACGGAGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACC\n+>OTU_2\n+AACGTACGCTGGCGGCACGCCTAACACATGCAAGTCGAACGCAGTAGCAATACTGAGTGGCAAACGGGTGAGTATAATGT\n+GGGAATCTGCCTTTTGGTTTGGAATAACACGGGGAAACTTGTGCTAATACCGAATAAGCCCTTACGGGGAAAGTTTTAAC\n+GCCGAAAGATGAGCCTGCACTTGATTAGCTAGTTGGTAAGGTAAAAGCTTACCAAGGCAACGATCAATAGCTGTTCTTAG\n+AGGAAGACCAGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCACAATGGgg\n+gAAACCCTGATGCAGCGATGCCGCGTGAGTGAAGAGGGCCCTTGGGTTGTAAAACTCTTTCGTCGGGGAAGAAAATGACT\n+GTACCCGAATAAGAAGGTCCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGACCTAGCGTAGTTCGGAATTAC\n+TGGGCTTAAAGAGCTCGTAGGTGGTTAAaaaaGTTGATGGTGAAATCCCAAGGCTCAACCTTGGAACTGCCATCAAAACT\n+TtttAGCTAGAGTGTGATAGAGGTAAGTGGAATTTCTAGTGTAGAGGTGAAATTCGTAGATATTAGAAAGAACACCAAAT\n+GCGAAGGCAACTTACTGGGTCACTACTGACACTGAGGAGCGAAAGCATGGGTAGCGAAGAGGATTAGATACCCTCGTAGT\n+CCATGCCGTAAACGATGtgtgCTAGACGTTGGAAATatatTtttCAGTGTCGCAGCGAAAGCATTAAGCACACCGCCTGG\n+GGAGTACGACCGCAAGGTTAAAACTCAAATGAATTGACGGGGACCCGCACAAGCAGTGGAGCATGTGGTTTAATTCGAAG\n+ATACGCGCAGAACCTTACCAACACTTGACATGTTCGTCGCGAAACTAAGAGATTAGTTttttCAGTTCGGCTGGACGAAA\n+CACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTACTTTT\n+AGTTGCCACCATTTAGTTGGGCACTTTAAAAGAACTGCCAGTGATAAGCTGGAGGAAGGTGGGGATGACGTCAAGTCCTC\n+ATGGCCCTTATGTGTTGGGCTACacacGTGCTACAATGGTACTTACAATGGGATGCAAAGAGGTGACTCTTAGCTAATCC\n+CTAAAATGTACCTCAGTTCGGATTGTACTCTGTAACTCGAGTGCATGAAGCTGGAATTGCTAGTAATCGCGGATCAGCgc\n+gcCGCGGTGAATACGTTCCCGGGTCTTGTACacacCGCCCGTCACACCATGGAAGTTGGTTACACCTTAAGGCAAAGCTT\n+ATACCTTTGACTACGGTACGATCAGCAACTGGGGTGAAGTCGTAACAAGGTAGCCGTAGGGGAACCTGCGGCTGGATTAC\n+CTCCTTTCTAAGGA\n+>OTU_3\n+AGAGTTTGATCATGGCTCAGGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGATGAAGCACCTTCGGGTGT\n+GAATTAGCGGCGAACGGGTGAGGAACACGTGAGAAATCTGCCTTCAACACTGGGATAACTCCGGGAAACCGGGGCTAATA\n+CCGGATATGAAACCTGCGGGCATCCGCGGGTTTGGAAAGTTtttCGGTTGAAGATGATCTCGCGGCCTATCAGCTTGTTG\n+GTGAGGTAATGGCTCACCAAGGCAACGACGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCC\n+CAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCAACGCCGCGTGCGGGATGA\n+AGGCCTTCGGGTTGTAAACCTCTTTCAGTAGGGAAGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCACCGGCTAACTAC\n+GTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTAGAC\n+ACGTCGGATGTGAAAACTGGgggCTCAACCcccAGCCTGCATTCGATACGGGAGGACTCGAGGACGGCAGGGGAGACTGG\n+AACTTCTGGTGTAGCGGTGGAATGCGCAGATATCAGAAAGAACACCAATGGCGAAGGCAGGTCTCTGGGCCGATCCTGAC\n+GCTGAGGAACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACTATGGACGCTAGGTGTG\n+GgggACATTCCACGTTCTCTGCGCCGCAGCTAACGCATTAAGCGTCCCGCCTGGGGAGTACGACCGCAAGGTTAAAACTC\n+AAAGGAATTGACGGgggCCCG'..b'\n+ACGGAGGgggTTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGACTATTAAGTCAGGGGTGAAATCCCG\n+GGGCTCAACCCCGGAACTGCCCTTGATACTGGTAGTCTTGAGTTCGAgagagGTGAGTGGAATTCCGAGTGTAGAGGTGA\n+AATTCGTAGATATTCGGAGGAACACCAGTGGCGAAGGCGGCTCACTGGCTCGATACTGACGCTGAGGTGCGAAAGTGTGG\n+GGAGCAAACAGGATTAGATACCCTGGTAGTCCACACCGTAAACGATGAATGCCAGTCGTCGGGTTGCATGCAATTCGGTG\n+ACacacCTAACGGATTAAGCATTCCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGgggCCCGCA\n+CAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGCAGAACCTTACCAACCCTTGACATCCTGTGCTACATGGAgag\n+aTCCATGGTTCCCTTCGGGGACGCAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTCGGTTAAGT\n+CCGGCAACGAGCGCAACCCACACCCTTAGTTGCCAGCAGTTCGGCTGGGCACTCTAGGGGAACTGCCCGTGATAAGCGGG\n+AGGAAGGTGTGGATGACGTCAAGTCCTCATGGCCCTTACGGGTTGGGCTACacacGTGCTACAATGGCAGTGACAATGGG\n+TTAATCCCCAAaaaCTGTCTCAGTTCGGATTGTCGTCTGCAACTCGACGGCATGAAGTCGGAATCGCTAGTAATCGCGTA\n+ACAGCATGACGCGGTGAATACGTTCCCGGGCCTTGTACacacCGCCCGTCACATCATGGGAGTTGGGTTTACCCGAAGAC\n+GGTGCGCCAACCTGTTCGCAGGgggCAGCTGGCCACGGTAGGCTCAGCGACTGGGATGAAGTCGTAACAAGGTAGCCGTA\n+GGGGAACCTGCGGCTGGATCACCTCCTTTCT\n+>OTU_535\n+CGCTGGCGGCAGGCTTAACACATGCAAGTCGAGCGGTAACAGGGGAGCTTGCTCCCGCTGACGAGCGGCGGACGGGTGAG\n+TAACGCGTAGGAATCTGCCCAATAGTGGgggATAGCCCGGGGAAACTCGGATTAATACCGCATACGCCCTACGGgggAAA\n+GGCCGGGATCTTCGGACCGGTCGCTATTGGATGAGCCTGCGTAAGATTAGCTAGTTGGTAGGGTAAAGGCCTACCAAGGC\n+GACGATCTTTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAG\n+TGGGGAATATTGGACAATGGgggCAACCCTGATCCAGCCATGCCGCGTgtgtgAAGAAGGCCTTAGGGTTGTAAAGCACT\n+TTAAGTTGGGAGGAAGGCTCTGTAGCTAATATCTGCAGGGATTGACGTTACCAACAGAATAAGCACCGGCTAACTCCGTG\n+CCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCgcgcgTAGGCGGTTTGGTAAG\n+TGTGATGTGAAAGCCCAGGGCTTAACCTTGGAACTGCATCACATACTGCCAGGCTAGAGTACGGTAGAGGggggTAGAAT\n+TCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAATACCAGTGGCGAAGGCGGCCcccTGGATCGATACTGACGCT\n+GAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCAACTAGCCGTTGGA\n+AGGGTAATCCTTTTAGTGGCGCAGCTAACGCTCTAAGTTGACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAATG\n+AATTGACGGgggCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGAAGAACCTTACCTGGTCTTGACAT\n+CCTGCGAACTTTCCAGAGATGGATTGGTGCCTTCGGGAGCGCAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCG\n+TGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTGCCATCATTTAGTTGGGCACTTTAGGGAGAC\n+TGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACacacGTGCTACA\n+ATGGAGCGTACAAAGGGTTGCAACCCCGCGAGGGTGAGCTAATCCCATAAAACGTTTCGTAGTCCGGATCGCAGTCTGCA\n+ACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGCGAATCAGAATGTCGCGGTGAATACGTTCCCGGGCCTTGTACaca\n+cCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTGGGTAGCATAACCGCAAGGAGTGCGCTCACCACTTTGTGATT\n+CATGACTGGGGTGAAGTCGTAACAAGGTAACCGTA\n+>OTU_536\n+GAGTTTGATCCTGGCTCAGGATGAACGCTGGCGGCGTGGATAAGTCATGCAAGTCAAGGgggCTCGCAAGAGCAACCGGC\n+AGACGAGGTAGTAATAAGTAGGTACGTCCCTTCAAGTCACGAATAGCCCGTCGAAAGACGGGGTAATACGCGATAGTCCC\n+TTCGGGGTAAAGATTTATCGCTTGAAGAACGGCCTGCTCGGTATCAGCTAGTTGGCGGTGTAAAAGACCACCAAGGCTAT\n+GACGCCTAGGGGAGCTGAGAGGCTGACCcccACCGATGGGACTGAGATACGGCCCATACACCTACGGGTGGCTGCAGACG\n+AGAATATTCCACAATGGACGAAAGTCTGATGGAGCGACGCCGCGTGCAGGATGAAGTTCTTCGGGATGTAAACTGCTTTT\n+ATGAGCGAGAAAGTTTATTGATCAGCTCATGAATAAGAGGTTGCTAAACTCGTGCCAGCAGCAGCGGTAATACGAGTGCC\n+TCAAGCGTTATCCGGAATCATTGGGCGTAAAGGGTgtgtAGGTGGTCGCGTTAGTCTTCCGTTAAATTCTTCGGCTCAAC\n+CGGgggCATGCGGgggAAACGGCGCGACTTGAGGATGCGAGAGGAAAGCGGAACTCATAGTGTAGCGGTGAAATGCGTTG\n+ATATTATGGGGAACACCAAATGCGAAGGCAGCTTTCTGGAGCATCCTGACACTGAAACACGAAAGCGTGGGTAGCGAACG\n+GGATTAGATACCCCGGTAGTCCACGCCCTAAACGATGATCACTAGCTATTCGGAGTATCGACCTCCAAGTGGCGTAGCTA\n+ACGCGTTAAGTGATCCGCCTGGGTAGTACGGCCGCAAGGCTAAAACTCAAAGGAATAGACGGGGACTTGCACAAGCGGAG\n+GAACATGTGGTTCAATTCGATGGTAAACGAAaaaCCTTACCAGGGTTGGAAATCAGTTGAGATAGGCAGAAACGTCTATG\n+CCGCAAGGCAATTAGACAGGTGCTGCATGGTCGTCGTCAGTTCGTGGCTTGAGTTGTTCCCTTCAGTGGGGTAACGAACG\n+CAACCcccGTTGCCTGGTATAAGTATCAGGCGAGACTGCCCAGGTTAACTGGGAGGAAGGTGGGGATGACGCCAGATCAG\n+CATGGCCCTTATACCTGGGCCTACacacGTGTTACAATGGCCGACTCACGCGAGGCGAAGAGGAAACTCGGAGCAAATCG\n+TAAaaaGTCGGCCAAGTTCGGATTGAGGGCTGCAACTCGCCCTCATGAAGCGGGATTCGCTAGTAATCGCAGATCAGCAT\n+GCTGCGGTGAATACGTTCTCAAGTCTTGTACTCACCGCCCGTCAACTCAAGGGAGCTGGGAATACCCGAAGTCGCCCTTG\n+GGCGCCTAAGGTAAGCTCAGTGACAGGGAGTAAGTCGTAACAAGGTAACCGT\n'
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/test-data/preotu.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/test-data/preotu.tab Thu May 29 02:27:56 2014 -0400
b
b'@@ -0,0 +1,536 @@\n+OTU_2\t60\t\tAACGTACGCTGGCGGCACGCCTAACACATGCAAGTCGAACGCAGTAGCAATACTGAGTGGCAAACGGGTGAGTATAATGTGGGAATCTGCCTTTTGGTTTGGAATAACACGGGGAAACTTGTGCTAATACCGAATAAGCCCTTACGGGGAAAGTTTTAACGCCGAAAGATGAGCCTGCACTTGATTAGCTAGTTGGTAAGGTAAAAGCTTACCAAGGCAACGATCAATAGCTGTTCTTAGAGGAAGACCAGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCACAATGGgggAAACCCTGATGCAGCGATGCCGCGTGAGTGAAGAGGGCCCTTGGGTTGTAAAACTCTTTCGTCGGGGAAGAAAATGACTGTACCCGAATAAGAAGGTCCGGCTAACTTCGTGCCAGCAGCCGCGGTAATACGAAGGGACCTAGCGTAGTTCGGAATTACTGGGCTTAAAGAGCTCGTAGGTGGTTAAaaaaGTTGATGGTGAAATCCCAAGGCTCAACCTTGGAACTGCCATCAAAACTTtttAGCTAGAGTGTGATAGAGGTAAGTGGAATTTCTAGTGTAGAGGTGAAATTCGTAGATATTAGAAAGAACACCAAATGCGAAGGCAACTTACTGGGTCACTACTGACACTGAGGAGCGAAAGCATGGGTAGCGAAGAGGATTAGATACCCTCGTAGTCCATGCCGTAAACGATGtgtgCTAGACGTTGGAAATatatTtttCAGTGTCGCAGCGAAAGCATTAAGCACACCGCCTGGGGAGTACGACCGCAAGGTTAAAACTCAAATGAATTGACGGGGACCCGCACAAGCAGTGGAGCATGTGGTTTAATTCGAAGATACGCGCAGAACCTTACCAACACTTGACATGTTCGTCGCGAAACTAAGAGATTAGTTttttCAGTTCGGCTGGACGAAACACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTACTTTTAGTTGCCACCATTTAGTTGGGCACTTTAAAAGAACTGCCAGTGATAAGCTGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGTGTTGGGCTACacacGTGCTACAATGGTACTTACAATGGGATGCAAAGAGGTGACTCTTAGCTAATCCCTAAAATGTACCTCAGTTCGGATTGTACTCTGTAACTCGAGTGCATGAAGCTGGAATTGCTAGTAATCGCGGATCAGCgcgcCGCGGTGAATACGTTCCCGGGTCTTGTACacacCGCCCGTCACACCATGGAAGTTGGTTACACCTTAAGGCAAAGCTTATACCTTTGACTACGGTACGATCAGCAACTGGGGTGAAGTCGTAACAAGGTAGCCGTAGGGGAACCTGCGGCTGGATTACCTCCTTTCTAAGGA\n+OTU_1\t4\t\tAGAGTTTGATCCTGGCTCAGATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAGCGCGAAATCTCCTTCGGGAGTGAGTAGAGCGGCGGACGGGTGAGTAACGCGTAGGAATCTACCCAGTGGTGGgggACAACCTGGGGAAACCCAGGCTAATACCGCATACGCCCTACGGgggAAAGCGGgggCTctctTCGGAGACCTCGCGCCATTGGATGAGCCTGCGTTGGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCCATAGCTGGTCTGAGAGGACGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGgggAAACCCTGACGCAGCCATGCCGCGTgtgtgAAGAAGGCTCTAGGGTTGTAAAGCACTTTCAGTAGGGAGAAaaaGCTCATGTTTAATAGATGTGAGTGTTGATGTTACCTACAGAAGAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCgcgcgTAGGCGGTTTGTTAAGTCGGATGTGAAAGCCCCGGGCTCAACCTGGGAATTGCATTCGATACTGATCGACTAGAGTACGAgagagGGAGGTAGAATTCCACGTGTAGCGGTGAAATGCGTAGATATGTGGAGGAATACCGGTGGCGAAGGCGGCCTCCTGGCTCGATACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCAACTAGCCGTTGGGGAACTTGATTCCTTAGTGGCGCAGCTAACGCAATAAGTTGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGgggCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCAGGTCTTGACATCCTGAAAACTTTCCAGAGATGGATTGGTGCCTTCGGGAATTCAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTGCCAGCACGTAATGGTGGGAACTCTAAGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGACCTGGGCTACacacGTGCTACAATGGTCGGTACAGACGGCTGCGAACCCGCGAGGgggAGCGAATCCGAGAAAACCGATCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGCGAATCAGAATGTCGCGGTGAATACGTTCCCGGGCCTTGTACacacCGCCCGTCACACCATGGGAGTGGGTTGCTCCAGAAGTGGTTAGCCTAACCTTAGGGAGGGCGATCACCACGGAGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACC\n+OTU_3\t3\t\tAGAGTTTGATCATGGCTCAGGACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGATGAAGCACCTTCGGGTGTGAATTAGCGGCGAACGGGTGAGGAACACGTGAGAAATCTGCCTTCAACACTGGGATAACTCCGGGAAACCGGGGCTAATACCGGATATGAAACCTGCGGGCATCCGCGGGTTTGGAAAGTTtttCGGTTGAAGATGATCTCGCGGCCTATCAGCTTGTTGGTGAGGTAATGGCTCACCAAGGCAACGACGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCAACGCCGCGTGCGGGATGAAGGCCTTCGGGTTGTAAACCTCTTTCAGTAGGGAAGAAGCGAAAGTGACGGTACCTGCAGAAGAAGCACCGGCTAACTACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGAGCTCGTAGGCGGTTAGACACGTCGGATGTGAAAACTGGgggCTCAACCcccAGCCTGCATTCGATACGGGAGGACTCGAGGACGGCAGGGGAGACTGGAACTTCTGGTGTAGCGGTGGAATGCGCAGATATCAGAAAGAACACCAATGGCGAAGGCAGGTCTCTGGGCCGATCCTGACGCTGAGGAACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACTATGGACGCTAGGTGTGGgggACATTCCACGTTCTCTGCGCCGCAGCTAACGCATTAAGCGTCCCGCCTGGGGAGTACGACCGCAAGGTTAAAACTCAAAGGAATTGACGGgggCCCGCACAAGCAGCGGAGCATGCGGCTTAATTCGATGCAACGCGAAGAACCTTACCTAGGCTTGACATGCATTGAAAACTGTTAGAGATAACAGGT'..b'GGCCCTAGGGTCGTAAAGCTCTTTCGCCAGGGATGATAATGACAGTACCTGGTAAAGAAACCCCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGgggTTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGACTATTAAGTCAGGGGTGAAATCCCGGGGCTCAACCCCGGAACTGCCCTTGATACTGGTAGTCTTGAGTTCGAgagagGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAGGAACACCAGTGGCGAAGGCGGCTCACTGGCTCGATACTGACGCTGAGGTGCGAAAGTGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACACCGTAAACGATGAATGCCAGTCGTCGGGTTGCATGCAATTCGGTGACacacCTAACGGATTAAGCATTCCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGgggCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGCAGAACCTTACCAACCCTTGACATCCTGTGCTACATGGAgagaTCCATGGTTCCCTTCGGGGACGCAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTCGGTTAAGTCCGGCAACGAGCGCAACCCACACCCTTAGTTGCCAGCAGTTCGGCTGGGCACTCTAGGGGAACTGCCCGTGATAAGCGGGAGGAAGGTGTGGATGACGTCAAGTCCTCATGGCCCTTACGGGTTGGGCTACacacGTGCTACAATGGCAGTGACAATGGGTTAATCCCCAAaaaCTGTCTCAGTTCGGATTGTCGTCTGCAACTCGACGGCATGAAGTCGGAATCGCTAGTAATCGCGTAACAGCATGACGCGGTGAATACGTTCCCGGGCCTTGTACacacCGCCCGTCACATCATGGGAGTTGGGTTTACCCGAAGACGGTGCGCCAACCTGTTCGCAGGgggCAGCTGGCCACGGTAGGCTCAGCGACTGGGATGAAGTCGTAACAAGGTAGCCGTAGGGGAACCTGCGGCTGGATCACCTCCTTTCT\n+OTU_535\t1\t\tCGCTGGCGGCAGGCTTAACACATGCAAGTCGAGCGGTAACAGGGGAGCTTGCTCCCGCTGACGAGCGGCGGACGGGTGAGTAACGCGTAGGAATCTGCCCAATAGTGGgggATAGCCCGGGGAAACTCGGATTAATACCGCATACGCCCTACGGgggAAAGGCCGGGATCTTCGGACCGGTCGCTATTGGATGAGCCTGCGTAAGATTAGCTAGTTGGTAGGGTAAAGGCCTACCAAGGCGACGATCTTTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGgggCAACCCTGATCCAGCCATGCCGCGTgtgtgAAGAAGGCCTTAGGGTTGTAAAGCACTTTAAGTTGGGAGGAAGGCTCTGTAGCTAATATCTGCAGGGATTGACGTTACCAACAGAATAAGCACCGGCTAACTCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCgcgcgTAGGCGGTTTGGTAAGTGTGATGTGAAAGCCCAGGGCTTAACCTTGGAACTGCATCACATACTGCCAGGCTAGAGTACGGTAGAGGggggTAGAATTCCACGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAATACCAGTGGCGAAGGCGGCCcccTGGATCGATACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCAACTAGCCGTTGGAAGGGTAATCCTTTTAGTGGCGCAGCTAACGCTCTAAGTTGACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAATGAATTGACGGgggCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGAAGAACCTTACCTGGTCTTGACATCCTGCGAACTTTCCAGAGATGGATTGGTGCCTTCGGGAGCGCAGTGACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTGTCCTTAGTTGCCATCATTTAGTTGGGCACTTTAGGGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACacacGTGCTACAATGGAGCGTACAAAGGGTTGCAACCCCGCGAGGGTGAGCTAATCCCATAAAACGTTTCGTAGTCCGGATCGCAGTCTGCAACTCGACTGCGTGAAGTCGGAATCGCTAGTAATCGCGAATCAGAATGTCGCGGTGAATACGTTCCCGGGCCTTGTACacacCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTGGGTAGCATAACCGCAAGGAGTGCGCTCACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGTA\n+OTU_536\t1\t\tGAGTTTGATCCTGGCTCAGGATGAACGCTGGCGGCGTGGATAAGTCATGCAAGTCAAGGgggCTCGCAAGAGCAACCGGCAGACGAGGTAGTAATAAGTAGGTACGTCCCTTCAAGTCACGAATAGCCCGTCGAAAGACGGGGTAATACGCGATAGTCCCTTCGGGGTAAAGATTTATCGCTTGAAGAACGGCCTGCTCGGTATCAGCTAGTTGGCGGTGTAAAAGACCACCAAGGCTATGACGCCTAGGGGAGCTGAGAGGCTGACCcccACCGATGGGACTGAGATACGGCCCATACACCTACGGGTGGCTGCAGACGAGAATATTCCACAATGGACGAAAGTCTGATGGAGCGACGCCGCGTGCAGGATGAAGTTCTTCGGGATGTAAACTGCTTTTATGAGCGAGAAAGTTTATTGATCAGCTCATGAATAAGAGGTTGCTAAACTCGTGCCAGCAGCAGCGGTAATACGAGTGCCTCAAGCGTTATCCGGAATCATTGGGCGTAAAGGGTgtgtAGGTGGTCGCGTTAGTCTTCCGTTAAATTCTTCGGCTCAACCGGgggCATGCGGgggAAACGGCGCGACTTGAGGATGCGAGAGGAAAGCGGAACTCATAGTGTAGCGGTGAAATGCGTTGATATTATGGGGAACACCAAATGCGAAGGCAGCTTTCTGGAGCATCCTGACACTGAAACACGAAAGCGTGGGTAGCGAACGGGATTAGATACCCCGGTAGTCCACGCCCTAAACGATGATCACTAGCTATTCGGAGTATCGACCTCCAAGTGGCGTAGCTAACGCGTTAAGTGATCCGCCTGGGTAGTACGGCCGCAAGGCTAAAACTCAAAGGAATAGACGGGGACTTGCACAAGCGGAGGAACATGTGGTTCAATTCGATGGTAAACGAAaaaCCTTACCAGGGTTGGAAATCAGTTGAGATAGGCAGAAACGTCTATGCCGCAAGGCAATTAGACAGGTGCTGCATGGTCGTCGTCAGTTCGTGGCTTGAGTTGTTCCCTTCAGTGGGGTAACGAACGCAACCcccGTTGCCTGGTATAAGTATCAGGCGAGACTGCCCAGGTTAACTGGGAGGAAGGTGGGGATGACGCCAGATCAGCATGGCCCTTATACCTGGGCCTACacacGTGTTACAATGGCCGACTCACGCGAGGCGAAGAGGAAACTCGGAGCAAATCGTAAaaaGTCGGCCAAGTTCGGATTGAGGGCTGCAACTCGCCCTCATGAAGCGGGATTCGCTAGTAATCGCAGATCAGCATGCTGCGGTGAATACGTTCTCAAGTCTTGTACTCACCGCCCGTCAACTCAAGGGAGCTGGGAATACCCGAAGTCGCCCTTGGGCGCCTAAGGTAAGCTCAGTGACAGGGAGTAAGTCGTAACAAGGTAACCGT\n'
b
diff -r 000000000000 -r a73ae72b47aa rdpmulticlassifier/tool_dependencies.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rdpmulticlassifier/tool_dependencies.xml Thu May 29 02:27:56 2014 -0400
b
@@ -0,0 +1,17 @@
+<?xml version="1.0"?>
+<tool_dependency>
+    <package name="rdp_multi_classifier_1.1" version="1.1">
+        <install version="1.0">
+            <actions>
+                <action type="download_by_url">https://bitbucket.org/qfab/metagenomics/downloads/rdp_multiclassifier_1.1.zip</action>
+ <action type="move_file">
+                    <source>rdp_multiclassifier_1.1</source>
+                    <destination>$INSTALL_DIR/multi_classifier</destination>
+                </action>
+ <action type="set_environment">
+                    <environment_variable name="JAVA_JAR_PATH" action="set_to">$INSTALL_DIR/multi_classifier/rdp_multiclassifier_1.1</environment_variable>
+                </action>
+            </actions>
+        </install>
+    </package>
+</tool_dependency>