Repository 'orthogroups_tool'
hg clone https://toolshed.g2.bx.psu.edu/repos/abims-sbr/orthogroups_tool

Changeset 0:d33ad52f59bc (2019-02-01)
Commit message:
planemo upload for repository htpps://github.com/abims-sbr/adaptearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
added:
README.rst
macros.xml
orthogroups_tool.xml
scripts/filter_orthofinder.py
scripts/format_transdecoder_headers.sh
static/images/adaptsearch_picture_helps.png
test-data/2_orthogroups_tool.output
test-data/Orthogroups.txt
test-data/filtered_orthogroups/orthogroup_1_3_sequences.fasta
test-data/filtered_orthogroups/orthogroup_2_4_sequences.fasta
test-data/filtered_orthogroups/orthogroup_3_2_sequences.fasta
test-data/filtered_orthogroups/orthogroup_4_3_sequences.fasta
test-data/filtered_orthogroups/orthogroup_5_3_sequences.fasta
test-data/filtered_orthogroups/orthogroup_6_3_sequences.fasta
test-data/filtered_orthogroups/orthogroup_7_2_sequences.fasta
test-data/orthogroups_tool.output
test-data/orthogroups_withParalogs/orthogroup_1_8_sequences_withParalogs.fasta
test-data/orthogroups_withParalogs/orthogroup_2_5_sequences_withParalogs.fasta
test-data/orthogroups_withParalogs/orthogroup_3_3_sequences_withParalogs.fasta
test-data/orthogroups_withParalogs/orthogroup_4_3_sequences_withParalogs.fasta
test-data/orthogroups_withParalogs/orthogroup_5_3_sequences_withParalogs.fasta
test-data/orthogroups_withParalogs/orthogroup_6_3_sequences_withParalogs.fasta
test-data/orthogroups_withParalogs/orthogroup_7_2_sequences_withParalogs.fasta
test-data/output_filterassemblies/AcAcaud_trinity.fasta
test-data/output_filterassemblies/AmAmphi_trinity.fasta
test-data/output_filterassemblies/ApApomp_trinity.fasta
test-data/output_filterassemblies/AsAsp1_trinity.fasta
b
diff -r 000000000000 -r d33ad52f59bc README.rst
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/README.rst Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,13 @@
+Changelog
+---------
+
+**Version 2.0 - 08/01/2017**
+
+ - Adapted to new TransDecoder headers
+ - Using numpy and pandas
+ - Improved algorithm and added options
+
+**Version 1.0 - 13/04/2017**
+
+ - Functional tests with planemo
+ - beta version
b
diff -r 000000000000 -r d33ad52f59bc macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,32 @@
+<macros>
+
+ <xml name="python_required">
+ <requirement type="package" version="2.7">python</requirement>
+ </xml>
+
+    <token name="@HELP_AUTHORS@">
+.. class:: infomark
+
+**Authors**  Eric Fontanillas created the version 1 of this pipeline. Victor Mataigne developped version 2.
+
+.. class:: infomark
+
+**Galaxy integration** Julie Baffard and ABiMS TEAM, Roscoff Marine Station
+
+ | Contact support.abims@sb-roscoff.fr for any questions or concerns about the Galaxy implementation of this tool.
+ | Credits : Gildas le Corguillé, Misharl Monsoor
+
+---------------------------------------------------
+
+    </token>
+
+ <xml name="citations">
+ <citations>
+ <citation type="bibtex">Credits : ABIMS team, Roscoff Marine Station</citation>
+ <citation type="bibtex">Contact support.abims@sb-roscoff.fr for any questions or concerns about the Galaxy implementation of this tool.</citation>
+ <citation type="bibtex">Version 1 : Scripts by Eric Fontanillas -- Galaxy integration by Julie Baffard</citation>
+ <citation type="bibtex">Version 2 : improvments by Victor Mataigne, Gildas le Corguillé, Misharl Monsoor</citation>
+ </citations>
+ </xml>
+
+</macros>
b
diff -r 000000000000 -r d33ad52f59bc orthogroups_tool.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/orthogroups_tool.xml Fri Feb 01 10:25:10 2019 -0500
[
b'@@ -0,0 +1,167 @@\n+<tool name="Orthogroups_Tool" id="orthogroups_tool" version="1.0.2">\n+\n+    <description>\n+        Writes orthogroups found by OrthoFinder in fasta files (with their sequences).\n+    </description>\n+\n+    <macros>\n+        <import>macros.xml</import>\n+    </macros>\n+\n+    <requirements>\n+        <requirement type="package" version="2.7">python</requirement>\n+        <requirement type="package" version="1.12.0">numpy</requirement>\n+        <requirement type="package" version="0.20.0">pandas</requirement>\n+    </requirements>\n+    \n+    <command>\n+    <![CDATA[        \n+        #set $infiles = ""\n+        #for $input in $inputs_fasta\n+            ln -s \'$input\' \'$input.element_identifier\';\n+            #set $infiles = $infiles + $input.element_identifier + ","\n+        #end for\n+        #set $infiles = $infiles[:-1]\n+\n+        $__tool_directory__/scripts/format_transdecoder_headers.sh \'$orthogroups\' tmp_orthogroups.txt\n+        &&\n+        python $__tool_directory__/scripts/filter_orthofinder.py tmp_orthogroups.txt \'$infiles\' $nbseq               \n+        #if $verbosity=="T":\n+            -v\n+        #end if\n+        #if $paralogs=="T":\n+            -p\n+        #end if\n+\n+        > \'$output\';\n+    ]]> \n+    </command>\n+\n+    <inputs>\n+        <param name="orthogroups" type="data" format="txt" label="Select a file of Orthogroups" help="The output from OrthoFinder, \'Orthogroups.txt\'."/>\n+        <param name="inputs_fasta" type="data" format="fasta" multiple="true" label="Outputs from Filter Assemblies" help="Contains the nucleic sequences to retrieve."/>\n+        <param name="nbseq" type="integer" value="3" label="Minimal number of sequences per orthogroup" help="Drop orthogroups with less than x sequences :" />\n+        <param name="verbosity" type="boolean" checked="True" truevalue="T" falsevalue="F" label="verbosity" help="Turn on this paramater to display an additional summary table (computed before the pralogous filtering)" />\n+        <param name="paralogs" type="boolean" checked="False" truevalue="T" falsevalue="F" label="paralogs" help="Turn on this parameter to obtain an additional output (orthogroups files before paralogous filtering)" />\n+    </inputs>\n+\n+    <outputs>\n+        <data format="txt" name="output" label="orthogroups_tool.output" />        \n+        <collection name="orthogroups_fasta" type="list" label="Orthogroups_fasta_files" >\n+            <discover_datasets pattern="__name_and_ext__" directory="filtered_orthogroups" />\n+        </collection>\n+        <collection name="orthogroups_fasta_paralogs" type="list" label="Orthogroups_with_paralogs_fasta_files" >\n+            <discover_datasets pattern="__name_and_ext__" directory="orthogroups_withParalogs" />\n+            <filter>paralogs == True</filter>\n+        </collection>\n+    </outputs>\n+\n+    <tests>\n+        <test>\n+            <param name="orthogroups" value="Orthogroups.txt"/>\n+            <param name="inputs_fasta" value="output_filterassemblies/AcAcaud_trinity.fasta,output_filterassemblies/AmAmphi_trinity.fasta,output_filterassemblies/ApApomp_trinity.fasta,output_filterassemblies/AsAsp1_trinity.fasta"/>\n+            <param name="nbseq" value="2"/>\n+            <param name="verbosity" value="True"/>\n+            <param name="paralogs" value="True"/>\n+            <output name="output" value="orthogroups_tool.output" lines_diff="2"/>\n+            <output_collection name="orthogroups_fasta" type="list">\n+                <element name="orthogroup_1_3_sequences" value="filtered_orthogroups/orthogroup_1_3_sequences.fasta" />\n+                <element name="orthogroup_2_4_sequences" value="filtered_orthogroups/orthogroup_2_4_sequences.fasta" />\n+                <element name="orthogroup_3_2_sequences" value="filtered_orthogroups/orthogroup_3_2_sequences.fasta" />\n+                <element name="orthogroup_4_3_sequences" value="filtered_orthogroups/orthogroup_4_3_sequences.fasta" />\n+                <element name="orthogroup_5_3_sequenc'..b'_fasta" value="output_filterassemblies/AcAcaud_trinity.fasta,output_filterassemblies/AmAmphi_trinity.fasta,output_filterassemblies/ApApomp_trinity.fasta,output_filterassemblies/AsAsp1_trinity.fasta"/>\n+            <param name="nbseq" value="2"/>\n+            <param name="verbosity" value="True"/>\n+            <param name="paralogs" value="False"/>\n+            <output name="output" value="2_orthogroups_tool.output" lines_diff="2"/>\n+            <output_collection name="orthogroups_fasta" type="list">\n+                <element name="orthogroup_1_3_sequences" value="filtered_orthogroups/orthogroup_1_3_sequences.fasta" />\n+                <element name="orthogroup_2_4_sequences" value="filtered_orthogroups/orthogroup_2_4_sequences.fasta" />\n+                <element name="orthogroup_3_2_sequences" value="filtered_orthogroups/orthogroup_3_2_sequences.fasta" />\n+                <element name="orthogroup_4_3_sequences" value="filtered_orthogroups/orthogroup_4_3_sequences.fasta" />\n+                <element name="orthogroup_5_3_sequences" value="filtered_orthogroups/orthogroup_5_3_sequences.fasta" />\n+                <element name="orthogroup_6_3_sequences" value="filtered_orthogroups/orthogroup_6_3_sequences.fasta" />\n+                <element name="orthogroup_7_2_sequences" value="filtered_orthogroups/orthogroup_7_2_sequences.fasta" />\n+            </output_collection>\n+        </test>\n+    </tests>\n+\n+    <help>\n+\n+@HELP_AUTHORS@\n+\n+<![CDATA[\n+\n+**Description**\n+\n+This tool takes Orthogroups found by OrthoFinder and proceeds to retrieve nucleic sequences back, then write each orthogroups in its own fasta file.\n+\n+-------------------------------------------\n+\n+**Step 1 : re-writing headers**\n+\n+.. class:: warningmark\n+\n+This tool is configured to work within the AdaptSearch toolsuite, which implies a specific format of headers. Indeed, due to the use of external tools (like TransDecoder), the genes IDs might have been modified. A regular expression rewrites all the genes IDs in order to have, for instance, this format : >Pf1004_1/1_1.000_369\n+\n+-------------------------------------------\n+\n+**Step 2 : reading an re-writing orthoGroups from OrthoFinder**\n+\n+OrthoFinder (Emms, D.M. and Kelly, S., 2015) is a fast, accurate and comprehensive analysis tool for comparative genomics. It finds orthologues and orthogroups infers gene trees for all orthogroups and infers a rooted species tree for the species being analysed. OrthoFinder also provides comprehensive statistics for comparative genomic analyses. \n+\n+Our tool focus on the orthogroups.txt file created before gene trees.The script proceeds to split each orthogroup in its own fasta file and, with the use of the output of Filter_Assemblies, to re-associate each ID with its sequence.\n+\n+-------------------------------------------\n+\n+**Inputs and parameters**\n+\n+- File of Orthogroups : the orthogroups.txt file from OrthoFinder.\n+- Output from Filter_Assemblies (either as multiple datasets or dataset collection)\n+- Minimal number of sequences : The orthogroups with less than the specified number won\'t be recorded.\n+- Verbose : If \'Yes\', a supplementary table will be displayed in the outputs (coutings of species and sequences in orthogroups before the removal of paralogs).\n+- Paralogs : if \'Yes\', there will be a supplementary output of orthogroups file, before the removal of paralogs.\n+\n+-------------------------------------------\n+\n+**Outputs**\n+\n+- Dataset collection of fasta files : each file represents an orthogroup, each gene within tthe group has the couple ID-nucleic sequence.\n+- If the --paralogs option is checked : another dataset collection of fasta files with all the paralogous genes.\n+- The tool log.\n+\n+---------\n+\n+**The AdaptSearch Pipeline**\n+\n+.. image:: adaptsearch_picture_helps.png\n+\n+Changelog\n+---------\n+\n+**Version 1.0 - 11/01/2018**\n+\n+]]>\n+    </help>\n+\n+    <citations>\n+        <citation type="doi">10.1186/s13059-015-0721-2</citation>\n+    </citations>\n+\n+</tool>\n'
b
diff -r 000000000000 -r d33ad52f59bc scripts/filter_orthofinder.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/scripts/filter_orthofinder.py Fri Feb 01 10:25:10 2019 -0500
[
b'@@ -0,0 +1,184 @@\n+#!/usr/bin/env python\n+# Commandline : ./filter_orthofinder.py <Orthogroups.txt> <Nb_of_studied_species> <minimal_nb_species_per_group> [-v] [-p]\n+\n+## This script takes an output file of OrthoFinder (Orthogroups.txt), which contains a set of orthogroups,\n+## and rewrite it to split each orthogroup into a single fasta file.\n+\n+import os, string, glob, argparse, csv, itertools\n+import numpy as np\n+import pandas as pd\n+\n+## PART 1 : Make a dictionary of {IDs : sequence}\n+\n+""" Build a hash table with gene IDs and gene sequences from fasta made from input files \n+    Returns a dictionnary """\n+def hashSequences(path):\n+    hashTable = {}\n+    # WARNING : sequences are expected to be on one line. If not, biopython can do it\n+    for file in path:\n+        gene = ""\n+        sequence = ""\n+        with open(file, "r") as origin:\n+            for line1,line2 in itertools.izip_longest(*[origin]*2):\n+                gene=line1.strip("\\r\\n ")\n+                sequence=line2.strip("\\r\\n ")\n+                hashTable[gene] = sequence    \n+\n+    return hashTable\n+\n+## PART 2 : Create orthogroups file (one file per orthogroup)\n+\n+""" Takes a file.txt of orthogroups as parameter and keeps the orthogroups where there are at least args.minspec loci\n+    WARNING : sequences names within the groups must the same as IDs in fasta files from Filter_Assemblies. if not, the \n+    dictionnary will be false. That\'s is why the script "format_transdecoder_headers is for.\n+    Returns a 2D list (each list being a list of loci) """\n+def formatAndFilter(orthogroups, mini, nbspecs, hashTable, verbose, paralogs):\n+\n+    """ Builds a 2D array for a summary\n+        Returns a numpy 2D array """\n+    def countings(listOrthogroups, nbcols):\n+        #listOrthogroups.sort().reverse()\n+        #nblines = len(listOrthogroups[0])\n+        nblines = 0    \n+        for group in listOrthogroups:\n+            if len(group) > nblines:\n+                nblines = len(group)\n+        matrix = np.array([[0]*nbcols]*nblines)\n+        # empty lines are avoided : first line of the frame is the line for minimal number of sequences in a group (>=mini)\n+        # for now, this feature diseappear when using numpy arrays and pandas :/\n+\n+        for group in listOrthogroups:\n+            listSpecs = []\n+            for loci in group:\n+                if loci[1:3] not in listSpecs:\n+                    listSpecs.append(loci[1:3])\n+            matrix[len(group)-1][len(listSpecs)-1] += 1\n+\n+        return matrix\n+\n+    """ numpy 2D array in a nice dataframe \n+        Returns a pandas 2D dataframe """\n+    def asFrame(matrix) :\n+        index = [0]*len(matrix)\n+        colnames = [0]*len(matrix[0])\n+        index = [str(i+1)+" seqs" for i in range(len(matrix))]\n+        colnames = [str(i+1)+" sps" for i in range(len(matrix[0]))]\n+        df = pd.DataFrame(matrix, index=index, columns=colnames)\n+        return df # Mettre une selection pour ne renvoyer que les lignes et les colonnes qui somment > 0\n+        #return df.loc[\'4 seqs\':\'9 seqs\'].loc[:,colnames[3:]]\n+        \n+    """ Writes each orthogroup in a fasta file. Retrieves sequences with a hash table """\n+    def writeOutputFile(orthogroup, hashTable, i, naming):\n+        length = len(orthogroup)\n+        name =""\n+        if naming: \n+            name="orthogroup_{}_{}_sequences_withParalogs.fasta".format(i, length) \n+        else :\n+            name = "orthogroup_{}_{}_sequences.fasta".format(i, length)\n+        result = open(name, "w")\n+        with result:\n+            for locus in orthogroup:                \n+                result.write("{}\\n".format(locus)) # write geneID. ">%s\\n" before\n+                result.write("{}\\n".format(hashTable[locus])) # write sequence\n+\n+    # FUNCTION\n+\n+    orthogroups = open(orthogroups, "r")\n+    list_orthogroups = []\n+    # STEP 1 - Read file into a list ----------------------------------------------\n+    with orthogroups:\n+        while (1):\n+            group = orthog'..b'iltering -----------------------------------------------\n+    if verbose or paralogs:\n+        list_orthogroups_withpara = []\n+    list_orthogroups_format = []\n+\n+    i,j = 1,1\n+    for group in list_orthogroups:\n+        group = string.split(group, " ") # list of lists\n+        group.sort()\n+        if verbose and len(group) >= mini:\n+            list_orthogroups_withpara.append(group)\n+        if paralogs and len(group) >= mini:\n+            writeOutputFile(group, hashTable, j, True)\n+        j += 1\n+        new_group = []\n+        rang=-1\n+        # Keep only one paralogs per species (1st encounter)\n+        for loci in group:\n+            if rang == -1:\n+                new_group.append(loci)\n+                rang +=1\n+            elif loci[1:3] != new_group[rang][1:3]:\n+                new_group.append(loci)\n+                rang +=1\n+\n+        if len(new_group) >= mini: # Drop too small orthogroups\n+            list_orthogroups_format.append(new_group)\n+            writeOutputFile(new_group, hashTable, i, False)\n+            i += 1\n+    \n+    # STEP 3 - Print summaries ----------------------------------------------------\n+    if verbose:\n+        print "  Summary before paralogous filtering : \\n"\n+        df1 = asFrame(countings(list_orthogroups_withpara, nbspecs))\n+        print df1.loc[df1.ne(0).any(1),df1.ne(0).any()]\n+        #print "  Summary before paralogous filtering : \\n",countings(list_orthogroups_withpara, nbspecs),"\\n"\n+    print "\\n  Summary after paralogous filtering : \\n"\n+    df2 = asFrame(countings(list_orthogroups_format, nbspecs))\n+    print df2.loc[df2.ne(0).any(1),df2.ne(0).any()]\n+\n+    return len(list_orthogroups_format) #list_orthogroups_no_para\n+\n+## MAIN\n+\n+def main():\n+    parser = argparse.ArgumentParser()\n+    parser.add_argument("files", help="Orthogroups.txt file from OrthoFinder")\n+    parser.add_argument("infiles", help="fasta files used for OrthoFinder (after or before TransDecoder), separated by commas")\n+    parser.add_argument("minspec", type=int, help="Minimal number of species to keep per group")\n+    parser.add_argument("-v", "--verbose", action="store_true", help="Add another summary table : countings before paralogous genes filtering")\n+    parser.add_argument("-p", "--paralogs", action="store_true", help="Proceeds to write orthogroups also before paralogous filtering")\n+    args = parser.parse_args()\n+\n+    print "\\n-This script works on the \'Orthogroups\' file output of Orthofinder to split each orthogroup in a single fasta file."\n+    print "-It also gets rid of orthogroups with less sequences than the number specified by the user." \n+\n+    # Build hashtable\n+    print "  Building hashTable IDs/sequences ...\\n"\n+    infiles_good = str.split(args.infiles, ",")\n+    nbspec = len(infiles_good)\n+    #path = glob.glob(\'*.fasta\')\n+    hashTable = hashSequences(infiles_good)\n+\n+    # Open txt file with orthogroups\n+    print "  Reading Orthogroups.txt and writing orthogroups to separated files..."\n+    print "    (Dropping orthogroups of less than {} loci.)\\n".format(args.minspec)\n+    list_orthogroups = formatAndFilter(args.files, args.minspec, nbspec, hashTable, args.verbose, args.paralogs)\n+    print "\\n{} filtered orthogroups have been written in separated files".format(list_orthogroups)\n+\n+    # Move output files in a new directory\n+    if args.paralogs:\n+        os.system("mkdir orthogroups_withParalogs")\n+        path=glob.glob("*_withParalogs.fasta")\n+        for file in path:\n+            os.system("mv {} orthogroups_withParalogs".format(file))\n+\n+    os.system("mkdir filtered_orthogroups")\n+    path = glob.glob("*_sequences.fasta")\n+    for file in path:\n+        os.system("mv {} filtered_orthogroups".format(file))\n+    \n+    print "  \\nFiltered orthogroups are written in the directory \'filtered_orthogroups\'"\n+    if args.paralogs:\n+        print "  \\nFull orthogroups files are written in the directory \'orthogroups_withParalogs\'\\n"\n+\n+if __name__ == "__main__":\n+    main()\n'
b
diff -r 000000000000 -r d33ad52f59bc scripts/format_transdecoder_headers.sh
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/scripts/format_transdecoder_headers.sh Fri Feb 01 10:25:10 2019 -0500
[
@@ -0,0 +1,27 @@
+#/bin/bash
+
+# v2 - this script modifies the 'Orthogroups.txt' file in order to make it easily readable by the following script, filter_orthofinder.py
+  #Example :
+    #OG0000001: Gene.117__As119_1/1_1.000_543__g.117__m.117 Gene.157__As170_1/1_1.000_1203__g.157__m.157
+  #Becomes :
+    #As119_1/1_1.000_543 As170_1/1_1.000_1203
+    
+# removes 'OGxxxxxxx: '
+sed -E 's/OG[0-9]{7,}:\s//' $1 > $2
+# removes things like Gene.119__
+sed -i -E 's/Gene\.[0-9]{1,}\_\_/>/g' $2
+# removes things like __g.117__m.117
+sed -i -E 's/\_\_g\.[0-9]{1,}\_\_m\.[0-9]{1,}//g' $2
+
+# Old version
+
+# removes 'OGxxxxxxx '
+#sed -E 's/OG[0-9]{7}:\s//' $1 > $2
+# replace _+_ by (+) because '_' causes bugs
+#sed -i 's/_+_/(+)/g' $2
+# Replaces everything by '>'
+#sed -i -E 's/m\.[0-9]{1,}[^()]+\(\+\)\s*/>/g' $2
+# Removes terminal '(+)'
+#sed -i 's/(+)//g' $2
+# Removes last suite of unwanted numbers, underscore and dash
+#sed -i -E 's/\_[0-9]{1,}-[0-9]{1,}//g' $2
b
diff -r 000000000000 -r d33ad52f59bc static/images/adaptsearch_picture_helps.png
b
Binary file static/images/adaptsearch_picture_helps.png has changed
b
diff -r 000000000000 -r d33ad52f59bc test-data/2_orthogroups_tool.output
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/2_orthogroups_tool.output Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,26 @@
+
+-This script works on the 'Orthogroups' file output of Orthofinder to split each orthogroup in a single fasta file.
+-It also gets rid of orthogroups with less sequences than the number specified by the user.
+  Building hashTable IDs/sequences ...
+
+  Reading Orthogroups.txt and writing orthogroups to separated files...
+    (Dropping orthogroups of less than 2 loci.)
+
+  Summary before paralogous filtering : 
+
+        2 sps  3 sps  4 sps
+2 seqs      1      0      0
+3 seqs      1      3      0
+5 seqs      0      0      1
+8 seqs      0      1      0
+
+  Summary after paralogous filtering : 
+
+        2 sps  3 sps  4 sps
+2 seqs      2      0      0
+3 seqs      0      4      0
+4 seqs      0      0      1
+
+7 filtered orthogroups have been written in separated files
+  
+Filtered orthogroups are written in the directory 'filtered_orthogroups'
b
diff -r 000000000000 -r d33ad52f59bc test-data/Orthogroups.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/Orthogroups.txt Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,15 @@
+OG0000000: Gene.119__Ac284_1/1_1.000_317__g.119__m.119 Gene.128__Ac297_1/1_1.000_317__g.128__m.128 Gene.140__Ac340_1/1_1.000_334__g.140__m.140 Gene.153__As166_1/1_1.000_1107__g.153__m.153 Gene.16__Am117_1/1_1.000_300__g.16__m.16 Gene.335__As369_1/1_1.000_544__g.335__m.335 Gene.43__Ac95_1/1_1.000_580__g.43__m.43 Gene.1__Am6_1/1_1.000_361__g.1__m.1
+OG0000001: Gene.117__As119_1/1_1.000_543__g.117__m.117 Gene.157__As170_1/1_1.000_1203__g.157__m.157 Gene.159__Ac386_1/1_1.000_378__g.159__m.159 Gene.2__Am7_1/1_1.000_325__g.2__m.2 Gene.9__Ap12_1/1_1.000_582__g.9__m.9
+OG0000002: Gene.21__Ap34_1/1_1.000_337__g.21__m.21 Gene.250__As255_1/1_1.000_648__g.250__m.250 Gene.359__As422_1/1_1.000_636__g.359__m.359
+OG0000003: Gene.129__As137_1/1_1.000_685__g.129__m.129 Gene.48__Ac103_1/1_1.000_315__g.48__m.48 Gene.8__Ap11_1/1_1.000_406__g.8__m.8
+OG0000004: Gene.47__Ac102_1/1_1.000_654__g.47__m.47 Gene.12__Am92_1/1_1.000_509__g.12__m.12 Gene.152__As165_1/1_1.000_684__g.152__m.152
+OG0000005: Gene.50__Ac109_1/1_1.000_333__g.50__m.50 Gene.90__As95_1/1_1.000_729__g.90__m.90 Gene.7__Ap10_1/1_1.000_338__g.7__m.7
+OG0000006: Gene.52__Ac113_1/1_1.000_323__g.52__m.52 Gene.4__Am9_1/1_1.000_360__g.4__m.4
+OG0000007: Gene.13__Am99_1/1_1.000_399__g.13__m.13
+OG0000008: Gene.41__Ap101_1/1_1.000_309__g.41__m.41
+OG0000009: Gene.42__Ap102_1/1_1.000_382__g.42__m.42
+OG0000010: Gene.43__Ap108_1/1_1.000_314__g.43__m.43
+OG0000011: Gene.154__As169_1/1_1.000_945__g.154__m.154
+OG0000012: Gene.11__As16_1/1_1.000_810__g.11__m.11
+OG0000013: Gene.158__As171_1/1_1.000_527__g.158__m.158
+OG0000014: Gene.160__As172_1/1_1.000_393__g.160__m.160
b
diff -r 000000000000 -r d33ad52f59bc test-data/filtered_orthogroups/orthogroup_1_3_sequences.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtered_orthogroups/orthogroup_1_3_sequences.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,6 @@
+>Ac284_1/1_1.000_317
+TGCTTTTTCTGCAATGAGAGCTTCATGCAGCGAAATCGTCTCAACATTCACATGAAGAAAAAGCATGAAAAGGAGAGGGCATTTCCATGTCGATGGCCTGGATGTCACCGCCAGTTCATCTACAAGTCAGAGTACAACCAACACATGCGAGTGCACACAGGTGAGCGTCCATTTCTCTGTGATCTCTGTGGCTATGCAACCAAAACAAAGGTCCAGCTGCGCAGACATGAGAAGTCACACACAGGTGAGAGTAACTACAAGTGCAAGTACTGCACTTATAGTGCGAGTCACAGTTGGGGCCTGAGACGACACATGCG
+>Am117_1/1_1.000_300
+ATTGAATTTATTGGAACGATGATGAATGATGTATGCAATGCCCCTGCCAACCAGTGTACCATATGTTCAAGAATGTTCTCAACTCAGACAGACTTGGTTCAGCACATATCAATCCATACAACAAACTCTAGGTGGCGTTGTGATCTTTGTGGTAGAGGATATACAAAAAGAGATGCCCTTGAAGGTCATATAAATGCCAGGCATACAAACACCCTTCAGTTTGCTTGTACAAAATGTGATTTGGCTTATGCATATAAATCTGCATTACAGAGACACATGAAATATAAACACCCTGACCCA
+>As166_1/1_1.000_1107
+ACCCAGGAGAAAGGGAACTATCAGAGTCACATGTGGGCACAGCATAAAATGCGGATTCACGACAAACAGCGAGTTTTCCAGTGCGACACTTGTGACTACAGCACCGATCGGAAGACCCGATTCACGCAGCACATGGCTTCTCATAATGACATCCGCGCGCACAAGTGTCCGCACTGCGACAAAACATTTGTCGCCAAGACAACGATGAACTCGCACATCAAGTGGGCTCACATGGAGAAAATCCTGCGTTGCGACTACTGCGACCACAAAACAAGCACGCTCAACATGCTGAGAGAGCACGTGCGAATGATGCACACTCACCGTGATGTCAAACCCTACAAGTGCGCCTACTGCGATTATCGGTGCCGTACCAGCGGCAACTGTCGGAAACACTGCATGAATCGACACAAGGATCAGGAGGTCAAGTGGGTACGCGTCTGCGAAAAATACCCGAACAACTCAAAGCCGTTGCTCAGCTTCGAGGCCGGCATGACGGAAAACGGGATTTCCCGGAAAGACTCTCGGACTCAACGGATCTTTCCCTACGAGCAAAACGAGGCGGCACAACCCGTGATCCTGAATAAGTCCCCGGGAAAAAAGTCGCCGGCAAAGGTCCTAGACGTCGAGCCGATGCAAGAAATCCTACCGGTCGTCGTTTCACAGAAACTGGAGAACATGCAAGACCAAGTTGACGCCACGATGATGCAAGTGGAGCGAGATTCCTTCCAAGTTCAACTGCAGCAGCTACAGCTCCAGCAGTCCCAGGCACAGATGCTCCCCCTGCCCCAGAACCAAGCGATCCTTGTGCAACCGGAGACCCAGACCCTACACCAGCTCCTCGGTCAACAAGTGCACACGCTGACCCAGCTCTCAGCAGAGGGGGTATCCCTGGAACAGCCAGTCCAGATGATCCAGCAAACGCACTCCCTCCCACCGCCACCGATGATGACGTCCACAGTTACCCAGCAGTTGCCGGTGGTGACGGGAGCGTCAACGCCCATAGTGGTTTCAGGGGCTGCTCAACTGACGCCGGTCCAGCAGCAGTATCTGCTTCAGTACATGCAACAGCAACAACAACAGCAGCAGCAGATGCAGTTGCAGCATCAC
b
diff -r 000000000000 -r d33ad52f59bc test-data/filtered_orthogroups/orthogroup_2_4_sequences.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtered_orthogroups/orthogroup_2_4_sequences.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,8 @@
+>Ac386_1/1_1.000_378
+ACTCTACCAGTAAACACGTCGGTTAGCGTCGGCGGCTGGGGAGTCGCCGACCCTGATGATCTTTCTGAAGATATGGGCTTACCAACGATCTTACAAAAAGCTCAGTTGTTTGTGGCTGACATCGGCGATTGTGAGGCGGTATATAGTGTTCCCGTCACCGACAACCAGATCTGTATCAAGGATGGCAGCGGAAACACCGAGAAGGGAACGTGCGCAGGTGATGAAGGCGGACCTCTCATGTTTGAAGAAAATGATGTCACCTCTGTGGTTGGAATAATATCATATGGATCTGAAGGAGGATGTGTCGTTGGTGATCCTGCCGTGTTCACAAATGTGGCCAAGTACATCGACTGGATCAAGTATGTGATGGAACACAAC
+>Am7_1/1_1.000_325
+GGGGCCCGGGATGTCGAGGATGTTGTACTCGTAGTTGCTGTGGTTGACGTGGTATTGTTGTTCCTGGCTGTGGCTCCGTTACCACTTGACGTGGCTGTTGTGGTGCTGGTGGAAAAACGACTAGTGGTTGTGTCTGCAACTAATTCCTCGCCTCTAATCAGAATTAATGGACTGTCTGCAATACGAATTCCACGCAGGCTTTTGTCCAATTTGGCAGATTTTTCCTTGCTGGTTATTTTAGGTTCAGTTTTGGTCAAATCCAGTCTGTCACTGATCACACCATACGCCAATCTGCATACTCTCCCATCCTCCAGATCGGAAGAGC
+>Ap12_1/1_1.000_582
+GATGGTGTTGCGCTGTTCTGCTTTCTGCACGCATTTTATCTCGTCAAAACGCAGCCGTTGCTTCTCAGTTTGTTTATGTTTGTTGTTGTTTTGTTTTGTTATTTCCTTTCAAGTCGCCCTGATACAATGCTGTCACATAAACACGAGGTCATCGGACGTTTTCCGTCGATGTCGACATATATATATTTTTCCCCGCTACTTGTCCATCCATCCATCCATTCGTCTACCTGTCTGTCTTCTACGCCGTTCTGGTTGTTGCTGGCGTCTGCTGTAGCAGTCGTTATTGTTGGCGGCGGCGGTGACGTCTCCTCCGTTGGCGTGGACGGCCACAGCTCACAGCGACACCTGTCGGCGTCCGGTGGAGTCGGCTTGTTCCGGTGCCGTTCGACGTCCTGTGCCGAACGCCACCTGGCGACACGCATGCGTTATGACGTCGCCCGGCCGCCATTGAAGTCTCCAGTGATCGGTCCACACACACACACACACAGCTGTAACAATAAAACAGACAAGACACTGGCCTTACTCAGGATACAGTCGCTATTTAATAGATTGGCCTTAGTCCACGTGACCATTTGGGGTCGG
+>As119_1/1_1.000_543
+GGCGAACACCGCCGCCAGAGTTCGAACCCGTTCCGGGATACGCTCAGCGCTGTCGAGGTTCACGTCCACCCGGAGTACGCGCCGAACCCGGACGTGGGCCGGGTCGAGTACAACGACGTGGCTCTGCTCCGCATGGAGCGCATCATCGCCTCGACCATAGCGCACTATCCCATCTGCGCGCCGCCCACCGGCCCCGTCAACCACACGGACGGCATCATATGTGGCTGGGGCTCGAACGACGGCATCGACGGCCGGCCGACGAACGAGCTGCGCTGTACGTATCTGGACTTCCTGCAGAAGGACACCTGCGTACAGGCGTACCCGGACGACCCGCTCGATGACGCCATGTTCTGTACCTTCACGGCCGGCAGGGATGTATGCACTATTGACCGCGGCGGTCCGATAGCCGTGAAGATTGACGGGCTGTTCTATATCCTGGGGATAGCCTCCTGGTCGCCAGGCTGCAGTCAGGGTCCACCGTCCGTGTACATGGATGTCGCCTACTACAAGGACTGGATTGACAGTGTCATGCTCTCAGCAAAA
b
diff -r 000000000000 -r d33ad52f59bc test-data/filtered_orthogroups/orthogroup_3_2_sequences.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtered_orthogroups/orthogroup_3_2_sequences.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,4 @@
+>Ap34_1/1_1.000_337
+AAACAATTAACTGTGTGCACAGAAGGACAGTTTAAATGTGCCAACCATCACTGCATCAGTGCCAGCAGTGTCTGTGACAAATATGATGACTGTGGTGATATGTCAGATGAGATTGGTTGCCATAAAGACAGCAGTGAGGGATGTTCAGTCAATAATGGTGGGTGTGAGCAGAATTGTACTGATTTACCCGACAAGGGTCATGTGTGTCACTGTGACCCCGGTTACATCGTCAATCAGGATGACAAAACATCATGCTCAGACGTTGACGAATGTGCTTCTTGGGGTAACAAATGCTCACAAATCTGTCACAATATCAAAGGTTCCTATAAATGTGCTT
+>As255_1/1_1.000_648
+AACTGTACGACGATGTGTGTGAACACCCCCGGGGCCTTCGAGTGTGTATGTCCGGTCGGCTACCGGCTCAACCAGAACGGCAGCTCGTGTGAAGACCGAAACGAGTGCATTGATGACAACGGCGGGTGTGACCAGTATTGCCTCAACATGCAGGGATCGTATCGTTGCGCATGCGCTCAAGAGAGCGGATACATGCTCTCTACTGATAGCCACAACTGCCTTGTGATTTGTCCAGACCAATTCACCGCCATCAACCAGAACGATACTTGTCTGCAGGTGCAAGGGGCGCGGATGAATACATTCGAGGACGCGGAGGAATATTGTCGACGGTTGCACGCGCAGTCACACCTAGCAACCGTGGAAAGTTCCGGCAAACTTCGGGACATTTCGGCACTTCTACAAGGCACCAACATTACCAGCATTTGGACGGCAGGGAAGTACTGGCGACCAATCAGCGACTTCATATGGATTACGTCATATGACGTCATATCTGGGTTGAATCTGACCAATGCCATTGGGCCGACGTCATTACAGGGCACGTGCGTTGCCTTGACAACCGAAACATCGCAGGACTCACGTCTCATTCCTCAGAACTGTGTTTTTTCTAAACACTTTGCTTGTGAAATTAAATGGAATCGAAATCGCGGA
b
diff -r 000000000000 -r d33ad52f59bc test-data/filtered_orthogroups/orthogroup_4_3_sequences.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtered_orthogroups/orthogroup_4_3_sequences.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,6 @@
+>Ac103_1/1_1.000_315
+TGTTCATGTCATCAAAAACGCATAGTCCACAGAGATCTAAAGGCAGAGAATCTCTTGTTGGACAATGACATGAACATCAAAATAGCTGACTTTGGCTTTAGCAATAGCTTCACACCAGGGAACAAACTAGACACATTCTGTGGTAGTCCACCTTATGCAGCACCAGAATTATTTCAGGGCAAGAAGTATGATGGTCCTGAGGTGGATGTATGGAGCTTAGGTGTAATTCTCTATACTCTAGTCAGTGGCTCATTACCTTTTGATGGTCAAAACCTGAAGGAACTAAGAGAAAGGGTACTGAGAGGGAAGTACAGA
+>Ap11_1/1_1.000_406
+GAGGTACCCAGTGTGGCTGTACCAGGTGTTGTTTCAACCGTGGTACAGGATTCAGCACACAAGATCTTCATTGGTGGTCTACCAAACTACTTGAATGAAGACCAGGTTAAGGAACTGCTGACATCATTTGGTCCCCTGAAGGCCTTTAACTTGGTGAAAGATAGTGCAACTGGACTGTCGAAGGGTTATGCATTCTGTGAATATCTTGATCCTTCCATAACTGATCAGGCCTGTGCTGGCTTAAATGGAATGCAGCTTGGAGACAAAAAGCTAATTGTACAGAGGGCAAGTGTTGGTGCCAAGAATGCCCAAGGCGGGCCCAATGTTTTGCCAGTTCAGCTGCAAATTCCAGGACTTAACATGGCCCAGGTGCAGGGACCAGGTCCTACGACAGAGGTCCTCTGCT
+>As137_1/1_1.000_685
+TATTTGGCCTGTGTACATTTACATTTCAAAATGGCTGCCCAAGCGACTACGGCAAAATATAACGATTTATATGAATTGAAAGAAGAGTTAGGAAAAGGCGCCTTTTCAGTTGTTCGGAGATGTGTACAAAAGACTACCGGATTAGAATTCGCTGCCAAAATCATCAACACAAAAAAATTGTCAGCTCGAGATCACCAGAAATTGGAACGTGAAGCTAGGATCTGTAGATTACTAAAGCATCCAAATATAGTTCGACTCCATGATAGTATACAAGATGAAGGATTCCATTATTTAGTATTCGATTTGGTCACAGGTGGCGAGTTATTTGAAGACATAGTCGCCAGAGAATTCTATAGTGAAGCTGATGCTAGTCACTGCATGCAGCAAATATTAGAGAGTGTAAACTATTGCCACCAAATGGGTATAGTTCATAGGGACTTGAAGCCTGAGAATCTGCTGCTGGCAAGCAAAGCCAAAAATGCTGCTGTGAAACTTGCTGATTTCGGCTTGGCCATCGAAGTACAGGGCGACCAACAAGCATGGTTTGGTTTTGCGGGAACCCCCGGTTACCTGTCACCCGAGGTACTGAGACGAGACCCGTACGGCAAACCGGTGGACGTCTGGGCTTGTGGCGTAATTCTGTACATACTGCTGGTGGGTTACCCGCCGTTCTGGGACGAAGACC
b
diff -r 000000000000 -r d33ad52f59bc test-data/filtered_orthogroups/orthogroup_5_3_sequences.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtered_orthogroups/orthogroup_5_3_sequences.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,6 @@
+>Ac102_1/1_1.000_654
+GACAAAGGCTTGCTGAGTTCAGTAAAGGATTCCATTGTTCAAGGTTTCCAGTGGGGTACACGAGAAGGTCCTCTTTGTGATGAACCAATTCGGAACACAAAGTTTAAGATCCTGGATGCTGTAATAGCATCAGAGCCAATACACAGGGGAGGAGGTCAGGTTATACCAACAGCCAGACGAGTAGCTTACTCTGCATTCCTTATGGCTACACCACGTCTGATGGAACCTTACTTCTTTGTAGAGGTTCAAGCCCCTGCTGATTGTGTCTCTGCTGTATACACTGTATTAGCTCGAAGAAGAGGTCATGTGACAGCTGACGCTCCAATACCAGGTTCTCCAATGTACATCATTAAGGCCTTCATGCCTGCCATAGACTCCTTTGGGTTTGAAACAGATTTAAGAATCCACACACAAGGACAAGCTTTCTGCTTGTCTGTGTTCCACCATTGGCAGATTGTACCTGGTGATCCCTTAGATAAGAGCATAGTCATACGTCCACTGGAACCACAACCAGCCACACACCTGGCGAGAGAGTTTATGATAAAGACTCGTCGCAGAAAGGGGCTTAGTGAAGATGTCAGCATCAACAAATTCTTTGATGATCCTATGTTGTTGGAGCTTGCTAAGCAAGATGTTATGCTTAGTTATGGAATG
+>Am92_1/1_1.000_509
+CTTGCCGGAGTCTTGGATGGAGTTCTGGGTGGTTACCCGGTGTTTCTCATGGCTTCATTCTCATACATTTCTGACATTACTCTACACAGCAATAGATCTTTACGAATTGTTATCCTGGAGGTATGTATCAGTCTCGGGGGAACAATCTCCTATATGGCATCAGGATTACTCATTACTCATCTGAATTTCTTAGGAACATGTATAGTCCTGCATATAATTGTGGTACTAGATCTGGCACTAGTGGCATTTTACTTGCCAGAAACAGTGCAAAAACAAGAGGATATTACATTTTGGACTTTGGATCATTTCAAACAATCTTTCAGAGTGTATTTGGAAGATGAAGGTACTGGCAGAAGAGGACTCTTACTCACATCAATGCTGGTCTTATTAATTCTGTGTCCAGCAGCAATAGGTGAAGATGATGTTCTAGCATTGTTTGTGTTAAATTCTCCAATTTGCTTCACCCCAGATCTTCTTGGATATTACAAAGGAACTTTTTTCTTAGTTGC
+>As165_1/1_1.000_684
+TCCACGCCGTGGTGGGAACCGGATACAGCGACCAAGGCTACGGCACCAAGCACGAGTACGGCCACCAGCAGCAGAGCTACGGATACCACAAACCGAGCAAGTTCTGCTACCAGTGCGCCTACTCGCCGCCCAAGACGTACTACGACAAGAAGGTCGTGGTCGAGAACTATGAGTACGGACAACACAAGCAGGGATACCAACAGGGCGGCTACGGGGACGACAAGAAACAGGGCTATGGCCAGCAGGGCGGCTACCAGAAGAAGACTTACGTGCCGGTGGCGAGGACGGTCTACGGGGGCTGGGACAAGTGTTTCGGCTCGTTCGACCACGTCCAGGCCAAGGAGTTCGGCATCGACGTTTGGGAGTGCCACAGCAACTGCTACGTGCGCAAGGACCCCAACGGAGACCTGTTCCGCGGCTGTTACAAGGGCGAGTATGCGGTGGACCCGCACAAGTACGGCTGTAACCACCAGGCCGGGGCGCTCTGGTGCTTCTGTGAGGGCGACAAGTGTAACAACCAGGACATCGGCTACAACTAACCGTCCCAGCCAATCACAGCCGTCCACACATCTGTTTGTCTGCCAGCAACCAATCACAGTCGTGCTCACAGCTGGCTGCTTACCAGCAGCCAGTCACAGTCACCGATACATCCGTTTGTTTCTGCTTTTAACCAATGGCAGCCGT
b
diff -r 000000000000 -r d33ad52f59bc test-data/filtered_orthogroups/orthogroup_6_3_sequences.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtered_orthogroups/orthogroup_6_3_sequences.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,6 @@
+>Ac109_1/1_1.000_333
+AACTTCCTGTACCTTGTTGGCAATGTTTTCAACCTTCTTAGCGTGCTTGCCAAAATCTTCAAACATACGGCTCATACCGCGGTCAATTCTGTCGATGAGGTTGCTGTGTTCGCCGACCGCCTTGGTCAGATCCAGAGAGGCTTCCTTCAGCTCGCCGATGTCCTTGTCGTGCTGCATGTTGAGGTTGGCACGCTCGCACTGGCCGAGCGACGCGTTGAGCACGCGCACCTCGACCCGCAGCAGCCGGTCGTCGTTGGAGTCGATGCGGCCGTCGAACTCCTCGAACTTCTTGTCGATGAAGTCGAAGACGTCGGCCGCCTCCAGGTGGTGATC
+>Ap10_1/1_1.000_338
+CCATACTCAGCCGCCAAGACCACGGCCCAGGCTGCCACAGATGACCTGAAGAGACGTCAGGAAGAACTGGAGAGGAAGGCTGAGGAACTACAGAGAAAGGAACAGGAATTACAGAGAAACATGGGACACCAAGCCAGGGTGAACAACTTCCCACCACTGCCTGAGAAATGCTGTGTCCAGCCTTGCTTCTATCAAGATTTTGAGCTTGACATCCCATTGGAATTCCAAAGAATTGTAAAAACAGTGTATTATGTGTGGATAGCCTACATATGTCTGTTGATTCTGAATGTACTGGGAACACTGGCCTACTTCATAGCTGCGTCCAAGGCAGGTCATGG
+>As95_1/1_1.000_729
+GTGCAATATCCGAAAATCGCTGTTGGATTGCAAACTATTCCACAAGCCAGTCTTCTCTCGCATCTAATAGGAGACCCTACACTCACATTATATATTATAGCAGCCCACACTCACTATAAAATGCCTAGAGGACGTGGAAAACGCGGTAGTCACAAAGGCGGCCACCGAAAGTTCACGAATGCAGAGGAGTTGAAGCAACAACAGAGTAAACAAGAGAAGGAGAAAGAATGGCGGAAGATGAAGGGTCTGCCGAGCGACGAGTCCGGGGACGAGGACGAGGAGGGCGGAGCAAAAGCCGCGGCCAAAAAAACTGAGGACGCGGAGGAAGATGTCAAATTTGGGGACTCGTCCTCGGAGGAGGAATCATCAGAAGAGGAAGAAGACGCTAAAGCAAAAGGAGTATCACATTTAATAGAGATAGCAAATCCAAATCATCAAGTCACCAAATCTTCCAAGAAAGTGACGGAAATTTCAGGAGACGCCAAAGTGAATCTATCAAGAAGAGAAAAGGAGGAGCTTGCCAAGCAGCAGGCCAAGGTGCAGTACCAGAAGATGCACCTGGAGGGCAAGACGGACGAGGCGCGATCGGACCTGGCTCGCCTGGCGCTGATCCGCAAACAGCGCGAGGACGCCGCCAAGAAAAAGGACGAGGAACGCAAGCAGCGCGAGGCGGCGGCGGCGGAGGCGGAGCAGAAGCTCAAGGACAAGCGTGCGGCCGCCCGGGGCCAA
b
diff -r 000000000000 -r d33ad52f59bc test-data/filtered_orthogroups/orthogroup_7_2_sequences.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtered_orthogroups/orthogroup_7_2_sequences.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,4 @@
+>Ac113_1/1_1.000_323
+TCGATCCTGAAGAGTTCTAACGGAAAGAGGCTGATCCCGATCCCAGCCGACGAGGGATCGTTAGATCCCGATTATGAAAGTCTGAATAAAATAAAGCCATGGAGTCCTGTTGATGACGAGCACATCCGGATGGATGACGTTTCGCGCGAAATGCAACGCATCCACGACAACCTGGAGCGCATGCGTAAGCAGACGATGCTCAACTTCCGGCCGCCGCCTCCACCGCCACCGCCTTTCGATCCCATGATGCCTCAACTACTTCCGGTTCCTCAGTTCACCATGCCGTCGTTTCCGGCTTTGCCGGATCCAATGGCGCCGATGCC
+>Am9_1/1_1.000_360
+AGCCATCAAAGGTTGCTAATCATGTTGAGTTGTATTGTCAAGCATTTCTACTCGAGGCAACCATTAATAATTGAAGTTATCAGTTATATTGTCAACTCAATGGAAAATCAAATGGATTTAATTAAGGAAGGAAGATTTTGTACTTGTAAATCTGCATTTTATTACAAAATGTGTAATAAAATTACAATTCTCAAATGGATTCATATATATGCAAATAAAGGATTTATGAGTTATGATTTAAGAGTTGATCTTTCTTCTAGAAGTTGCATGTACTTGTGTAAACCACTAACAACTACTACTATAAAACTACTTGACATAATTCAAAACTACCGACATATATTCCAAATAAAACTTAGCTCA
b
diff -r 000000000000 -r d33ad52f59bc test-data/orthogroups_tool.output
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/orthogroups_tool.output Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,29 @@
+
+-This script works on the 'Orthogroups' file output of Orthofinder to split each orthogroup in a single fasta file.
+-It also gets rid of orthogroups with less sequences than the number specified by the user.
+  Building hashTable IDs/sequences ...
+
+  Reading Orthogroups.txt and writing orthogroups to separated files...
+    (Dropping orthogroups of less than 2 loci.)
+
+  Summary before paralogous filtering : 
+
+        2 sps  3 sps  4 sps
+2 seqs      1      0      0
+3 seqs      1      3      0
+5 seqs      0      0      1
+8 seqs      0      1      0
+
+  Summary after paralogous filtering : 
+
+        2 sps  3 sps  4 sps
+2 seqs      2      0      0
+3 seqs      0      4      0
+4 seqs      0      0      1
+
+7 filtered orthogroups have been written in separated files
+  
+Filtered orthogroups are written in the directory 'filtered_orthogroups'
+  
+Full orthogroups files are written in the directory 'orthogroups_withParalogs'
+
b
diff -r 000000000000 -r d33ad52f59bc test-data/orthogroups_withParalogs/orthogroup_1_8_sequences_withParalogs.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/orthogroups_withParalogs/orthogroup_1_8_sequences_withParalogs.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,16 @@
+>Ac284_1/1_1.000_317
+TGCTTTTTCTGCAATGAGAGCTTCATGCAGCGAAATCGTCTCAACATTCACATGAAGAAAAAGCATGAAAAGGAGAGGGCATTTCCATGTCGATGGCCTGGATGTCACCGCCAGTTCATCTACAAGTCAGAGTACAACCAACACATGCGAGTGCACACAGGTGAGCGTCCATTTCTCTGTGATCTCTGTGGCTATGCAACCAAAACAAAGGTCCAGCTGCGCAGACATGAGAAGTCACACACAGGTGAGAGTAACTACAAGTGCAAGTACTGCACTTATAGTGCGAGTCACAGTTGGGGCCTGAGACGACACATGCG
+>Ac297_1/1_1.000_317
+CACAATAAGATCCACACCGGCGAGAAGCCATTCAAGTGTCACATATGTGGCAAGGCATTCTCACAAACATCGAACTTGCGTACGCACATCAAGCGGCACACGGGTGAAAAACCACACAAGTGCCACATGTGTGAGAAATGCTTTGGAGATCTTGGCCACCTGCGCACACACCTGCGTAGACATACTGGTGAGAAACCTTTTGTGTGCAGCTTCTGTGGAAAGGGCTTTGTTGACAAGCAGAGCATGCGCAAACATTCTGACAGACATATAAACAAACCAAACCTGATCATCTGTCCTAACGACCAGGTCATCTTTCC
+>Ac340_1/1_1.000_334
+GAGAGACCTTACAGTTGTCCACAGTGTGGCAAGAGCTTCCCCCGTTCTGAAGACTTGAAGATGCACATTCGAACTCATACAGGCCAGAAACCTTATAAGTGCTTAGTCTGTGGGAAGTGTTTCATCAAATCTAGCTACCTGCAAAAGCATGCCAGAATTCACACTGGGGAGAAGCCTTACAAGTGTAGTACCTGTGGCGAGGCCTTTGCCCAGTCGGACATTCTTGCCAAACACATACGAGTTCACACTGGTGAACGTCCTTACTGTTGCACCGTATGTGGCAAAACGTTCACACAGAGTGGGTCACTGTATCATCACATGAAAATGCACAAAC
+>Ac95_1/1_1.000_580
+TGCACACTGTGGTTTGCATTATGTGTCTTCTCTATATGGCTATACAGGAAGAAGCACGCCAAAAAGAAAATGGCAAAGAATGGTAACTCCACAAGTATGTTGCCATCTTTTGCTAGCCATAAGAGTGATGAAGGAAGAAGACAGGAGAATCTGTTCAACTCACTGAATGTACCTAATTACCTCCAGAAAGATGCCAATAACCATGTGGATAACCTGCAACCCGACGTCACAAATGTCGGCAGTGACATGTCAAAACCGGATTCGGGATCCGAGAATCTCTACAACCTGCCGAACATCACCCAGGCGCCGATGAAAACATTCTACCACAAGAACAGCTCCGTGGCCCAGCCGTATGCCACAACGACGCTGATAGCCAACAACCTTAGCAGTCCTCCTGGCGGCGAAAGCGCATTCCGGCCAATACAGCAGGGCTACGTACAACAGCCACACAACGGCAGCGGCTCCAGTGACAGCTGCCAAAAGCCTGACATCAGTACCGACTCGAATCCCGACAACGTCAGGCACAAAACTGGTGGGTGCATCAGTGGTAACGTTCATGGCAATAAGTTGTACCCAGATT
+>Am117_1/1_1.000_300
+ATTGAATTTATTGGAACGATGATGAATGATGTATGCAATGCCCCTGCCAACCAGTGTACCATATGTTCAAGAATGTTCTCAACTCAGACAGACTTGGTTCAGCACATATCAATCCATACAACAAACTCTAGGTGGCGTTGTGATCTTTGTGGTAGAGGATATACAAAAAGAGATGCCCTTGAAGGTCATATAAATGCCAGGCATACAAACACCCTTCAGTTTGCTTGTACAAAATGTGATTTGGCTTATGCATATAAATCTGCATTACAGAGACACATGAAATATAAACACCCTGACCCA
+>Am6_1/1_1.000_361
+ACCACACAATCATCTAGTGAAACATTTACCAAAACACCCTCTGAAACTGTTCGGTCAGAAGAAGACAGTGCTAAAAAGCAGAAAACTTTCATCAAAAGCCCACAGGCAGTTGCTGTATCTGAAGAATCTACAAAAACAAATTTAACTTTTGTTGCTAAATCATCCGACGTTAACAGCAACTCTCCATTATCTACAGTACACCAGGCATCAGGATCAGGAGAAACATTTACCAAAACACCTGTAGAAACTGACCATACGGAACAACCTTCTGGTCAACCAGAACATAAACAGGCCTCCACTGACCTTGTTCCTCCAGAAAGCACCAAAGAACCGCTGATCCATTCTGGTAATGTGCTGGGTT
+>As166_1/1_1.000_1107
+ACCCAGGAGAAAGGGAACTATCAGAGTCACATGTGGGCACAGCATAAAATGCGGATTCACGACAAACAGCGAGTTTTCCAGTGCGACACTTGTGACTACAGCACCGATCGGAAGACCCGATTCACGCAGCACATGGCTTCTCATAATGACATCCGCGCGCACAAGTGTCCGCACTGCGACAAAACATTTGTCGCCAAGACAACGATGAACTCGCACATCAAGTGGGCTCACATGGAGAAAATCCTGCGTTGCGACTACTGCGACCACAAAACAAGCACGCTCAACATGCTGAGAGAGCACGTGCGAATGATGCACACTCACCGTGATGTCAAACCCTACAAGTGCGCCTACTGCGATTATCGGTGCCGTACCAGCGGCAACTGTCGGAAACACTGCATGAATCGACACAAGGATCAGGAGGTCAAGTGGGTACGCGTCTGCGAAAAATACCCGAACAACTCAAAGCCGTTGCTCAGCTTCGAGGCCGGCATGACGGAAAACGGGATTTCCCGGAAAGACTCTCGGACTCAACGGATCTTTCCCTACGAGCAAAACGAGGCGGCACAACCCGTGATCCTGAATAAGTCCCCGGGAAAAAAGTCGCCGGCAAAGGTCCTAGACGTCGAGCCGATGCAAGAAATCCTACCGGTCGTCGTTTCACAGAAACTGGAGAACATGCAAGACCAAGTTGACGCCACGATGATGCAAGTGGAGCGAGATTCCTTCCAAGTTCAACTGCAGCAGCTACAGCTCCAGCAGTCCCAGGCACAGATGCTCCCCCTGCCCCAGAACCAAGCGATCCTTGTGCAACCGGAGACCCAGACCCTACACCAGCTCCTCGGTCAACAAGTGCACACGCTGACCCAGCTCTCAGCAGAGGGGGTATCCCTGGAACAGCCAGTCCAGATGATCCAGCAAACGCACTCCCTCCCACCGCCACCGATGATGACGTCCACAGTTACCCAGCAGTTGCCGGTGGTGACGGGAGCGTCAACGCCCATAGTGGTTTCAGGGGCTGCTCAACTGACGCCGGTCCAGCAGCAGTATCTGCTTCAGTACATGCAACAGCAACAACAACAGCAGCAGCAGATGCAGTTGCAGCATCAC
+>As369_1/1_1.000_544
+ATACCCCACATACGGCAGAGCAGTTTCCTACGGAAGGATGGGGATACCGATCAGCAATCCTTCCGATACCGGTCTTCAGAGGAGCTTATACCAGTACCCAGAGAAAATTATTACTTTTGTGTCACGGGAAACGTGGATAAGATGGGTAAAATCAACAAGGCTGCTGATATCAAACCTGGTGTGAGAGTTTTGACGGCACACACTGGAGAGAAACAACATAAATGTACGTGCAGAATCTGTGGTAAAGGATTATCTCGTCCAGATGCACTTAAATCACACATGTTGATACATACTGGAGAGGGACCACACACATGCACAATATGTGGCAGAGGATTTAGTCAGAAAGGTCGCCTCAAATCACACATGCTGATACACACTGGCGAGAAACCGCACAAGTGCACAATCTGTGGTAATGGATTATCTCGGCCAGATGCACTCAAATCACACATGTTGAGACATACTGGAGAGGGACCACACACATGCACAATATGTGGCAGAGGATTTAGTCAGAAAGGTCGCCTCAAATCACACATGCTGATACACA
b
diff -r 000000000000 -r d33ad52f59bc test-data/orthogroups_withParalogs/orthogroup_2_5_sequences_withParalogs.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/orthogroups_withParalogs/orthogroup_2_5_sequences_withParalogs.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,10 @@
+>Ac386_1/1_1.000_378
+ACTCTACCAGTAAACACGTCGGTTAGCGTCGGCGGCTGGGGAGTCGCCGACCCTGATGATCTTTCTGAAGATATGGGCTTACCAACGATCTTACAAAAAGCTCAGTTGTTTGTGGCTGACATCGGCGATTGTGAGGCGGTATATAGTGTTCCCGTCACCGACAACCAGATCTGTATCAAGGATGGCAGCGGAAACACCGAGAAGGGAACGTGCGCAGGTGATGAAGGCGGACCTCTCATGTTTGAAGAAAATGATGTCACCTCTGTGGTTGGAATAATATCATATGGATCTGAAGGAGGATGTGTCGTTGGTGATCCTGCCGTGTTCACAAATGTGGCCAAGTACATCGACTGGATCAAGTATGTGATGGAACACAAC
+>Am7_1/1_1.000_325
+GGGGCCCGGGATGTCGAGGATGTTGTACTCGTAGTTGCTGTGGTTGACGTGGTATTGTTGTTCCTGGCTGTGGCTCCGTTACCACTTGACGTGGCTGTTGTGGTGCTGGTGGAAAAACGACTAGTGGTTGTGTCTGCAACTAATTCCTCGCCTCTAATCAGAATTAATGGACTGTCTGCAATACGAATTCCACGCAGGCTTTTGTCCAATTTGGCAGATTTTTCCTTGCTGGTTATTTTAGGTTCAGTTTTGGTCAAATCCAGTCTGTCACTGATCACACCATACGCCAATCTGCATACTCTCCCATCCTCCAGATCGGAAGAGC
+>Ap12_1/1_1.000_582
+GATGGTGTTGCGCTGTTCTGCTTTCTGCACGCATTTTATCTCGTCAAAACGCAGCCGTTGCTTCTCAGTTTGTTTATGTTTGTTGTTGTTTTGTTTTGTTATTTCCTTTCAAGTCGCCCTGATACAATGCTGTCACATAAACACGAGGTCATCGGACGTTTTCCGTCGATGTCGACATATATATATTTTTCCCCGCTACTTGTCCATCCATCCATCCATTCGTCTACCTGTCTGTCTTCTACGCCGTTCTGGTTGTTGCTGGCGTCTGCTGTAGCAGTCGTTATTGTTGGCGGCGGCGGTGACGTCTCCTCCGTTGGCGTGGACGGCCACAGCTCACAGCGACACCTGTCGGCGTCCGGTGGAGTCGGCTTGTTCCGGTGCCGTTCGACGTCCTGTGCCGAACGCCACCTGGCGACACGCATGCGTTATGACGTCGCCCGGCCGCCATTGAAGTCTCCAGTGATCGGTCCACACACACACACACACAGCTGTAACAATAAAACAGACAAGACACTGGCCTTACTCAGGATACAGTCGCTATTTAATAGATTGGCCTTAGTCCACGTGACCATTTGGGGTCGG
+>As119_1/1_1.000_543
+GGCGAACACCGCCGCCAGAGTTCGAACCCGTTCCGGGATACGCTCAGCGCTGTCGAGGTTCACGTCCACCCGGAGTACGCGCCGAACCCGGACGTGGGCCGGGTCGAGTACAACGACGTGGCTCTGCTCCGCATGGAGCGCATCATCGCCTCGACCATAGCGCACTATCCCATCTGCGCGCCGCCCACCGGCCCCGTCAACCACACGGACGGCATCATATGTGGCTGGGGCTCGAACGACGGCATCGACGGCCGGCCGACGAACGAGCTGCGCTGTACGTATCTGGACTTCCTGCAGAAGGACACCTGCGTACAGGCGTACCCGGACGACCCGCTCGATGACGCCATGTTCTGTACCTTCACGGCCGGCAGGGATGTATGCACTATTGACCGCGGCGGTCCGATAGCCGTGAAGATTGACGGGCTGTTCTATATCCTGGGGATAGCCTCCTGGTCGCCAGGCTGCAGTCAGGGTCCACCGTCCGTGTACATGGATGTCGCCTACTACAAGGACTGGATTGACAGTGTCATGCTCTCAGCAAAA
+>As170_1/1_1.000_1203
+CGAGGGTCTGGCACCAAGGACAGTCCAGCCTGTGGACCCAACAAGCCACAGGTTCTGGAGCGGGAGGAGGGAGAGTTCTCCAGCTATGGGTACGAAAGCGACAGGAAATATCTCAACGACATGGACTGTGCCTGGAGGGTTGTGGTAGCCCCTAACATGAGGGCCCATCTGCATTTCATGAATTTCGAACTGGAAGCATCATCGCTGTGTTGTTACGACAAACTTCACATATACGATGGCTACGACGGTACTGCCGAAAAGTTGGGTCTGTACTGTGGCGATGGCACTCCTGGGGACATCACTGGCTCTGGTAACGTCCTCTACGTCGTCCTGAAGACCGACTCGAGTGTTACAGCTGCGGGCTTCCATGCGAGGTTCAGCGGCAAGGAAAAGATGACTCTCGGATCTGGAGGAAATGATAATGTAATGTGTGGAATGCCGTCGATCGACCCTAAGTTCGGCCGGATCGTGGGAGGACAAGAGGCGATTCCGCACTCCTGGCCGTGGCAGATCAGCATGCGGAACAGGAACCACCCGCACACAGACGGCTGGGGACACTGGTGCGGCGGGTCGCTCATACACCCGGACTGGGTCTTGACGGCAGCCCACTGTGTGAATGACAATCCTAACTCGAGCAACTACCGTGTGTTGATTGGAGAGCACAACCGCCACGAGACTGAACTGAGCCAGGTGACCATCAACGTGGAGCGAGTGATCGTCCACGAGTCGTACGGCTATGGTGGCAGATACAACAACGACATAGCCCTGTTCAAGCTGGCCTCGCCCGTGGACTATGCCAGTGAGGTGTCACCCATCTGCCTGCCAGCCAACGACATCCCGCCCAGGACGCTGTGTGTGACGACCGGCTGGGGGGAAACTGAAGGTGCGGGTGACCGGATCAGTCTGCGGCAGGTGCAGGTGCCCATTCTGCCCCGTGCCGAGTGTAACCAGGCCGACTGGTACGGCGGCAGCGTCACCCCGGAGATGATCTGTGCCGGCTACCCCGAGGGCCTCAAAGACTCCTGCCAGGGTGACTCTGGGGGACCTTTCGTGTGTACAACAGGTGGCGCCTGGCAATTGCACGGGATAACGAGCTGGGGCAATGGTTGCGCCGAGGCCAAGAAGCCCGGGGTGTACACCCGAGTGTCAAGATACATCGATTGGATCGAGGAGAAGACTGGAGTGCAGTTCGATGAGCGGATC
b
diff -r 000000000000 -r d33ad52f59bc test-data/orthogroups_withParalogs/orthogroup_3_3_sequences_withParalogs.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/orthogroups_withParalogs/orthogroup_3_3_sequences_withParalogs.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,6 @@
+>Ap34_1/1_1.000_337
+AAACAATTAACTGTGTGCACAGAAGGACAGTTTAAATGTGCCAACCATCACTGCATCAGTGCCAGCAGTGTCTGTGACAAATATGATGACTGTGGTGATATGTCAGATGAGATTGGTTGCCATAAAGACAGCAGTGAGGGATGTTCAGTCAATAATGGTGGGTGTGAGCAGAATTGTACTGATTTACCCGACAAGGGTCATGTGTGTCACTGTGACCCCGGTTACATCGTCAATCAGGATGACAAAACATCATGCTCAGACGTTGACGAATGTGCTTCTTGGGGTAACAAATGCTCACAAATCTGTCACAATATCAAAGGTTCCTATAAATGTGCTT
+>As255_1/1_1.000_648
+AACTGTACGACGATGTGTGTGAACACCCCCGGGGCCTTCGAGTGTGTATGTCCGGTCGGCTACCGGCTCAACCAGAACGGCAGCTCGTGTGAAGACCGAAACGAGTGCATTGATGACAACGGCGGGTGTGACCAGTATTGCCTCAACATGCAGGGATCGTATCGTTGCGCATGCGCTCAAGAGAGCGGATACATGCTCTCTACTGATAGCCACAACTGCCTTGTGATTTGTCCAGACCAATTCACCGCCATCAACCAGAACGATACTTGTCTGCAGGTGCAAGGGGCGCGGATGAATACATTCGAGGACGCGGAGGAATATTGTCGACGGTTGCACGCGCAGTCACACCTAGCAACCGTGGAAAGTTCCGGCAAACTTCGGGACATTTCGGCACTTCTACAAGGCACCAACATTACCAGCATTTGGACGGCAGGGAAGTACTGGCGACCAATCAGCGACTTCATATGGATTACGTCATATGACGTCATATCTGGGTTGAATCTGACCAATGCCATTGGGCCGACGTCATTACAGGGCACGTGCGTTGCCTTGACAACCGAAACATCGCAGGACTCACGTCTCATTCCTCAGAACTGTGTTTTTTCTAAACACTTTGCTTGTGAAATTAAATGGAATCGAAATCGCGGA
+>As422_1/1_1.000_636
+GGGAAAGCGGGAAACACGTGCCTGGATTACCTGACCATTCATGACGGCGCCAGTGCCACTGCCTCGGAACTCACGAGTGAGCCTCTCTGTGGCACGATACAAGACGAGTTCAACCTGACGACGTCATCAAACCACGTGACCTTCCATTTCATATCGGACACGACAGCCGTATATCGGGGATTTGCCTTTGAATATACAGAGTTCACAATAGCCCCGTGTGACACGACCCAGTTTGAGTGTGACAATGGCATCTGTATCAACATCAACAACGTGTGCGATGACGTCACGCAGTGTGGAGACCGGTCGGACGAGGGCCAATGCTCCATTGATGCGATATTGGCCTCCCAGCGAGGAGACCTACCACTGATTATAGGCTGCAGTGTGGCCGGGCTTATCGTTCTTATCATTATCATAGTCATCATCTACAAGGTGTACCAGTACTACAAGTGGCGTCGCTTCATCAGGCTGAACCAGGAGGTGAGTGTCGACGACCTGTACCAGTACCCGGTCACCGACCTCTACAACCGACACGACATCGGCAAGAAGGGCCGCCGGCCGCCGAACGTCAGCTCCTACTACCGCGCCCCCGCCATGGCCACGCCCTACCACGAGAACGGCGCCTACATCGACGAGATG
b
diff -r 000000000000 -r d33ad52f59bc test-data/orthogroups_withParalogs/orthogroup_4_3_sequences_withParalogs.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/orthogroups_withParalogs/orthogroup_4_3_sequences_withParalogs.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,6 @@
+>Ac103_1/1_1.000_315
+TGTTCATGTCATCAAAAACGCATAGTCCACAGAGATCTAAAGGCAGAGAATCTCTTGTTGGACAATGACATGAACATCAAAATAGCTGACTTTGGCTTTAGCAATAGCTTCACACCAGGGAACAAACTAGACACATTCTGTGGTAGTCCACCTTATGCAGCACCAGAATTATTTCAGGGCAAGAAGTATGATGGTCCTGAGGTGGATGTATGGAGCTTAGGTGTAATTCTCTATACTCTAGTCAGTGGCTCATTACCTTTTGATGGTCAAAACCTGAAGGAACTAAGAGAAAGGGTACTGAGAGGGAAGTACAGA
+>Ap11_1/1_1.000_406
+GAGGTACCCAGTGTGGCTGTACCAGGTGTTGTTTCAACCGTGGTACAGGATTCAGCACACAAGATCTTCATTGGTGGTCTACCAAACTACTTGAATGAAGACCAGGTTAAGGAACTGCTGACATCATTTGGTCCCCTGAAGGCCTTTAACTTGGTGAAAGATAGTGCAACTGGACTGTCGAAGGGTTATGCATTCTGTGAATATCTTGATCCTTCCATAACTGATCAGGCCTGTGCTGGCTTAAATGGAATGCAGCTTGGAGACAAAAAGCTAATTGTACAGAGGGCAAGTGTTGGTGCCAAGAATGCCCAAGGCGGGCCCAATGTTTTGCCAGTTCAGCTGCAAATTCCAGGACTTAACATGGCCCAGGTGCAGGGACCAGGTCCTACGACAGAGGTCCTCTGCT
+>As137_1/1_1.000_685
+TATTTGGCCTGTGTACATTTACATTTCAAAATGGCTGCCCAAGCGACTACGGCAAAATATAACGATTTATATGAATTGAAAGAAGAGTTAGGAAAAGGCGCCTTTTCAGTTGTTCGGAGATGTGTACAAAAGACTACCGGATTAGAATTCGCTGCCAAAATCATCAACACAAAAAAATTGTCAGCTCGAGATCACCAGAAATTGGAACGTGAAGCTAGGATCTGTAGATTACTAAAGCATCCAAATATAGTTCGACTCCATGATAGTATACAAGATGAAGGATTCCATTATTTAGTATTCGATTTGGTCACAGGTGGCGAGTTATTTGAAGACATAGTCGCCAGAGAATTCTATAGTGAAGCTGATGCTAGTCACTGCATGCAGCAAATATTAGAGAGTGTAAACTATTGCCACCAAATGGGTATAGTTCATAGGGACTTGAAGCCTGAGAATCTGCTGCTGGCAAGCAAAGCCAAAAATGCTGCTGTGAAACTTGCTGATTTCGGCTTGGCCATCGAAGTACAGGGCGACCAACAAGCATGGTTTGGTTTTGCGGGAACCCCCGGTTACCTGTCACCCGAGGTACTGAGACGAGACCCGTACGGCAAACCGGTGGACGTCTGGGCTTGTGGCGTAATTCTGTACATACTGCTGGTGGGTTACCCGCCGTTCTGGGACGAAGACC
b
diff -r 000000000000 -r d33ad52f59bc test-data/orthogroups_withParalogs/orthogroup_5_3_sequences_withParalogs.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/orthogroups_withParalogs/orthogroup_5_3_sequences_withParalogs.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,6 @@
+>Ac102_1/1_1.000_654
+GACAAAGGCTTGCTGAGTTCAGTAAAGGATTCCATTGTTCAAGGTTTCCAGTGGGGTACACGAGAAGGTCCTCTTTGTGATGAACCAATTCGGAACACAAAGTTTAAGATCCTGGATGCTGTAATAGCATCAGAGCCAATACACAGGGGAGGAGGTCAGGTTATACCAACAGCCAGACGAGTAGCTTACTCTGCATTCCTTATGGCTACACCACGTCTGATGGAACCTTACTTCTTTGTAGAGGTTCAAGCCCCTGCTGATTGTGTCTCTGCTGTATACACTGTATTAGCTCGAAGAAGAGGTCATGTGACAGCTGACGCTCCAATACCAGGTTCTCCAATGTACATCATTAAGGCCTTCATGCCTGCCATAGACTCCTTTGGGTTTGAAACAGATTTAAGAATCCACACACAAGGACAAGCTTTCTGCTTGTCTGTGTTCCACCATTGGCAGATTGTACCTGGTGATCCCTTAGATAAGAGCATAGTCATACGTCCACTGGAACCACAACCAGCCACACACCTGGCGAGAGAGTTTATGATAAAGACTCGTCGCAGAAAGGGGCTTAGTGAAGATGTCAGCATCAACAAATTCTTTGATGATCCTATGTTGTTGGAGCTTGCTAAGCAAGATGTTATGCTTAGTTATGGAATG
+>Am92_1/1_1.000_509
+CTTGCCGGAGTCTTGGATGGAGTTCTGGGTGGTTACCCGGTGTTTCTCATGGCTTCATTCTCATACATTTCTGACATTACTCTACACAGCAATAGATCTTTACGAATTGTTATCCTGGAGGTATGTATCAGTCTCGGGGGAACAATCTCCTATATGGCATCAGGATTACTCATTACTCATCTGAATTTCTTAGGAACATGTATAGTCCTGCATATAATTGTGGTACTAGATCTGGCACTAGTGGCATTTTACTTGCCAGAAACAGTGCAAAAACAAGAGGATATTACATTTTGGACTTTGGATCATTTCAAACAATCTTTCAGAGTGTATTTGGAAGATGAAGGTACTGGCAGAAGAGGACTCTTACTCACATCAATGCTGGTCTTATTAATTCTGTGTCCAGCAGCAATAGGTGAAGATGATGTTCTAGCATTGTTTGTGTTAAATTCTCCAATTTGCTTCACCCCAGATCTTCTTGGATATTACAAAGGAACTTTTTTCTTAGTTGC
+>As165_1/1_1.000_684
+TCCACGCCGTGGTGGGAACCGGATACAGCGACCAAGGCTACGGCACCAAGCACGAGTACGGCCACCAGCAGCAGAGCTACGGATACCACAAACCGAGCAAGTTCTGCTACCAGTGCGCCTACTCGCCGCCCAAGACGTACTACGACAAGAAGGTCGTGGTCGAGAACTATGAGTACGGACAACACAAGCAGGGATACCAACAGGGCGGCTACGGGGACGACAAGAAACAGGGCTATGGCCAGCAGGGCGGCTACCAGAAGAAGACTTACGTGCCGGTGGCGAGGACGGTCTACGGGGGCTGGGACAAGTGTTTCGGCTCGTTCGACCACGTCCAGGCCAAGGAGTTCGGCATCGACGTTTGGGAGTGCCACAGCAACTGCTACGTGCGCAAGGACCCCAACGGAGACCTGTTCCGCGGCTGTTACAAGGGCGAGTATGCGGTGGACCCGCACAAGTACGGCTGTAACCACCAGGCCGGGGCGCTCTGGTGCTTCTGTGAGGGCGACAAGTGTAACAACCAGGACATCGGCTACAACTAACCGTCCCAGCCAATCACAGCCGTCCACACATCTGTTTGTCTGCCAGCAACCAATCACAGTCGTGCTCACAGCTGGCTGCTTACCAGCAGCCAGTCACAGTCACCGATACATCCGTTTGTTTCTGCTTTTAACCAATGGCAGCCGT
b
diff -r 000000000000 -r d33ad52f59bc test-data/orthogroups_withParalogs/orthogroup_6_3_sequences_withParalogs.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/orthogroups_withParalogs/orthogroup_6_3_sequences_withParalogs.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,6 @@
+>Ac109_1/1_1.000_333
+AACTTCCTGTACCTTGTTGGCAATGTTTTCAACCTTCTTAGCGTGCTTGCCAAAATCTTCAAACATACGGCTCATACCGCGGTCAATTCTGTCGATGAGGTTGCTGTGTTCGCCGACCGCCTTGGTCAGATCCAGAGAGGCTTCCTTCAGCTCGCCGATGTCCTTGTCGTGCTGCATGTTGAGGTTGGCACGCTCGCACTGGCCGAGCGACGCGTTGAGCACGCGCACCTCGACCCGCAGCAGCCGGTCGTCGTTGGAGTCGATGCGGCCGTCGAACTCCTCGAACTTCTTGTCGATGAAGTCGAAGACGTCGGCCGCCTCCAGGTGGTGATC
+>Ap10_1/1_1.000_338
+CCATACTCAGCCGCCAAGACCACGGCCCAGGCTGCCACAGATGACCTGAAGAGACGTCAGGAAGAACTGGAGAGGAAGGCTGAGGAACTACAGAGAAAGGAACAGGAATTACAGAGAAACATGGGACACCAAGCCAGGGTGAACAACTTCCCACCACTGCCTGAGAAATGCTGTGTCCAGCCTTGCTTCTATCAAGATTTTGAGCTTGACATCCCATTGGAATTCCAAAGAATTGTAAAAACAGTGTATTATGTGTGGATAGCCTACATATGTCTGTTGATTCTGAATGTACTGGGAACACTGGCCTACTTCATAGCTGCGTCCAAGGCAGGTCATGG
+>As95_1/1_1.000_729
+GTGCAATATCCGAAAATCGCTGTTGGATTGCAAACTATTCCACAAGCCAGTCTTCTCTCGCATCTAATAGGAGACCCTACACTCACATTATATATTATAGCAGCCCACACTCACTATAAAATGCCTAGAGGACGTGGAAAACGCGGTAGTCACAAAGGCGGCCACCGAAAGTTCACGAATGCAGAGGAGTTGAAGCAACAACAGAGTAAACAAGAGAAGGAGAAAGAATGGCGGAAGATGAAGGGTCTGCCGAGCGACGAGTCCGGGGACGAGGACGAGGAGGGCGGAGCAAAAGCCGCGGCCAAAAAAACTGAGGACGCGGAGGAAGATGTCAAATTTGGGGACTCGTCCTCGGAGGAGGAATCATCAGAAGAGGAAGAAGACGCTAAAGCAAAAGGAGTATCACATTTAATAGAGATAGCAAATCCAAATCATCAAGTCACCAAATCTTCCAAGAAAGTGACGGAAATTTCAGGAGACGCCAAAGTGAATCTATCAAGAAGAGAAAAGGAGGAGCTTGCCAAGCAGCAGGCCAAGGTGCAGTACCAGAAGATGCACCTGGAGGGCAAGACGGACGAGGCGCGATCGGACCTGGCTCGCCTGGCGCTGATCCGCAAACAGCGCGAGGACGCCGCCAAGAAAAAGGACGAGGAACGCAAGCAGCGCGAGGCGGCGGCGGCGGAGGCGGAGCAGAAGCTCAAGGACAAGCGTGCGGCCGCCCGGGGCCAA
b
diff -r 000000000000 -r d33ad52f59bc test-data/orthogroups_withParalogs/orthogroup_7_2_sequences_withParalogs.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/orthogroups_withParalogs/orthogroup_7_2_sequences_withParalogs.fasta Fri Feb 01 10:25:10 2019 -0500
b
@@ -0,0 +1,4 @@
+>Ac113_1/1_1.000_323
+TCGATCCTGAAGAGTTCTAACGGAAAGAGGCTGATCCCGATCCCAGCCGACGAGGGATCGTTAGATCCCGATTATGAAAGTCTGAATAAAATAAAGCCATGGAGTCCTGTTGATGACGAGCACATCCGGATGGATGACGTTTCGCGCGAAATGCAACGCATCCACGACAACCTGGAGCGCATGCGTAAGCAGACGATGCTCAACTTCCGGCCGCCGCCTCCACCGCCACCGCCTTTCGATCCCATGATGCCTCAACTACTTCCGGTTCCTCAGTTCACCATGCCGTCGTTTCCGGCTTTGCCGGATCCAATGGCGCCGATGCC
+>Am9_1/1_1.000_360
+AGCCATCAAAGGTTGCTAATCATGTTGAGTTGTATTGTCAAGCATTTCTACTCGAGGCAACCATTAATAATTGAAGTTATCAGTTATATTGTCAACTCAATGGAAAATCAAATGGATTTAATTAAGGAAGGAAGATTTTGTACTTGTAAATCTGCATTTTATTACAAAATGTGTAATAAAATTACAATTCTCAAATGGATTCATATATATGCAAATAAAGGATTTATGAGTTATGATTTAAGAGTTGATCTTTCTTCTAGAAGTTGCATGTACTTGTGTAAACCACTAACAACTACTACTATAAAACTACTTGACATAATTCAAAACTACCGACATATATTCCAAATAAAACTTAGCTCA
b
diff -r 000000000000 -r d33ad52f59bc test-data/output_filterassemblies/AcAcaud_trinity.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_filterassemblies/AcAcaud_trinity.fasta Fri Feb 01 10:25:10 2019 -0500
b
b'@@ -0,0 +1,782 @@\n+>Ac1_1/1_1.000_629\n+CCACCACTGGCACAAAGGATTATCAAGGCTCATGACAAAGGTATAAATAAGACATTTTATGGCCAGCTGGTCGGTCGATGTGCTAAGGAGTTGTCTCTGGTGCAGATTAAACTGCTGCCAGAAAAGGTCAGAGAACCAGTCTTAAAGAGATACAAGATCTATGAGGAGAGAAAAAAGCTGGAAAAAATGACACCAGAAGAAAAAGAAGAATACATGAGAAAGAAGAAGGAGGAATACAGAAAGAAGTTAAATGAGATGCTGAAGAACCGAAGACTTGAAAAACACAAACGTTTTGAAGACACCGATTTGGAACTGAAGCCCATTCCAACTCCACGCCTTGTGGAAACTCCTGATGGTCTGGCAAATGAATTGTTTGGTTATGTTGCTATGGTGACTGAATTCATTAGCTGCTACAAAGACCTCTTCACGCCAAAGGATGACAGCACTGTAATCAATGTGACCACAGATGCCCTGATGACCAGCTTAGTGTCTGATGGTAGGCAGTCTGGACCAGTAGCTAACATCCTGACAACATTGCTGCAGACTTTGTTACAGGATGGCATCACAGAGGATTACACAGAGCTCGGTTTGAAGATGTCTGAAATCCCAGTCAACCAGTACACAGCCAG\n+>Ac2_1/1_1.000_896\n+ATGTTAGTAAAAGAGATTAAAGAGTACCGAGAGATAAAAGAGAAGGCTAGAACCTATCTATGTTATATTATAAGTAGTAACCTATCTTATGGTTCAAGCATAAATGAGGAGACTCTTCAAGAGAGTATGGAGATGTTAAAGAGGGCAATCCCAAAGAGTGAGGTCATCTATGTTTTAGATAGCGAAGGGATGCAGATAACAGATAACATATCACAATTCTCTAATCTACATGGTATAAATAAGGGTAAAGATAGGAGTAATCGTTCTTACTACTATAATACAAAAGCACAACATCGTTGTGAAATATCCGACCCTTATCCATCAATAGCGAGTAAACATCTGATTGTTACATCTAGTTTTCCTATTTATGATGAGTTTGATAATCTTCTATACATTATATGTGTAGAGCTTAGTTTGCAAAATATCCTAAGAGTGGTACACCCAAGCTCTGTGGACTCTATGTTTGGAAATGGTAGTAAGGTTGTTTATACAATATTCTCTTTAGCTCTATTTTTTGTGGCTATGCTTCTTTTTGTAAAGGGAATTACAAGTTTTGTGGGGTATGGAATAGATTTCCATAAAGTAGAGATAAATGATATGTTTAAATCGACAATTCTACTTACTCTATCTTTGGCTATTGTTGATTTGGTAAAAGCGATATTTGAAGAGGAGGTTTTAGGAAAAGAGAAGAAGCATGGAGACGGGGATACCCATCAAACTATGGTTAGATTTTTGGGTTCGATTATTATTGCCCTATCTATTGAGGCTTTGATGTTGGTATTTAAATTTGCACTAAATGACCCAAGTCAACTACTCTATGCTGTATATATTATGTTTGGTGTAACAGCTCTGCTTCTTGGTTTATCATACTATCTAAAAGTGAGCCATGATAGTTG\n+>Ac3_1/1_1.000_252\n+ATCTGTAATGTCGTTTACCACACACTGGACACTGATATTTCCGCTCGCCAGTGTGTGGTAAACGATATTACAGATCAGATGTGCTGGCAATCCATATCAGTACACACAGCAGTGAAAAAAATCATAAATGTGACATCTGTGGCAAGGCTTTCTCAAATGCTAGTTATGTCCACGTGCACAAGAAGATGCACAGCAGTGAAAAAGCACACTTGTGTGTTCAGTGTGGGGAGAGGTTTACAAGAGCACAATCAC\n+>Ac4_1/1_1.000_165\n+AAACAATGCAATCCTCTACCATTGCCAAGATATGAAGAACAAGTAAATGGCACATCAACAACAATGATAATAATAAGTGCTAATAACAATAAGAGTAATACAATTACCACAATATCTGAGAACAAGGGGCTTAAGCATAGCTATCATTATTTGGGAGGGGAGGAT\n+>Ac5_1/1_1.000_447\n+GCACCGGGATGCGGATTTGCTGACGATATGGCAAAAGCATTGTCAGCGTGCGGAACCTGTTTATGTCACACCACTGGCATCTTCCTGGCCGTCGCAGCCTTCGTTCTGACGGCACTCGGTATTGTCTGCGTCACGCGATCAGCTGACCCGAGCCTTTGGTACAAACTCGGTCTGGGAGCCTTCGCAGTGGCCGGCCTGTTCGCGCTACTTCTCACATGTTACGCCTGCTTCACGATTCACCGAGGTTGGAAGCTGTTCGGGTGCTGTGGCGACTGGACACAAGGGAAGCTTACCGAAAGACAGGCCCCCGTCAACTTGTATGCCACTCGTATCAACCCCAGAACAGATCCAAGGTTAGCTTCTAGACAGACTTCAAAGACCGACTCAGTGCCGGATCGAGGGACGGAAACGAGCGCCAGTCTACCTTCTAATGTTATTGGAATGGTG\n+>Ac6_1/1_1.000_393\n+CAGCCTACCACTGAGAAGAGATACTTCAACATGTCTTACTGGGGTAGAAGTGGTGGTCGTACAGCGGGTGGTAATGCAGGACGTGGTCGTGGCGGCGGCAGCGGCAGTGGCAGTAGTCAAAGTGGTGGTGGCAGCTTTCTACAGGAACGTATCAAAGAGATGAGTGCCCAAGAAAAACTCATTGAGCAGAAGAAAAAGGAAATAGAAGCTAAGCTCCTTGAACAAAAACAGAAGGAACAAGAAAAGGTTCTCTCAAAACTTCAGTCAAAAGCAACTGCTAAGACATCACTTACAAAGATTGGAAAAAGACCTGGTTATGGACGAGGTGGCATATTTAGTACCAAACGTGTGAAGCAAGAGGAGCCAGATGCTGAAACTGACACAACTCCACAG\n+>Ac7_1/1_1.000_614\n+GCACCTAGAATTACCCGAAGTTGCTTGGCAATAGCGACACCTAACGGTCGCCATGATATTTGCAGGAAGAAGGCATGTGGTACCATTGGGAACCGTCAAGCGTTTCCTCAGCCCTGTGGCAGCTGCCCGTCTGCGCCCGTGTTTGACCTTGAGCACCAAGTCACGACCTCTGTGTCCGTGTGGGTGTGCGCCCGCGCGCGCGCTGCCAGGCTCGGTTCAGACACGTTAAGGCACCTTCGTTCCGGTGGCGTTGGAATGGACGCGTTGGTGAGGCACTGGGACACGACCGTGAATCAAACTGGACGGAACCCGGTCTGGCACGCGCCGACACACGCACACACACCGATAGCAGCCGACACGCCGTGGTCCTTGGCTCCGGATTACAACACCCGGCACGGCATCCTCGGAACGGCGTCTCGGCGAAATGGAGAAACGATCCAAGTCAAGTCTTCGTCTACTGATTTGTCTACGGCGACAATGTACAACGGATGGCTGGGATATGTGTACCGCTGTCAAACCGGTCGCAGACGCAGGGGCCGTGCCCAGGACACGAACAGAGACACATTACAGTCACACCTGTCTGGGCCGACCACCCAAACAGTCCCATCGTCCAC\n+>Ac8_1/1_1.000_332\n+ATCAAAGAAGAGCAACATCGAGCTACTGGCACTGGCAATGGAATCCTAATTATAGCAGAAACAAGCACTGGTTGCCTGTTGTCTGGGTCAGCAATTGGTAGTAGAGGTGTTCCTGCTGAAGAAGTTGGGGTCAAAGCAGGACAGATGCTTTTGGATAACTTAGGTCATGGTGGCTGTGTTGATGACTATTTACAAGACCAGCTTATTGTACTGATGGCCTTAGCTAAGGGCACATCACGAGTCAGATGTGGGCCAGTCACATTACACACACAAACGGCCATCGAAGTTGTCAAGATGTTAGCAGAGGTGAATTTCACCATAACACAAGTATC\n+>Ac9_1/1_1.000_303\n+GCCATTCGTCTTAGGAGAAGTTTGTCGTCAGGAAAGATACATGAGGCCTGGATTCT'..b'AGAGTTGGACAGAGAATGGCAGAGGATACAGAACATTATAGCTAAACGTAAACATGCAGCAGCTGCTGAGGGCAGTGGTGGAAAGCAGATGAAATTTGTTGAG\n+>Ac379_1/1_1.000_279\n+TTTCTAAACATGTTTCGGGAGGTATCAAAACAGTATTTGGCTATGTGTCCTTTGAAAACCATGAATTTGTCCCACCTGATGATCAATGATTTGACACAACAAAGAGAATTACTTTTAGCAACACTGCAACATCCACTGAGTAAACAGTATCCACCATCTTCACGTTATAGAAGACAGTTCCTCAAATTGATGATCCAGCAGATAGAAGAAAATAGTAATGAAGTCCTGGATGAATTTTACACTGAATACACTGCACTGTTGAATGAAAAAGAATCGGAG\n+>Ac380_1/1_1.000_213\n+ACTATTGCCCACACCGAAGCAGCTTTCTGCGCGTTCAGTGCCACAGTTGTTTATCACAAGGTGATCAAAGCCCATTCAGAAGTGGGGGGGGCCTTCGTTCAAAGGACTCGGGAAGCGACAGACCTCCGTCCGTCAGCGCGATGTGACGAGGCAGAAAGAAGGAACACAGATTTAAACGTAAACACACGGCAGAGAATAATACTGTATGAACGA\n+>Ac381_1/1_1.000_207\n+ACAATTTGGCAAGCAATGGAAACTGACCAAGTCAGAAGCTCTGAGAGAGAAAATGAAACGACAAACTCTCACCAAAGAATGGTTAATAAAGGTTCCACATTTTCCAGTAACCTAACTGAGATAGGCATTGTTATTACCATTAACTCGACTTTCAAACTATTTGCAAATATATCTAGCACAGTGAAAAATAAAATTGAGCGTGTAAGG\n+>Ac382_1/1_1.000_227\n+TTCAGGGCAAGGACTACGGTACGAGTACAGCGCAGTAACAACAACAACAAAGGCGGTCTGTCCAGAGATCAGTGCGCGGGTAACGAGGCCAGCAGTGCATGCATGAGGCATCTGCTTCAACCAGCAGACGCCCAGTATGTCGGATGTGTGTGTGTGTGTGGTTTGTCTATCTGTCTCTGTCTCTCTCTGTGTCAGTGTGTGACACCGGTGATAAGGTCTGGAGGCGG\n+>Ac383_1/1_1.000_135\n+TCAAAGTTTAGCCGGTCATCAAGTTCTTGGCTGCGTGCGCTCTGCTTTGTGCGCCGTTCTAGCATTCATACGAGCGACGAGGCTTGTCAGCTGAGACGACACTTCTCCCTCGCCCATTCACACGCGCAGCGACGA\n+>Ac384_1/1_1.000_174\n+CAAAAACGTTTGCATAAAAATACCGCTACAGGAACTCAGAAGATTTACATAGTTAACTCATCTGTTAAAATAATAATCGAGAACAGATCTTCCGCAATGACCATTTATTCGTTGTCAATACTCCACAAGACAGCACAGATATCACAATCTCACAACGGATGTCATGTGACGGTA\n+>Ac385_1/1_1.000_198\n+TTGGTGTGTTTCAAGGAAAACATCCTTACTATTTTGTTTTCTTTCTGTTTTTGGAAGACTTTTTTTTGTCCCGTTTTTTTATTTGAAATGCTATTGTTTAGTTGTTTAATCAGTAGTCACCTGCGTTTATCAGACGGTCGTAATAGGAACAGGCAAAGAGGTATGCCAGTTTTCACTCTGAGCACCACCTTGTATATT\n+>Ac386_1/1_1.000_378\n+ACTCTACCAGTAAACACGTCGGTTAGCGTCGGCGGCTGGGGAGTCGCCGACCCTGATGATCTTTCTGAAGATATGGGCTTACCAACGATCTTACAAAAAGCTCAGTTGTTTGTGGCTGACATCGGCGATTGTGAGGCGGTATATAGTGTTCCCGTCACCGACAACCAGATCTGTATCAAGGATGGCAGCGGAAACACCGAGAAGGGAACGTGCGCAGGTGATGAAGGCGGACCTCTCATGTTTGAAGAAAATGATGTCACCTCTGTGGTTGGAATAATATCATATGGATCTGAAGGAGGATGTGTCGTTGGTGATCCTGCCGTGTTCACAAATGTGGCCAAGTACATCGACTGGATCAAGTATGTGATGGAACACAAC\n+>Ac387_1/1_1.000_553\n+CAGAACAGTGATGTAGATCCTTTGTTTTACCTGGAAGATCGGCTTGATCAGAAGAAGCACCTGCCCCCCAACAAGGCTGCAGGTTACCTTGATCTGAAACATATGGTCTATTATAGGCTGGATAAAGGAATAACAGTACAGATAAGCAGAGCACATGGGCTGTCAGAGGGACTGTATTATGAATGCTTTGCACGTGTGTATCCAGGAGTAAATGCACAAGGGGAGCAAGTCACTGATGAGGGTTATGGCAGAGATGATGAGCAGATGGTGACACTGAAAACAGACATCGACAGCTATCAAGTATCACCACAGTGGAGAGATCCACCAAAGACAATACACCCACATTTGGATCCAAGAACATTCCTGATGTTACAGGTATTTGGTCTGAGTATCAAGTATACAGCTAACCCAGATCACAGTTCACCTGGACAACTTACAGATAAAAATGGAGAAGAGCTGAAACTGCACCCAGAAAACATTATTGGTTGGACAGTGATACCACTGTTTGAGAATATATACAGCTACTCAGGTGAACACCATGTACCACTCTTCA\n+>Ac388_1/1_1.000_336\n+GCCTACCCGCCATCCTACCAGACGTACGACAGGAGGCTGATCGAGGCGTTCAAACCCGTGGCCAGGCCAGTTGTCTATTCGGCCTACGAGACGCCACTCTACAGCCCACTGAAGGAATACGAGCCAGCCAGTGGCTACGGAAGCCAGAGTCGGACGTCCTATCCTGGATCATACTCACTCTTGTCCGCTGTTCGTCGACCAGTTACCTTGTATGACACGCTGACGGATAGCTACATCCCACCTCAGACATACACACCGAACATCTACGACCCATGTAGTACCCTGCCCGAGGGAGACTACTCCCTACAGGGAGACTTCCTTCAACTCTTCCCTGGA\n+>Ac389_1/1_1.000_204\n+GCAACCTTCCACGACCAAACATATCTAGTCGCAGCACTTAAGTGCGCAGATTGCATTCATACAGAGCAAACCGGATACAAACAAGACCAACCACGCGGGTGGCTGGCAGTAGCGTGGCTCAATGACGTATACAGTTCGTGTATTCGGTTATATTTGTCTGGGAGACTTTTGCGAAGGAATTGTTTCATGCATGACAATAAAACG\n+>Ac390_1/1_1.000_342\n+AAATGTTCACAACAACATCTTTCGTTGGATATAAATCAGCTTTTAAACCCGGGAAAGAGGCAGTGTCTACTGTCGTATCAAAGTAGCAAAGGCTCTTCATCTGCGAATGGTGTCGCGATGAGTTTCAAATCAACAGCGGCACCTGAACAGCGCCTAGAACAGCACGTTCCTTCTTCACTACACCATCCCGATAGCACACAAGTGTCTTACGAAAATCACCTATTTTCAAGGCAATCTAGCATAATATTTAATGACAAATTCAGAGCACATGCATTTTCGGAACAAGAAAACGTTACGTTGACTAGGTTATGCCAGGATTTAGCCAGACCAAATGTTCGGTTG\n+>Ac391_1/1_1.000_337\n+CTGCTGCTGTGGATCGGCTCGATCCTGTTCGGCTTCTCGATGGGCCCGATGATCCCGACCATGATATCCTGCGCCAACCTGTACCTACCTCTGGAAGGCGCGTCCGTGTCTTTGATGTTCTTCAATCTGGCACTGGGCTCCATGTGTTACCAGTACTTCGCCGGCTACCTGTACGACATGTACGGCCCGACGGTCCACATGTCCATCGTCCTCGGCTACTGCATCACGACCACGTGCGCCATGGCCGTCATGTGCGCCCTTCTCAGAAACAGAGACAATCGATTTCAAAACAGATCCGCCGGTGACGTCATCGAGCAGGACGTCACCGCCAACGGAA\n'
b
diff -r 000000000000 -r d33ad52f59bc test-data/output_filterassemblies/AmAmphi_trinity.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_filterassemblies/AmAmphi_trinity.fasta Fri Feb 01 10:25:10 2019 -0500
b
b'@@ -0,0 +1,254 @@\n+>Am1_1/1_1.000_262\n+GAAGAAGTATTAGATAGACTTTCTGCAGAGGAAATTAAACACATCTTACTGAACCAACTGAGAAACCAGGATTCAAAACCAGTTGTTGCACTTGGTATCCTGTTCCCCCGCGTGTCATATCCATATCTAGGTGAACAGCATTGCGTCAGATGTCACATGACATTCAATTCGAGATCTCAGACGCCATGTTTATTACGTCATCCAACCAAAGCAGTGTCAAAGTTTAAACAAAGTCCCACAGGAGCACATTTTCACTGTCGTG\n+>Am2_1/1_1.000_279\n+CTGAAATGGAAGAAGGAAGTAAAGCAGGCAGTGCAAAAGTATTGGTTACAGGAACTGAAAAATGAGGCCAGATATAAAACGACATTGGCATACCTAGATGTAAGCGATTGCCAACCAGGCCTGATGCATAATGTCTGGAGGAGAACACCACTCAACAAGGCAGCTGTACTGCAGGCTAACATCAGAGCACAATTACTTGTAGGTCGATATCCACTGCAGGACCAAGCAAATAAGTTTAATAAAACCAACCATAAGTGCCCAATATGCAAGGTAAATGAC\n+>Am3_1/1_1.000_141\n+ATGTCAACAATCTGGACGTTAATACCAAATAGTGAACAAACATTCTGTTATATAACTAAGCATGAACAAATTAACATTGTAAAAAAAACAGTTGAGTCATGGCTCATAAAGTCAGGTATAATTGATATTTATTTGGATGAC\n+>Am4_1/1_1.000_144\n+ACAGTTCTAAATAGCATTCGCCAAATGATATTGAAAGCATATTTTATGAATAGTGGTTCACAGATGAAAGATCATTATTGGGAACCCGTTCCAGCTTTTGTAGATCATTTTGTTCTTGCTATAGATCATCGACCCAGAATACAA\n+>Am5_1/1_1.000_224\n+TACTGCTGTCGAAGTGATGGCGCTTGGAACAGTGTGATAACCTTGCCTACAAATAGGCCATTCTATTTGCTCAGATACACAAGTCAATGTCAGCTGGTGAAAGGAATGAAAGTCAGAAGGGAAGTATTCTACTGGGATAATGAAGATATTAACAATATTGATTACACTACAGGATATCACCCGTATGAAGATGGAGGCAGATACAACCATAAACTACATTATTG\n+>Am6_1/1_1.000_361\n+ACCACACAATCATCTAGTGAAACATTTACCAAAACACCCTCTGAAACTGTTCGGTCAGAAGAAGACAGTGCTAAAAAGCAGAAAACTTTCATCAAAAGCCCACAGGCAGTTGCTGTATCTGAAGAATCTACAAAAACAAATTTAACTTTTGTTGCTAAATCATCCGACGTTAACAGCAACTCTCCATTATCTACAGTACACCAGGCATCAGGATCAGGAGAAACATTTACCAAAACACCTGTAGAAACTGACCATACGGAACAACCTTCTGGTCAACCAGAACATAAACAGGCCTCCACTGACCTTGTTCCTCCAGAAAGCACCAAAGAACCGCTGATCCATTCTGGTAATGTGCTGGGTT\n+>Am7_1/1_1.000_325\n+GGGGCCCGGGATGTCGAGGATGTTGTACTCGTAGTTGCTGTGGTTGACGTGGTATTGTTGTTCCTGGCTGTGGCTCCGTTACCACTTGACGTGGCTGTTGTGGTGCTGGTGGAAAAACGACTAGTGGTTGTGTCTGCAACTAATTCCTCGCCTCTAATCAGAATTAATGGACTGTCTGCAATACGAATTCCACGCAGGCTTTTGTCCAATTTGGCAGATTTTTCCTTGCTGGTTATTTTAGGTTCAGTTTTGGTCAAATCCAGTCTGTCACTGATCACACCATACGCCAATCTGCATACTCTCCCATCCTCCAGATCGGAAGAGC\n+>Am8_1/1_1.000_144\n+GTATTAATAAAAGGACAAGACTATTATTTAATACCAAGAAATCTGGCCTTAATAAGCATGGTTGCTTATATCATAAGCATGGTAAATCACATTGTGTTTTCCATGTGTTTACCCATCAGATGTAAAAATATTCTGCATGAAATA\n+>Am9_1/1_1.000_360\n+AGCCATCAAAGGTTGCTAATCATGTTGAGTTGTATTGTCAAGCATTTCTACTCGAGGCAACCATTAATAATTGAAGTTATCAGTTATATTGTCAACTCAATGGAAAATCAAATGGATTTAATTAAGGAAGGAAGATTTTGTACTTGTAAATCTGCATTTTATTACAAAATGTGTAATAAAATTACAATTCTCAAATGGATTCATATATATGCAAATAAAGGATTTATGAGTTATGATTTAAGAGTTGATCTTTCTTCTAGAAGTTGCATGTACTTGTGTAAACCACTAACAACTACTACTATAAAACTACTTGACATAATTCAAAACTACCGACATATATTCCAAATAAAACTTAGCTCA\n+>Am10_1/1_1.000_318\n+AGCAACTTTGCCACCACCACCACCACCAACAATAACAACAACAGCTGCAACACCGCGACCAATAACAACAACAACACTGGTAACACTAACCACGTCACCACCAGAAATAACATCTTCACAACCATCACCAACACTACCATTAACTCAACTTATAACAATAACAACACCTCAAGTGTTGCTACCTACATCACTCAAAACAATTACAACAACATCAGAATCGCCTTCGACACATACACAAGCAACAATTTCAACAACTTTTGTGCCACAAATATCTGCCACAACAGTCCATTCAGCTCCCCCTACCTCACCACTCACTAC\n+>Am11_1/1_1.000_207\n+ATTTTTTGTAGATATTTTTATCTATTTACATTTCTATCTTTATTTCTCCCTACGACCGAAGGCCTCAAAGAGCATATGATTTATTTCTGTCCATTTATCGACCGTGCGTCTGTCTGTCCATCCGCCTCCCTTCCACAAACAGCTGCCGCTACTGTTATATTTAAAGTTTTCTGGTATCGCTTAGTCCGTTTTCTGGTATCGCTTGGT\n+>Am12_1/1_1.000_120\n+ATAAAGTGGGCCATACAAAGTGAGACCTTACACATATATGAATGTCTAAATTGTCCTATGTTGTCCCATTTAACATGTTTAGTTTGTGGTATTTTTCAAACAAATATAACATGGGGTTTG\n+>Am13_1/1_1.000_264\n+ACAACTCCTCCAATAGTACTACCAGCTTGTCAGGGTGAACCAGATGGTAATGCACCTGATCCTGACTCGTGCTCACGATATGTAGTATGTCTCAATCAGGAACCGGTTAATGACTATCCATGTGATCCAAGTACCTTCTTCAACGACCTACCCGAGTACAGGGAATGTACAGACCCAGACCTACTGAGCAATGAGCGATATTTTGAGTGTTTTGGAATCACAAAGCGACCTACTGCAGCCATTGAATCTACTTCAGTAGCCCAA\n+>Am14_1/1_1.000_153\n+TACTTTCCTGAAATTAGTTCTAATGGTTTCATTGTGATGACAAAGTTTAATATGTCAAGCATAATAAACTTGATTGTGTTTTTCCACCTCAGCAGTCATTTATACATTTTATTGAATGTAGAGGGTGTTGAGACATTCAGTGTTGTTATACTT\n+>Am15_1/1_1.000_241\n+AAAACTACCATTTTGTATTCCACCACTGACATGGATAGCCCCAAGCCACCCACCCATACCATATCAAGGTTTGTGGGTAGAGGAATGGACAACAGTGTATATCTAATTCTAGGAGTTGTATTTCTGGTGGTGATTGTTGTGGTTGTTACAGTTATTCTGTTTATCAGTTTTAACAGAAGGAAAAAGAACAGCGAGTCTTCATCATCAAATCTTATATGCACCAGTAAAAATTATCCCCAAG\n+>Am16_1/1_1.000_298\n+CATTTTTTTTATTTTTCAACTGGTACTCATTATCCAGGAACAGTACTACTCAAGTACCAAAATATCAAAGAAACACAATG'..b'ACATCCAGA\n+>Am112_1/1_1.000_195\n+TACCTTGTCCTGAGGGGGCGACATACGCGAGGTCAACACGCCCGGGCCGACCATCACTCCGAGACCACATTCACCTCTCGTGACACAGGTTCACTAGATCGTTTTGATATGCAAAGTATTTATCTCGCACATAACGATGACATACTGATCGAATTTTGTCACAGAAAACACACATGTACCAAAAATGATCACAAA\n+>Am113_1/1_1.000_362\n+AATGTGTTCACGAGCCCCGGGGCCCTAATACCCTCTACATGCCTGTCCCCGTTTGGTACAATGGGCGACTCATTTTGTGCCCTACCGCCCTCAGAATCACGCTGGAACGGTATGTCACAAATGTCTCAGATGGCAACTGGAAATAGCTTGTTCGGCAAGCAAGGTTTTGGCCAAGGTTTCCCTGCCCATATGAACATGAACATGAACGGTCTGGGGGGTGCAGGAAATATGGGACTTGGAAATGGACTTTGTTCAACGCCTCCAGGCAATACTTCTATGTATTCACATCCCTATGGCGTCACATCTACGTGTGATACGTCACTAACCAATGGCTCAGTGACGTCATCAGTTGCCACTGGAAT\n+>Am114_1/1_1.000_255\n+GAAATAATGTCAAATTTCGAAAAAAGAAGAAAAAAAATACAAATGTTCATCTCACCAGAAGCTCGTAATTGTATACATGTAGACCTAGTTCATTTAATGAGACACATCATGTACCTGTATTTTTTTGGTGTATGGTATTTGAAAACAAAAAGAAAACAGTTTTTTATCAACATACATTGTATATATATTTATAATATGCATCTAGGAGAAACAGTTTGTTTACTGAAGAATAAATGTAAAATAGGTAGTGAAGGT\n+>Am115_1/1_1.000_261\n+CCCTCTGGTGATCACATGACTCTCTCCAGTGCTTCCAGCAGCACTATGCTGTTACCTCGTACCACCACCATGCCGATCTCGTGCTTCTCTCCACTCTTCGTCTCCTCCACGGCCTCGTCAATGACCAGGTTCATGAACGGGTCGAACCCTCGCAGCGTGCCGGTCACCAGACGGCTGCCATTCAGGCGCAAGGTCAGCCTCTTGTCCATGTACTTCTTCAACTCTGGCGGATGTGCTTTAATCTCCGAAAATCACCATGAG\n+>Am116_1/1_1.000_183\n+TATCAATTTATATTATCAATCTCACCATTAATTGAAACTACACACAAGTTGAGGTACAACAGATTTATATCTATCTACATATATCCACACCTGGATGATGAATCCTATTATAAAAACGTAATTACAGTAGATGTACTGTCATACATGTGGAATTGGGTTACATCAATTCTATCCAAAATAGTA\n+>Am117_1/1_1.000_300\n+ATTGAATTTATTGGAACGATGATGAATGATGTATGCAATGCCCCTGCCAACCAGTGTACCATATGTTCAAGAATGTTCTCAACTCAGACAGACTTGGTTCAGCACATATCAATCCATACAACAAACTCTAGGTGGCGTTGTGATCTTTGTGGTAGAGGATATACAAAAAGAGATGCCCTTGAAGGTCATATAAATGCCAGGCATACAAACACCCTTCAGTTTGCTTGTACAAAATGTGATTTGGCTTATGCATATAAATCTGCATTACAGAGACACATGAAATATAAACACCCTGACCCA\n+>Am118_1/1_1.000_279\n+AATGGCTTAAGAAGATCTGCTATGTCAAGTCTGCATGAAAGACGCAAACCTGGCCGAGAGTTTGTTACGTTTTTACTTGTTTGTAATATTGCTATGATGGGATTGAACACTTTTGAAGTACTGCGCTCTGATGCCAACCCTGTCTCATTAATATTTTATGGCAACTTAGCCTGGAATATTGTCACACATATTACTACGCCATTTGCTATTTTCTACAGGTTCCATTCTGTAGTATGTCTAGCTACAGTTTGGCAAGGCGCATATAAACTGAAATTCCAC\n+>Am119_1/1_1.000_263\n+CGTGGAGGACCAAAGACCTGGACTGTGACGAAAGGTCCACGCTGGATAATCGTTGATGCAGTGTCCAACAATGGTTTCATCCCTGGAGCGAATTTAATGTTCCAGTCAAAATCAACTGGTGACTACCACGAGGAAATGGATGGGCCAAGATTTCAAAAGTGGTTTCAAGAGCAGTTACTACCGAATTTGCCGCAAAGGGCTGTAGTTGTTATGGATAACGCCTCTTACCACAGTGTGGAAACTGATGATACAAAAATCCCTTC\n+>Am120_1/1_1.000_187\n+ACTATGGATGGGATTAGAAGTAACACTTTCTATGGACATTCTATGAAGGGAAATGCTTTTACAACTAAGGTGATCATGATGGATGGAGAAGTTAGGTTTTGGAAACTATTCAGCTTCTTATGGATAATTATGACCACTGATATTGCTTTAGGACAAGAGAGTTTTCAAAAAGCATCATTGGAATGTA\n+>Am121_1/1_1.000_180\n+CAAGAATCTGTGACTGGTAAATTCTGTAATACAAATGTAGTAGAGTGTTATTGTATTCTTTGTAATTCTGGTGCTATAGAACATGTATTTCACTTTCTTTTTGATCGTTCCATTTATCAAAATGAAAGAATTATTTTTTACAGAGTCAACTATGTCCAGATTTTAACATTTTTTAGTAAC\n+>Am122_1/1_1.000_276\n+TTTACATTTTTAATAGCTAACAAATGTCACAAATTCATAAGTTTAACAAGCAAGGTATGTTTCCTCTATGAAGCTAGGAAACACCCCCAAAGTGGTCATTTTTGCTTAAAAGAATGGTACCTTATATTCCATTTGACATCTTTTAAACCTACAAAGAAATGTGTAAATGAAGTAATAGGATGTGGGATCCAGTCCATTAGTCATTTAGACCTTTATCACATGTTTATGTCAGTTGATATGTCAATGAACATTAAACAACTGCTCATGAATACTCTG\n+>Am123_1/1_1.000_144\n+TGTGCATTTTCTGTGTTCACAAATGGTTTTCTTGGTCAATGTTTCCAAGATTTGATCATCCACAAAAATGATCATGTTTCAATTTTATATTTGACAATTATTTTCACTCGGTCCATTCATATTAAAAGGCAAAAACCGAAACCA\n+>Am124_1/1_1.000_165\n+CATACATTTGTTAATTTACCAGAGCAATTTCACAAAGATTCCATGTCCAATTTAGTAAGTATTTTTCTGAATTTCAATGTATTACATATTTATGACCATACATTTTTTTACCAAGGCACTCAAACTCAGTTCATCACTCAAAATAGAGAAGGTAACAAACAAACC\n+>Am125_1/1_1.000_210\n+ATTATACATTGTAAAGTATTTTGGAAGGGCAGTGTACATGCAATGTTATTACATAGTCTATATTTTAATCACATGTTGTTAAAAGTAAAGTTGCAGATAGTAAATAGTGTCCCTGCTTATCTTGTGCACATAACAAAATCATATCTGACCTGTTTTATCTACATAATTTTGATGAATGCAAATAACACCTTTATCATTGACCCCCGGCAT\n+>Am126_1/1_1.000_237\n+AATGGTTTCAAATGGGAAAAGGACAGCAATTCCTTTTTCTCCTTAGCTATGAATAGTCCAGGTATTAAGCAAAAAATCGCAGAACTACGCCTAGCGAAATTGGATAATCAAGAAATCGATATCAACAAATATTATCAACAGATAGTTGATATCATTATTGAATCAGCTAACTCTGTTCTAAAGAAAAAAAAATCCAACACACATAAAAAAAAAACGAAAATGGTCCGACCCGAATTG\n+>Am127_1/1_1.000_108\n+TGGGGTCCTCATCCATCCGTTCCCACCCACTTAATTCACTTACATTTATTTCAGCAGATTTCCCATTCCCTTAGGACCTCATCCATATCCAGGGCTCCTGATGCCTGG\n'
b
diff -r 000000000000 -r d33ad52f59bc test-data/output_filterassemblies/ApApomp_trinity.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_filterassemblies/ApApomp_trinity.fasta Fri Feb 01 10:25:10 2019 -0500
b
b'@@ -0,0 +1,216 @@\n+>Ap1_1/1_1.000_168\n+GGTCGCCTTATAAAAACCAATCCGAAACAGTTTTCCTTTGAAACGTGCCAAAAACCAAAAACATACTTCAAATCTTCCAGTGTCTGTTATAAAGGGGTGAGCGTAGAGAGGGCACTTGTGAGATTGGTGTCTGGGTTAAAGATTTTGCCAAAAAGCGATTGCTTGGTT\n+>Ap2_1/1_1.000_174\n+ATACTCAGGCACACAGCATTTGTCGTACTAGGCGAGAGAGAGAGAGGAACGACTAATTGCAACCACGATTACGTTACATTTGTTTACAAACCAAACGTACTGGCGTCGAAGATAATTAAGAGGAAGCTGACTGAATGCGATTGGCGTTGGTCTACGGGTTTGAGTTCTATTATA\n+>Ap3_1/1_1.000_546\n+GCCATGCAGTACACTGGACTTCTGTTATTCTGTTTGTTTGCCTTGACGGCAGCCAAACCCGCGGAAGACCTTCAAATGCTCATCCGAGCCCTGCTCCATGAAATAGAAGAGGAAGGTGAACTCCAAGAGCGAGGCATTGGCGCCGTGAAGTATGGTGGAACGAACGTTGGAGAAGACTACGTCGAGGTGAAGGTGATCAGGAACATGGAGGAAGTGAAGGCCGACCAGAAGAGCCACAAGCCACTCTACTCTCTTATATACGGCAAAGGAACCCACGATCCGAATTCCTCTCAACATTCGCTTACTTCCTGGACCTGGAGCCAACTGGATAAGTGTCAGAACGGTGCAGAGGGATGTTTCATGATCAGAAATCTGAAGCCAAACACCGAATACTGGTTCCAATTAGAAGTTCAGATGTGGATCAATGGAGCATATGAATACATCGAGAGCAGGAAGGATGTTGAACAGATCAGGACGAAGGGAAGACAGGAGAACGCACCATGGATGTCTTCAAAAAGTTACAAACCTGACGCAGACATTCGTACC\n+>Ap4_1/1_1.000_294\n+ATTTCTGAGGGGGCGCCACCAGTTGTCGTAGTTTCGATCACCAGGCAGCCTCGGCGCGAGTCAGTTCCTTGCTCCGACGACTTGGTTCAATCCATCCACCTCGTCGTTGAAGATGGCTACAAACGAGCAACCCGGCCGTCACCACTCATCAGAGCAGGACGACGGACAATTATTCGATGGCACAGGGCAGTGGGAAGACGACTATCTGTTTATAGCATGGCAGTGCGCAGAAGGCTTCGGAGGTGTGCTGGCTTTGACATCGACAGGGTTAAGCCATTGGCCTCACCAGGCCAA\n+>Ap5_1/1_1.000_271\n+AATCTACTGACAGATACCTGGAACGAGATGCAGGTCAAGTGGTCGTGTTGTGGTGTGGATGGCTACTCCGACTGGACGCAAGCTGAAGGTCTGGCCACGGGTCACTACGTGCCGCAGTCCTGCTGTCAGAACACGATGAGTACAAGCTGCACGTCACAGAACAACCCGACACTGTGGTGGCAAAAGGGCTGTCTCGGAGAGCTGAAGTACCGCCTGAAGGAGAACCTGTACATCATCGGAGTGATTGGCATCTCCGTCGGCGTGGTGCAGG\n+>Ap6_1/1_1.000_390\n+GAGAACGTGTTAGCTTCACACTGTCCGGTTGGCTTGTCCTCCACACGCTACTGGCAAAGCGAAATGGCTGACCTTCCACCTGGAGATGCTGAGAGAGGAAAGAAGATATTTATCCAGAGATGTGCCCACTGCCACTCTGTGGAAGCTGGTGGAAAACACAAACAAGGACCAAACCTTCATGGCTTCATTGGTCGTAAAACAGGACAAGCTCCTGGCTATACCTTTACAGAGGCAAACCTAAAGAAAGGTATTATTTGGGACAAGGAAACCCTTGACATCTACTTAGAGAACCCAAAGAAGTACATACCTGGAACAAAGATGATCTTTCCAGGTCTTAAAAAGAAGGCAGACAGAGCTGATCTGATTGCTTACTTAGAGGAATCCACAAAA\n+>Ap7_1/1_1.000_421\n+TTCGTAATGAATCTTTTTGACTGGTATTCCGCAGGATACTCAATAATTATTGTCGCATTCTTCGAAGTTATCGCCATTTCTTGGATATACGGTCTCCAACGGTTCAAGAAGGACATTCAGATGATGGTTGGCAAGGGGCGATGGATCAATGCTAGTTTCTATTACTACTGGTATCCTACTTGGTTTATCATCAGTCCAGCTTTGATGCTGTACATCCTGGTTACCATGAGCATGCAGTTCGCACCAATAACGTACGGGGGTAGCATCAGCTACCCAAGCTACGCTGACGGCATTGGCTTTCTGATGGTTGGCCTCGCCTTGATCTACCTCCCAGTTCTCGCCATGATTGAATATTGCAAAGCTCATGGTTTTTTCAGCACGATGCAAAAGATCCTGCGACCGAAGCCTGATTGGGGTCCGG\n+>Ap8_1/1_1.000_417\n+GCGAAAACTGGTTTTAACACAAATAATTGTTACAGTACCAGGTTTCGGAACACGTTTGCATATAACCAGCGAGAGTGGTGCTCAGTTCTGTTATGTATGACAGTCCTTCTCCTCAACATGCAACGGAAGCGAGCACTTCCATCATCACATTTGTCAATAAATACTGCATGGTACTCCGGCCAGGGTGAACAGGAAGAAAGACTGATTGTCAGCACTCGTGCATGCTCACCAACACACACACACACATCCTCACATGTATGCACACGCACACGCAGGCCAAAACACACTAACACGCACACAGGCTCAAGAATGTTTATTAGACATAGTAGTAGTAGTAGTTGTCATTCAACTCGAACAACGAGTCGCCTATCACTAGGCATCATCTTTCTGTGGGCAAACCGTGGACCGATCAGACAG\n+>Ap9_1/1_1.000_470\n+TTGGAAGAAGAAATAGAAGAATTAATGCATGAGAATGATGATGAAGATGGAGTTGAAGTTGAAAAATCAAAAGATAAACATGAAAGTGTGGAAAGGGCTGAGAAGAGAGGCAGCAATAAAAATGATGTAAAACATGATGAGAAGGATAGAAGTAAAGACAACAAAGAAAATGAGTTAGGTCAGATTAAGGAAGTAGAAGATATGGGTCCTAGTGTTGATAGGAGTGAGAATGAACGTGAAGCAGTTGGGAAGGGAATCAAATCAGAACAGGAAGGGTCTGGTTCTAAAGCCAACAAACACCAGGTATCACCAACAAATCAGGGTTGTTCTCACACAACCAATGAGAGTGAGAAGAAAGAACCCTCACACCCTAGGAGTCAGTCTCAACAGGACAGTGATGATGATGATGGGGAGGGTGAGACATTGCATGAGAAGAGTTCATCTGAAGGGGATGATGAAGGGAATCAAAT\n+>Ap10_1/1_1.000_338\n+CCATACTCAGCCGCCAAGACCACGGCCCAGGCTGCCACAGATGACCTGAAGAGACGTCAGGAAGAACTGGAGAGGAAGGCTGAGGAACTACAGAGAAAGGAACAGGAATTACAGAGAAACATGGGACACCAAGCCAGGGTGAACAACTTCCCACCACTGCCTGAGAAATGCTGTGTCCAGCCTTGCTTCTATCAAGATTTTGAGCTTGACATCCCATTGGAATTCCAAAGAATTGTAAAAACAGTGTATTATGTGTGGATAGCCTACATATGTCTGTTGATTCTGAATGTACTGGGAACACTGGCCTACTTCATAGCTGCGTCCAAGGCAGGTCATGG\n+>Ap11_1/1_1.000_406\n+GAGGTACCCAGTGTGGCTGTACCAGGTGTTGTTTCAACCGTGGTACAGGATTCAGCACACAAGATCTTCATTGGTGGTCTACCAAACTACTTGAATGAAGACCAGGTTAAGGAACTGCTGACATCATTTGGTCCCCTGAAGGCCTTTAACTTGGTGAAAGATAGTGCAACTGGACTGTCGAAGGGTTATGCATTCTGTGAATATCTTGATCCTTCCATAACTGATCAGGCCTGTGCTGGCTTAAATGGA'..b'ACGCTAGATGCCCTTCAGAATGACATTGACACACTAGAAGCTGAGAAAGCCG\n+>Ap94_1/1_1.000_282\n+TGGATTGGTGACAATAAAATTGCTGCTATTGGTGTTCATGGTAGCCGGTATGTGACCAGCCATGGCTTGGCACTGAACTGTAACACGGATCTGTCTTGGTTTGATCATATCGTTCCTTGTGGATTGGAAGGGAAAGGAGTCACGTCACTGAGCAAAGAAACCGGTCGCACTGTGACCATCGAGGACGCAACGAAACCATTTATTGAATCGTTTGCTGAACACTTCCACTGCACGCTTGAAGATAAAGACACTTCATTGATCTATGAAAAAATACAGAAAACG\n+>Ap95_1/1_1.000_183\n+TCACCTATAGCATCTCTAGGACATACCATGCTTCACTGTGACACTTGGCAGGCCTTCTCATCACAAGTCACTCGGCTATTACATCACACACTACAAACACAGATTTCACATTATAGCATGAACACTGATGTACAGCTTGGCCAGCTGAATAGCACGTCCAAGGCAAGTGAGTCAGGATTGCTT\n+>Ap96_1/1_1.000_156\n+ATGTTTTGTTTGTGGAAAAATAACATCCACTCATTTTGCATTGTACACCCATTGTGCAAGATTGTCTCATTCTGTATTTATATATGTCGTCTGTATGTTATATGTCAGGCTGCCATTGTAAGCAATATCCCGAAGTTGTCATTTTGCCGTAGTTTA\n+>Ap97_1/1_1.000_156\n+ACAGATGAGTTCAGTCGAGGAGGCGGTCCATGCACTGATGGCCCTTCACAACATAGAGCTGGGCAACTCGAGCCACCTTCGTGTGTCATTCACCAAATCAGTGATCTAATATGTTTGGGTCTCCACACTCCATCTCTCAAACATTCCACCCACAAC\n+>Ap98_1/1_1.000_273\n+ATTGTTAAAATAAATGAGGCTGAAAACCAAGTAGTAGTAGATATTGGTAGAAAAAATGAGGCTATTATGTCTCTTGACCAGATAAGAGATGAAGATGGCAATATTATGTTTAATATCGGAGATACAATTCCAGTTGTTATTACAAAAAGAAATGGAGAAAGAGTTAGTATCTCATATGAGTTAGCAGAAAAGAGAATAGCACTATCTGAGTTTATCGATGAGTATGATGATGAAGAAGAGTATATAGTAGAGGGTGTAATTGTTCGTAAAAAT\n+>Ap99_1/1_1.000_210\n+GACACTCCCAGTCAGATGTCAGACAGGACTGACAGTGATGAAGCTTATGATTTAATTACAACAGATGAAGTAATGGAATCATTATCTGAGCCCGTGCCAGACCCAAATTTGGATTTTCATCCCACTATCACCCTGGAACAGATTGAGTCAGGTGTATGCTTGTGTCCCCTAGAGCCATGGGTCAGTGCTGGTAGATTGTATGCTGTGCCT\n+>Ap100_1/1_1.000_246\n+TCATGCAATCCACATTGTGAACACTGCAATTTACTTGTGCTCAACACATCTGCCTTTAAAGCAACCAGCATAAAAACTGCACTTCAAGCATGCAACAACAACAATATGGAAGGAGACTTTGCAATAATTGTGCAAGTCACAGCAATTTCGTTCTGCATTCATTTGAAGGTTTGCTGTCACAGACATGAGCAAACTCACCAAGTAAACACTCCCAGTGGTACCATGACAAAGTCCACCTCTGATGTG\n+>Ap101_1/1_1.000_309\n+GTGTGTGTGTGTGTCTGTGCACGGTGTGTGTGTGTGTGTGCCACGTGCAAACTATGTACATGGTGCGTACCAAAAGAAAAACTTCTCAAACACAACGGTCCTCCTATAGACCACAACGACCCGACAACAAAACAAAACCTTGGTCATTTCATATCCAGAACGATTTGGAAGCTGAACTCGTCGCTTTCAAACTGTAACCATTCGCCTCGTACACATAATCATTCGTCTCCGTCCTCGCCAGGAGAGTTCAAGTTTACAGTCAACAACGAAGATAAAGGAATATTTGTATGTCAGATAAAGGTTGAGCAA\n+>Ap102_1/1_1.000_382\n+ACAGATGAATATGATCCTCAGCGGCCAAATGACTATGAGAGTTACATCAAAATGCGTAAAGACCAAAGGCAGAGAGAACGTGAAGAGGAGAGGAAAAGAGAACTGGAGGAAAGGGAAAAGAGACGCCGTGAGCGACACAGAGATGAATATGACAGTGATGAGGATGATGAGTTTAACAGGAAAAGAAGAAGAAGCAGAAGGGATGATGATGATGACCACAGAAGAAGTTCGGAGCACAAAGCTAGAGGTGCTGCAATAGCTCCACCACAGTCACTGATTGAGTCCAGTAAGCCAGACCCAAAAGAAGTTTCTCTGCCTCAACCAGAGAACAAGCTAACCTTGAACACTGGAGAGTATGGTGGAGGATTCAGTGTTGGCAAAG\n+>Ap103_1/1_1.000_274\n+GACGATCTAAACATGGGTTCGTATTTAACGTTAGCGTCATCTATTTGTTTCCAGAATTCCGTCTCATCCTTAGGTGGCTTGAATGCAGTACGACGGAGGTCTTCCGATATATTTACGACGGATGAACTTGAAGCCAGGTTAGTTCCCGAACCAGAGCTCATCATTGTGGTTTCTTGTGCGTCGCTGGGTGGCAGTGATGTTGATAATTGTGAGTTATTCGACCTCACTCTTTGCGAAATTGATATCACTGAACCTGATACCACTGAACTTTGTG\n+>Ap104_1/1_1.000_215\n+AATGCCAAGGATCTCTCTCTGTCCAAGGAGCAGCGTGTGGAAATCCTCAGCGAGGTGATGGAGGACACCGGTTTCGGTCGGATTAAGGAGTTCAAGGAGGCGTACAGCGAGGCGCTGAAGGAGAGTGTCTCGCACAAGGACAACGACAGTGGCAAGGACGACGACCACAACGACAAGGAAAACATGGGTGACGACATGCTGCCGAATTCAGAGCC\n+>Ap105_1/1_1.000_215\n+TTTTTTTTTCTAAATTTTGTCCTCTTAATTTCCACGTTCTCAACCACCGGCACTGCGACAACGCTTAACTACGCCAATCCGTCGTTACAAGTGAAACCGAAACCAGAACCGAAACAACGGAACGAAGAAAACCCGACCTGGGGCGGTCTGCCGTCAGTGCTTCTTCTATTACTAAAATCGATCGTATTAATTAATGTGCGAATATTACAAACACA\n+>Ap106_1/1_1.000_219\n+CTTGCTTTTAAGGCCGTCAGAGCCCAACAAGTTGGTGTGAAGCCTGAAGACGTGGAAAAGGTTGAAAAAGGAGAACTGATCCATGACAGCATGGAAGAGCAAGATTCAGGGAGTGCACAGGACACAGCACAAGATGATATGAATGATGTCGATGAGGAAGATGAAGAAGCAGTTAAGCAGAAGAGGAAGGAGTCTAAAAACAAGAAGCGTAAAAAGAAG\n+>Ap107_1/1_1.000_158\n+ATATCAGCATTTAACGGTAATCGGACAACTGAGATAGCGGCTTGGAACCATAAATATCAGAAAACAGACAACAGAATGAATTACCTGACGACTCCACAGTATTACACTAACGTGAGTTATTGGTATCCTTATTCCGTACAAGGTGTCGCTGATCCAAC\n+>Ap108_1/1_1.000_314\n+CTAGATGACATGGACATCTTTAACTCTCCTCCACTTGGCATCTTCAGTGTAATCAGAAAGATGCCTGATGCAGCAGAGCTGGAGAAGACAATGTCATTGTATGATCGCATACAGAGGGATTTAGAGTTAGCTGAAATGACTTATCCACCTCAAAATGCCTTTGAGGAATGGTCAAGATGGACAAAGGAGGGCAAGATGTGGATTTATCCTGTAGATAATGAACAAGGAATGGAAGAGGAAGCCAATGTTGGTTTCCATGAACATGTCTTCTTGGACCACATGCTGGAAGACTTCCCAAAACGTGGCCCTGTACG\n'
b
diff -r 000000000000 -r d33ad52f59bc test-data/output_filterassemblies/AsAsp1_trinity.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_filterassemblies/AsAsp1_trinity.fasta Fri Feb 01 10:25:10 2019 -0500
b
b'@@ -0,0 +1,866 @@\n+>As1_1/1_1.000_270\n+AGCATTGTCCGTGTTGCGCGGGTCGTCGACGTAACCTCGGTACACCTCAGCGTGCCCGGCCATCTGGTGCGTGAGCCGCTTGAAGACGACTCTCGCCGGCGGCTGCTTGCTGTCCAGCGTCATGCTCTCGAACGCCTTGATCCAGGACTCCTTGACACTGGTCACGGGGTCCTTGCCGCTCCGCCCGAACGCCTGCACGAGGGGGGGGGGGTAGGAAAAATAAGCACATGGATTATGGGAATGTATGCACGATATAATTATTTATTTGAT\n+>As2_1/1_1.000_225\n+ATCACGCCCCCTGTCGTGGACAACAGGCTAGCCCATTGTAATGGGAAATCTACAGTGGTAAACAAACTGATATACAATATAACCAATATGTATATATATATAACAGATATGGAGACTGATCATAAAATCAACGATTCACTTTTAGGATTAGTCATGTTTGTTGGAGTCAAATACTTGTGTATAAATTATCATTGCGATCAATCAATTCAGCCTCATTTCAGCGAC\n+>As3_1/1_1.000_596\n+TGTGCGTCGGTGCCGGACTGCAGGCTGTTGTTTGTCGGGAGCACCTCCGGAGTCATCAGTGTCATCAACACCAAGTTCAACCAGAGCAAGCAAAGCCACCTGCAGGTGTTCGGCCACAAAACCTGCCTGTACGGCCATTCCGGGGCCGTCACAGCCTTCTCCGTGTGCAGTCCCTTCAGCATCCTCGTGTCGGCCAGCAGGGACCGGTCGCTCATCATATGGGACCTCAACAGGCTTTCCTACGTGCGATCGATCACGGACCACCGCAACCCTGTACACACTGTTGCCGCTAGCGACACCCTGGGTGACATAGCTTCCGTTAGCCATACAGACCACGGGAGCTGCCTGATGCTGCACACCATCAACGGGGAACATGTCAAAAGTATCGAGTGCGAGGAGCTGGTCCTGTGCTTGACGTTCTCCACGGCCCCCGAGGGCCGATCGGTCAACGTCATCGCCGGAGGACTGAGCAGTGGCACCATACGGTTGTGGAGTTCCTGGGACCTCAATCCAGTGCGAGATATTTGCTCAGACAAATTCACCCACCCCATTGTGAGCGTGGTGTTCACACACGACTGCAAGAGACTGTTCGCCGA\n+>As4_1/1_1.000_546\n+ACACCCGACAGAAACTTCTCGAGAAGGGGATTGGAGATTCCATGGTCTTGGAGTCTGCTGATGTCGTCACCGACGTTGCCATTACCAACAAGGACGATGAAGGCCAGATCAGATGGCCCAGCTAAGCTTGGGTCAAGGAGCGCCATCAGGTGTCCATGTCCCTTGTGCGGTAGATATATCTATCGGGGTGAGATGCTCATAGTTGTGTCCCGATGTTGTTCCATTAGACTGACTTCTACTGGAGGACCACAAACTGTGTGCGAGCCTGGGTTACCTCCATTATATGTTGGTGGCTTCAGGTTTGCGATGTCTTTGACTTTCTCGATTTCGTGTGTTCCGCCCAACCTAGACTGTGACACTGTAGCACGCAAATGGACACTGTTTGAAGATGCGCCAACGGGCACAACGAATGATTTGTACGGGGCAAAAGTCGGTTTCTGCTGCAGTTCTTCATATATGTCGGTAGAATCCAACGTTTTCGTTTCTTCAAATGAGTCATGTTGGTCGACTCGAACCCGCAGTGTAATGCTCAGAGGTTGTCTTAAT\n+>As5_1/1_1.000_240\n+TTTGTTATTGTCGTATCTGAAGCCATTGTTTGGATTTATAGCTTAGATGTCAAATTAGTCGCCCTGTCTGATCTGTTTACTATTGTTTGTTATTGTTGCCATGGTTACAAAAACTACTCGATGGTGCTGCTAACAAGTGTGAAAACTGTGCTGTGTACAAAGTTATATATATCCCAGTTACCCGGACCCTCCTGCTTATCAATACAGCCTATAGCCGAAGTTTCCTGGTTGCTAAAGTTG\n+>As6_1/1_1.000_276\n+AGAGTCGCTGGCGCTTTACTGCCGACAGCTCAGGAAGCTGAGTCTCAAGGCGTGCGAGGCCGTCACCGACCGCGGTCTAATGCTGCTGGCCCACAAGTGCCGGGGGCTGCAGCAGCTCAACGTACAACACTGCCAGCTGACCGTGGACACCTACAGGGCCCTCAAACGATGCTGCAAGCGCTGTATCATCGAGCACACAAACCCGGGCTTCTACTGATGTCACAACGGCCACGAGGTCACTGGAATGACTTCATCCGTGTGAATAAAATAAACCAT\n+>As7_1/1_1.000_352\n+TTCGAGATTTTTTTAGAAATGCAAATTTCGCGAAACAAATACATCGCTAAAAATTATACAATTACAGTAGATTGTTTTCTATTGGTGTGCAAAGATTACAATCAAACACAATTATACAAGGTTTCAGAAAGACTCGGCATGTGTGCACACAGAATACCAACCACGGTGGCAAAATGCAACTCAACAATCAATATAATGGAGAGAAAAAACAAACAGGCTACGAAACATTCCTATATTACAGGAAGAAAATACCACAATGAAAACCTCCATAAGATTATAGCCATGTGTATCCATAGAAAAGCAGGAGTGGAAGCCATATTACAGTGGTCTGCTACACGTCATGGACGATGGA\n+>As8_1/1_1.000_255\n+ACCGCCAACAAGGCGCTGGACAAGGCCCGCGCCAAAAACAAGGACGTGGCCCAGGCTGAATCTGCCCAACAGACGTCGAGTACGAAATTTGATAAGATATCTGACACAGCAAAGCAAGAACTGACTGACTTCAAAGCCAGACGAATACAGCACTTCCGGAAAAACTTAGTGGACATAGCCGAACTAGAACTGAAACATGCTAGGGCCCAAGTTCAGCTTTTACGAAATGTCATCAGCTCAATAAAGGAGGACTCC\n+>As9_1/1_1.000_267\n+GGCCAACTCAACCATGTCGAGGTAGCAGCGTACCTACACTCCGAAGATCGCAAACGACACACCGTGGAAGAAGACCTAGAGGAATATGATAGACTGGCTGAGACATTGATGAGTTTTGAGGATACCAATAACGATGGGCTAGTTACACAGGCGGAATATGGAAGATCAGTTTATCCTGAGCTAAAGAAATTTGTCGAAACGGTGGCCGCAGCAGATCTGGAATCCGGTGGAATGTCCACTTTACCGCGTATCCCTGATGATCTGAAA\n+>As10_1/1_1.000_279\n+GGCGCAGGCGTTGCTGGTGTTGGCGCAGGCGTTGCTGGTGTAGGAGCAGGCGTCGCTGGTGTAGGCGCTGGTGTTGGCGTGGATGGCGTCGGTGGCATGGGGGTTGGTGTCGGCGTTGGCGCGGCAATCGTGGAGGTCGTGAAGGCCGGAGTGGTCTGGGCAGACGTAAACTGCACCATTCCGATCAATTTTTTTGTCCTGAAGACTCGTAAGGAAATTGGCCTGTCAAGTCTTTTCTTTCAAACGAGTCTGAAAGAAATAAGACATAATTTTGAAAGA\n+>As11_1/1_1.000_183\n+GCAAACTTAAATTTCTTGAAACTGAACCCGAACACATCAGTTGAGACCTATATATATCACGCACTTAGTATTACAAAAGATATTAAGCGCCGCTGTACAAACATAATACAGAGCATAAGGCGCCTACGATTGTTCCACACGTTATTTACCATTGAACTTACAAATAACTTAGGCTTTGCCAAT\n+>As12_1/1_1.000_450\n+CGAACACCACAGCGCCCTCTAGTGAACCTGGAGCAGGTCCGGCTTGACTCGGAGACTGTACATTTTGTTGTAGTAGATCATGTTCTCTTCGATGGCCTGCAGCACGTGCTTGGGCAGGTTGGGCATCACGTTGGGACTCTTGGGCTTGGTGGCCGAGGGCTGGAAGGTCTTGGATGTGAGCACGCCCTCGAACCAGGGCATCCACTCTTGGAACATCTGCAGGTCC'..b'TGGTGCTCGGGACGATCACGTGGTCACATATGTAATTACATCATTTGGTCTTCTCTTGGTCGATTGTTTCTTTTGTGGGTAACGTGTTCTTCTCCTGGGTTTCGGTTTTCTTCAGTTTGGTCTTGTCAAACTGCGATACCTCGTCCATATCAGGCTTGTCACCCATGT\n+>As424_1/1_1.000_708\n+CTGATCGACTCGCAGAAAGGCGATATTCCTGTGGCTGTCTTGAGGCCGTCCGTCATCCTGTCCTCGGTGAAAGAACCCATTCCAGGGTGGATGGATGGTTTATCGGGTGCAAACGCCGCTTCTGCTTTGCAAGGCCAAGGTCTACTCAGAATCATGTTGGGACGCAACGCCAACCTGGCACAAATCATTCCTGTCGACATTGTCGCCAACACGTCCATCGTCGCTGGATGGAAACTAGCCAAGGATAAACCAAACACTACATTCGTCGTCAACATCACATCAGGAAATGTTAATCCCATTCTTTGGGGAGATGTCTTTGGATATGGAGCCGTCCAACAGCACAAGTACCCGTCCAAGAGAGTGATCCGCCCTCCAGTACACGTCATGTTCACATCTAGTCTATGGTGGAGACGATTCCTGACTGTCTTTGATCACTATGTTCCTGGCATGTTCTTCGATATATGCACACTGTTGACAGGACGAATGCCGACGTACTTGTTAAGTCTTAAAGGCGTGCTGCGATTCTCATACGCCACAGAGTACTTCTCATATGGCCACTGGAACTTCGAACAAACGAACATCAACGCTTTATGTGAAGATATGACACACTACGAAAGGAAGGTGTTCAACTGCGATGTACGCACTGTGGTGTGGAAAGATTTCGTAGCGGACTGGTGGTTTGGTACCAAGCGCAGATCGGAAGAGCAC\n+>As425_1/1_1.000_363\n+TACAAGGATTTTTATAGAACAATCAAGATGAAGATTTTTGTCTACCTTTCGTTGATGTGTCTTCTGCTTTGCATAATAGTGACGCCTGTCATCTCCGGCTCGTCGTTACCAAGGCGACGCGAGACGCTGGCGCTGTTCCGGGGGTTCCTCTGTTACCTGAAGGGAGAGTCGTTACAAGACTGCCGAGAAGATGAAGACATCACGAATGTTATAAACAGCATAACGGGAGATATTCGGGAGAACCTTGGCGATGAACGACCTGTCACGCTGTCCAAGGAGCCTTCAGTACTGCGCTCCGACTTCCCTCGCCCGCCCCAGGGCACCCGCAAACGGGATGCCTTCTACAGCGACTGGAAGCGGAAG\n+>As426_1/1_1.000_189\n+ATGAAGATATTTGGGTTCTGTATAGTCTGGTCAATCTGTGAGATTTTATGGCTCAACCCACCACAAATTGCAACACAATCTTTTAGTGTTTTTTCATATCATAAAGGTGTCCTTATGAACATACTAAGAATCACGGAAAATCTACGTAGAAGAAGTTCACTTTTTTGCCAAAATGCAAGATGGCCGCCA\n+>As427_1/1_1.000_301\n+CGTTTGATCTGTCAGACGATCTTGTTCTCATCCGGAACTGTTTTGCTAATCTCGCAGATATATCCGGTGAATGAGCGTTTATCTTCATCCACCACTCCCACATATCCGTTTCGTGGCAACTTCGTTGATCCCCGGAGTTTGAGAACGACGATGGCCACTATAGCCAAAGCCAGGCCGCTTGTTATACCGGCGACAACAGACACGTGTAATATCCAGGCAGGATATCCGTTGAGGCCTGGTGACGTCCTGTTGGAATCCCCAACGACACCTGTGAGATTTATGCCGACCAGTGGACTACTCG\n+>As428_1/1_1.000_132\n+CATCTTGAAATAAATAGTCTAATCATGTTACCTGACCAAATAAGCAGAGTTGTTACTTACACTGTTTCAATATTGAATGTGCAGTGTTATGAGAATGCTGATAGATACGTGTGGGTACTTATTGATCTCTCG\n+>As429_1/1_1.000_342\n+ACCTGTTTTCAAATGCCAAAAAAATACATTGTGAAAATAGTTGCTACTTTCTTAATAAGTAATTATTCTATCGATGCATCAACACAAGTCCTCAATGGTATGTACGGACATACATCATGTACATACGTTCACAAATATCACAATACTGGGTATGTTCCATGCAGACCAATGTCCAAGACGAGATTGTTGCCCCGTGGATCCGAAATGTCCCCGTCGATATATCGATTACCTGTAGTTTTCTACCGATATCCCATGAAGAGGGATGTAATAACATTCAGTATTCTGTCGAATCGGCTACCATACCATGGGTATGTCTATTTGATAGTTAACGCTGTATACATG\n+>As430_1/1_1.000_612\n+AGCGTCTTCAGCAGCGGGTTTTCCTCCCCTATCTCGGGCCCTGGGTCACCTACATGTAGCGATGACCACACGGCGGATGCATCGGGACTCCTGTCAGGACGTCACCTACCCTCCGAAGACAATCCGCACGCATCTGCCGATGAAGAGAAGCAGGTATCAGATAGTGAACAGGTCCATATGAAAGAAGATTCTGGAATTCTGTCACCGATTCATTCTTCTAGTCGTGGTGTTGATATTGATGAACACATGGGCGCCTGTCAAACTCCCCAATTCGCTATAGACGGAACAGATTTGATCTCGCACGATTCGCCGCCAATATCAAAGTCACCTCATTTTTCTATGTCTTCTCCAGTTTCCCCAGTCGAGCATGTTCATCTCGGCTCCTCAGGCTCCGAACATTCGGGAACTTCGTCGACGTCCAGCTTGGAGCACACTTCAATCATAGCGTGCCCCAAAAAGCGACTGCAATCAACGTTCATGGAGGACAAGGACCGTGAATATGTGTCCAGTGAAAAACCTGCAGGGGATTCGCATTTCGACAGCGGCTTCGCAGACAAAAATGTCACAAGTGACTTGGAAGTTACGGGTTTGATCCAGGCGTCCAAGATCGAA\n+>As431_1/1_1.000_577\n+TGGCTGCAGGGGATCGGCCAGTGGCTCGGGACGGCGTGCGCCGCCGTGATGTTCGTGCCGCTTCTCTACCCGCTCCGGCTGACCAGCTCCTACGAGTATCTGGAGATGAGGTTCCAGAGTCGAACTGTGAGGCTGTGCGGTACGTTACTCCTGGTTATAGGACAGCTGTCATACATGGGTGTATGCATCTACTCGCCGGCAACAGCTCTGGAAGCAGTTACCGGGTTTCCTGAAACGGCCAGTATTGTTCTCGGCTCAGTCGTTGCTGGTATTTACTCCTTACTGGGAGGAATGAAAGCCTCAATCTGGATCGGAGCCGGTCAAGCTATTATCATGTTGTTCGGAACACTCGTAGCCATTATAAAGCCCTGTATAGATCACCCCGATGGCATCGCCGGTCTATGGGAAATTAACGAAGATACCCGACGACTGGACATGTGGAACTTTGACCCGAACCCCCTGATCCGCCACACGTTCTGGACTCTGGTGGTGGGTAACTTTGTGACGTGGCTCAACACATACGGTCCCAACCAGGCGACCGTTCAGCGCTACTGCTCGGTGACCAGCATGAGGAAAG\n+>As432_1/1_1.000_183\n+CCAGATCAGCATGCTCCTCTGCATGTTATTGTACGCACGTTTTGTAAGTGCACACATACAACAATACCGTCACTGTTACTCAGCATATATAAAATAATTTGTCCGAAGTTATTAATCTATCGAATAAATTCAATCAAAATGCGCACAGTTATATATTTGAATACTTCTAGGTTAAACAGATTA\n+>As433_1/1_1.000_183\n+GACATCCTTCATCCCTCGGCTTTCCGACTAGCAACAGGTAGATTTTCAGTTGTCACGAGACTTTCAGGGCTAGTGACGATAGTGTTCGGTTTATCCATGTATCCAGCTTACTTCCACAGCTCCTGCGAGCGGTCGACATTAGCACAACATGACGCCTGGTGTGCCTTCTCGAATCATCCTCAC\n'