Repository 'cherry_pick_fasta'
hg clone https://toolshed.g2.bx.psu.edu/repos/artbio/cherry_pick_fasta

Changeset 1:ea8fde9c6f82 (2019-10-09)
Previous changeset 0:e3aee4ba49c6 (2017-10-15) Next changeset 2:321cad0eb507 (2021-03-16)
Commit message:
"planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/cherry_pick_fasta commit f527add7e7bace30b8bc67524ff1da1bf920ec29"
modified:
cherry_pick_fasta.py
cherry_pick_fasta.xml
test-data/input.fa
added:
test-data/output_termlist.fa
test-data/output_termlist_without.fa
test-data/output_without.fa
test-data/termlist.txt
b
diff -r e3aee4ba49c6 -r ea8fde9c6f82 cherry_pick_fasta.py
--- a/cherry_pick_fasta.py Sun Oct 15 13:26:45 2017 -0400
+++ b/cherry_pick_fasta.py Wed Oct 09 18:48:17 2019 -0400
[
@@ -12,27 +12,78 @@
         description="Cherry pick fasta sequences")
     the_parser.add_argument('--input', action="store", type=str,
                             help="input fasta file")
+    the_parser.add_argument('--searchfor', action="store", type=str,
+                            help="with, without, or withlist, withoutlist")
     the_parser.add_argument('--query-string', dest="query_string",
                             action="store", type=str,
-                            help="header containing the string will be\
-                                  extracted as well as the corresponding\
-                                  sequence")
+                            help="headers containing the string will be \
+                                  extracted or excluded as well as the \
+                                  corresponding sequence")
+    the_parser.add_argument('--query-file', dest="query_file",
+                            action="store", type=str,
+                            help="headers containing any of the strings provided in the \
+                                  text file (1 string per line) will be \
+                                  extracted or excluded as well as the \
+                                  corresponding sequence")
+
     the_parser.add_argument(
         '--output', action="store", type=str, help="output fasta file")
     args = the_parser.parse_args()
     return args
 
 
+def parse_fasta_with(query, FastaListe):
+    if not isinstance(query, list):
+        query = [query]
+    accumulator = []
+    for sequence in FastaListe:
+        for string in query:
+            if string in sequence:
+                accumulator.append(sequence)
+                continue
+    return accumulator
+
+
+def complement_fasta(fullfasta, subfasta):
+    return list(set(fullfasta) - set(subfasta))
+
+
+def getquerylist(file):
+    querylist = []
+    for line in open(file, 'r'):
+        querylist.append(line.rstrip())
+    return querylist
+
+
 def __main__():
     """ main function """
     args = Parser()
-    search_term = args.query_string
+    searchterm = args.query_string
     CrudeFasta = open(args.input, "r").read()
     Output = open(args.output, "w")
-    FastaListe = CrudeFasta.split(">")
-    for sequence in FastaListe:
-        if search_term in sequence:
-            Output.write(">%s\n" % sequence.rstrip())
+    FastaListe = CrudeFasta.split(">")[1:]
+    if args.query_string:
+        if args.searchfor == 'with':
+            contList = parse_fasta_with(searchterm, FastaListe)
+            contFasta = ">%s" % ">".join(contList)
+            Output.write(contFasta)
+        elif args.searchfor == 'without':
+            notcontList = complement_fasta(FastaListe,
+                                           parse_fasta_with(searchterm,
+                                                            FastaListe))
+            notcontFasta = ">%s" % ">".join(notcontList)
+            Output.write(notcontFasta)
+    if args.query_file:
+        searchlist = getquerylist(args.query_file)
+        if args.searchfor == 'with':
+            contList = parse_fasta_with(searchlist, FastaListe)
+            contFasta = ">%s" % ">".join(contList)
+            Output.write(contFasta)
+        elif args.searchfor == 'without':
+            notcontList = complement_fasta(FastaListe, parse_fasta_with(
+                                           searchlist, FastaListe))
+            notcontFasta = ">%s" % ">".join(notcontList)
+            Output.write(notcontFasta)
     Output.close()
 
 
b
diff -r e3aee4ba49c6 -r ea8fde9c6f82 cherry_pick_fasta.xml
--- a/cherry_pick_fasta.xml Sun Oct 15 13:26:45 2017 -0400
+++ b/cherry_pick_fasta.xml Wed Oct 09 18:48:17 2019 -0400
b
@@ -1,44 +1,94 @@
-<tool id="cherry_pick_fasta" name="Pick Fasta sequences" version="1.0.0">
-  <description>with header satisfying a query string</description>
+<tool id="cherry_pick_fasta" name="Pick Fasta sequences" version="2.0.0">
+  <description>with header satisfying a string query</description>
   <command interpreter="python">cherry_pick_fasta.py
                                    --input $input
-                                   --query-string "$query"
+                                   --searchfor '$search.searchfor'
+                                   #if $search.options_selector == 'single':
+                                       --query-string '$search.query'
+                                   #else:
+                                       --query-file '$search.query'
+                                   #end if
                                    --output $output
   </command>
 
   <inputs>
-    <param name="query" type="text" size="30" value="" label="Select sequences with this string in their header" help="exemple: gi|40557596">
-    <sanitizer>
-        <valid initial="string.printable">
-          <remove value="&quot;"/>
-          <remove value="\"/>
-        </valid>
-        <mapping initial="none">
-          <add source="&quot;" target="\&quot;"/>
-          <add source="\" target="\\"/>
-        </mapping>
-      </sanitizer>
-    </param>
-    <param format="fasta" label="Source file" name="input" type="data" />
+    <param name="input" type="data" format="fasta" label="Source file" help="Fasta file to parse" />
+
+    <conditional name="search">
+        <param name="options_selector" type="select" display="radio" label="by single term or file of terms">
+            <option value="single" selected="True">single term</option>
+            <option value="textdataset">terms in a text dataset</option>
+        </param>
+        <when value="single">
+            <param name="query" type="text" size="30" value="" label="Search string" help="exemple: gi|40557596">
+                <sanitizer>
+                    <valid initial="string.printable">
+                        <remove value="&quot;"/>
+                        <remove value="\"/>
+                    </valid>
+                    <mapping initial="none">
+                        <add source="&quot;" target="\&quot;"/>
+                        <add source="\" target="\\"/>
+                    </mapping>
+                </sanitizer>
+            </param>
+            <param name="searchfor" type="select" label="retrieve sequences whose headers contain or do not contain the search string">
+                <option value="with" selected="true">contain</option>
+                <option value="without">do not contain</option>
+            </param>
+        </when>
+        <when value="textdataset">
+            <param name="query" type="data" format="txt" label="term dataset" help="a list of term to search for, one term per line" />
+            <param name="searchfor" type="select" label="retrieve sequences whose headers contain or do not contain the search list">
+                <option value="with" selected="true">contain</option>
+                <option value="without">do not contain</option>
+            </param>
+        </when>
+    </conditional>
   </inputs>
   <outputs>
-    <data name="output" format="fasta" label="${tool.name} on ${on_string} including '${query.value}' in header" />
+    <data name="output" format="fasta" label="Fasta sequences ${search.searchfor.value} ${search.options_selector} term(s) in header" />
   </outputs>
   <tests>
     <test>
         <param ftype="fasta" name="input" value="input.fa" />
+        <!-- <param name="options_selector" value="textdataset" /> -->
         <param name="query" value="gi|81971654" />
+        <param name="searchfor" value="with" />
         <output name="output" ftype="fasta" file="output.fa" />
     </test>
+    <test>
+        <param ftype="fasta" name="input" value="input.fa" />
+        <!-- <param name="options_selector" value="textdataset" /> -->
+        <param name="query" value="RNA" />
+        <param name="searchfor" value="without" />
+        <output name="output" ftype="fasta" file="output_without.fa" />
+    </test>
+    <test>
+        <param ftype="fasta" name="input" value="input.fa" />
+        <param name="options_selector" value="textdataset" />
+        <param name="query" ftype="txt" value="termlist.txt" />
+        <param name="searchfor" value="without" />
+        <output name="output" ftype="fasta" file="output_termlist.fa" />
+    </test>
+    <test>
+        <param ftype="fasta" name="input" value="input.fa" />
+        <param name="options_selector" value="textdataset" />
+        <param name="query" ftype="txt" value="termlist.txt" />
+        <param name="searchfor" value="without" />
+        <output name="output" ftype="fasta" file="output_termlist_without.fa" />
+    </test>
   </tests>
+
   <help>
 **What it does**
 
-This tool retrieves nucleotide/peptide sequences from a fasta file whose headers match a given query string.
+This tool retrieves nucleotide/peptide sequences from a fasta file whose headers match
+or do not match a given string.
 
-It is Copyright © 2015 `CNRS and University Pierre et Marie Curie`_ and is released under the `MIT license`_.
+It is Copyright © 2019 `CNRS and Sorbonne-Université`_ and is released under the `MIT license`_.
 
-.. _CNRS and University Pierre et Marie Curie: http://www.upmc.fr/en/index.html
+.. _CNRS and  Sorbonne-Université: http://www.sorbonne-universite.fr/en
 .. _MIT license: http://opensource.org/licenses/MIT
 
   </help>
b
diff -r e3aee4ba49c6 -r ea8fde9c6f82 test-data/input.fa
--- a/test-data/input.fa Sun Oct 15 13:26:45 2017 -0400
+++ b/test-data/input.fa Wed Oct 09 18:48:17 2019 -0400
b
b'@@ -107,7 +107,6 @@\n ACTGTGCGTCCAAAAGAGGCTTATCGTCTAGTCGAAGAAGGATCAACCGGCAATAAGCAG\n TATCGTTTGGACAAAACGAAAACCAAAGGAGCTATCGATCTCGATGTGTACGAATTCGTG\n CGC\n-\n >gi|21321709|ref|NP_647481.1|_nonstructural_polyprotein__Cricket_paralysis_virus--Locus_65_Transcript_2/2_Confidence_0.333_Length_1324_hit1_IdMatch=43.5,AligLength=446,E-val=1e-119\n CTTGAGGATACTTTACCAGGTATGGTCGAGCACGTTACGCTCGTAGCACAAAATACATCC\n GCGTCAGCCAAGGTGTTATCTGACGAGTTGATCAAATCAATGCTTTGCATTGTTTTGATT\n@@ -217,7 +216,6 @@\n GGAGATTGTGGTGCCTTGCTGGTAGCACAAAATCATGCAATTGTGAGGAAAATATTTGCA\n ATGCATATAGCAGGTGCGGAAGAAAATGGCTATGCTTGTCCAATCAATCAGGAAATGTTA\n G\n-\n >gi|8895507|gb|AAF80998.1|_nonstructural_polyprotein__cricket_paralysis_virus--Locus_65_Transcript_2/2_Confidence_0.333_Length_1324_hit1_IdMatch=43.5,AligLength=446,E-val=1e-119\n CTTGAGGATACTTTACCAGGTATGGTCGAGCACGTTACGCTCGTAGCACAAAATACATCC\n GCGTCAGCCAAGGTGTTATCTGACGAGTTGATCAAATCAATGCTTTGCATTGTTTTGATT\n@@ -327,7 +325,6 @@\n GGAGATTGTGGTGCCTTGCTGGTAGCACAAAATCATGCAATTGTGAGGAAAATATTTGCA\n ATGCATATAGCAGGTGCGGAAGAAAATGGCTATGCTTGTCCAATCAATCAGGAAATGTTA\n G\n-\n >gi|798547303|gb|AKA63265.1|_nonstructural_polyprotein__Cricket_paralysis_virus--Locus_63_Transcript_2/2_Confidence_0.333_Length_343_hit1_IdMatch=53.45,AligLength=116,E-val=4e-32\n ACACAGTCCACAGTCCGAAGACCAAAGCGTTGGATAGGACACGAATACACAGATGAAACG\n AAAACAGGCGAGGCTGCGCCCTATCGGACATTGGAAGAAGTCCGTTTCCTTAAAAGAGGG\n@@ -385,21931 +382,117 @@\n TGGAAGAAGTCCGTTTCCTTAAAAGAGGGTTCAGAATGGATCACCTCTTGTGTCGGTGGG\n TAGCTCCTTTGAAGAAGGATGTCATCTACGAAATGCTTAATTGGACGCGCAAAGGGATTA\n ACCCAGATGATGTGACGATGATGATCATTGATACAGCATTTAGGGAGATCTCTTATCACG\n-GAAGGGAAGCTTTCGAGAAGCTGCGAGGGCAGATACTTGAGCAGCGGGATGTGTTGGTTG\n-AATATCCTCAA\n->gi|798547303|gb|AKA63265.1|_nonstructural_polyprotein__Cricket_paralysis_virus--Locus_50_Transcript_1/1_Confidence_0.000_Length_1442_hit1_IdMatch=25.51,AligLength=537,E-val=1e-49\n-GAATTCGTGCGCATGCAAAGAATAAATGACCACCCTTCGGGTTGGAAAGCTACGGATGAA\n-GTATATGGCTATGCAGAGTTCTCGAAACTAATGTGTGCTGAATGGAAGAGAAGGAAGACA\n-GAACATCAGAATACTGTTGACTTCCTTAAGAAGTATGCAGAGCGACCCTTCGAGACCAAC\n-CCCGGACCAGTGGAGGATATCCCAATAAGACACGATGATGTCGAGCAGGGGGTAGAAGCG\n-CAGATGGGTCGAGATGCAGATTGGTTTAACAATGACATAGCGGAACGTATAGCGCGTGGA\n-CAGGATATTACTGATATCTTGTATGAGTATGCTGAAGATGACGAGTTGCATGAGGATTAC\n-ATGGCTTACAAGAAACAGCAGGCCCAGCCTAGTAAGTGGGACAAATACGCGCGCCGTCTC\n-GAAAGTGCAATTACGGAAGGAAAGAATTTCCTTGCCCGTGTGGTTTCAAAAATAGCCAGC\n-GTCATTCGGGAGAACCCATATTTGACCATGATGGCAACTGTGGGGAGCGTTCTCGCTCTG\n-TATGGAGCTATGCGTTGGTTTTCGAAAGGAGTAACGGAGACTTTTGACGCTGAAGAAGTT\n-ACTATTCCCAACGAAACCAAGGTAGAGAACGTTGTGCGTACGGAGGGTTTTGAATCTTAC\n-GACCATCGGACTCCGCGCGCTCATCGAGCCAACAGGCAATATGTGCGAGCTGAGGCGATG\n-ATAGATGAAACAGGGTACCTGGTAGCCAACAACAAAGTCACTGGCAACACGTATCGAATG\n-TGTATCAAGAGGGATCCTGATGATTTGGTCGTTGGAAACGCTGTGTTTATCACAGGGTGG\n-ACGCTCCTCATACCGTACCACTTCGTTTGTGGACTGGCGGGACGGAGAATAGCTGCTGAT\n-TCCATCGTGACTTTGTCAAAGCCAGGCTTGGATAAGATTATTGAATTCCCGTTGTCACGA\n-ATCTTCCGATACGATACCTCACCAGATGGTTTTACCACTAGTGAGTATTGTGCTCGAATG\n-GAACATGAAGATGGAGAATTGGTTGATGCCATCCTGGTAAACCTGCATGGTTTGGGAGTG\n-CGAATCCATCCTGACCTCCGGGGAAAAATTGTGACGGTACGAGACCAAGCGCACCTGAGT\n-ACGACATTTCATGCGATTCTCACAACGATGTCCAGGAAGCCACCACTAACAACGTCACAA\n-CAAGTGGTAAAAGGGGTCAAGCCAATGGATAAAATCCTGCACATCAATTTACCAGTTGGG\n-GACAAAACAACGCAATACACCCAACGTGACTGTTACAAGTATTATTCCGTAACGGTCGTT\n-GGAGATTGTGGTGCCTTGCTGGTAGCACAAAATCATGCAATTGTGAGGAAAATATTTGCA\n-ATGCATATAGCAGGTGCGGAAGAAAATGGCTATGCTTGTCCAATCAATCAGGAAATGTTA\n-G\n->gi|798547303|gb|AKA63265.1|_nonstructural_polyprotein__Cricket_paralysis_virus--Locus_65_Transcript_1/2_Confidence_0.667_Length_1344_hit1_IdMatch=43.68,AligLength=451,E-val=2e-123\n-TAGATAAGGTTTGCTCATTTCTTGAGGATGCTTTACCAGGTATGGTCGAGCACGTTACGC\n-TCGTAGCACAAAATACATCCGCGTCAGCCAAGGTGTTATCTGACGAGTTGATCAAATCAA\n-TGCTTTGCATTGTTTTGATTTGCTTGTTGATTGAAACCAAGTTCTATAAGACCGCTTTCG\n-CGGTACTTATAGTGGTTGCTCTACGTGTTTTCGGGTACAGTGAGCAAATAATTGAGACAG\n-CTATGGACATGTATCGCGTAATTAGGGCTCCAAAGGCTCAAGGTAATATGGAAGATGTCG\n-TTTTCCATCCGTGGTTGAACACGTGTGGAAAGTTGATTTTCCTACTTATCGCTGTCCTGT\n-GTCTCAAGAAATTACCAGGAAAGAACGACGTAGACACTTTCATGCGCAGGCTCGACAGCT\n-TACCCAAAGCTGTTAAGGGTGCGACACAACTACATGAATGGGTGTCAAAATACTTCGATC\n'..b'AAAACATCTGCAGTATTATCGA\n+AATCAAGACGAGGTTTGGAAGCGCTTGAAGCATCTGAATATAGAAGCATCAATCGTGTTG\n+AACGAGCGTTAGAGATGGTACTCAAATTAGTTCAAAGACAACAAAATGATAGAAGACAAC\n+GAGCGATAGCAGGCGAACCAAATTCCATTCTATTACTGACCCTTGTTTATTATGTTATCT\n+TATCGGCTATGTACGCCATGTCGACAGATGCAGCTCAAGGTAAACAGGTTGGTAATTCAA\n+TGGACCTTCAAGACTTGTTATTCGCGACAACTCAGACGGACACGCTTGTGTCATCAATTG\n+ATATTGTAGGTATGGATGCTTCTGTGCAGTCAATAACTACTGAGTTGTCAAATATTATCT\n+GTCTTGAAGTGACGCGTGGTTTACCTGAATCACAAATTGGACCATTTACAGGCGGTATGA\n+AGCGTCTTCTGCAACTAAGTGATGAACCTGGTGGAGCGTGGAAGCAGGTTGAGATGTATG\n+TATCAGGTACACTTGAGGCCGTGGTATTCGAAGGTAGTCATGCACTAACATCAACTACTT\n+ACGAGAGTAAGATTTTTGGAAGTGTTAAGAACTATGCGGGTACGTATCCCTCAGGTAGAG\n+CTGACACGTCGTCACATCACACTAAGGTTTTGGAAGGTGCGACCCGTGGTAATGAAATGC\n+GAAGAAGAACGGATGAGCGAATCGTGCACCATGCGTCGACGATTGTAATGTCACGTAATA\n+TGGGTGATGATAAGTCAGACGTATACACAGGATCATTTCCAAATGTTATATCACAATTAG\n+TGAGCGATAAAGATGTACTCGCACAATTGGGTTTTAAGACAGATGCAGATCTCTCGAGTC\n+ACAACGGAGAATTCTTGCAACAACATGTATGTAGAGGAAGGCTAGTCGGAAAACCATCAC\n+GTATATCAATAGGCACAGTAGAGCATCGTAAAGAGAAGGTTCGGATGCATGAAGCATGTC\n+AAGAACTTCTATCTATTATGGATGACCTAATTGTGCGTATTAGAGATACCGAGGGCTTGA\n+AGATGATGATCTTCTCGTTTGCTATACATTGCATTAATAGTATTGTATTAAACATTGCGA\n+AAGTTGATCTTGCCGCTATAATATCGAAATTGACTTCAAATAATTTGCGTACATATGTAT\n+ATCCTACGAAAGATGAACATGCTTTTCAGCTCGTTAGATTGTATTTTCCATTGATGTGGT\n+TCTTTATGCATAAAGGTGGTGAATTACCAGCTTATCCAATTGAACGGGTTGATGGTACTT\n+ATACAGATGACGAGTCGGTGTACACTGTGCGAGGTGAATACAAACGAAGATTGATGTTTG\n+ATATTATAGGTATTGATAAAATTGAGAAATTTGGTGACGCCATTTTCAGAAATAATCACT\n+GCTTTGATATCGGTTTGAACGCTGCTGATGCCATCATTAAGCTGAAGATAACGGATCTAC\n+CGAAGGAAATGAGAAGTGAAACGCTCGAGCATGGTATCATATCAAATCTAGCGAAAAATT\n+TAGAGTCATTCGGCAATGCTATGTCTAAGGAAGCTTCACTTCAAGCGAAACTCAGGATTG\n+AAAATGAACTTGCAGGTGTTAGGAGCGTAACTCAGACAAATGAAGTTGTCGTTGGAAGAG\n+GAAAGATAGCAAAAGTCCCAAAAAGTATTGTATACGCACATCGAACTGAAGCACAACTTG\n+AACAGATATTAATGACAAGAGAGTCGGATAATGAAGAGCGACCAATGATATCAAAGCGAA\n+TGCTTGATCACATCGCTTCACTATCGTTTCATCATGTTGTTAATGTCAAGACAACGGATA\n+AGTTACACTTGTATTACTTCTATCCTAGTGGCGATGCCCTAGTTTACGGTAATCATGCAA\n+AATACACTGAACATTTCGAATTAGCTCCACCTATGTGGTATTTGTCACCTTCATGGCGTT\n+TATATGGCCTATTAGGTACAGCGTCACAGACACGTGGTGACTTACTTCGACAAATTAATT\n+GGCTAAAAGGTAAATATGGAACGTTTAAGCTTGATGACGAGAAGATCCGTTATGGATATG\n+ATGTTATCTGGCGAAAGAACAGACATCTGCTTAATGACTACATGACAATGATCGGAGCAT\n+CACCACATCTTGAAAACTTGCTTAAGAGCATCTTTCGTTTGATGGATAGATGGGGTACTT\n+ATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTATCTCAGACAATCCATTAG\n+TCGCTGAACAGAACATTATCTTCGCTGCAGATGGTGACGAGATAACTAGGCCCTTACAGG\n+TAATTGTCGGCTATCTACATATACTTGCGCAT\n+>gi|722158941|ref|YP_009104379.1|_RNA-dependent_RNA_polymerase__Fako_virus--Locus_27_Transcript_6/7_Confidence_0.333_Length_1626_hit1_IdMatch=21.78,AligLength=473,E-val=8e-19\n+CTCGCTCATGTCAAGAACTTCTATCTATTATGGATGACCTAATTGTGCGTATTAGAGATA\n+CCGAGGGCTTGAAGATGATGATCTTCTCGTTTGCTATACATTGCATTAATAGTATTGTAT\n+TAAACATTGCGAAAGTTGATCTTGCCGCTATAATATCGAAATTGACTTCAAATAATTTGC\n+GTACATATGTATATCCTACGAAAGATGAACATGCTTTTCAGCTCGTTAGATTGTATTTTC\n+CATTGATGTGGTTCTTTATGCATAAAGGTGGTGAATTACCAGCTTATCCAATTGAACGGG\n+TTGATGGTACTTATACAGATGACGAGTCGGTGTACACTGTGCGAGGTGAATACAAACGAA\n+GATTGATGTTTGATATTATAGGTATTGATAAAATTGAGAAATTTGGTGACGCCATTTTCA\n+GAAATAATCACTGCTTTGATATCGGTTTGAACGCTGCTGATGCCATCATTAAGCTGAAGA\n+TAACGGATCTACCGAAGGAAATGAGAAGTGAAACGCTCGAGCATGGTATCATATCAAATC\n+TAGCGAAAAATTTAGAGTCATTCGGCAATGCTATGTCTAAGGAAGCTTCACTTCAAGCGA\n+AACTCAGGATTGAAAATGAACTTGCAGGTGTTAGGAGCGTAACTCAGACAAATGAAGTTG\n+TCGTTGGAAGAGGAAAGATAGCAAAAGTCCCAAAAAGTATTGTATACGCACATCGAACTG\n+AAGCACAACTTGAACAGATATTAATGACAAGAGAGTCGGATAATGAAGAGCGACCAATGA\n+TATCAAAGCGAATGCTTGATCACATCGCTTCACTATCGTTTCATCATGTTGTTAATGTCA\n+AGACAACGGATAAGTTACACTTGTATTACTTCTATCCTAGTGGCGATGCCCTAGTTTACG\n+GTAATCATGCAAAATACACTGAACATTTCGAATTAGCTCCACCTATGTGGTATTTGTCAC\n+CTTCATGGCGTTTATATGGCCTATTAGGTACAGCGTCACAGACACGTGGTGACTTACTTC\n+GACAAATTAATTGGCTAAAAGGTAAATATGGAACGTTTAAGCTTGATGACGAGAAGATCC\n+GTTATGGATATGATGTTATCTGGCGAAAGAACAGACATCTGCTTAATGACTACATGACAA\n+TGATCGGAGCATCACCACATCTTGAAAACTTGCTTAAGAGCATCTTTCGTTTGATGGATA\n+GATGGGGTACTTATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTATCTCAG\n+ACAATCCATTAGTCGCTGAACAGAACATTATCTTCGCTGCAGATGGTGACGAGATAACTA\n+GGCCCTTACAGGTAATTGTCGGCTATCTACATATACTTGCGCAT\n'
b
diff -r e3aee4ba49c6 -r ea8fde9c6f82 test-data/output_termlist.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_termlist.fa Wed Oct 09 18:48:17 2019 -0400
b
b'@@ -0,0 +1,5187 @@\n+>gi|157065140|gb|ABV04399.1|_p3__Heliothis_armigera_cypovirus_5--Locus_27_Transcript_6/7_Confidence_0.333_Length_1626_hit1_IdMatch=24.9,AligLength=494,E-val=2e-33\n+CTCCTCGCTCATGTCAAGAACTTCTATCTATTATGGATGACCTAATTGTGCGTATTAGAG\n+ATACCGAGGGCTTGAAGATGATGATCTTCTCGTTTGCTATACATTGCATTAATAGTATTG\n+TATTAAACATTGCGAAAGTTGATCTTGCCGCTATAATATCGAAATTGACTTCAAATAATT\n+TGCGTACATATGTATATCCTACGAAAGATGAACATGCTTTTCAGCTCGTTAGATTGTATT\n+TTCCATTGATGTGGTTCTTTATGCATAAAGGTGGTGAATTACCAGCTTATCCAATTGAAC\n+GGGTTGATGGTACTTATACAGATGACGAGTCGGTGTACACTGTGCGAGGTGAATACAAAC\n+GAAGATTGATGTTTGATATTATAGGTATTGATAAAATTGAGAAATTTGGTGACGCCATTT\n+TCAGAAATAATCACTGCTTTGATATCGGTTTGAACGCTGCTGATGCCATCATTAAGCTGA\n+AGATAACGGATCTACCGAAGGAAATGAGAAGTGAAACGCTCGAGCATGGTATCATATCAA\n+ATCTAGCGAAAAATTTAGAGTCATTCGGCAATGCTATGTCTAAGGAAGCTTCACTTCAAG\n+CGAAACTCAGGATTGAAAATGAACTTGCAGGTGTTAGGAGCGTAACTCAGACAAATGAAG\n+TTGTCGTTGGAAGAGGAAAGATAGCAAAAGTCCCAAAAAGTATTGTATACGCACATCGAA\n+CTGAAGCACAACTTGAACAGATATTAATGACAAGAGAGTCGGATAATGAAGAGCGACCAA\n+TGATATCAAAGCGAATGCTTGATCACATCGCTTCACTATCGTTTCATCATGTTGTTAATG\n+TCAAGACAACGGATAAGTTACACTTGTATTACTTCTATCCTAGTGGCGATGCCCTAGTTT\n+ACGGTAATCATGCAAAATACACTGAACATTTCGAATTAGCTCCACCTATGTGGTATTTGT\n+CACCTTCATGGCGTTTATATGGCCTATTAGGTACAGCGTCACAGACACGTGGTGACTTAC\n+TTCGACAAATTAATTGGCTAAAAGGTAAATATGGAACGTTTAAGCTTGATGACGAGAAGA\n+TCCGTTATGGATATGATGTTATCTGGCGAAAGAACAGACATCTGCTTAATGACTACATGA\n+CAATGATCGGAGCATCACCACATCTTGAAAACTTGCTTAAGAGCATCTTTCGTTTGATGG\n+ATAGATGGGGTACTTATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTATCT\n+CAGACAATCCATTAGTCGCTGAACAGAACATTATCTTCGCTGCAGATGGTGACGAGATAA\n+CTAGGCCCTTACAGGTAATTGTCGGCTATCTACATATACTTGCGCATATTAATACGATTT\n+TTACACGACCACAAGTAAAGTTAACTGAGCATCTTATTGAATATATGCATCAGCGAGCTG\n+TACATACAGGAAGGTCG\n+>gi|584614105|gb|AHJ14783.1|_VP3__Orgyia_pseudotsugata_cypovirus_5--Locus_27_Transcript_1/7_Confidence_0.444_Length_3872_hit1_IdMatch=28.76,AligLength=1217,E-val=4e-139\n+GTGGTATAGCTCTCAGCGCTACGGTTATAGTACCTCAGAGTATTTTGAAGCCACCACCTT\n+TCAACGAGAAAGACTGGCCTTTGAATGAAGACGAGAGTATGTTCAGTGCCTCGCGCAAGT\n+ATAATTACATGATAAATACTAGTACGTTGAGCCTTTATGGTTCGAGGGAAAGTTTAGTCG\n+GTAAAGCAATATACGGTTTATATACTGATGAGCAATCACAGTCACGCTTCAGGACAGTAT\n+GGCATCAAATAATGGCAAGTGTCTACGCACTAGACGATTATCTAGGTCATACTAACCATC\n+CAGTTCGTGCAGTGTTGGCACAGTTAAACTTAGACAAAGGATTACCATTCAAGGAAACTG\n+CTGAAGGTATTGACTTAACAGAGGCGGTTGAAAAAGGAATTGATTCGAGTACATTACTAC\n+CATCAATATTATATATGTTGATCTCAGTATCGTGCGATATCTGTTTCGGAATTTCAACTG\n+AAGTTGAAGGTGCCTTTACGATCAATCATTATCTTAATCTAGCACAGCATGATTACGCGG\n+ATGAGAAGTTACGAATTAAGTCGGCATGTCGTAATTGGTTTGCACAAGCATTGAGTAAAC\n+TAGACGTCATAGCTTACCCAGTTTATAACAATCAGCTCGAGATCATCGACCTAAAGTATG\n+TACATGGTAAAGAGCCAAAGTATGTAAGCACATTACATGAAAAAGTTGCCGAATCACGTC\n+AACGTAAGCTGTCAAAATACCCATACTTACTGGAATATATTGATAGGTCACGTAAAGCGA\n+AAACGGTGGAGGAATTAATCCATAGACTTTTAGTGATGAATGCACTTTCAAACGACCGCT\n+CTTTCTATAAAACACGGACGGAATTATCATTAGACGCGGCGGTAAAATCAGAGGTGCGAG\n+AGCACTTAGTTAGTGCTCCGGTCGCTAAATTGATTGACCCTCAGTCTAATCGAATCTATC\n+AGAAGTACTTTATTAGAGAAAGGAATGAAGCAATGTACTATGCTCAACAGTACTTATTAA\n+GCTTTGTCCCAGCATTGATCCAACAACTGAGCAAAACCAACTTTGATGAGGAATGGTTAC\n+GATTTTTAACCACATCTTCACCTGGAGTCAAATTACCTCAAGAAACGCTAGACAGCCTGA\n+GTAAAACATCTGCAGTATTATCGAAATCAAGACGAGGTTTGGAAGCGCTTGAAGCATCTG\n+AATATAGAAGCATCAATCGTGTTGAACGAGCGTTAGAGATGGTACTCAAATTAGTTCAAA\n+GACAACAAAATGATAGAAGACAACGAGCGATAGCAGGCGAACCAAATTCCATTCTATTAC\n+TGACCCTTGTTTATTATGTTATCTTATCGGCTATGTACGCCATGTCGACAGATGCAGCTC\n+AAGGTAAACAGGTTGGTAATTCAATGGACCTTCAAGACTTGTTATTCGCGACAACTCAGA\n+CGGACACGCTTGTGTCATCAATTGATATTGTAGGTATGGATGCTTCTGTGCAGTCAATAA\n+CTACTGAGTTGTCAAATATTATCTGTCTTGAAGTGACGCGTGGTTTACCTGAATCACAAA\n+TTGGACCATTTACAGGCGGTATGAAGCGTCTTCTGCAACTAAGTGATGAACCTGGTGGAG\n+CGTGGAAGCAGGTTGAGATGTATGTATCAGGTACACTTGAGGCCGTGGTATTCGAAGGTA\n+GTCATGCACTAACATCAACTACTTACGAGAGTAAGATTTTTGGAAGTGTTAAGAACTATG\n+CGGGTACGTATCCCTCAGGTAGAGCTGACACGTCGTCACATCACACTAAGGTTTTGGAAG\n+GTGCGACCCGTGGTAATGAAATGCGAAGAAGAACGGATGAGCGAATCGTGCACCATGCGT\n+CGACGATTGTAATGTCACGTAATATGGGTGATGATAAGTCAGACGTATACACAGGATCAT\n+TTCCAAATGTTATATCACAATTAGTGAGCGATAAAGATGTACTCGCACAATTGGGTTTTA\n+AGACAGATGCAGATCTCTCGAGTCACAACGGAGAATTCTTGCAACAACATGTATGTAGAG\n+GAAGGCTAGTCGGAAAACCATCACGTATAT'..b'TTTCGTTTGATGGATAGATGGG\n+GTACTTATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTATCTCAGACAATC\n+CATTAGTCGCTGAACAGAACATTATCTTCGCTGCAGATGGTGACGAGATAACTAGGCCCT\n+TACAGGTAATTGTCGGCTATCTACATATACTTGCGCATATTAATACGATTTTTACACGAC\n+CACAAGTAAAGTTAACTGAGCATCTTATTGAATATATGCATCAGCGAGCTGTACAT\n+>gi|330688232|gb|AEC32894.1|_RNA-dependent_RNA_polymerase__Rice_ragged_stunt_virus--Locus_27_Transcript_2/7_Confidence_0.333_Length_3860_hit1_IdMatch=24.94,AligLength=1199,E-val=1e-81\n+GGTTACTCACGACTATGCCACCATTGGTGACAGAATTCGCTGGAGTAGACTGTTGTGGTA\n+TAGCTCTCAGCGCTACGGTTATAGTACCTCAGAGTATTTTGAAGCCACCACCTTTCAACG\n+AGAAAGACTGGCCTTTGAATGAAGACGAGAGTATGTTCAGTGCCTCGCGCAAGTATAATT\n+ACATGATAAATACTAGTACGTTGAGCCTTTATGGTTCGAGGGAAAGTTTAGTCGGTAAAG\n+CAATATACGGTTTATATACTGATGAGCAATCACAGTCACGCTTCAGGACAGTATGGCATC\n+AAATAATGGCAAGTGTCTACGCACTAGACGATTATCTAGGTCATACTAACCATCCAGTTC\n+GTGCAGTGTTGGCACAGTTAAACTTAGACAAAGGATTACCATTCAAGGAAACTGCTGAAG\n+GTATTGACTTAACAGAGGCGGTTGAAAAAGGAATTGATTCGAGTACATTACTACCATCAA\n+TATTATATATGTTGATCTCAGTATCGTGCGATATCTGTTTCGGAATTTCAACTGAAGTTG\n+AAGGTGCCTTTACGATCAATCATTATCTTAATCTAGCACAGCATGATTACGCGGATGAGA\n+AGTTACGAATTAAGTCGGCATGTCGTAATTGGTTTGCACAAGCATTGAGTAAACTAGACG\n+TCATAGCTTACCCAGTTTATAACAATCAGCTCGAGATCATCGACCTAAAGTATGTACATG\n+GTAAAGAGCCAAAGTATGTAAGCACATTACATGAAAAAGTTGCCGAATCACGTCAACGTA\n+AGCTGTCAAAATACCCATACTTACTGGAATATATTGATAGGTCACGTAAAGCGAAAACGG\n+TGGAGGAATTAATCCATAGACTTTTAGTGATGAATGCACTTTCAAACGACCGCTCTTTCT\n+ATAAAACACGGACGGAATTATCATTAGACGCGGCGGTAAAATCAGAGGTGCGAGAGCACT\n+TAGTTAGTGCTCCGGTCGCTAAATTGATTGACCCTCAGTCTAATCGAATCTATCAGAAGT\n+ACTTTATTAGAGAAAGGAATGAAGCAATGTACTATGCTCAACAGTACTTATTAAGCTTTG\n+TCCCAGCATTGATCCAACAACTGAGCAAAACCAACTTTGATGAGGAATGGTTACGATTTT\n+TAACCACATCTTCACCTGGAGTCAAATTACCTCAAGAAACGCTAGACAGCCTGAGTAAAA\n+CATCTGCAGTATTATCGAAATCAAGACGAGGTTTGGAAGCGCTTGAAGCATCTGAATATA\n+GAAGCATCAATCGTGTTGAACGAGCGTTAGAGATGGTACTCAAATTAGTTCAAAGACAAC\n+AAAATGATAGAAGACAACGAGCGATAGCAGGCGAACCAAATTCCATTCTATTACTGACCC\n+TTGTTTATTATGTTATCTTATCGGCTATGTACGCCATGTCGACAGATGCAGCTCAAGGTA\n+AACAGGTTGGTAATTCAATGGACCTTCAAGACTTGTTATTCGCGACAACTCAGACGGACA\n+CGCTTGTGTCATCAATTGATATTGTAGGTATGGATGCTTCTGTGCAGTCAATAACTACTG\n+AGTTGTCAAATATTATCTGTCTTGAAGTGACGCGTGGTTTACCTGAATCACAAATTGGAC\n+CATTTACAGGCGGTATGAAGCGTCTTCTGCAACTAAGTGATGAACCTGGTGGAGCGTGGA\n+AGCAGGTTGAGATGTATGTATCAGGTACACTTGAGGCCGTGGTATTCGAAGGTAGTCATG\n+CACTAACATCAACTACTTACGAGAGTAAGATTTTTGGAAGTGTTAAGAACTATGCGGGTA\n+CGTATCCCTCAGGTAGAGCTGACACGTCGTCACATCACACTAAGGTTTTGGAAGGTGCGA\n+CCCGTGGTAATGAAATGCGAAGAAGAACGGATGAGCGAATCGTGCACCATGCGTCGACGA\n+TTGTAATGTCACGTAATATGGGTGATGATAAGTCAGACGTATACACAGGATCATTTCCAA\n+ATGTTATATCACAATTAGTGAGCGATAAAGATGTACTCGCACAATTGGGTTTTAAGACAG\n+ATGCAGATCTCTCGAGTCACAACGGAGAATTCTTGCAACAACATGTATGTAGAGGAAGGC\n+TAGTCGGAAAACCATCACGTATATCAATAGGCACAGTAGAGCATCGTAAAGAGAAGGTTC\n+GGATGCATGAAGCATGTCAAGAACTTCTATCTATTATGGATGACCTAATTGTGCGTATTA\n+GAGATACCGAGGGCTTGAAGATGATGATCTTCTCGTTTGCTATACATTGCATTAATAGTA\n+TTGTATTAAACATTGCGAAAGTTGATCTTGCCGCTATAATATCGAAATTGACTTCAAATA\n+ATTTGCGTACATATGTATATCCTACGAAAGATGAACATGCTTTTCAGCTCGTTAGATTGT\n+ATTTTCCATTGATGTGGTTCTTTATGCATAAAGGTGGTGAATTACCAGCTTATCCAATTG\n+AACGGGTTGATGGTACTTATACAGATGACGAGTCGGTGTACACTGTGCGAGGTGAATACA\n+AACGAAGATTGATGTTTGATATTATAGGTATTGATAAAATTGAGAAATTTGGTGACGCCA\n+TTTTCAGAAATAATCACTGCTTTGATATCGGTTTGAACGCTGCTGATGCCATCATTAAGC\n+TGAAGATAACGGATCTACCGAAGGAAATGAGAAGTGAAACGCTCGAGCATGGTATCATAT\n+CAAATCTAGCGAAAAATTTAGAGTCATTCGGCAATGCTATGTCTAAGGAAGCTTCACTTC\n+AAGCGAAACTCAGGATTGAAAATGAACTTGCAGGTGTTAGGAGCGTAACTCAGACAAATG\n+AAGTTGTCGTTGGAAGAGGAAAGATAGCAAAAGTCCCAAAAAGTATTGTATACGCACATC\n+GAACTGAAGCACAACTTGAACAGATATTAATGACAAGAGAGTCGGATAATGAAGAGCGAC\n+CAATGATATCAAAGCGAATGCTTGATCACATCGCTTCACTATCGTTTCATCATGTTGTTA\n+ATGTCAAGACAACGGATAAGTTACACTTGTATTACTTCTATCCTAGTGGCGATGCCCTAG\n+TTTACGGTAATCATGCAAAATACACTGAACATTTCGAATTAGCTCCACCTATGTGGTATT\n+TGTCACCTTCATGGCGTTTATATGGCCTATTAGGTACAGCGTCACAGACACGTGGTGACT\n+TACTTCGACAAATTAATTGGCTAAAAGGTAAATATGGAACGTTTAAGCTTGATGACGAGA\n+AGATCCGTTATGGATATGATGTTATCTGGCGAAAGAACAGACATCTGCTTAATGACTACA\n+TGACAATGATCGGAGCATCACCACATCTTGAAAACTTGCTTAAGAGCATCTTTCGTTTGA\n+TGGATAGATGGGGTACTTATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTA\n+TCTCAGACAAT\n'
b
diff -r e3aee4ba49c6 -r ea8fde9c6f82 test-data/output_termlist_without.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_termlist_without.fa Wed Oct 09 18:48:17 2019 -0400
b
b'@@ -0,0 +1,5187 @@\n+>gi|157065140|gb|ABV04399.1|_p3__Heliothis_armigera_cypovirus_5--Locus_27_Transcript_6/7_Confidence_0.333_Length_1626_hit1_IdMatch=24.9,AligLength=494,E-val=2e-33\n+CTCCTCGCTCATGTCAAGAACTTCTATCTATTATGGATGACCTAATTGTGCGTATTAGAG\n+ATACCGAGGGCTTGAAGATGATGATCTTCTCGTTTGCTATACATTGCATTAATAGTATTG\n+TATTAAACATTGCGAAAGTTGATCTTGCCGCTATAATATCGAAATTGACTTCAAATAATT\n+TGCGTACATATGTATATCCTACGAAAGATGAACATGCTTTTCAGCTCGTTAGATTGTATT\n+TTCCATTGATGTGGTTCTTTATGCATAAAGGTGGTGAATTACCAGCTTATCCAATTGAAC\n+GGGTTGATGGTACTTATACAGATGACGAGTCGGTGTACACTGTGCGAGGTGAATACAAAC\n+GAAGATTGATGTTTGATATTATAGGTATTGATAAAATTGAGAAATTTGGTGACGCCATTT\n+TCAGAAATAATCACTGCTTTGATATCGGTTTGAACGCTGCTGATGCCATCATTAAGCTGA\n+AGATAACGGATCTACCGAAGGAAATGAGAAGTGAAACGCTCGAGCATGGTATCATATCAA\n+ATCTAGCGAAAAATTTAGAGTCATTCGGCAATGCTATGTCTAAGGAAGCTTCACTTCAAG\n+CGAAACTCAGGATTGAAAATGAACTTGCAGGTGTTAGGAGCGTAACTCAGACAAATGAAG\n+TTGTCGTTGGAAGAGGAAAGATAGCAAAAGTCCCAAAAAGTATTGTATACGCACATCGAA\n+CTGAAGCACAACTTGAACAGATATTAATGACAAGAGAGTCGGATAATGAAGAGCGACCAA\n+TGATATCAAAGCGAATGCTTGATCACATCGCTTCACTATCGTTTCATCATGTTGTTAATG\n+TCAAGACAACGGATAAGTTACACTTGTATTACTTCTATCCTAGTGGCGATGCCCTAGTTT\n+ACGGTAATCATGCAAAATACACTGAACATTTCGAATTAGCTCCACCTATGTGGTATTTGT\n+CACCTTCATGGCGTTTATATGGCCTATTAGGTACAGCGTCACAGACACGTGGTGACTTAC\n+TTCGACAAATTAATTGGCTAAAAGGTAAATATGGAACGTTTAAGCTTGATGACGAGAAGA\n+TCCGTTATGGATATGATGTTATCTGGCGAAAGAACAGACATCTGCTTAATGACTACATGA\n+CAATGATCGGAGCATCACCACATCTTGAAAACTTGCTTAAGAGCATCTTTCGTTTGATGG\n+ATAGATGGGGTACTTATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTATCT\n+CAGACAATCCATTAGTCGCTGAACAGAACATTATCTTCGCTGCAGATGGTGACGAGATAA\n+CTAGGCCCTTACAGGTAATTGTCGGCTATCTACATATACTTGCGCATATTAATACGATTT\n+TTACACGACCACAAGTAAAGTTAACTGAGCATCTTATTGAATATATGCATCAGCGAGCTG\n+TACATACAGGAAGGTCG\n+>gi|584614105|gb|AHJ14783.1|_VP3__Orgyia_pseudotsugata_cypovirus_5--Locus_27_Transcript_1/7_Confidence_0.444_Length_3872_hit1_IdMatch=28.76,AligLength=1217,E-val=4e-139\n+GTGGTATAGCTCTCAGCGCTACGGTTATAGTACCTCAGAGTATTTTGAAGCCACCACCTT\n+TCAACGAGAAAGACTGGCCTTTGAATGAAGACGAGAGTATGTTCAGTGCCTCGCGCAAGT\n+ATAATTACATGATAAATACTAGTACGTTGAGCCTTTATGGTTCGAGGGAAAGTTTAGTCG\n+GTAAAGCAATATACGGTTTATATACTGATGAGCAATCACAGTCACGCTTCAGGACAGTAT\n+GGCATCAAATAATGGCAAGTGTCTACGCACTAGACGATTATCTAGGTCATACTAACCATC\n+CAGTTCGTGCAGTGTTGGCACAGTTAAACTTAGACAAAGGATTACCATTCAAGGAAACTG\n+CTGAAGGTATTGACTTAACAGAGGCGGTTGAAAAAGGAATTGATTCGAGTACATTACTAC\n+CATCAATATTATATATGTTGATCTCAGTATCGTGCGATATCTGTTTCGGAATTTCAACTG\n+AAGTTGAAGGTGCCTTTACGATCAATCATTATCTTAATCTAGCACAGCATGATTACGCGG\n+ATGAGAAGTTACGAATTAAGTCGGCATGTCGTAATTGGTTTGCACAAGCATTGAGTAAAC\n+TAGACGTCATAGCTTACCCAGTTTATAACAATCAGCTCGAGATCATCGACCTAAAGTATG\n+TACATGGTAAAGAGCCAAAGTATGTAAGCACATTACATGAAAAAGTTGCCGAATCACGTC\n+AACGTAAGCTGTCAAAATACCCATACTTACTGGAATATATTGATAGGTCACGTAAAGCGA\n+AAACGGTGGAGGAATTAATCCATAGACTTTTAGTGATGAATGCACTTTCAAACGACCGCT\n+CTTTCTATAAAACACGGACGGAATTATCATTAGACGCGGCGGTAAAATCAGAGGTGCGAG\n+AGCACTTAGTTAGTGCTCCGGTCGCTAAATTGATTGACCCTCAGTCTAATCGAATCTATC\n+AGAAGTACTTTATTAGAGAAAGGAATGAAGCAATGTACTATGCTCAACAGTACTTATTAA\n+GCTTTGTCCCAGCATTGATCCAACAACTGAGCAAAACCAACTTTGATGAGGAATGGTTAC\n+GATTTTTAACCACATCTTCACCTGGAGTCAAATTACCTCAAGAAACGCTAGACAGCCTGA\n+GTAAAACATCTGCAGTATTATCGAAATCAAGACGAGGTTTGGAAGCGCTTGAAGCATCTG\n+AATATAGAAGCATCAATCGTGTTGAACGAGCGTTAGAGATGGTACTCAAATTAGTTCAAA\n+GACAACAAAATGATAGAAGACAACGAGCGATAGCAGGCGAACCAAATTCCATTCTATTAC\n+TGACCCTTGTTTATTATGTTATCTTATCGGCTATGTACGCCATGTCGACAGATGCAGCTC\n+AAGGTAAACAGGTTGGTAATTCAATGGACCTTCAAGACTTGTTATTCGCGACAACTCAGA\n+CGGACACGCTTGTGTCATCAATTGATATTGTAGGTATGGATGCTTCTGTGCAGTCAATAA\n+CTACTGAGTTGTCAAATATTATCTGTCTTGAAGTGACGCGTGGTTTACCTGAATCACAAA\n+TTGGACCATTTACAGGCGGTATGAAGCGTCTTCTGCAACTAAGTGATGAACCTGGTGGAG\n+CGTGGAAGCAGGTTGAGATGTATGTATCAGGTACACTTGAGGCCGTGGTATTCGAAGGTA\n+GTCATGCACTAACATCAACTACTTACGAGAGTAAGATTTTTGGAAGTGTTAAGAACTATG\n+CGGGTACGTATCCCTCAGGTAGAGCTGACACGTCGTCACATCACACTAAGGTTTTGGAAG\n+GTGCGACCCGTGGTAATGAAATGCGAAGAAGAACGGATGAGCGAATCGTGCACCATGCGT\n+CGACGATTGTAATGTCACGTAATATGGGTGATGATAAGTCAGACGTATACACAGGATCAT\n+TTCCAAATGTTATATCACAATTAGTGAGCGATAAAGATGTACTCGCACAATTGGGTTTTA\n+AGACAGATGCAGATCTCTCGAGTCACAACGGAGAATTCTTGCAACAACATGTATGTAGAG\n+GAAGGCTAGTCGGAAAACCATCACGTATAT'..b'TTTCGTTTGATGGATAGATGGG\n+GTACTTATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTATCTCAGACAATC\n+CATTAGTCGCTGAACAGAACATTATCTTCGCTGCAGATGGTGACGAGATAACTAGGCCCT\n+TACAGGTAATTGTCGGCTATCTACATATACTTGCGCATATTAATACGATTTTTACACGAC\n+CACAAGTAAAGTTAACTGAGCATCTTATTGAATATATGCATCAGCGAGCTGTACAT\n+>gi|330688232|gb|AEC32894.1|_RNA-dependent_RNA_polymerase__Rice_ragged_stunt_virus--Locus_27_Transcript_2/7_Confidence_0.333_Length_3860_hit1_IdMatch=24.94,AligLength=1199,E-val=1e-81\n+GGTTACTCACGACTATGCCACCATTGGTGACAGAATTCGCTGGAGTAGACTGTTGTGGTA\n+TAGCTCTCAGCGCTACGGTTATAGTACCTCAGAGTATTTTGAAGCCACCACCTTTCAACG\n+AGAAAGACTGGCCTTTGAATGAAGACGAGAGTATGTTCAGTGCCTCGCGCAAGTATAATT\n+ACATGATAAATACTAGTACGTTGAGCCTTTATGGTTCGAGGGAAAGTTTAGTCGGTAAAG\n+CAATATACGGTTTATATACTGATGAGCAATCACAGTCACGCTTCAGGACAGTATGGCATC\n+AAATAATGGCAAGTGTCTACGCACTAGACGATTATCTAGGTCATACTAACCATCCAGTTC\n+GTGCAGTGTTGGCACAGTTAAACTTAGACAAAGGATTACCATTCAAGGAAACTGCTGAAG\n+GTATTGACTTAACAGAGGCGGTTGAAAAAGGAATTGATTCGAGTACATTACTACCATCAA\n+TATTATATATGTTGATCTCAGTATCGTGCGATATCTGTTTCGGAATTTCAACTGAAGTTG\n+AAGGTGCCTTTACGATCAATCATTATCTTAATCTAGCACAGCATGATTACGCGGATGAGA\n+AGTTACGAATTAAGTCGGCATGTCGTAATTGGTTTGCACAAGCATTGAGTAAACTAGACG\n+TCATAGCTTACCCAGTTTATAACAATCAGCTCGAGATCATCGACCTAAAGTATGTACATG\n+GTAAAGAGCCAAAGTATGTAAGCACATTACATGAAAAAGTTGCCGAATCACGTCAACGTA\n+AGCTGTCAAAATACCCATACTTACTGGAATATATTGATAGGTCACGTAAAGCGAAAACGG\n+TGGAGGAATTAATCCATAGACTTTTAGTGATGAATGCACTTTCAAACGACCGCTCTTTCT\n+ATAAAACACGGACGGAATTATCATTAGACGCGGCGGTAAAATCAGAGGTGCGAGAGCACT\n+TAGTTAGTGCTCCGGTCGCTAAATTGATTGACCCTCAGTCTAATCGAATCTATCAGAAGT\n+ACTTTATTAGAGAAAGGAATGAAGCAATGTACTATGCTCAACAGTACTTATTAAGCTTTG\n+TCCCAGCATTGATCCAACAACTGAGCAAAACCAACTTTGATGAGGAATGGTTACGATTTT\n+TAACCACATCTTCACCTGGAGTCAAATTACCTCAAGAAACGCTAGACAGCCTGAGTAAAA\n+CATCTGCAGTATTATCGAAATCAAGACGAGGTTTGGAAGCGCTTGAAGCATCTGAATATA\n+GAAGCATCAATCGTGTTGAACGAGCGTTAGAGATGGTACTCAAATTAGTTCAAAGACAAC\n+AAAATGATAGAAGACAACGAGCGATAGCAGGCGAACCAAATTCCATTCTATTACTGACCC\n+TTGTTTATTATGTTATCTTATCGGCTATGTACGCCATGTCGACAGATGCAGCTCAAGGTA\n+AACAGGTTGGTAATTCAATGGACCTTCAAGACTTGTTATTCGCGACAACTCAGACGGACA\n+CGCTTGTGTCATCAATTGATATTGTAGGTATGGATGCTTCTGTGCAGTCAATAACTACTG\n+AGTTGTCAAATATTATCTGTCTTGAAGTGACGCGTGGTTTACCTGAATCACAAATTGGAC\n+CATTTACAGGCGGTATGAAGCGTCTTCTGCAACTAAGTGATGAACCTGGTGGAGCGTGGA\n+AGCAGGTTGAGATGTATGTATCAGGTACACTTGAGGCCGTGGTATTCGAAGGTAGTCATG\n+CACTAACATCAACTACTTACGAGAGTAAGATTTTTGGAAGTGTTAAGAACTATGCGGGTA\n+CGTATCCCTCAGGTAGAGCTGACACGTCGTCACATCACACTAAGGTTTTGGAAGGTGCGA\n+CCCGTGGTAATGAAATGCGAAGAAGAACGGATGAGCGAATCGTGCACCATGCGTCGACGA\n+TTGTAATGTCACGTAATATGGGTGATGATAAGTCAGACGTATACACAGGATCATTTCCAA\n+ATGTTATATCACAATTAGTGAGCGATAAAGATGTACTCGCACAATTGGGTTTTAAGACAG\n+ATGCAGATCTCTCGAGTCACAACGGAGAATTCTTGCAACAACATGTATGTAGAGGAAGGC\n+TAGTCGGAAAACCATCACGTATATCAATAGGCACAGTAGAGCATCGTAAAGAGAAGGTTC\n+GGATGCATGAAGCATGTCAAGAACTTCTATCTATTATGGATGACCTAATTGTGCGTATTA\n+GAGATACCGAGGGCTTGAAGATGATGATCTTCTCGTTTGCTATACATTGCATTAATAGTA\n+TTGTATTAAACATTGCGAAAGTTGATCTTGCCGCTATAATATCGAAATTGACTTCAAATA\n+ATTTGCGTACATATGTATATCCTACGAAAGATGAACATGCTTTTCAGCTCGTTAGATTGT\n+ATTTTCCATTGATGTGGTTCTTTATGCATAAAGGTGGTGAATTACCAGCTTATCCAATTG\n+AACGGGTTGATGGTACTTATACAGATGACGAGTCGGTGTACACTGTGCGAGGTGAATACA\n+AACGAAGATTGATGTTTGATATTATAGGTATTGATAAAATTGAGAAATTTGGTGACGCCA\n+TTTTCAGAAATAATCACTGCTTTGATATCGGTTTGAACGCTGCTGATGCCATCATTAAGC\n+TGAAGATAACGGATCTACCGAAGGAAATGAGAAGTGAAACGCTCGAGCATGGTATCATAT\n+CAAATCTAGCGAAAAATTTAGAGTCATTCGGCAATGCTATGTCTAAGGAAGCTTCACTTC\n+AAGCGAAACTCAGGATTGAAAATGAACTTGCAGGTGTTAGGAGCGTAACTCAGACAAATG\n+AAGTTGTCGTTGGAAGAGGAAAGATAGCAAAAGTCCCAAAAAGTATTGTATACGCACATC\n+GAACTGAAGCACAACTTGAACAGATATTAATGACAAGAGAGTCGGATAATGAAGAGCGAC\n+CAATGATATCAAAGCGAATGCTTGATCACATCGCTTCACTATCGTTTCATCATGTTGTTA\n+ATGTCAAGACAACGGATAAGTTACACTTGTATTACTTCTATCCTAGTGGCGATGCCCTAG\n+TTTACGGTAATCATGCAAAATACACTGAACATTTCGAATTAGCTCCACCTATGTGGTATT\n+TGTCACCTTCATGGCGTTTATATGGCCTATTAGGTACAGCGTCACAGACACGTGGTGACT\n+TACTTCGACAAATTAATTGGCTAAAAGGTAAATATGGAACGTTTAAGCTTGATGACGAGA\n+AGATCCGTTATGGATATGATGTTATCTGGCGAAAGAACAGACATCTGCTTAATGACTACA\n+TGACAATGATCGGAGCATCACCACATCTTGAAAACTTGCTTAAGAGCATCTTTCGTTTGA\n+TGGATAGATGGGGTACTTATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTA\n+TCTCAGACAAT\n'
b
diff -r e3aee4ba49c6 -r ea8fde9c6f82 test-data/output_without.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_without.fa Wed Oct 09 18:48:17 2019 -0400
b
b'@@ -0,0 +1,2310 @@\n+>gi|157065140|gb|ABV04399.1|_p3__Heliothis_armigera_cypovirus_5--Locus_27_Transcript_6/7_Confidence_0.333_Length_1626_hit1_IdMatch=24.9,AligLength=494,E-val=2e-33\n+CTCCTCGCTCATGTCAAGAACTTCTATCTATTATGGATGACCTAATTGTGCGTATTAGAG\n+ATACCGAGGGCTTGAAGATGATGATCTTCTCGTTTGCTATACATTGCATTAATAGTATTG\n+TATTAAACATTGCGAAAGTTGATCTTGCCGCTATAATATCGAAATTGACTTCAAATAATT\n+TGCGTACATATGTATATCCTACGAAAGATGAACATGCTTTTCAGCTCGTTAGATTGTATT\n+TTCCATTGATGTGGTTCTTTATGCATAAAGGTGGTGAATTACCAGCTTATCCAATTGAAC\n+GGGTTGATGGTACTTATACAGATGACGAGTCGGTGTACACTGTGCGAGGTGAATACAAAC\n+GAAGATTGATGTTTGATATTATAGGTATTGATAAAATTGAGAAATTTGGTGACGCCATTT\n+TCAGAAATAATCACTGCTTTGATATCGGTTTGAACGCTGCTGATGCCATCATTAAGCTGA\n+AGATAACGGATCTACCGAAGGAAATGAGAAGTGAAACGCTCGAGCATGGTATCATATCAA\n+ATCTAGCGAAAAATTTAGAGTCATTCGGCAATGCTATGTCTAAGGAAGCTTCACTTCAAG\n+CGAAACTCAGGATTGAAAATGAACTTGCAGGTGTTAGGAGCGTAACTCAGACAAATGAAG\n+TTGTCGTTGGAAGAGGAAAGATAGCAAAAGTCCCAAAAAGTATTGTATACGCACATCGAA\n+CTGAAGCACAACTTGAACAGATATTAATGACAAGAGAGTCGGATAATGAAGAGCGACCAA\n+TGATATCAAAGCGAATGCTTGATCACATCGCTTCACTATCGTTTCATCATGTTGTTAATG\n+TCAAGACAACGGATAAGTTACACTTGTATTACTTCTATCCTAGTGGCGATGCCCTAGTTT\n+ACGGTAATCATGCAAAATACACTGAACATTTCGAATTAGCTCCACCTATGTGGTATTTGT\n+CACCTTCATGGCGTTTATATGGCCTATTAGGTACAGCGTCACAGACACGTGGTGACTTAC\n+TTCGACAAATTAATTGGCTAAAAGGTAAATATGGAACGTTTAAGCTTGATGACGAGAAGA\n+TCCGTTATGGATATGATGTTATCTGGCGAAAGAACAGACATCTGCTTAATGACTACATGA\n+CAATGATCGGAGCATCACCACATCTTGAAAACTTGCTTAAGAGCATCTTTCGTTTGATGG\n+ATAGATGGGGTACTTATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTATCT\n+CAGACAATCCATTAGTCGCTGAACAGAACATTATCTTCGCTGCAGATGGTGACGAGATAA\n+CTAGGCCCTTACAGGTAATTGTCGGCTATCTACATATACTTGCGCATATTAATACGATTT\n+TTACACGACCACAAGTAAAGTTAACTGAGCATCTTATTGAATATATGCATCAGCGAGCTG\n+TACATACAGGAAGGTCG\n+>gi|584614105|gb|AHJ14783.1|_VP3__Orgyia_pseudotsugata_cypovirus_5--Locus_27_Transcript_1/7_Confidence_0.444_Length_3872_hit1_IdMatch=28.76,AligLength=1217,E-val=4e-139\n+GTGGTATAGCTCTCAGCGCTACGGTTATAGTACCTCAGAGTATTTTGAAGCCACCACCTT\n+TCAACGAGAAAGACTGGCCTTTGAATGAAGACGAGAGTATGTTCAGTGCCTCGCGCAAGT\n+ATAATTACATGATAAATACTAGTACGTTGAGCCTTTATGGTTCGAGGGAAAGTTTAGTCG\n+GTAAAGCAATATACGGTTTATATACTGATGAGCAATCACAGTCACGCTTCAGGACAGTAT\n+GGCATCAAATAATGGCAAGTGTCTACGCACTAGACGATTATCTAGGTCATACTAACCATC\n+CAGTTCGTGCAGTGTTGGCACAGTTAAACTTAGACAAAGGATTACCATTCAAGGAAACTG\n+CTGAAGGTATTGACTTAACAGAGGCGGTTGAAAAAGGAATTGATTCGAGTACATTACTAC\n+CATCAATATTATATATGTTGATCTCAGTATCGTGCGATATCTGTTTCGGAATTTCAACTG\n+AAGTTGAAGGTGCCTTTACGATCAATCATTATCTTAATCTAGCACAGCATGATTACGCGG\n+ATGAGAAGTTACGAATTAAGTCGGCATGTCGTAATTGGTTTGCACAAGCATTGAGTAAAC\n+TAGACGTCATAGCTTACCCAGTTTATAACAATCAGCTCGAGATCATCGACCTAAAGTATG\n+TACATGGTAAAGAGCCAAAGTATGTAAGCACATTACATGAAAAAGTTGCCGAATCACGTC\n+AACGTAAGCTGTCAAAATACCCATACTTACTGGAATATATTGATAGGTCACGTAAAGCGA\n+AAACGGTGGAGGAATTAATCCATAGACTTTTAGTGATGAATGCACTTTCAAACGACCGCT\n+CTTTCTATAAAACACGGACGGAATTATCATTAGACGCGGCGGTAAAATCAGAGGTGCGAG\n+AGCACTTAGTTAGTGCTCCGGTCGCTAAATTGATTGACCCTCAGTCTAATCGAATCTATC\n+AGAAGTACTTTATTAGAGAAAGGAATGAAGCAATGTACTATGCTCAACAGTACTTATTAA\n+GCTTTGTCCCAGCATTGATCCAACAACTGAGCAAAACCAACTTTGATGAGGAATGGTTAC\n+GATTTTTAACCACATCTTCACCTGGAGTCAAATTACCTCAAGAAACGCTAGACAGCCTGA\n+GTAAAACATCTGCAGTATTATCGAAATCAAGACGAGGTTTGGAAGCGCTTGAAGCATCTG\n+AATATAGAAGCATCAATCGTGTTGAACGAGCGTTAGAGATGGTACTCAAATTAGTTCAAA\n+GACAACAAAATGATAGAAGACAACGAGCGATAGCAGGCGAACCAAATTCCATTCTATTAC\n+TGACCCTTGTTTATTATGTTATCTTATCGGCTATGTACGCCATGTCGACAGATGCAGCTC\n+AAGGTAAACAGGTTGGTAATTCAATGGACCTTCAAGACTTGTTATTCGCGACAACTCAGA\n+CGGACACGCTTGTGTCATCAATTGATATTGTAGGTATGGATGCTTCTGTGCAGTCAATAA\n+CTACTGAGTTGTCAAATATTATCTGTCTTGAAGTGACGCGTGGTTTACCTGAATCACAAA\n+TTGGACCATTTACAGGCGGTATGAAGCGTCTTCTGCAACTAAGTGATGAACCTGGTGGAG\n+CGTGGAAGCAGGTTGAGATGTATGTATCAGGTACACTTGAGGCCGTGGTATTCGAAGGTA\n+GTCATGCACTAACATCAACTACTTACGAGAGTAAGATTTTTGGAAGTGTTAAGAACTATG\n+CGGGTACGTATCCCTCAGGTAGAGCTGACACGTCGTCACATCACACTAAGGTTTTGGAAG\n+GTGCGACCCGTGGTAATGAAATGCGAAGAAGAACGGATGAGCGAATCGTGCACCATGCGT\n+CGACGATTGTAATGTCACGTAATATGGGTGATGATAAGTCAGACGTATACACAGGATCAT\n+TTCCAAATGTTATATCACAATTAGTGAGCGATAAAGATGTACTCGCACAATTGGGTTTTA\n+AGACAGATGCAGATCTCTCGAGTCACAACGGAGAATTCTTGCAACAACATGTATGTAGAG\n+GAAGGCTAGTCGGAAAACCATCACGTATAT'..b'CCAAAAAGTATTGTATACGCACATCGAA\n+CTGAAGCACAACTTGAACAGATATTAATGACAAGAGAGTCGGATAATGAAGAGCGACCAA\n+TGATATCAAAGCGAATGCTTGATCACATCGCTTCACTATCGTTTCATCATGTTGTTAATG\n+TCAAGACAACGGATAAGTTACACTTGTATTACTTCTATCCTAGTGGCGATGCCCTAGTTT\n+ACGGTAATCATGCAAAATACACTGAACATTTCGAATTAGCTCCACCTATGTGGTATTTGT\n+CACCTTCATGGCGTTTATATGGCCTATTAGGTACAGCGTCACAGACACGTGGTGACTTAC\n+TTCGACAAATTAATTGGCTAAAAGGTAAATATGGAACGTTTAAGCTTGATGACGAGAAGA\n+TCCGTTATGGATATGATGTTATCTGGCGAAAGAACAGACATCTGCTTAATGACTACATGA\n+CAATGATCGGAGCATCACCACATCTTGAAAACTTGCTTAAGAGCATCTTTCGTTTGATGG\n+ATAGATGGGGTACTTATCGTTATGATTACATTCAAACACCGAGGAATATTTTCTTTATCT\n+CAGACAATCCATTAGTCGCTGAACAGAACATTATCTTCGCTGCAGATGGTGACGAGATAA\n+CTAGGCCCTTACAGGTAATTGTCGGCTATCTACATATACTTGCGCATATTAATACGATTT\n+TTACACGACCACAAGTAAAGTTAACTGAGCATCTTATTGAATATATGCATCAGCGAGCTG\n+TACATACAGGAAGGTCG\n+>gi|798547250|gb|AKA63263.1|_nonstructural_polyprotein__Cricket_paralysis_virus--Locus_63_Transcript_2/2_Confidence_0.333_Length_343_hit1_IdMatch=53.45,AligLength=116,E-val=4e-32\n+ACACAGTCCACAGTCCGAAGACCAAAGCGTTGGATAGGACACGAATACACAGATGAAACG\n+AAAACAGGCGAGGCTGCGCCCTATCGGACATTGGAAGAAGTCCGTTTCCTTAAAAGAGGG\n+TTCAGAATGGATCACCTCTTGTGTCGGTGGGTAGCTCCTTTGAAGAAGGATGTCATCTAC\n+GAAATGCTTAATTGGACGCGCAAAGGGATTAACCCAGATGATGTGACGATGATGATCATT\n+GATACAGCATTTAGGGAGATCTCTTATCACGGAAGGGAAGCTTTCGAGAAGCTGCGAGGG\n+CAGATACTTGAGCAGCGGGATGTGTTGGTTGAATATCCTCAA\n+>gi|798547250|gb|AKA63263.1|_nonstructural_polyprotein__Cricket_paralysis_virus--Locus_63_Transcript_1/2_Confidence_0.333_Length_1607_hit1_IdMatch=54.29,AligLength=536,E-val=0.0\n+CTAGAATCACAGCTCAGATGAGTTTTGAGGCACCGAAGGACGCAATTGAAGGACCGTGTC\n+AAACCCCGGAAGGATTGTTCGCCCCTATTGGCAAAGCGCCGATAGGCGTAGGGATGTCCA\n+CCAAGACGGCTATACGACCTTCACGCTTGTATGGAAGAATAACTAAACCGACAACTGCAC\n+CATCATACTTGGGTAAAGACGCGCTTTATCGTGGATTGACCAAGTGTGGTGTTCGCACAG\n+TTAATATTCAACCAGAATACATAGACGCAGCGGCGAATGACGTCGCACGCTATGTGTTAA\n+ACCAGCATGTTGGTCACGTGGATAGGGAACGATACACACGTATATTGTCGTACGAGGAGG\n+CTGTTAAGGGCGTGCCGTACGATGATTTCATGAAGTCAGTGACTCGAGTCACTTCCCCTG\n+GTTACCCCTATTGCTTGGATACTGGAAACATGCCAGGGAAAAGCAAATGGATGGGGCTCG\n+AACAAGATTTCGATATGACAAGTCCAGCTGCTTTGGCTTTGAGGAAAGATGTTGAAAGTT\n+TGTTGGAAGATTGCAAAAATGGCTTAGTCCGTGATGTGGTGTTTGTCGACACTCTCAAGG\n+ATGAAAGGCGCGAGCTGATAAAGGTGGAAGCAAAGAAGACTCGAGTCTTTTCTGCTGGAC\n+CACAGCATTTTGTAATAGCTTTCCGGCAATACTTTCTTCCATTCTCTGCCTGGGTCATGC\n+ATAACAGAATCGAAAACGAAGTAGCCGTTGGAACAAACCCCTTCTCAATGGATTGGCACA\n+ACATTGCTGTGCGTATGCGTAGTAAAGGGAGACACATTATTGCTGGAGATTTTAGCAATT\n+TTGATGGATCCCTCAACGCCCAAGTTCTCTGGACAATATTTTGGAAGATATTTGTCCCGT\n+GGCTTAATGATATTGAACCACTTGGTACACCCAAGAATGAGGAGAATCTGCGGGTCTGCA\n+CGAGTCTATGGACGCACTTGGTGCACTCCGTGCACATTTGTGGAGATAACTTGTACATGT\n+GGACACATTCTCAACCATCGGGCAATCCCTTCACGGTGATAATCAATAGTTTGTATAACT\n+CAGTTATCATGCGTGTCGTGTGGCAATACATAATGGCGAAAGAAGAACCTAAGTTACGCA\n+CAATGAACCATTTCAATCAACATGTTGCTATGGTTTCATATGGTGATGACAATCTACTTA\n+ACATCTCGGAAGGGGTAATTGATATCTTCAACCAACTTACCATCTCGGAAGCCATGCGTT\n+GGATAGGACACGAATACACAGATGAAACGAAAACAGGCGAGGCTGCGCCCTATCGGACAT\n+TGGAAGAAGTCCGTTTCCTTAAAAGAGGGTTCAGAATGGATCACCTCTTGTGTCGGTGGG\n+TAGCTCCTTTGAAGAAGGATGTCATCTACGAAATGCTTAATTGGACGCGCAAAGGGATTA\n+ACCCAGATGATGTGACGATGATGATCATTGATACAGCATTTAGGGAGATCTCTTATCACG\n+GAAGGGAAGCTTTCGAGAAGCTGCGAGGGCAGATACTTGAGCAGCGGGATGTGTTGGTTG\n+AATATCCTCAA\n+>gi|2388673|gb|AAC58807.1|_replicase_polyprotein__Drosophila_C_virus--Locus_50_Transcript_1/1_Confidence_0.000_Length_1442_hit1_IdMatch=35.5,AligLength=231,E-val=2e-37\n+AACACGTATCGAATGTGTATCAAGAGGGATCCTGATGATTTGGTCGTTGGAAACGCTGTG\n+TTTATCACAGGGTGGACGCTCCTCATACCGTACCACTTCGTTTGTGGACTGGCGGGACGG\n+AGAATAGCTGCTGATTCCATCGTGACTTTGTCAAAGCCAGGCTTGGATAAGATTATTGAA\n+TTCCCGTTGTCACGAATCTTCCGATACGATACCTCACCAGATGGTTTTACCACTAGTGAG\n+TATTGTGCTCGAATGGAACATGAAGATGGAGAATTGGTTGATGCCATCCTGGTAAACCTG\n+CATGGTTTGGGAGTGCGAATCCATCCTGACCTCCGGGGAAAAATTGTGACGGTACGAGAC\n+CAAGCGCACCTGAGTACGACATTTCATGCGATTCTCACAACGATGTCCAGGAAGCCACCA\n+CTAACAACGTCACAACAAGTGGTAAAAGGGGTCAAGCCAATGGATAAAATCCTGCACATC\n+AATTTACCAGTTGGGGACAAAACAACGCAATACACCCAACGTGACTGTTACAAGTATTAT\n+TCCGTAACGGTCGTTGGAGATTGTGGTGCCTTGCTGGTAGCACAAAATCATGCAATTGTG\n+AGGAAAATATTTGCAATGCATATAGCAGGTGCGGAAGAAAATGGCTATGCTTGTCCAATC\n+AATCAGGAAATGTTAG\n'
b
diff -r e3aee4ba49c6 -r ea8fde9c6f82 test-data/termlist.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/termlist.txt Wed Oct 09 18:48:17 2019 -0400
b
@@ -0,0 +1,3 @@
+Locus_65_
+Locus_63_
+Pro--Locus_50