Repository 'blast_to_scaffold'
hg clone https://toolshed.g2.bx.psu.edu/repos/artbio/blast_to_scaffold

Changeset 0:7d96b28eec49 (2017-10-15)
Next changeset 1:be61d0d0d622 (2021-03-10)
Commit message:
planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/blast_to_scaffold commit 48a4098045106f363e92357949b32617a2e868c1
added:
blast_to_scaffold.py
blast_to_scaffold.xml
test-data/assembly.fa
test-data/blast.tab
test-data/contigs.fa
test-data/guideSequence.fa
b
diff -r 000000000000 -r 7d96b28eec49 blast_to_scaffold.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/blast_to_scaffold.py Sun Oct 15 12:52:40 2017 -0400
[
@@ -0,0 +1,140 @@
+#!/usr/bin/env python
+import argparse
+
+
+def insert_newlines(string, every=60):
+    lines = []
+    for i in range(0, len(string), every):
+        lines.append(string[i:i+every])
+    return '\n'.join(lines)
+
+
+def getseq(fastadict, transcript, up, down, orientation="direct"):
+    def reverse(seq):
+        revdict = {"A": "T", "T": "A", "G": "C", "C": "G", "N": "N"}
+        revseq = [revdict[i] for i in seq[::-1]]
+        return "".join(revseq)
+    pickseq = fastadict[transcript][up-1:down]
+    if orientation == "direct":
+        return pickseq
+    else:
+        return reverse(pickseq)
+
+
+def Parser():
+    the_parser = argparse.ArgumentParser(
+        description="Generate DNA scaffold from blastn or tblastx alignment\
+                     of Contigs")
+    the_parser.add_argument('--sequences', action="store", type=str,
+                            help="input sequence file in fasta format")
+    the_parser.add_argument('--guideSequence', action="store", type=str,
+                            help="the reference sequence to guide the scaffold\
+                                  assembly in fasta format")
+    the_parser.add_argument('--blast-tab', dest="blast_tab", action="store",
+                            type=str,
+                            help="13-columns tabular blastn or tblastx output")
+    the_parser.add_argument('--output', action="store", type=str,
+                            help="output file path, fasta format")
+    the_parser.add_argument('--scaffold_prefix', action="store", type=str,
+                            help="the prefix that will be used for the header\
+                                  of the fasta scaffold")
+    the_parser.add_argument('--scaffold_suffix', action="store", type=str,
+                            help="the sufix that will be used for the header\
+                                  of the fasta scaffold")
+    args = the_parser.parse_args()
+    return args
+
+
+def blatnInfo(file):
+    blastlist = []
+    with open(file, "r") as f:
+        for line in f:
+            minilist = []
+            fields = line.rstrip().split()
+            minilist.append(fields[0])
+            minilist.extend(fields[6:10])
+            blastlist.append(minilist)
+    blastlist.sort(key=lambda x: x[3], reverse=True)
+    return blastlist
+
+
+def myContigs(file):
+    Contigs = {}
+    with open(file, "r") as f:
+        for line in f:
+            if line[0] == ">":
+                header = line[1:-1]
+                Contigs[header] = ""
+            else:
+                Contigs[header] += line[:-1]
+    return Contigs
+
+
+def myGuide(file):
+    Guide = {}
+    coordinate = 0
+    with open(file, "r") as f:
+        for line in f:
+            if line[0] == ">":
+                continue
+            else:
+                for nucleotide in line[:-1]:
+                    coordinate += 1
+                    Guide[coordinate] = nucleotide.lower()
+    return Guide
+
+
+def updateGuide(blastlist, GuideDict, ContigsDict):
+    '''
+    the blastlist object is a list of list with
+    element [0] : name of the blasted Contig
+    element [1] : queryStart of the alignment to the reference
+    element [2] = queryStop of the alignment to the reference
+    element [3] : subjectStart of the alignment to the reference
+    element [4] = subjectStop of the alignment to the reference
+    '''
+    for fields in blastlist:
+        seqHeader = fields[0]
+        queryStart = int(fields[1])
+        queryStop = int(fields[2])
+        subjectStart = int(fields[3])
+        subjectStop = int(fields[4])
+        if subjectStart > subjectStop:
+            subjectStart, subjectStop = subjectStop, subjectStart
+            orientation = "reverse"
+        else:
+            orientation = "direct"
+        sequence = getseq(ContigsDict, seqHeader, queryStart, queryStop,
+                          orientation)
+        for i in range(subjectStart, subjectStop+1):
+            try:
+                del GuideDict[i]
+            except KeyError:
+                continue
+        for i, nucleotide in enumerate(sequence):
+            GuideDict[i+subjectStart] = nucleotide
+
+
+def finalAssembly(GuideDict, outputfile, prefix, suffix):
+    finalSeqList = []
+    for keys in sorted(GuideDict):
+        finalSeqList.append(GuideDict[keys])
+    finalSequence = insert_newlines("".join(finalSeqList))
+    Out = open(outputfile, "w")
+    Out.write(">Scaffold_from_%s_guided_by_%s\n" % (prefix, suffix))
+    Out.write("%s\n" % finalSequence)
+    Out.close()
+
+
+def __main__():
+    args = Parser()
+    ContigsDict = myContigs(args.sequences)
+    GuideDict = myGuide(args.guideSequence)
+    blastlist = blatnInfo(args.blast_tab)
+    updateGuide(blastlist, GuideDict, ContigsDict)
+    finalAssembly(GuideDict, args.output, args.scaffold_prefix,
+                  args.scaffold_suffix)
+
+
+if __name__ == "__main__":
+    __main__()
b
diff -r 000000000000 -r 7d96b28eec49 blast_to_scaffold.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/blast_to_scaffold.xml Sun Oct 15 12:52:40 2017 -0400
b
@@ -0,0 +1,49 @@
+<tool id="blast2scaffold" name="blast_to_scaffold" version="1.0.0">
+<description>Generate DNA scaffold from blastn or tblastx alignment of Contigs</description>
+<requirements>
+</requirements>
+<command interpreter="python">
+        blast_to_scaffold.py --sequences "$sequences"
+                             --guideSequence "$guideSequence"
+                             --blast-tab "$blast_tab"
+                             --output "$output"
+                             --scaffold_prefix "$sequences.element_identifier"
+                             --scaffold_suffix "$guideSequence.element_identifier"
+</command>
+<inputs>
+<param name="sequences" type="data" format="fasta" label="Select a fasta contigs file"/> 
+<param name="guideSequence" type="data" format="fasta" label="Select the fasta guide sequence for scaffolding"/> 
+<param name="blast_tab"  type="data" format="tabular" label="Select a blastn or tblastx output from your history" help="must have 13 columns with column 13 containing the subject lenght, other columns are standard"/> 
+
+</inputs>
+<outputs>
+ <data format="fasta" name="output"/>
+</outputs>
+
+
+<tests>
+  <test>
+    <param name="sequences" value="contigs.fa" ftype="fasta"/>
+    <param name="blast_tab" value="blast.tab" ftype="tabular"/>
+    <param name="guideSequence" value="guideSequence.fa" ftype="tabular"/>
+    <output name="output" file="assembly.fa" ftype="fasta"/>
+  </test>
+</tests>
+        
+
+<help>
+
+
+**What it Does**
+This tool starts from DNA contigs that aligned to a subject DNA sequence through blastn or tblastx.
+The contigs must be provided in fasta format. The blastn or tblastx output must be tabular, the 12 standard column plus column 13 with the length of the blastn or tblastx subject.
+The sequence used to BLAST (blastn or tblastx) the contigs must be provided to serve as a guide to the final assembly
+The final assembly is a DNA sequence.
+Nucleotides of the guide sequence which were not covered by contigs are in small letters in the output assembly.
+
+
+**Attribution**
+This Galaxy tool was created by drosofff@gmail.com on 5/01/2016
+</help>
+
+</tool>
b
diff -r 000000000000 -r 7d96b28eec49 test-data/assembly.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/assembly.fa Sun Oct 15 12:52:40 2017 -0400
b
b'@@ -0,0 +1,207 @@\n+>Scaffold_from_contigs.fa_guided_by_guideSequence.fa\n+gcaaaaaggcccctgggGGGGGGTTAATGAGTACTGGAAAAAGAAGCGCGAGATACCACT\n+TCGCTGATTATGCTGATTCTGGTATTAAGGATTAGTAGAGTATCGGAAGTGCCGAAGGGA\n+ATAATGCTGGTCCGTTGTAAACAGGATACTTATGAGACCTCTTAACAGAAACTTTGAGCA\n+AACAACAAATAAACGAACAAAAAGAGTTATACATTGAACTTGAAAAAAATCAATGTCTTT\n+TATTTAGACTGATTTATATTGGTCTTTATAATCGTAAGGAATAATTCTCATCTAATGATA\n+TCGATGTAAAATGTATCATTCTAGCTATTCAATTATATTAATTGAGCTTAGCATCTGATT\n+AAATTTATTATAAAATAATATTTAATCCCCATCTTTGCAAGATGGAAACTCTCAATAAAT\n+CAGGAGTATAATAGATTTAAACCCTCACACTGAATCACGAGTATAAACAGATTCAAATAT\n+GATTAACAATCAAACAAACAAAAAGGGACCACAACTAGAGAGAGTACATTTTGGTAGTGC\n+GCAGGTTGTGGGAAAAAGTACCAAACGACGACAACGCGGAACCAAATTTGACATTGAATA\n+TACTGTTAAAAGGAACGATGCACCAAAAGAGCAGAAATTCTTAGTTTCAGAAATTTTTGA\n+TGAAAAGTTGGATAAACAAATAAAATATGAGAAGAAGCAAAATCATACTTTTATTAAACC\n+GAAATTAAATTTAGTTACTAGAGAAGAACAACACGTGACTAAGAAGGTTTTAAGAGGTAA\n+AGAACGAGCTGCAACTCATGCTTTTATGAAGGAAATGGTTGAATCTAACAAGATACAACC\n+TAGTTGGAATGTCGAATACGAAAAAGAAATAGATGAGGTTGATCTATTTTTTATGAAGAA\n+GAAAACCAAACCTTTCTCAGGTTTTTCTATTAAGGAATTAAGAGATAGTCTAATTGTGCA\n+GTCAGACGATAAAAACATGGCACAGCCAACCGTGATGAGTTCAACCAATGAAATTGTTAC\n+ACCCCGTGAGGAGATAAGCGTTTCTGCTATCTCTGAACAACTGGCATCCTTGATGGAGAG\n+AGTTGATAAACTCGAGAAGATGAATGCTGCTTTGGAGGAAGAAAACAAGCAGCTAAAGAA\n+AGAGAGAGAGGCGACTATTAAGTCAGTTAAGAAAGAGGCAAAGAGGACTAAACAAGAGAA\n+GCCTCAGATTGCGAAGAAAACGCAACACAAGAGTTTAGGAGTAAATCTTAAAATCACCAA\n+GACCAAAGTAGTTGGTCAGGAACAATGTTTGGAAATTGAAAATACTCAGCATAAGAAATT\n+TGTTGAGAAGCCAAGCATGCCATCCAAAGTGAGCAAGAAGATGAAGGGACAACAGTTGAA\n+AAAGACTATTCGTACTTGGTATGAATTTGATCCCTCTAAACTCGTTCAGCATCAAAAAGA\n+AGTGTTGAACAGTGTTGTTACCAACACAACCTTCGCAGATAAAGTCCGTGAAACTGGTAT\n+ACCTAAACAAAAGATTAGGTATACTGCAAAACCACCAGCAGAGGAGAAGAGGAGTATCCA\n+TTTCTATGGTTATAAGCCAAAAGGAATCCCTAACAAAGTTTGGTGGAATTGGGTCACCAC\n+TGGCACAGCTATGGACGCTTATGAAAAAGCTGACCATTATCTGTATCACCAATTTAAACG\n+AGAAATGATGGTATACAGAAATAAATGGGTCAAGTTTAGTAAGGAGTTCAATCCGTACCT\n+ATCGGAACCGAAAATGGTATGGGAAGAGAATACATGGGAATATGAATATAAAACAGACGT\n+TCCCTACAATTTTATTCTCAAATGGCGCCAGTTAGTGCAGACCTACAAGCCTAACACACC\n+AATCCAGGCTGATTGGTACAAAATCTCGCAGAAACAACAATGTTAATTGAAGTTTTCATT\n+AATTCTTTGTTGCAAAATCTAGGTATCATGATGTCTTTCCGTGACCTAGTGGCGAGCCCA\n+TGGATATTGCTAGTAATAGCTATACCCTTGTGTGCATTTGCCAGTTCAGCGTCTATGGTT\n+AGGGAGATGCTTTTCCGTCATAAAATTACAGAAAATATTTTAAAAGGAACAGGAGTAGAA\n+GAATTGTTTAatccattcgggataattattaaataTTTCCTTTATTTTGCAATTTTGTAT\n+GCTTTTATTAAATATATTAGAAATAACATTAACGTAATAACAGAGAAAGTTAATTTTATA\n+CGGAGAATAGTATCGAACCCAACTGGAACAACAGGACGTAGAGGTGTGTTAGGGCGATGT\n+GTAGAACAAATCATAGAATATCCAACATTCTTTATCACGATGGTCTACGAACTACAGCAA\n+ATTAAGAACAAAAAAGATCTTATCTCGAAAATTACGATGATAAGTAGTATTCTCAAGTTA\n+CCACTTGGTATTTGGGAAAGTACTGTAGGACGGATGCTAGATCGACCGGCGATAGAAGGA\n+ACAGAAGAAATGTTGGAAGATGTTCTACCTATGGTAGCAATGGGATTGACGATTACAAAG\n+ACTCAAATTGGAGATGTTCCAGTTGAAAGTTTTCTTGTGAATTTGGACCGTAATCAAAAG\n+GCTTGCGAAAATATAATAAAACGTATGCAGCCGTTGATGATTAAAATGGGAATGATGAAA\n+GATAGTTCATATGATACTATTTTGCAAGTTGCAAAAGAAGTTAATGAATTATCGGAAGCG\n+GAAACATGGATGAAAACAACGCTCAAATTAAACCCAAATGAGTTCTTACAAACACAAGGG\n+GCTGTAAGAGTTGGCGAAATCAGGGAAAAAGTTGCAACTTTGAGAAATAAGTTAAACACT\n+TTGCAAACGAAAGAACTTCGATCAGATAAAGTAGTAACAGAGTGCCAAAAACATCTGGCA\n+TCACTCGAAGTGCTACTTATTGAAGTTAAGGTGTTAGAGAACAGTAACCAAACCCGAGTA\n+AAACCCGTAGGAGTTACCATACAAGGCGAAAAACAAATCGGAAAGACAAACCTCGTAGCA\n+ATCCTCTCAAGAAAAGTGTGCGAGTATGTTCAGGAACATGGCGATATTTCTTTTAGAAAC\n+GCTACTAAATGGACAACTTGGTCTAGGCAGTGCAGAGATGAATTTGATACAGGATACACC\n+GGACAAGAAATAACTTACGTAGATGATGCCTTTCAACAAAAAGACAACAAGGATCATTTG\n+ATGTGGTTTACTTTTATTTCTAATACAGCAGTGGGAACAAACCAAGCTGATTTGAAACAA\n+AAAGGTTTACCATACAGAAGTAAGTTGGTGTTTACGACCTGTAACAAGTTGCCGGACAAA\n+AGCGTAACGATTGAGGATATCGAAGCATTACATGCTCGATTCCCTCATACAATTTGCTTG\n+AGGAGGAACAAGAACAAAATGCCAAAACGAGGAGCGATTGACGAGAGCTATGACTGGGTC\n+GATTTTTATTACGGACCAATGTCGAAAGCCGTCAGCGCTATTGGAAGCAACACGACCAGC\n+ACGCTAAAAACCATGTCTTTGAGTGAAATAGTGAAGATAATTGGAGATGATTTGATTATT\n+CAAAATAATTTCTATAACTCCACTATTAAAGATGTGGGAATCACCGGACAAGAACAAATG\n+GATGGAGCGCAATTAGAAAGAAGACAACGAATGCGCGAATTGAGGGATCACTTGTTGAGA\n+ATCCGCCCAGGAGACGAAAACATGCCTTTCCTTGATGAAACATTTGAGTTGAATAGCCGA\n+CCTATCCAGACAGATGAGAAATTTATACCGCTCAAAGATAACTTAGATGAAGAAGTTATG\n+TATGGCGGTATTTCAGATCA'..b'+ACAGATTAACACCCTTGCCACAACATTAAACGAGCTTGATCAAACTACGAAAGACTCCTT\n+AGACACGTTGAACACAACAACAGAATCTCTTAGTAAACAAGTATTATTTAATACTGATGA\n+GATTACCGTGTTAAAGGTAGACGTAGCAACCGTCACACAAAAACAACAGGACGTAGAACA\n+TTCACTTGTGACAATGAAAGATGAGATAGGAGAATTGCACATATCAGTGAATGCCAATGC\n+TAACTCCATTGAGGCATTACGCACCAGAATTGCCGCGCTAGAGGTTAGAGATGTAGGACC\n+GTGGGTTTTGAAAAACAGAATTTACAAATTCGTGATCAATATGCCAAATGGAACTACTCG\n+CTATACTACAATATACTTTTTCGCCGATGTATATTATAGCACTGGAGTAAGAGCAGCACC\n+TACAAATGCGGGAACAACTACAAGCATATTGACGATTACTTCGTTGACAACATCATATAG\n+TTTGGCTAACGTCCCCGTTTTAAAAGGTGTACCTTATAGAGTCAATGGTTACTTTGCTAA\n+CGGAAATAGTATCGAAGATATAACCGGAAGCACGTCAGTGATTTACGACTCTATGTAAAC\n+CGGACATGACATGTCTATGACACGACATTAAACTGTCAGAACCTGTTTGGTTAACACAGA\n+GAGATTAACCGCAAGACGAGTATGCAGAATCCAACACAAACCATGCATATATACGACATG\n+CCCCTACGCGTCATCGCTGGCCTGTCAACCCTTGCCAAAACAACTGAAGAAGACGACAAC\n+ACCTCAACTGGAATAGTAGTTAGTGAAGTAGGAGAGCCACAAGTGGTCGACCATCCAGCA\n+TGGATTGATCCCTTTGTTGCTTATCAATTGCGAGCTCCACGTAAAAACATCACACCAGAT\n+TTTATATTTGGTCGAGCCGATATTGGTAATGCGTTTAGTGCTTTCTTACCGCGCCGCTTT\n+TCTGCTCCAGCAGTAGGAACCCGACTTGTGATAGACCCTGTTTTCACTTACCAACAGAAA\n+ACGGTGCTAGGACTATATAATTATTTCCATGCGGATTTTTATTATATAGTGCATGTTCCA\n+GCACCCTTGGGAACAGGTATCTATCTGAAGATCTATGCTCCTGAATTTGACACTACAACC\n+GTAACACGAGGAATTCGGTTTAAGCCAAGTGCATCTCCAACAATTGCACTTTCAGTCCCT\n+TGGAGCAACGATCTATCGACCGTAGAAACATCCGTAGGTCGAGTCGGACAGAGTGGAGGG\n+AGTATTGTTATCGAAACTATCGAAGATAACAGTAACGAGACGGTCAACACCCCACTCAGC\n+ATCACCGTTTGGTGTTGCATGGCGAATATTAAAGCCACAGGCTACAAAAATGCGGATACG\n+TCAGCTTACAACGAAAAAGGCATGAACTTTGTCCCAGTTCCAGTGCCAAAGCCGCCCGTT\n+CCCCCAACAAAACCAATTATGGGCGAGGAACAAGCTGACAATGAAGTTACAGCCGAAGGT\n+GGTAAACTTGTACAGGAATTGGTTTACGACCATTCTGCGATTCCTGTAGCGCCAGTCGTC\n+GAAACACAAGCAGAACAGCCGGAAGTCCCAGTTTCATCAGTGGCAACGCGAAAGAACGAT\n+ACGGGACATTTGGCAACAAAGTGGTATGATTTCGCCAAAATCAGTCTGTCAAACCCAGCT\n+AACATGAACTGGACCACGCTAACCATAGACCCGTACAACAATGTTACATTGTCTAGAGAT\n+GGTGAGTCGATGGTCCTACCATGGAGGCGAAATGTTTGGACAACCGGATCGAAAAGTATT\n+GGATATATCCGAACGATGGTTGCACAAATTAACATACCACGCCCGCCGCAGATCAGTGGA\n+GTGCTCGAAGTTAAAGATTCAATCAATAACTCAAGTATTTCACTGGTAGAATTTGGAGGA\n+AAAGTAGAGATTCCAATTATTCCGAAGGTTATGAACGGACTAGTAACAAGTGCTAGTTTG\n+CCAAGGCATAGACTAAACCCATGGATGAGAACCGCCGAAAGTAAGGTTGAATTGCAATAT\n+CGAATTATTGCTTTTAATCGAACTAGCGACATTGCTGACCTTAACGTTAGCGTTTTGTTG\n+CGACCTGGCGATTCGCAATTCCAATTGCCGATGAAACCTGACAATAGTGTGGATACACGT\n+CATTTTGAGCTTGTTGAAGCTTTAATGTACCACTACGATAGCCTCCGAATTCGAGGAGAA\n+GAACAGAGTCTGCCAGAAAATGCACCTAATGCAGTTTCAAACCCTCAGCAGTTCATTACA\n+CCCGCAACCGCTCTAAGTGCCGAAGAATATAATGTGCACGAGGCGTTGGGTGAAACTGAG\n+GAGTTGGAGCTGGATGAATTTCCGGTTCTGGTGTTCAAGGGAAATGTTCCCGTTGACTCA\n+GTGACGTCCATTCCTTTGGACCTCGCAACTATATACGACTTTGCTTGGGACGGAGAGCAG\n+AATGCAATTTCTCAGAAATTTCAGCGTTTTGCTCATCTGATACCGAAAAGCGCAGGTGGT\n+TTTGGCCCAGTGATTGGTAATTATACTATCACGGCTAACCTCCCCACCGGTGTAGCAGGT\n+CGTATTCTGCACAATTGTCTCCCAGGAGATTGTGTAGATCTAGCAGTATCGAGAATTTTT\n+GGCTTGAAGAGCCTTCTCGGTGTTGCAGGAACAGCAGTTTCAGCCATTGGTGGCCCACTC\n+CTTAACGGTTTGGTTAACACCGCAGCGCCTATCCTTAGTGGAGCAGCGCACGCCATTGGT\n+GGAAATGTTGTAGGAGGACTGGCTGATGCAGTGATCGACATTGGATCTAATTTGCTGACG\n+CCAAAAGAAAAAGAACAACCAAGCGCAAATTCAAGCGCGATTTCTGGAGATATTCCGATT\n+TCGCGTTTTGTAGAGATGCTCAAGTATGTCAAGGAGAATTACCAGGATAATCCTGTGTTC\n+CCGACTTTACTTGTTGAACCACAAAACTTCATCTCAAACGCAATGACCGCACTCAAAACA\n+ATTCCAATTGAGGTCTTTGCCAACATGCGCAATGTGAAAGTTGAACGAAATTTGTTCGAC\n+CGAACGGTTGTTCCAACTGTGAAGGAAGCTACTCTAGCTGATATTGTCATACCTAATCAT\n+ATGTATGGCTATATTCTCCGAGACTTCCTCCAAAACAAACGAGCGTTTCAATCTGGGACC\n+AAACAAAATGTGTACTTTCAGCAGTTTCTAACTGTTCTATCTCAACGTAATACCCGTACA\n+CATATTACGCTCAACGACATCACAAGTTGCTCTATTGATAGTGAGTCGATTGCAAACAAA\n+ATAGAGAGAGTAAAACGCTACTTGAGTGCAAACTCGAGTGGGGAGACCACGGAAGAATTT\n+TCGCGAACAGACACCGGTCTGCTACCTACTACGACCCGCAAAATCGTATTAGGTGAAAGT\n+AAACGCAGGACGGAACGAAACGTAGCAGAAACTGTTTTCCCTTCCGTGAGGCAGTAGATT\n+AAATCCAAAACTCGCCATGTGCGCGTCTCAGAAACTAATTTTTAAAATTGGTTTGCGCGT\n+ATGGTTAAAAAGTCACATTAAATATGAGGATGGTCGCTATAATTTTCTAGCAGAAGATTA\n+TAAAGGACGGTGTGATGATGTTTTGGAGCCCGCACTGGGTGTGGGTTCGTAGTGCTAGCA\n+ATTGCAACTTTTCCTGAAAGTTAATACCTATAGTTTATAGGAGAAAAATTAACATTTATT\n+GAGAATATCTGTGCAAACGACTCCCCACGCGGGGAGTAGTGGAATCTTGATAAACAGGTT\n+TTTTAAGCTTTTGCGTTTCCGAAAGGGTTACTCTGGCTGAACCAGCAGTTTTTATAACTG\n+TGGGTAGCCCCTCGGAAAATCAGGTTTGC\n'
b
diff -r 000000000000 -r 7d96b28eec49 test-data/blast.tab
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/blast.tab Sun Oct 15 12:52:40 2017 -0400
b
@@ -0,0 +1,7 @@
+Contig1 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 100.00 2113 0 0 1 2113 4248 2136 0.0  3811 12333
+Contig2 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.89 1745 2 0 1 1745 366 2110 0.0  3139 12333
+Contig3 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 98.78 164 0 1 1 164 377 216 4e-80   284 12333
+Contig4 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.92 2476 2 0 1 2476 5145 7620 0.0  4457 12333
+Contig5 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.89 4714 1 2 6 4715 12333 7620 0.0  8473 12333
+Contig6 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.89 894 1 0 1 894 4235 5128 0.0  1608 12333
+Contig7 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.10 222 0 1 1 222 237 18 2e-111   389 12333
b
diff -r 000000000000 -r 7d96b28eec49 test-data/contigs.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/contigs.fa Sun Oct 15 12:52:40 2017 -0400
b
b'@@ -0,0 +1,216 @@\n+>Contig1\n+TTTTGCTAAAGCTAAATCAACTATATCTGTTTCCATCAGACTCAGTTCATCGTTCACGAA\n+ATTTTTGATTTGATCGTAAACTGTTTCATATGAATTCGCTGATGTCGATGGAATTTCATC\n+CATATCGATCAATTTATTCTCTTGCAACATTCGTTTGGCCGCGATCAACTGCAAACCTGT\n+AAAAGGATTAACTCTAATTTTGACTTTCGTCGTAACTAGATTTTCTGCTGCTCCTTCTAC\n+ACATTCGGTGATGTACCTTCCTAACCAAGCACTGAAAGTTTCTGTTTTGTTAATACACAT\n+GGAATTAATGAGATTCCACGCTCTATAACTCAACATATTACTTCTCACGTGATTTAGTGT\n+AGTTAAAGGTTCAACACCTAGCTCTCGCGACTCAACATCATAGCCTTCTAAACTCCTTTC\n+GATGATATTATCAAATCTAGTTAACAACTGATCTGAAATACCGCCATACATAACTTCTTC\n+ATCTAAGTTATCTTTGAGCGGTATAAATTTCTCATCTGTCTGGATAGGTCGGCTATTCAA\n+CTCAAATGTTTCATCAAGGAAAGGCATGTTTTCGTCTCCTGGGCGGATTCTCAACAAGTG\n+ATCCCTCAATTCGCGCATTCGTTGTCTTCTTTCTAATTGCGCTCCATCCATTTGTTCTTG\n+TCCGGTGATTCCCACATCTTTAATAGTGGAGTTATAGAAATTATTTTGAATAATCAAATC\n+ATCTCCAATTATCTTCACTATTTCACTCAAAGACATGGTTTTTAGCGTGCTGGTCGTGTT\n+GCTTCCAATAGCGCTGACGGCTTTCGACATTGGTCCGTAATAAAAATCGACCCAGTCATA\n+GCTCTCGTCAATCGCTCCTCGTTTTGGCATTTTGTTCTTGTTCCTCCTCAAGCAAATTGT\n+ATGAGGGAATCGAGCATGTAATGCTTCGATATCCTCAATCGTTACGCTTTTGTCCGGCAA\n+CTTGTTACAGGTCGTAAACACCAACTTACTTCTGTATGGTAAACCTTTTTGTTTCAAATC\n+AGCTTGGTTTGTTCCCACTGCTGTATTAGAAATAAAAGTAAACCACATCAAATGATCCTT\n+GTTGTCTTTTTGTTGAAAGGCATCATCTACGTAAGTTATTTCTTGTCCGGTGTATCCTGT\n+ATCAAATTCATCTCTGCACTGCCTAGACCAAGTTGTCCATTTAGTAGCGTTTCTAAAAGA\n+AATATCGCCATGTTCCTGAACATACTCGCACACTTTTCTTGAGAGGATTGCTACGAGGTT\n+TGTCTTTCCGATTTGTTTTTCGCCTTGTATGGTAACTCCTACGGGTTTTACTCGGGTTTG\n+GTTACTGTTCTCTAACACCTTAACTTCAATAAGTAGCACTTCGAGTGATGCCAGATGTTT\n+TTGGCACTCTGTTACTACTTTATCTGATCGAAGTTCTTTCGTTTGCAAAGTGTTTAACTT\n+ATTTCTCAAAGTTGCAACTTTTTCCCTGATTTCGCCAACTCTTACAGCCCCTTGTGTTTG\n+TAAGAACTCATTTGGGTTTAATTTGAGCGTTGTTTTCATCCATGTTTCCGCTTCCGATAA\n+TTCATTAACTTCTTTTGCAACTTGCAAAATAGTATCATATGAACTATCTTTCATCATTCC\n+CATTTTAATCATCAACGGCTGCATACGTTTTATTATATTTTCGCAAGCCTTTTGATTACG\n+GTCCAAATTCACAAGAAAACTTTCAACTGGAACATCTCCAATTTGAGTCTTTGTAATCGT\n+CAATCCCATTGCTACCATAGGTAGAACATCTTCCAACATTTCTTCTGTTCCTTCTATCGC\n+CGGTCGATCTAGCATCCGTCCTACAGTACTTTCCCAAATACCAAGTGGTAACTTGAGAAT\n+ACTACTTATCATCGTAATTTTCGAGATAAGATCTTTTTTGTTCTTAATTTGCTGTAGTTC\n+GTAGACCATCGTGATAAAGAATGTTGGATATTCTATGATTTGTTCTACACATCGCCCTAA\n+CACACCTCTACGTCCTGTTGTTCCAGTTGGGTTCGATACTATTCTCCGTATAAAATTAAC\n+TTTCTCTGTTATTACGTTAATGTTATTTCTAATATATTTAATAAAAGCATACAAAATTGC\n+AAAATAAAGGAAA\n+>Contig2\n+TATTATAAAATAATATTTAATCCCCATCTTTGCAAGATGGAAACTCTCAATAAATCAGGA\n+GTATAATAGATTTAAACCCTCACACTGAATCACGAGTATAAACAGATTCAAATATGATTA\n+ACAATCAAACAAACAAAAAGGGACCACAACTAGAGAGAGTACATTTTGGTAGTGCGCAGG\n+TTGTGGGAAAAAGTACCAAACGACGACAACGCGGAACCAAATTTGACATTGAATATACTG\n+TTAAAAGGAACGATGCACCAAAAGAGCAGAAATTCTTAGTTTCAGAAATTTTTGATGAAA\n+AGTTGGATAAACAAATAAAATATGAGAAGAAGCAAAATCATACTTTTATTAAACCGAAAT\n+TAAATTTAGTTACTAGAGAAGAACAACACGTGACTAAGAAGGTTTTAAGAGGTAAAGAAC\n+GAGCTGCAACTCATGCTTTTATGAAGGAAATGGTTGAATCTAACAAGATACAACCTAGTT\n+GGAATGTCGAATACGAAAAAGAAATAGATGAGGTTGATCTATTTTTTATGAAGAAGAAAA\n+CCAAACCTTTCTCAGGTTTTTCTATTAAGGAATTAAGAGATAGTCTAATTGTGCAGTCAG\n+ACGATAAAAACATGGCACAGCCAACCGTGATGAGTTCAACCAATGAAATTGTTACACCCC\n+GTGAGGAGATAAGCGTTTCTGCTATCTCTGAACAACTGGCATCCTTGATGGAGAGAGTTG\n+ATAAACTCGAGAAGATGAATGCTGCTTTGGAGGAAGAAAACAAGCAGCTAAAGAAAGAGA\n+GAGAGGCGACTATTAAGTCAGTTAAGAAAGAGGCAAAGAGGACTAAACAAGAGAAGCCTC\n+AGATTGCGAAGAAAACGCAACACAAGAGTTTAGGAGTAAATCTTAAAATCACCAAGACCA\n+AAGTAGTTGGTCAGGAACAATGTTTGGAAATTGAAAATACTCAGCATAAGAAATTTGTTG\n+AGAAGCCAAGCATGCCATCCAAAGTGAGCAAGAAGATGAAGGGACAACAGTTGAAAAAGA\n+CTATTCGTACTTGGTATGAATTTGATCCCTCTAAACTCGTTCAGCATCAAAAAGAAGTGT\n+TGAACAGTGTTGTTACCAACACAACCTTCGCAGATAAAGTCCGTGAAACTGGTATACCTA\n+AACAAAAGATTAGGTATACTGCAAAACCACCAGCAGAGGAGAAGAGGAGTATCCATTTCT\n+ATGGTTATAAGCCAAAAGGAATCCCTAACAAAGTTTGGTGGAATTGGGTCACCACTGGCA\n+CAGCTATGGACGCTTATGAAAAAGCTGACCATTATCTGTATCACCAATTTAAACGAGAAA\n+TGATGGTATACAGAAATAAATGGGTCAAGTTTAGTAAGGAGTTCAATCCGTACCTATCGG\n+AACCGAAAATGGTATGGGAAGAGAATACATGGGAATATGAATATAAAACAGACGTTCCCT\n+ACAATTTTATTCTCAAATGGCGCCAGTTAGTGCAGACCTACAAGCCTAACACACCAATCC\n+AGGCTGATTGGTACAAAATCTCGCAGAAACAACAATGTTAATTGAAGTTTTCATTAATTC\n+TTTGTTGCAAAATCTAGGTATCATGATGTCTTTCCGTGACCTAGTGGCGAGCCCATGGAT\n+ATTGCTAGTAATAGCTATACCCTTGTGTGCATTTGCCAGTTCAGCGTCTATGGTTAGGGA\n+GATGCTTTTCCGTCATAAAATTACAGAAAATATTTTAAA'..b'TGAGTTATTGATTGAATCTTTAACTTCGAGCACTCCACTGATCTGCGGCGGGCGTGGTA\n+TGTTAATTTGTGCAACCATCGTTCGGATATATCCAATACTTTTCGATCCGGTTGTCCAAA\n+CATTTCGCCTCCATGGTAGGACCATCGACTCACCATCTCTAGACAATGTAACATTGTTGT\n+ACGGGTCTATGGTTAGCGTGGTCCAGTTCATGTTAGCTGGGTTTGACAGACTGATTTTGG\n+CGAAATCATACCACTTTGTTGCCAAATGTCCCGTATCGTTCTTTCGCGTTGCCACTGATG\n+AAACTGGGACTTCCGGCTGTTCTGCTTGTGTTTCGACGACTGGCGCTACAGGAATCGCAG\n+AATGGTCGTAAACCAATTCCTGTACAAGTTTACCACCTTCGGCTGTAACTTCATTGTCAG\n+CTTGTTCCTCGCCCATAATTGGTTTTGTTGGGGGAACGGGCGGCTTTGGCACTGGAACTG\n+GGACAAAGTTCATGCCTTTTTCGTTGTAAGCTGACGTATCCGCATTTTTGTAGCCTGTGG\n+CTTTAATATTCGCCATGCAACACCAAACGGTGATGCTGAGTGGGGTGTTGACCGTCTCGT\n+TACTGTTATCTTCGATAGTTTCGATAACAATACTCCCTCCACTCTGTCCGACTCGACCTA\n+CGGATGTTTCTACGGTCGATAGATCGTTGCTCCAAGGGACTGAAAGTGCAATTGTTGGAG\n+ATGCACTTGGCTTAAACCGAATTCCTCGTGTTACGGTTGTAGTGTCAAATTCAGGAGCAT\n+AGATCTTCAGATAGATACCTGTTCCCAAGGGTGCTGGAACATGCACTATATAATAAAAAT\n+CCGCATGGAAATAATTATATAGTCCTAGCACCGTTTTCTGTTGGTAAGTGAAAACAGGGT\n+CTATCACAAGTCGGGTTCCTACTGCTGGAGCAGAAAAGCGGCGCGGTAAGAAAGCACTAA\n+ACGCATTACCAATATCGGCTCGACCAAATATAAAATCTGGTGTGATGTTTTTACGTGGAG\n+CTCGCAATTGATAAGCAACAAAGGGATCAATCCATGCTGGATGGTCGACCACTTGTGGCT\n+CTCCTACTTCACTAACTACTATTCCAGTTGAGGTGTTGTCGTCTTCTTCAGTTGTTTTGG\n+CAAGGGTTGACAGGCCAGCGATGACGCGTAGGGGCATGTCGTATATATGCATGGTTTGTG\n+TTGGATTCTGCATACTCGTCTTGCGGTTAATCTCTCTGTGTTAACCAAACAGGTTCTGAC\n+AGTTTAATGTCGTGTCATAGACATGTCATGTCCGGTTTACATAGAGTCGTAAATCACTGA\n+CGTGCTTCCGGTTATATCTTCGATACTATTTCCGTTAGCAAAGTAACCATTGACTCTATA\n+AGGTACACCTTTTAAAACGGGGACGTTAGCCAAACTATATGATGTTGTCAACGAAGTAAT\n+CGTCAATATGCTTGTAGTTGTTCCCGCATTTGTAGGTGCTGCTCTTACTCCAGTGCTATA\n+ATATACATCGGCGAAAAAGTATATTGTAGTATAGCGAGTAGTTCCATTTGGCATATTGAT\n+CACGAATTTGTAAATTCTGTTTTTCAAAACCCACGGTCCTACATCTCTAACCTCTAGCGC\n+GGCAATTCTGGTGCGTAATGCCTCAATGGAGTTAGCATTGGCATTCACTGATATGTGCAA\n+TTCTCCTATCTCATCTTTCATTGTCACAAGTGAATGTTCTACGTCCTGTTGTTTTTGTGT\n+GACGGTTGCTACGTCTACCTTTAACACGGTAATCTCATCAGTATTAAATAATACTTGTTT\n+ACTAAGAGATTCTGTTGTTGTGTTCAACGTGTCTAAGGAGTCTTTCGTAGTTTGATCAAG\n+CTCGTTTAATGTTGTGGCAAGGGTGTTAATCTGTTTTGCCTGTTGACTTGTTGTTGTGGT\n+TAATTTGTCAACTTCTGAATTCATTTCTACCAATGCTGTATTGATATTAACGAATTGTTC\n+TTCATTTCGAGCTTGATTGTTGTCAACTACTTTAGCTAAACCGTCAAGTTGCAGTTTTTG\n+TTGATCGAGCTGGGTCTTTACTGCTGTTACTGAAGATTGAATTGACTTAATCTCAGTAAC\n+CTCGTTCTCGTCTAAAACGGTGAAAAGAGTGGTGTTCTGATCAAAGATCTCCTCTTTTAA\n+TGCCATAATAACGATTACAGAATTTTTGGAAAGTAACTTCCCAGCTCGTATTCAACAATA\n+CTGCTAATGCTCCATTCAAGGTTCTATTTGTACCACATTTTAGCTTTTGACAAAGCTCAT\n+TGTAATACTCCTCACCCCAAAGAGCGGCTTCGATCAACTGTTCTTGCACGAGATTTACCC\n+ACACAGTTATCTGATCTTCGCGGATATCAGTCCATACAAACGGTCCTTCAATAGATCGTT\n+GTAGTAATGGAGCTAAAACCATACCGTTTTCTAACTTAAATCCTCTTTTCAAGAATTGTA\n+GGTTTTCAAAAGAAGTAAATGGCTTCTCTTCTCCATCCTTTGAACCTGGTGTCATGATAT\n+GTCCTGTAGCATTTAGTACATCTCGATAAGTACAATAATTATACTTATCCTTATACTCAT\n+CGCTAACGCTTTTTATAATATCATCACCAAACGCGACGCTCGAGACATTCTGTCGGTAAT\n+CCCACAGTGATCTTAGGCCGGTTGTCTTCACCCACGCATACAAACCATAAATATCGTTCG\n+CCAGGCAATTATCAATTGTAGTAGTATAACTACCA\n+>Contig6\n+TAGCTTTAGCAAAAATTAGCTTATCGCAAATCCGAGGCAACATCAAGAGATCAACCTGGC\n+TGGACGTAAATGATTGGATATTAGCTTTGAAACATAAAATTTCAGGAAAAAGCTTTGCCA\n+AACATATGGATCTGTATCCTAGCTCGCTAGATTCTTTTCTTCTTACACTCAAAGATTGGG\n+AGGTTGAAGACCGTATAAAGTTTAACTCTATTTACAAGCAAAAGGTATTGTTTGTTCAAT\n+CTAGATTTTCACTTTACTGTTGGTCTCCTTTTATATCTCGTGGAACACGATTTGTGAAAG\n+TGACTTCTCAGTTTAGAGAGTTAGTGGATAAGTTAGAAACTGGCATTCTATTCCATGAAA\n+TAAAATCGGTTACAAATGGAATTAGATGGTTAGGAGGAGCAGGGAACAATGGACACGTTG\n+GAGAAAGAGTAAGAGTTATTGCTCATACAGCCCAATTTCCGAAAAAGAGTTACCCTCAGA\n+ATGGATTCCCTATAAACGAAGAACTACATAGGGAATGGATCCAACTTGTTATGAACTCGG\n+ACTATAAGTATCACTCACTTATAGGAGAAGAAAAAGTAAATATTCTTTGGAACCTTATTA\n+GGCTCCAACCTCAACATGAGGTGGAGAATTTTAAGGTTTACTTAGAAGATTTGCAGGCGT\n+CCCCGCCGAAAACTGGGACAATTTGTGCAAAAGTAGTGAATGATATAAAAGCCGAAGTAA\n+CTTCAAGTTATAGGCAATTTAACAATTACTACACTCGTTTAACAAAAGATGGTATGCACA\n+CACTTTTATCAATGCTTTCTAGGATAGGTGTTCCAATTTCAGATTATTGGAATGACCTTC\n+TTGTCGACAAAGCGCCAGCTATTACAGCGGTTACTGTTGGAGCAATAACAAGTT\n+>Contig7\n+AAGACATTGATTTTTTTCAAGTTCAATGTATAACTCTTTTTGTTCGTTTATTTGTTGTTT\n+GCTCAAAGTTTCTGTTAAGAGGTCTCATAAGTATCCTGTTTACAACGGACCAGCATTATT\n+CCCTTCGGCACTTCCGATACTCTACTAATCCTTAATACCAGAATCAGCATAATCAGCGAA\n+GTGGTATCTCGCGCTTCTTTTTCCAGTACTCATTAACCCCCC\n'
b
diff -r 000000000000 -r 7d96b28eec49 test-data/guideSequence.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/guideSequence.fa Sun Oct 15 12:52:40 2017 -0400
b
b'@@ -0,0 +1,178 @@\n+>gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome\n+GCAAAAAGGCCCCTGGGGGGGGGTTAATGAGTACTGGAAAAAGAAGCGCGAGATACCACTTCGCTGATTA\n+TGCTGATTCTGGTATTAAGGATTAGTAGAGTATCGGAAGTGCCGAAGGGAATAATGCTGGTCCGTTGTAA\n+ACAGGATACTTATGAGACCTCTTAACAGAAACTTTGAGCAAACAACAAATAAACGAACAAAAAGAGTTAT\n+ACATTGAACTTGAAAAATCAATGTCTTTTATTTAGACTGATTTATATTGGTCTTTATAATCGTAAGGAAT\n+AATTCTCATCTAATGATATCGATGTAAAATGTATCATTCTAGCTATTCAATTATATTAATTGAGCTTAGC\n+ATCTGATTAAATTATTATTATAAAATAATATTTAATCCCCATCTTTGCAAGATGGAAACTCTCAATAAAT\n+CAGGAGTATAATAGATTTAAACCCTCACACTGAATCACGAGTATAAACAGATTCAAATATGATTAACAAT\n+CAAACAAACAAAAAGGGACCACAACTAGAGAGAGTACATTTTGGTAGTGCGCAGGTTGTGGGAAAAAGTA\n+CCAAACGACGACAACGCGGAACCAAATTTGACATTGAATATACTGTTAAAAGGAACGATGCACCAAAAGA\n+GCAGAAATTCTTAGTTTCAGAAATTTTTGATGAAAAGTTGGATAAACAAATAAAATATGAGAAGAAGCAA\n+AATCATACTTTTATTAAACCGAAATTAAATTTAGTTACTAGAGAAGAACAACACGTGACTAAGAAGGTTT\n+TAAGAGGTAAAGAACGAGCTGCAACTCATGCTTTTATGAAGGAAATGGTTGAATCTAACAAGATACAACC\n+TAGTTGGAATGTCGAATACGAAAAAGAAATAGATGAGGTTGATCTATTTTTTATGAAGAAGAAAACCAAA\n+CCTTTCTCAGGTTTTTCTATTAAGGAATTAAGAGATAGTCTAATTGTGCAGTCAGACGATAAAAACATGG\n+CACAGCCAACCGTGATGAGTTCAACCAATGAAATTGTTACACCCCGTGAGGAGATAAGCGTTTCTGCTAT\n+CTCTGAACAACTGGCATCCTTGATGGAGAGAGTTGATAAACTCGAGAAGATGAATGCTGCTTTGGAGGAA\n+GAAAACAAGCAGCTAAAGAAAGAGAGAGAGGCGACTATTAAGTCAGTTAAGAAAGAGGCAAAGAGGACTA\n+AACAAGAGAAGCCTCAGATTGCGAAGAAAACGCAACACAAGAGTTTAGGAGTAAATCTTAAAATCACCAA\n+GACCAAAGTAGTTGGTCAGGAACAATGTTTGGAAATTGAAAATACTCAGCATAAGAAATTTGTTGAGAAG\n+CCAAGCATGCCATCCAAAGTGAGCAAGAAGATGAAGGGACAACAGTTGAAAAAGACTATTCGTACTTGGT\n+ATGAATTTGATCCCTCTAAACTCGTTCAGCATCAAAAAGAAGTGTTGAACAGTGTTGTTACTAACACAAC\n+CTTCGCAGATAAAGTCCGTGAAACTGGTATACCTAAACAAAAGATTAGGTATACTGCAAAACCACCAGCA\n+GAGGAGAAGAGGAGTATCCATTTCTATGGTTATAAGCCAAAAGGAATCCCTAACAAAGTTTGGTGGAATT\n+GGGTCACCACTGGCACAGCTATGGACGCTTATGAAAAAGCTGACCATTATCTGTATCACCAATTTAAACG\n+AGAAATGATGGTATACAGAAATAAATGGGTCAAGTTTAGTAAGGAGTTCAATCCGTACCTATCGGAACCG\n+AAAATGGTATGGGAAGAGAATACATGGGAATATGAATATAAAACAGACGTTCCCTACAATTTTATTCTCA\n+AATGGCGCCAGTTAGTGCAGACCTACAAGCCTAACACACCAATCCAGGCTGATTGGTACAAAATCTCGCA\n+GAAACAACAATGTTAATTGAAGTTTTCATTAATTCTTTGTTGCAAAATCTAGGTATCATGATGTCTTTCC\n+GTGACCTAGTGGCGAGCCCATGGATACTGCTAGTAATAGCTATACCCTTGTGTGCATTTGCCAGTTCAGC\n+GTCTATGGTTAGGGAGATGCTTTTCCGTCATAAAATTACAGAAAATATTTTAAAAGGAACAGGAGTAGAA\n+GAATTGTTTAATCCATTCGGGATAATTATTAAATATTTCCTTTATTTTGCAATTTTGTATGCTTTTATTA\n+AATATATTAGAAATAACATTAACGTAATAACAGAGAAAGTTAATTTTATACGGAGAATAGTATCGAACCC\n+AACTGGAACAACAGGACGTAGAGGTGTGTTAGGGCGATGTGTAGAACAAATCATAGAATATCCAACATTC\n+TTTATCACGATGGTCTACGAACTACAGCAAATTAAGAACAAAAAAGATCTTATCTCGAAAATTACGATGA\n+TAAGTAGTATTCTCAAGTTACCACTTGGTATTTGGGAAAGTACTGTAGGACGGATGCTAGATCGACCGGC\n+GATAGAAGGAACAGAAGAAATGTTGGAAGATGTTCTACCTATGGTAGCAATGGGATTGACGATTACAAAG\n+ACTCAAATTGGAGATGTTCCAGTTGAAAGTTTTCTTGTGAATTTGGACCGTAATCAAAAGGCTTGCGAAA\n+ATATAATAAAACGTATGCAGCCGTTGATGATTAAAATGGGAATGATGAAAGATAGTTCATATGATACTAT\n+TTTGCAAGTTGCAAAAGAAGTTAATGAATTATCGGAAGCGGAAACATGGATGAAAACAACGCTCAAATTA\n+AACCCAAATGAGTTCTTACAAACACAAGGGGCTGTAAGAGTTGGCGAAATCAGGGAAAAAGTTGCAACTT\n+TGAGAAATAAGTTAAACACTTTGCAAACGAAAGAACTTCGATCAGATAAAGTAGTAACAGAGTGCCAAAA\n+ACATCTGGCATCACTCGAAGTGCTACTTATTGAAGTTAAGGTGTTAGAGAACAGTAACCAAACCCGAGTA\n+AAACCCGTAGGAGTTACCATACAAGGCGAAAAACAAATCGGAAAGACAAACCTCGTAGCAATCCTCTCAA\n+GAAAAGTGTGCGAGTATGTTCAGGAACATGGCGATATTTCTTTTAGAAACGCTACTAAATGGACAACTTG\n+GTCTAGGCAGTGCAGAGATGAATTTGATACAGGATACACCGGACAAGAAATAACTTACGTAGATGATGCC\n+TTTCAACAAAAAGACAACAAGGATCATTTGATGTGGTTTACTTTTATTTCTAATACAGCAGTGGGAACAA\n+ACCAAGCTGATTTGAAACAAAAAGGTTTACCATACAGAAGTAAGTTGGTGTTTACGACCTGTAACAAGTT\n+GCCGGACAAAAGCGTAACGATTGAGGATATCGAAGCATTACATGCTCGATTCCCTCATACAATTTGCTTG\n+AGGAGGAACAAGAACAAAATGCCAAAACGAGGAGCGATTGACGAGAGCTATGACTGGGTCGATTTTTATT\n+ACGGACCAATGTCGAAAGCCGTCAGCGCTATTGGAAGCAACACGACCAGCACGCTAAAAACCATGTCTTT\n+GAGTGAAATAGTGAAGATAATTGGAGATGATTTGATTATTCAAAATAATTTCTATAACTCCACTATTAAA\n+GATGTGGGAATCACCGGACAAGAACAAATGGATGGAGCGCAATTAGAAAGAAGACAACGAATGCGCGAAT\n+TGAGGGATCACTTGTTGAGAATCCGCCCAGGAGACGAAAACATGCCTTTCCTTGATGAAACATTTGAGTT\n+GAATAGCCGACCTATCCAGACAGATGAGAAATTTATACCGCTCAAAGATAACTTAGATGAAGAAGTTATG\n+TATGGCGGTATTTCAGATCAGT'..b'GTCAACAGGCAAAACAGATTAAC\n+ACCCTTGCCACAACATTAAACGAGCTTGATCAAACTACGAAAGACTCCTTAGACACGTTGAACACAACAA\n+CAGAATCTCTTAGTAAACAAGTATTATTTAATACTGATGAGATTACCGTGTTAAAGGTAGACGTAGCAAC\n+CGTCACACAAAAACAACAGGACGTAGAACATTCACTTGTGACAATGAAAGATGAGATAGGAGAATTGCAC\n+ATATCAGTGAATGCCAATGCTAACTCCATTGAGGCATTACGCACCAGAATTGCCGCGCTAGAGGTTAGAG\n+ATGTAGGACCGTGGGTTTTGAAAAACAGAATTTACAAATTCGTGATCAATATGCCAAATGGAACTACTCG\n+CTATACTACAATATACTTTTTCGCCGATGTATATTATAGCACTGGAGTAAGAGCAGCACCTACAAATGCG\n+GGAACAACTACAAGCATATTGACGATTACTTCGTTGACAACATCATATAGTTTGGCTAACGTCCCCGTTT\n+TAAAAGGTGTACCTTATAGAGTCAATGGTTACTTTGCTAACGGAAATAGTATCGAAGATATAACCGGAAG\n+CACGTCAGTGATTTACGACTCTATGTAAAAACCGGACATGACATGTCTATGACACGACATTAAACTGTCA\n+GAACCTGTTTGGTTAACACAGAGAGATTAACCGCAAGACGAGTATGCAGAATCCAACACAAACCATGCAT\n+ATATACGACATGCCCCTACGCGTCATCGCTGGCCTGTCAACCCTTGCCAAAACAACTGAAGAAGACGACA\n+ACACCTCAACTGGAATAGTAGTTAGTGAAGTAGGAGAGCCACAAGTGGTCGACCATCCAGCATGGATTGA\n+TCCCTTTGTTGCTTATCAATTGCGAGCTCCACGTAAAAACATCACACCAGATTTTATATTTGGTCGAGCC\n+GATATTGGTAATGCGTTTAGTGCTTTCTTACCGCGCCGCTTTTCTGCTCCAGCAGTAGGAACCCGACTTG\n+TGATAGACCCTGTTTTCACTTACCAACAGAAAACGGTGCTAGGACTATATAATTATTTCCATGCGGATTT\n+TTATTATATAGTGCATGTTCCAGCACCCTTGGGAACAGGTATCTATCTGAAGATCTATGCTCCTGAATTT\n+GACACTACAACCGTAACACGAGGAATTCGGTTTAAGCCAAGTGCATCTCCAACAATTGCACTTTCAGTCC\n+CTTGGAGCAACGATCTATCGACCGTAGAAACATCCGTAGGTCGAGTCGGACAGAGTGGAGGGAGTATTGT\n+TATCGAAACTATCGAAGATAACAGTAACGAGACGGTCAACACCCCACTCAGCATCACCGTTTGGTGTTGC\n+ATGGCGAACATTAAAGCCACAGGCTACAAAAATGCGGATACGTCAGCTTACAACGAAAAAGGCATGAACT\n+TTGTCCCAGTTCCAGTGCCAAAGCCGCCCGTTCCCCCAACAAAACCAATTATGGGCGAGGAACAAGCTGA\n+CAATGAAGTTACAGCCGAAGGTGGTAAACTTGTACAGGAATTGGTTTACGACCATTCTGCGATTCCTGTA\n+GCGCCAGTCGTCGAAACACAAGCAGAACAGCCGGAAGTCCCAGTTTCATCAGTGGCAACGCGAAAGAACG\n+ATACGGGACATTTGGCAACAAAGTGGTATGATTTCGCCAAAATCAGTCTGTCAAACCCAGCTAACATGAA\n+CTGGACCACGCTAACCATAGACCCGTACAACAATGTTACATTGTCTAGAGATGGTGAGTCGATGGTCCTA\n+CCATGGAGGCGAAATGTTTGGACAACCGGATCGAAAAGTATTGGATATATCCGAACGATGGTTGCACAAA\n+TTAACATACCACGCCCGCCGCAGATCAGTGGAGTGCTCGAAGTTAAAGATTCAATCAATAACTCAAGTAT\n+TTCACTGGTAGAATTTGGAGGAAAAGTAGAGATTCCAATTATTCCGAAGGTTATGAACGGACTAGTAACA\n+AGTGCTAGTTTGCCAAGGCATAGACTAAACCCATGGATGAGAACCGCCGAAAGTAAGGTTGAATTGCAAT\n+ATCGAATTATTGCTTTTAATCGAACTAGCGACATTGCTGACCTTAACGTTAGCGTTTTGTTGCGACCTGG\n+CGATTCGCAATTCCAATTGCCGATGAAACCTGACAATAGTGTGGATACACGTCATTTTGAGCTTGTTGAA\n+GCTTTAATGTACCACTACGATAGCCTCCGAATTCGAGGAGAAGAACAGAGTCTGCCAGAAAATGCACCTA\n+ATGCAGTTTCAAACCCTCAGCAGTTCATTACACCCGCAACCGCTCTAAGTGCCGAAGAATATAATGTGCA\n+CGAGGCGTTGGGTGAAACTGAGGAGTTGGAGCTGGATGAATTTCCGGTTCTGGTGTTCAAGGGAAATGTT\n+CCCGTTGACTCAGTGACGTCCATTCCTTTGGACCTCGCAACTATATACGACTTTGCTTGGGACGGAGAGC\n+AGAATGCAATTTCTCAGAAATTTCAGCGTTTTGCTCATCTGATACCGAAAAGCGCAGGTGGTTTTGGCCC\n+AGTGATTGGTAATTATACTATCACGGCTAACCTCCCCACCGGTGTAGCAGGTCGTATTCTGCACAATTGT\n+CTCCCAGGAGATTGTGTAGATCTAGCAGTATCGAGAATTTTTGGCTTGAAGAGCCTTCTCGGTGTTGCAG\n+GAACAGCAGTTTCAGCCATTGGTGGCCCACTCCTTAACGGTTTGGTTAACACCGCAGCGCCTATCCTTAG\n+TGGAGCAGCGCACGCCATTGGTGGAAATGTTGTAGGAGGACTGGCTGATGCAGTGATCGACATTGGATCT\n+AATTTGCTGACGCCAAAAGAAAAAGAACAACCAAGCGCAAATTCAAGCGCGATTTCTGGAGATATTCCGA\n+TTTCGCGTTTTGTAGAGATGCTCAAGTATGTCAAGGAGAATTACCAGGATAATCCTGTGTTCCCGACTTT\n+ACTTGTTGAACCACAAAACTTCATCTCAAACGCAATGACCGCACTCAAAACAATTCCAATTGAGGTCTTT\n+GCCAACATGCGCAATGTGAAAGTTGAACGAAATTTGTTCGACCGAACGGTTGTTCCAACTGTGAAGGAAG\n+CTACTCTAGCTGATATTGTCATACCTAATCATATGTATGGCTATATTCTCCGAGACTTCCTCCAAAACAA\n+ACGAGCGTTTCAATCTGGGACCAAACAAAATGTGTACTTTCAGCAGTTTCTAACTGTTCTATCTCAACGT\n+AATACCCGTACACATATTACGCTCAACGACATCACAAGTTGCTCTATTGATAGTGAGTCGATTGCAAACA\n+AAATAGAGAGAGTAAAACGCTACTTGAGTGCAAACTCGAGTGGGGAGACCACGGAAGAATTTTCGCGAAC\n+AGACACCGGTCTGCTACCTACTACGACCCGCAAAATCGTATTAGGTGAAAGTAAACGCAGGACGGAACGA\n+AACGTAGCAGAAACTGTTTTCCCTTCCGTGAGGCAGTAGATTAAATCCAAAACTCGCCATGTGCGCGTCT\n+CAGAAACTAATTTTTAAAATTGGTTTGCGCGTATGGTTAAAAAGAGTCACATTAAATATGAGGATGGTCG\n+CTATAATTTTCTAGCAGAAGATTATAAAGGACGGTGTGATGATGTTTTGGAGCCCGCACTGGGTGTGGGT\n+TCGTAGTGCTAGCAATTGCAACTTTTCCTGAAAGTTAATACCTATAGTTTATAGGAGAAAAATTAACATT\n+TATTGAGAATATCTGTGCAAACGACTCCCCACGCGGGGAGTAGTGGAATCTTGATAAACAGGTTTTTTAA\n+GCTTTTGCGTTTCCGAAAGGGTTACTCTGGCTGAACCAGCAGTTTTTATAACTGTGGGTAGCCCCTCGGA\n+AAATCAGGTTTGC\n'