Next changeset 1:be61d0d0d622 (2021-03-10) |
Commit message:
planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/blast_to_scaffold commit 48a4098045106f363e92357949b32617a2e868c1 |
added:
blast_to_scaffold.py blast_to_scaffold.xml test-data/assembly.fa test-data/blast.tab test-data/contigs.fa test-data/guideSequence.fa |
b |
diff -r 000000000000 -r 7d96b28eec49 blast_to_scaffold.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/blast_to_scaffold.py Sun Oct 15 12:52:40 2017 -0400 |
[ |
@@ -0,0 +1,140 @@ +#!/usr/bin/env python +import argparse + + +def insert_newlines(string, every=60): + lines = [] + for i in range(0, len(string), every): + lines.append(string[i:i+every]) + return '\n'.join(lines) + + +def getseq(fastadict, transcript, up, down, orientation="direct"): + def reverse(seq): + revdict = {"A": "T", "T": "A", "G": "C", "C": "G", "N": "N"} + revseq = [revdict[i] for i in seq[::-1]] + return "".join(revseq) + pickseq = fastadict[transcript][up-1:down] + if orientation == "direct": + return pickseq + else: + return reverse(pickseq) + + +def Parser(): + the_parser = argparse.ArgumentParser( + description="Generate DNA scaffold from blastn or tblastx alignment\ + of Contigs") + the_parser.add_argument('--sequences', action="store", type=str, + help="input sequence file in fasta format") + the_parser.add_argument('--guideSequence', action="store", type=str, + help="the reference sequence to guide the scaffold\ + assembly in fasta format") + the_parser.add_argument('--blast-tab', dest="blast_tab", action="store", + type=str, + help="13-columns tabular blastn or tblastx output") + the_parser.add_argument('--output', action="store", type=str, + help="output file path, fasta format") + the_parser.add_argument('--scaffold_prefix', action="store", type=str, + help="the prefix that will be used for the header\ + of the fasta scaffold") + the_parser.add_argument('--scaffold_suffix', action="store", type=str, + help="the sufix that will be used for the header\ + of the fasta scaffold") + args = the_parser.parse_args() + return args + + +def blatnInfo(file): + blastlist = [] + with open(file, "r") as f: + for line in f: + minilist = [] + fields = line.rstrip().split() + minilist.append(fields[0]) + minilist.extend(fields[6:10]) + blastlist.append(minilist) + blastlist.sort(key=lambda x: x[3], reverse=True) + return blastlist + + +def myContigs(file): + Contigs = {} + with open(file, "r") as f: + for line in f: + if line[0] == ">": + header = line[1:-1] + Contigs[header] = "" + else: + Contigs[header] += line[:-1] + return Contigs + + +def myGuide(file): + Guide = {} + coordinate = 0 + with open(file, "r") as f: + for line in f: + if line[0] == ">": + continue + else: + for nucleotide in line[:-1]: + coordinate += 1 + Guide[coordinate] = nucleotide.lower() + return Guide + + +def updateGuide(blastlist, GuideDict, ContigsDict): + ''' + the blastlist object is a list of list with + element [0] : name of the blasted Contig + element [1] : queryStart of the alignment to the reference + element [2] = queryStop of the alignment to the reference + element [3] : subjectStart of the alignment to the reference + element [4] = subjectStop of the alignment to the reference + ''' + for fields in blastlist: + seqHeader = fields[0] + queryStart = int(fields[1]) + queryStop = int(fields[2]) + subjectStart = int(fields[3]) + subjectStop = int(fields[4]) + if subjectStart > subjectStop: + subjectStart, subjectStop = subjectStop, subjectStart + orientation = "reverse" + else: + orientation = "direct" + sequence = getseq(ContigsDict, seqHeader, queryStart, queryStop, + orientation) + for i in range(subjectStart, subjectStop+1): + try: + del GuideDict[i] + except KeyError: + continue + for i, nucleotide in enumerate(sequence): + GuideDict[i+subjectStart] = nucleotide + + +def finalAssembly(GuideDict, outputfile, prefix, suffix): + finalSeqList = [] + for keys in sorted(GuideDict): + finalSeqList.append(GuideDict[keys]) + finalSequence = insert_newlines("".join(finalSeqList)) + Out = open(outputfile, "w") + Out.write(">Scaffold_from_%s_guided_by_%s\n" % (prefix, suffix)) + Out.write("%s\n" % finalSequence) + Out.close() + + +def __main__(): + args = Parser() + ContigsDict = myContigs(args.sequences) + GuideDict = myGuide(args.guideSequence) + blastlist = blatnInfo(args.blast_tab) + updateGuide(blastlist, GuideDict, ContigsDict) + finalAssembly(GuideDict, args.output, args.scaffold_prefix, + args.scaffold_suffix) + + +if __name__ == "__main__": + __main__() |
b |
diff -r 000000000000 -r 7d96b28eec49 blast_to_scaffold.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/blast_to_scaffold.xml Sun Oct 15 12:52:40 2017 -0400 |
b |
@@ -0,0 +1,49 @@ +<tool id="blast2scaffold" name="blast_to_scaffold" version="1.0.0"> +<description>Generate DNA scaffold from blastn or tblastx alignment of Contigs</description> +<requirements> +</requirements> +<command interpreter="python"> + blast_to_scaffold.py --sequences "$sequences" + --guideSequence "$guideSequence" + --blast-tab "$blast_tab" + --output "$output" + --scaffold_prefix "$sequences.element_identifier" + --scaffold_suffix "$guideSequence.element_identifier" +</command> +<inputs> +<param name="sequences" type="data" format="fasta" label="Select a fasta contigs file"/> +<param name="guideSequence" type="data" format="fasta" label="Select the fasta guide sequence for scaffolding"/> +<param name="blast_tab" type="data" format="tabular" label="Select a blastn or tblastx output from your history" help="must have 13 columns with column 13 containing the subject lenght, other columns are standard"/> + +</inputs> +<outputs> + <data format="fasta" name="output"/> +</outputs> + + +<tests> + <test> + <param name="sequences" value="contigs.fa" ftype="fasta"/> + <param name="blast_tab" value="blast.tab" ftype="tabular"/> + <param name="guideSequence" value="guideSequence.fa" ftype="tabular"/> + <output name="output" file="assembly.fa" ftype="fasta"/> + </test> +</tests> + + +<help> + + +**What it Does** +This tool starts from DNA contigs that aligned to a subject DNA sequence through blastn or tblastx. +The contigs must be provided in fasta format. The blastn or tblastx output must be tabular, the 12 standard column plus column 13 with the length of the blastn or tblastx subject. +The sequence used to BLAST (blastn or tblastx) the contigs must be provided to serve as a guide to the final assembly +The final assembly is a DNA sequence. +Nucleotides of the guide sequence which were not covered by contigs are in small letters in the output assembly. + + +**Attribution** +This Galaxy tool was created by drosofff@gmail.com on 5/01/2016 +</help> + +</tool> |
b |
diff -r 000000000000 -r 7d96b28eec49 test-data/assembly.fa --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/assembly.fa Sun Oct 15 12:52:40 2017 -0400 |
b |
b'@@ -0,0 +1,207 @@\n+>Scaffold_from_contigs.fa_guided_by_guideSequence.fa\n+gcaaaaaggcccctgggGGGGGGTTAATGAGTACTGGAAAAAGAAGCGCGAGATACCACT\n+TCGCTGATTATGCTGATTCTGGTATTAAGGATTAGTAGAGTATCGGAAGTGCCGAAGGGA\n+ATAATGCTGGTCCGTTGTAAACAGGATACTTATGAGACCTCTTAACAGAAACTTTGAGCA\n+AACAACAAATAAACGAACAAAAAGAGTTATACATTGAACTTGAAAAAAATCAATGTCTTT\n+TATTTAGACTGATTTATATTGGTCTTTATAATCGTAAGGAATAATTCTCATCTAATGATA\n+TCGATGTAAAATGTATCATTCTAGCTATTCAATTATATTAATTGAGCTTAGCATCTGATT\n+AAATTTATTATAAAATAATATTTAATCCCCATCTTTGCAAGATGGAAACTCTCAATAAAT\n+CAGGAGTATAATAGATTTAAACCCTCACACTGAATCACGAGTATAAACAGATTCAAATAT\n+GATTAACAATCAAACAAACAAAAAGGGACCACAACTAGAGAGAGTACATTTTGGTAGTGC\n+GCAGGTTGTGGGAAAAAGTACCAAACGACGACAACGCGGAACCAAATTTGACATTGAATA\n+TACTGTTAAAAGGAACGATGCACCAAAAGAGCAGAAATTCTTAGTTTCAGAAATTTTTGA\n+TGAAAAGTTGGATAAACAAATAAAATATGAGAAGAAGCAAAATCATACTTTTATTAAACC\n+GAAATTAAATTTAGTTACTAGAGAAGAACAACACGTGACTAAGAAGGTTTTAAGAGGTAA\n+AGAACGAGCTGCAACTCATGCTTTTATGAAGGAAATGGTTGAATCTAACAAGATACAACC\n+TAGTTGGAATGTCGAATACGAAAAAGAAATAGATGAGGTTGATCTATTTTTTATGAAGAA\n+GAAAACCAAACCTTTCTCAGGTTTTTCTATTAAGGAATTAAGAGATAGTCTAATTGTGCA\n+GTCAGACGATAAAAACATGGCACAGCCAACCGTGATGAGTTCAACCAATGAAATTGTTAC\n+ACCCCGTGAGGAGATAAGCGTTTCTGCTATCTCTGAACAACTGGCATCCTTGATGGAGAG\n+AGTTGATAAACTCGAGAAGATGAATGCTGCTTTGGAGGAAGAAAACAAGCAGCTAAAGAA\n+AGAGAGAGAGGCGACTATTAAGTCAGTTAAGAAAGAGGCAAAGAGGACTAAACAAGAGAA\n+GCCTCAGATTGCGAAGAAAACGCAACACAAGAGTTTAGGAGTAAATCTTAAAATCACCAA\n+GACCAAAGTAGTTGGTCAGGAACAATGTTTGGAAATTGAAAATACTCAGCATAAGAAATT\n+TGTTGAGAAGCCAAGCATGCCATCCAAAGTGAGCAAGAAGATGAAGGGACAACAGTTGAA\n+AAAGACTATTCGTACTTGGTATGAATTTGATCCCTCTAAACTCGTTCAGCATCAAAAAGA\n+AGTGTTGAACAGTGTTGTTACCAACACAACCTTCGCAGATAAAGTCCGTGAAACTGGTAT\n+ACCTAAACAAAAGATTAGGTATACTGCAAAACCACCAGCAGAGGAGAAGAGGAGTATCCA\n+TTTCTATGGTTATAAGCCAAAAGGAATCCCTAACAAAGTTTGGTGGAATTGGGTCACCAC\n+TGGCACAGCTATGGACGCTTATGAAAAAGCTGACCATTATCTGTATCACCAATTTAAACG\n+AGAAATGATGGTATACAGAAATAAATGGGTCAAGTTTAGTAAGGAGTTCAATCCGTACCT\n+ATCGGAACCGAAAATGGTATGGGAAGAGAATACATGGGAATATGAATATAAAACAGACGT\n+TCCCTACAATTTTATTCTCAAATGGCGCCAGTTAGTGCAGACCTACAAGCCTAACACACC\n+AATCCAGGCTGATTGGTACAAAATCTCGCAGAAACAACAATGTTAATTGAAGTTTTCATT\n+AATTCTTTGTTGCAAAATCTAGGTATCATGATGTCTTTCCGTGACCTAGTGGCGAGCCCA\n+TGGATATTGCTAGTAATAGCTATACCCTTGTGTGCATTTGCCAGTTCAGCGTCTATGGTT\n+AGGGAGATGCTTTTCCGTCATAAAATTACAGAAAATATTTTAAAAGGAACAGGAGTAGAA\n+GAATTGTTTAatccattcgggataattattaaataTTTCCTTTATTTTGCAATTTTGTAT\n+GCTTTTATTAAATATATTAGAAATAACATTAACGTAATAACAGAGAAAGTTAATTTTATA\n+CGGAGAATAGTATCGAACCCAACTGGAACAACAGGACGTAGAGGTGTGTTAGGGCGATGT\n+GTAGAACAAATCATAGAATATCCAACATTCTTTATCACGATGGTCTACGAACTACAGCAA\n+ATTAAGAACAAAAAAGATCTTATCTCGAAAATTACGATGATAAGTAGTATTCTCAAGTTA\n+CCACTTGGTATTTGGGAAAGTACTGTAGGACGGATGCTAGATCGACCGGCGATAGAAGGA\n+ACAGAAGAAATGTTGGAAGATGTTCTACCTATGGTAGCAATGGGATTGACGATTACAAAG\n+ACTCAAATTGGAGATGTTCCAGTTGAAAGTTTTCTTGTGAATTTGGACCGTAATCAAAAG\n+GCTTGCGAAAATATAATAAAACGTATGCAGCCGTTGATGATTAAAATGGGAATGATGAAA\n+GATAGTTCATATGATACTATTTTGCAAGTTGCAAAAGAAGTTAATGAATTATCGGAAGCG\n+GAAACATGGATGAAAACAACGCTCAAATTAAACCCAAATGAGTTCTTACAAACACAAGGG\n+GCTGTAAGAGTTGGCGAAATCAGGGAAAAAGTTGCAACTTTGAGAAATAAGTTAAACACT\n+TTGCAAACGAAAGAACTTCGATCAGATAAAGTAGTAACAGAGTGCCAAAAACATCTGGCA\n+TCACTCGAAGTGCTACTTATTGAAGTTAAGGTGTTAGAGAACAGTAACCAAACCCGAGTA\n+AAACCCGTAGGAGTTACCATACAAGGCGAAAAACAAATCGGAAAGACAAACCTCGTAGCA\n+ATCCTCTCAAGAAAAGTGTGCGAGTATGTTCAGGAACATGGCGATATTTCTTTTAGAAAC\n+GCTACTAAATGGACAACTTGGTCTAGGCAGTGCAGAGATGAATTTGATACAGGATACACC\n+GGACAAGAAATAACTTACGTAGATGATGCCTTTCAACAAAAAGACAACAAGGATCATTTG\n+ATGTGGTTTACTTTTATTTCTAATACAGCAGTGGGAACAAACCAAGCTGATTTGAAACAA\n+AAAGGTTTACCATACAGAAGTAAGTTGGTGTTTACGACCTGTAACAAGTTGCCGGACAAA\n+AGCGTAACGATTGAGGATATCGAAGCATTACATGCTCGATTCCCTCATACAATTTGCTTG\n+AGGAGGAACAAGAACAAAATGCCAAAACGAGGAGCGATTGACGAGAGCTATGACTGGGTC\n+GATTTTTATTACGGACCAATGTCGAAAGCCGTCAGCGCTATTGGAAGCAACACGACCAGC\n+ACGCTAAAAACCATGTCTTTGAGTGAAATAGTGAAGATAATTGGAGATGATTTGATTATT\n+CAAAATAATTTCTATAACTCCACTATTAAAGATGTGGGAATCACCGGACAAGAACAAATG\n+GATGGAGCGCAATTAGAAAGAAGACAACGAATGCGCGAATTGAGGGATCACTTGTTGAGA\n+ATCCGCCCAGGAGACGAAAACATGCCTTTCCTTGATGAAACATTTGAGTTGAATAGCCGA\n+CCTATCCAGACAGATGAGAAATTTATACCGCTCAAAGATAACTTAGATGAAGAAGTTATG\n+TATGGCGGTATTTCAGATCA'..b'+ACAGATTAACACCCTTGCCACAACATTAAACGAGCTTGATCAAACTACGAAAGACTCCTT\n+AGACACGTTGAACACAACAACAGAATCTCTTAGTAAACAAGTATTATTTAATACTGATGA\n+GATTACCGTGTTAAAGGTAGACGTAGCAACCGTCACACAAAAACAACAGGACGTAGAACA\n+TTCACTTGTGACAATGAAAGATGAGATAGGAGAATTGCACATATCAGTGAATGCCAATGC\n+TAACTCCATTGAGGCATTACGCACCAGAATTGCCGCGCTAGAGGTTAGAGATGTAGGACC\n+GTGGGTTTTGAAAAACAGAATTTACAAATTCGTGATCAATATGCCAAATGGAACTACTCG\n+CTATACTACAATATACTTTTTCGCCGATGTATATTATAGCACTGGAGTAAGAGCAGCACC\n+TACAAATGCGGGAACAACTACAAGCATATTGACGATTACTTCGTTGACAACATCATATAG\n+TTTGGCTAACGTCCCCGTTTTAAAAGGTGTACCTTATAGAGTCAATGGTTACTTTGCTAA\n+CGGAAATAGTATCGAAGATATAACCGGAAGCACGTCAGTGATTTACGACTCTATGTAAAC\n+CGGACATGACATGTCTATGACACGACATTAAACTGTCAGAACCTGTTTGGTTAACACAGA\n+GAGATTAACCGCAAGACGAGTATGCAGAATCCAACACAAACCATGCATATATACGACATG\n+CCCCTACGCGTCATCGCTGGCCTGTCAACCCTTGCCAAAACAACTGAAGAAGACGACAAC\n+ACCTCAACTGGAATAGTAGTTAGTGAAGTAGGAGAGCCACAAGTGGTCGACCATCCAGCA\n+TGGATTGATCCCTTTGTTGCTTATCAATTGCGAGCTCCACGTAAAAACATCACACCAGAT\n+TTTATATTTGGTCGAGCCGATATTGGTAATGCGTTTAGTGCTTTCTTACCGCGCCGCTTT\n+TCTGCTCCAGCAGTAGGAACCCGACTTGTGATAGACCCTGTTTTCACTTACCAACAGAAA\n+ACGGTGCTAGGACTATATAATTATTTCCATGCGGATTTTTATTATATAGTGCATGTTCCA\n+GCACCCTTGGGAACAGGTATCTATCTGAAGATCTATGCTCCTGAATTTGACACTACAACC\n+GTAACACGAGGAATTCGGTTTAAGCCAAGTGCATCTCCAACAATTGCACTTTCAGTCCCT\n+TGGAGCAACGATCTATCGACCGTAGAAACATCCGTAGGTCGAGTCGGACAGAGTGGAGGG\n+AGTATTGTTATCGAAACTATCGAAGATAACAGTAACGAGACGGTCAACACCCCACTCAGC\n+ATCACCGTTTGGTGTTGCATGGCGAATATTAAAGCCACAGGCTACAAAAATGCGGATACG\n+TCAGCTTACAACGAAAAAGGCATGAACTTTGTCCCAGTTCCAGTGCCAAAGCCGCCCGTT\n+CCCCCAACAAAACCAATTATGGGCGAGGAACAAGCTGACAATGAAGTTACAGCCGAAGGT\n+GGTAAACTTGTACAGGAATTGGTTTACGACCATTCTGCGATTCCTGTAGCGCCAGTCGTC\n+GAAACACAAGCAGAACAGCCGGAAGTCCCAGTTTCATCAGTGGCAACGCGAAAGAACGAT\n+ACGGGACATTTGGCAACAAAGTGGTATGATTTCGCCAAAATCAGTCTGTCAAACCCAGCT\n+AACATGAACTGGACCACGCTAACCATAGACCCGTACAACAATGTTACATTGTCTAGAGAT\n+GGTGAGTCGATGGTCCTACCATGGAGGCGAAATGTTTGGACAACCGGATCGAAAAGTATT\n+GGATATATCCGAACGATGGTTGCACAAATTAACATACCACGCCCGCCGCAGATCAGTGGA\n+GTGCTCGAAGTTAAAGATTCAATCAATAACTCAAGTATTTCACTGGTAGAATTTGGAGGA\n+AAAGTAGAGATTCCAATTATTCCGAAGGTTATGAACGGACTAGTAACAAGTGCTAGTTTG\n+CCAAGGCATAGACTAAACCCATGGATGAGAACCGCCGAAAGTAAGGTTGAATTGCAATAT\n+CGAATTATTGCTTTTAATCGAACTAGCGACATTGCTGACCTTAACGTTAGCGTTTTGTTG\n+CGACCTGGCGATTCGCAATTCCAATTGCCGATGAAACCTGACAATAGTGTGGATACACGT\n+CATTTTGAGCTTGTTGAAGCTTTAATGTACCACTACGATAGCCTCCGAATTCGAGGAGAA\n+GAACAGAGTCTGCCAGAAAATGCACCTAATGCAGTTTCAAACCCTCAGCAGTTCATTACA\n+CCCGCAACCGCTCTAAGTGCCGAAGAATATAATGTGCACGAGGCGTTGGGTGAAACTGAG\n+GAGTTGGAGCTGGATGAATTTCCGGTTCTGGTGTTCAAGGGAAATGTTCCCGTTGACTCA\n+GTGACGTCCATTCCTTTGGACCTCGCAACTATATACGACTTTGCTTGGGACGGAGAGCAG\n+AATGCAATTTCTCAGAAATTTCAGCGTTTTGCTCATCTGATACCGAAAAGCGCAGGTGGT\n+TTTGGCCCAGTGATTGGTAATTATACTATCACGGCTAACCTCCCCACCGGTGTAGCAGGT\n+CGTATTCTGCACAATTGTCTCCCAGGAGATTGTGTAGATCTAGCAGTATCGAGAATTTTT\n+GGCTTGAAGAGCCTTCTCGGTGTTGCAGGAACAGCAGTTTCAGCCATTGGTGGCCCACTC\n+CTTAACGGTTTGGTTAACACCGCAGCGCCTATCCTTAGTGGAGCAGCGCACGCCATTGGT\n+GGAAATGTTGTAGGAGGACTGGCTGATGCAGTGATCGACATTGGATCTAATTTGCTGACG\n+CCAAAAGAAAAAGAACAACCAAGCGCAAATTCAAGCGCGATTTCTGGAGATATTCCGATT\n+TCGCGTTTTGTAGAGATGCTCAAGTATGTCAAGGAGAATTACCAGGATAATCCTGTGTTC\n+CCGACTTTACTTGTTGAACCACAAAACTTCATCTCAAACGCAATGACCGCACTCAAAACA\n+ATTCCAATTGAGGTCTTTGCCAACATGCGCAATGTGAAAGTTGAACGAAATTTGTTCGAC\n+CGAACGGTTGTTCCAACTGTGAAGGAAGCTACTCTAGCTGATATTGTCATACCTAATCAT\n+ATGTATGGCTATATTCTCCGAGACTTCCTCCAAAACAAACGAGCGTTTCAATCTGGGACC\n+AAACAAAATGTGTACTTTCAGCAGTTTCTAACTGTTCTATCTCAACGTAATACCCGTACA\n+CATATTACGCTCAACGACATCACAAGTTGCTCTATTGATAGTGAGTCGATTGCAAACAAA\n+ATAGAGAGAGTAAAACGCTACTTGAGTGCAAACTCGAGTGGGGAGACCACGGAAGAATTT\n+TCGCGAACAGACACCGGTCTGCTACCTACTACGACCCGCAAAATCGTATTAGGTGAAAGT\n+AAACGCAGGACGGAACGAAACGTAGCAGAAACTGTTTTCCCTTCCGTGAGGCAGTAGATT\n+AAATCCAAAACTCGCCATGTGCGCGTCTCAGAAACTAATTTTTAAAATTGGTTTGCGCGT\n+ATGGTTAAAAAGTCACATTAAATATGAGGATGGTCGCTATAATTTTCTAGCAGAAGATTA\n+TAAAGGACGGTGTGATGATGTTTTGGAGCCCGCACTGGGTGTGGGTTCGTAGTGCTAGCA\n+ATTGCAACTTTTCCTGAAAGTTAATACCTATAGTTTATAGGAGAAAAATTAACATTTATT\n+GAGAATATCTGTGCAAACGACTCCCCACGCGGGGAGTAGTGGAATCTTGATAAACAGGTT\n+TTTTAAGCTTTTGCGTTTCCGAAAGGGTTACTCTGGCTGAACCAGCAGTTTTTATAACTG\n+TGGGTAGCCCCTCGGAAAATCAGGTTTGC\n' |
b |
diff -r 000000000000 -r 7d96b28eec49 test-data/blast.tab --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/blast.tab Sun Oct 15 12:52:40 2017 -0400 |
b |
@@ -0,0 +1,7 @@ +Contig1 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 100.00 2113 0 0 1 2113 4248 2136 0.0 3811 12333 +Contig2 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.89 1745 2 0 1 1745 366 2110 0.0 3139 12333 +Contig3 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 98.78 164 0 1 1 164 377 216 4e-80 284 12333 +Contig4 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.92 2476 2 0 1 2476 5145 7620 0.0 4457 12333 +Contig5 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.89 4714 1 2 6 4715 12333 7620 0.0 8473 12333 +Contig6 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.89 894 1 0 1 894 4235 5128 0.0 1608 12333 +Contig7 gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome 99.10 222 0 1 1 222 237 18 2e-111 389 12333 |
b |
diff -r 000000000000 -r 7d96b28eec49 test-data/contigs.fa --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/contigs.fa Sun Oct 15 12:52:40 2017 -0400 |
b |
b'@@ -0,0 +1,216 @@\n+>Contig1\n+TTTTGCTAAAGCTAAATCAACTATATCTGTTTCCATCAGACTCAGTTCATCGTTCACGAA\n+ATTTTTGATTTGATCGTAAACTGTTTCATATGAATTCGCTGATGTCGATGGAATTTCATC\n+CATATCGATCAATTTATTCTCTTGCAACATTCGTTTGGCCGCGATCAACTGCAAACCTGT\n+AAAAGGATTAACTCTAATTTTGACTTTCGTCGTAACTAGATTTTCTGCTGCTCCTTCTAC\n+ACATTCGGTGATGTACCTTCCTAACCAAGCACTGAAAGTTTCTGTTTTGTTAATACACAT\n+GGAATTAATGAGATTCCACGCTCTATAACTCAACATATTACTTCTCACGTGATTTAGTGT\n+AGTTAAAGGTTCAACACCTAGCTCTCGCGACTCAACATCATAGCCTTCTAAACTCCTTTC\n+GATGATATTATCAAATCTAGTTAACAACTGATCTGAAATACCGCCATACATAACTTCTTC\n+ATCTAAGTTATCTTTGAGCGGTATAAATTTCTCATCTGTCTGGATAGGTCGGCTATTCAA\n+CTCAAATGTTTCATCAAGGAAAGGCATGTTTTCGTCTCCTGGGCGGATTCTCAACAAGTG\n+ATCCCTCAATTCGCGCATTCGTTGTCTTCTTTCTAATTGCGCTCCATCCATTTGTTCTTG\n+TCCGGTGATTCCCACATCTTTAATAGTGGAGTTATAGAAATTATTTTGAATAATCAAATC\n+ATCTCCAATTATCTTCACTATTTCACTCAAAGACATGGTTTTTAGCGTGCTGGTCGTGTT\n+GCTTCCAATAGCGCTGACGGCTTTCGACATTGGTCCGTAATAAAAATCGACCCAGTCATA\n+GCTCTCGTCAATCGCTCCTCGTTTTGGCATTTTGTTCTTGTTCCTCCTCAAGCAAATTGT\n+ATGAGGGAATCGAGCATGTAATGCTTCGATATCCTCAATCGTTACGCTTTTGTCCGGCAA\n+CTTGTTACAGGTCGTAAACACCAACTTACTTCTGTATGGTAAACCTTTTTGTTTCAAATC\n+AGCTTGGTTTGTTCCCACTGCTGTATTAGAAATAAAAGTAAACCACATCAAATGATCCTT\n+GTTGTCTTTTTGTTGAAAGGCATCATCTACGTAAGTTATTTCTTGTCCGGTGTATCCTGT\n+ATCAAATTCATCTCTGCACTGCCTAGACCAAGTTGTCCATTTAGTAGCGTTTCTAAAAGA\n+AATATCGCCATGTTCCTGAACATACTCGCACACTTTTCTTGAGAGGATTGCTACGAGGTT\n+TGTCTTTCCGATTTGTTTTTCGCCTTGTATGGTAACTCCTACGGGTTTTACTCGGGTTTG\n+GTTACTGTTCTCTAACACCTTAACTTCAATAAGTAGCACTTCGAGTGATGCCAGATGTTT\n+TTGGCACTCTGTTACTACTTTATCTGATCGAAGTTCTTTCGTTTGCAAAGTGTTTAACTT\n+ATTTCTCAAAGTTGCAACTTTTTCCCTGATTTCGCCAACTCTTACAGCCCCTTGTGTTTG\n+TAAGAACTCATTTGGGTTTAATTTGAGCGTTGTTTTCATCCATGTTTCCGCTTCCGATAA\n+TTCATTAACTTCTTTTGCAACTTGCAAAATAGTATCATATGAACTATCTTTCATCATTCC\n+CATTTTAATCATCAACGGCTGCATACGTTTTATTATATTTTCGCAAGCCTTTTGATTACG\n+GTCCAAATTCACAAGAAAACTTTCAACTGGAACATCTCCAATTTGAGTCTTTGTAATCGT\n+CAATCCCATTGCTACCATAGGTAGAACATCTTCCAACATTTCTTCTGTTCCTTCTATCGC\n+CGGTCGATCTAGCATCCGTCCTACAGTACTTTCCCAAATACCAAGTGGTAACTTGAGAAT\n+ACTACTTATCATCGTAATTTTCGAGATAAGATCTTTTTTGTTCTTAATTTGCTGTAGTTC\n+GTAGACCATCGTGATAAAGAATGTTGGATATTCTATGATTTGTTCTACACATCGCCCTAA\n+CACACCTCTACGTCCTGTTGTTCCAGTTGGGTTCGATACTATTCTCCGTATAAAATTAAC\n+TTTCTCTGTTATTACGTTAATGTTATTTCTAATATATTTAATAAAAGCATACAAAATTGC\n+AAAATAAAGGAAA\n+>Contig2\n+TATTATAAAATAATATTTAATCCCCATCTTTGCAAGATGGAAACTCTCAATAAATCAGGA\n+GTATAATAGATTTAAACCCTCACACTGAATCACGAGTATAAACAGATTCAAATATGATTA\n+ACAATCAAACAAACAAAAAGGGACCACAACTAGAGAGAGTACATTTTGGTAGTGCGCAGG\n+TTGTGGGAAAAAGTACCAAACGACGACAACGCGGAACCAAATTTGACATTGAATATACTG\n+TTAAAAGGAACGATGCACCAAAAGAGCAGAAATTCTTAGTTTCAGAAATTTTTGATGAAA\n+AGTTGGATAAACAAATAAAATATGAGAAGAAGCAAAATCATACTTTTATTAAACCGAAAT\n+TAAATTTAGTTACTAGAGAAGAACAACACGTGACTAAGAAGGTTTTAAGAGGTAAAGAAC\n+GAGCTGCAACTCATGCTTTTATGAAGGAAATGGTTGAATCTAACAAGATACAACCTAGTT\n+GGAATGTCGAATACGAAAAAGAAATAGATGAGGTTGATCTATTTTTTATGAAGAAGAAAA\n+CCAAACCTTTCTCAGGTTTTTCTATTAAGGAATTAAGAGATAGTCTAATTGTGCAGTCAG\n+ACGATAAAAACATGGCACAGCCAACCGTGATGAGTTCAACCAATGAAATTGTTACACCCC\n+GTGAGGAGATAAGCGTTTCTGCTATCTCTGAACAACTGGCATCCTTGATGGAGAGAGTTG\n+ATAAACTCGAGAAGATGAATGCTGCTTTGGAGGAAGAAAACAAGCAGCTAAAGAAAGAGA\n+GAGAGGCGACTATTAAGTCAGTTAAGAAAGAGGCAAAGAGGACTAAACAAGAGAAGCCTC\n+AGATTGCGAAGAAAACGCAACACAAGAGTTTAGGAGTAAATCTTAAAATCACCAAGACCA\n+AAGTAGTTGGTCAGGAACAATGTTTGGAAATTGAAAATACTCAGCATAAGAAATTTGTTG\n+AGAAGCCAAGCATGCCATCCAAAGTGAGCAAGAAGATGAAGGGACAACAGTTGAAAAAGA\n+CTATTCGTACTTGGTATGAATTTGATCCCTCTAAACTCGTTCAGCATCAAAAAGAAGTGT\n+TGAACAGTGTTGTTACCAACACAACCTTCGCAGATAAAGTCCGTGAAACTGGTATACCTA\n+AACAAAAGATTAGGTATACTGCAAAACCACCAGCAGAGGAGAAGAGGAGTATCCATTTCT\n+ATGGTTATAAGCCAAAAGGAATCCCTAACAAAGTTTGGTGGAATTGGGTCACCACTGGCA\n+CAGCTATGGACGCTTATGAAAAAGCTGACCATTATCTGTATCACCAATTTAAACGAGAAA\n+TGATGGTATACAGAAATAAATGGGTCAAGTTTAGTAAGGAGTTCAATCCGTACCTATCGG\n+AACCGAAAATGGTATGGGAAGAGAATACATGGGAATATGAATATAAAACAGACGTTCCCT\n+ACAATTTTATTCTCAAATGGCGCCAGTTAGTGCAGACCTACAAGCCTAACACACCAATCC\n+AGGCTGATTGGTACAAAATCTCGCAGAAACAACAATGTTAATTGAAGTTTTCATTAATTC\n+TTTGTTGCAAAATCTAGGTATCATGATGTCTTTCCGTGACCTAGTGGCGAGCCCATGGAT\n+ATTGCTAGTAATAGCTATACCCTTGTGTGCATTTGCCAGTTCAGCGTCTATGGTTAGGGA\n+GATGCTTTTCCGTCATAAAATTACAGAAAATATTTTAAA'..b'TGAGTTATTGATTGAATCTTTAACTTCGAGCACTCCACTGATCTGCGGCGGGCGTGGTA\n+TGTTAATTTGTGCAACCATCGTTCGGATATATCCAATACTTTTCGATCCGGTTGTCCAAA\n+CATTTCGCCTCCATGGTAGGACCATCGACTCACCATCTCTAGACAATGTAACATTGTTGT\n+ACGGGTCTATGGTTAGCGTGGTCCAGTTCATGTTAGCTGGGTTTGACAGACTGATTTTGG\n+CGAAATCATACCACTTTGTTGCCAAATGTCCCGTATCGTTCTTTCGCGTTGCCACTGATG\n+AAACTGGGACTTCCGGCTGTTCTGCTTGTGTTTCGACGACTGGCGCTACAGGAATCGCAG\n+AATGGTCGTAAACCAATTCCTGTACAAGTTTACCACCTTCGGCTGTAACTTCATTGTCAG\n+CTTGTTCCTCGCCCATAATTGGTTTTGTTGGGGGAACGGGCGGCTTTGGCACTGGAACTG\n+GGACAAAGTTCATGCCTTTTTCGTTGTAAGCTGACGTATCCGCATTTTTGTAGCCTGTGG\n+CTTTAATATTCGCCATGCAACACCAAACGGTGATGCTGAGTGGGGTGTTGACCGTCTCGT\n+TACTGTTATCTTCGATAGTTTCGATAACAATACTCCCTCCACTCTGTCCGACTCGACCTA\n+CGGATGTTTCTACGGTCGATAGATCGTTGCTCCAAGGGACTGAAAGTGCAATTGTTGGAG\n+ATGCACTTGGCTTAAACCGAATTCCTCGTGTTACGGTTGTAGTGTCAAATTCAGGAGCAT\n+AGATCTTCAGATAGATACCTGTTCCCAAGGGTGCTGGAACATGCACTATATAATAAAAAT\n+CCGCATGGAAATAATTATATAGTCCTAGCACCGTTTTCTGTTGGTAAGTGAAAACAGGGT\n+CTATCACAAGTCGGGTTCCTACTGCTGGAGCAGAAAAGCGGCGCGGTAAGAAAGCACTAA\n+ACGCATTACCAATATCGGCTCGACCAAATATAAAATCTGGTGTGATGTTTTTACGTGGAG\n+CTCGCAATTGATAAGCAACAAAGGGATCAATCCATGCTGGATGGTCGACCACTTGTGGCT\n+CTCCTACTTCACTAACTACTATTCCAGTTGAGGTGTTGTCGTCTTCTTCAGTTGTTTTGG\n+CAAGGGTTGACAGGCCAGCGATGACGCGTAGGGGCATGTCGTATATATGCATGGTTTGTG\n+TTGGATTCTGCATACTCGTCTTGCGGTTAATCTCTCTGTGTTAACCAAACAGGTTCTGAC\n+AGTTTAATGTCGTGTCATAGACATGTCATGTCCGGTTTACATAGAGTCGTAAATCACTGA\n+CGTGCTTCCGGTTATATCTTCGATACTATTTCCGTTAGCAAAGTAACCATTGACTCTATA\n+AGGTACACCTTTTAAAACGGGGACGTTAGCCAAACTATATGATGTTGTCAACGAAGTAAT\n+CGTCAATATGCTTGTAGTTGTTCCCGCATTTGTAGGTGCTGCTCTTACTCCAGTGCTATA\n+ATATACATCGGCGAAAAAGTATATTGTAGTATAGCGAGTAGTTCCATTTGGCATATTGAT\n+CACGAATTTGTAAATTCTGTTTTTCAAAACCCACGGTCCTACATCTCTAACCTCTAGCGC\n+GGCAATTCTGGTGCGTAATGCCTCAATGGAGTTAGCATTGGCATTCACTGATATGTGCAA\n+TTCTCCTATCTCATCTTTCATTGTCACAAGTGAATGTTCTACGTCCTGTTGTTTTTGTGT\n+GACGGTTGCTACGTCTACCTTTAACACGGTAATCTCATCAGTATTAAATAATACTTGTTT\n+ACTAAGAGATTCTGTTGTTGTGTTCAACGTGTCTAAGGAGTCTTTCGTAGTTTGATCAAG\n+CTCGTTTAATGTTGTGGCAAGGGTGTTAATCTGTTTTGCCTGTTGACTTGTTGTTGTGGT\n+TAATTTGTCAACTTCTGAATTCATTTCTACCAATGCTGTATTGATATTAACGAATTGTTC\n+TTCATTTCGAGCTTGATTGTTGTCAACTACTTTAGCTAAACCGTCAAGTTGCAGTTTTTG\n+TTGATCGAGCTGGGTCTTTACTGCTGTTACTGAAGATTGAATTGACTTAATCTCAGTAAC\n+CTCGTTCTCGTCTAAAACGGTGAAAAGAGTGGTGTTCTGATCAAAGATCTCCTCTTTTAA\n+TGCCATAATAACGATTACAGAATTTTTGGAAAGTAACTTCCCAGCTCGTATTCAACAATA\n+CTGCTAATGCTCCATTCAAGGTTCTATTTGTACCACATTTTAGCTTTTGACAAAGCTCAT\n+TGTAATACTCCTCACCCCAAAGAGCGGCTTCGATCAACTGTTCTTGCACGAGATTTACCC\n+ACACAGTTATCTGATCTTCGCGGATATCAGTCCATACAAACGGTCCTTCAATAGATCGTT\n+GTAGTAATGGAGCTAAAACCATACCGTTTTCTAACTTAAATCCTCTTTTCAAGAATTGTA\n+GGTTTTCAAAAGAAGTAAATGGCTTCTCTTCTCCATCCTTTGAACCTGGTGTCATGATAT\n+GTCCTGTAGCATTTAGTACATCTCGATAAGTACAATAATTATACTTATCCTTATACTCAT\n+CGCTAACGCTTTTTATAATATCATCACCAAACGCGACGCTCGAGACATTCTGTCGGTAAT\n+CCCACAGTGATCTTAGGCCGGTTGTCTTCACCCACGCATACAAACCATAAATATCGTTCG\n+CCAGGCAATTATCAATTGTAGTAGTATAACTACCA\n+>Contig6\n+TAGCTTTAGCAAAAATTAGCTTATCGCAAATCCGAGGCAACATCAAGAGATCAACCTGGC\n+TGGACGTAAATGATTGGATATTAGCTTTGAAACATAAAATTTCAGGAAAAAGCTTTGCCA\n+AACATATGGATCTGTATCCTAGCTCGCTAGATTCTTTTCTTCTTACACTCAAAGATTGGG\n+AGGTTGAAGACCGTATAAAGTTTAACTCTATTTACAAGCAAAAGGTATTGTTTGTTCAAT\n+CTAGATTTTCACTTTACTGTTGGTCTCCTTTTATATCTCGTGGAACACGATTTGTGAAAG\n+TGACTTCTCAGTTTAGAGAGTTAGTGGATAAGTTAGAAACTGGCATTCTATTCCATGAAA\n+TAAAATCGGTTACAAATGGAATTAGATGGTTAGGAGGAGCAGGGAACAATGGACACGTTG\n+GAGAAAGAGTAAGAGTTATTGCTCATACAGCCCAATTTCCGAAAAAGAGTTACCCTCAGA\n+ATGGATTCCCTATAAACGAAGAACTACATAGGGAATGGATCCAACTTGTTATGAACTCGG\n+ACTATAAGTATCACTCACTTATAGGAGAAGAAAAAGTAAATATTCTTTGGAACCTTATTA\n+GGCTCCAACCTCAACATGAGGTGGAGAATTTTAAGGTTTACTTAGAAGATTTGCAGGCGT\n+CCCCGCCGAAAACTGGGACAATTTGTGCAAAAGTAGTGAATGATATAAAAGCCGAAGTAA\n+CTTCAAGTTATAGGCAATTTAACAATTACTACACTCGTTTAACAAAAGATGGTATGCACA\n+CACTTTTATCAATGCTTTCTAGGATAGGTGTTCCAATTTCAGATTATTGGAATGACCTTC\n+TTGTCGACAAAGCGCCAGCTATTACAGCGGTTACTGTTGGAGCAATAACAAGTT\n+>Contig7\n+AAGACATTGATTTTTTTCAAGTTCAATGTATAACTCTTTTTGTTCGTTTATTTGTTGTTT\n+GCTCAAAGTTTCTGTTAAGAGGTCTCATAAGTATCCTGTTTACAACGGACCAGCATTATT\n+CCCTTCGGCACTTCCGATACTCTACTAATCCTTAATACCAGAATCAGCATAATCAGCGAA\n+GTGGTATCTCGCGCTTCTTTTTCCAGTACTCATTAACCCCCC\n' |
b |
diff -r 000000000000 -r 7d96b28eec49 test-data/guideSequence.fa --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/guideSequence.fa Sun Oct 15 12:52:40 2017 -0400 |
b |
b'@@ -0,0 +1,178 @@\n+>gi|402295620|gb|JX220408.1|_Nora_virus_isolate_FR1,_complete_genome\n+GCAAAAAGGCCCCTGGGGGGGGGTTAATGAGTACTGGAAAAAGAAGCGCGAGATACCACTTCGCTGATTA\n+TGCTGATTCTGGTATTAAGGATTAGTAGAGTATCGGAAGTGCCGAAGGGAATAATGCTGGTCCGTTGTAA\n+ACAGGATACTTATGAGACCTCTTAACAGAAACTTTGAGCAAACAACAAATAAACGAACAAAAAGAGTTAT\n+ACATTGAACTTGAAAAATCAATGTCTTTTATTTAGACTGATTTATATTGGTCTTTATAATCGTAAGGAAT\n+AATTCTCATCTAATGATATCGATGTAAAATGTATCATTCTAGCTATTCAATTATATTAATTGAGCTTAGC\n+ATCTGATTAAATTATTATTATAAAATAATATTTAATCCCCATCTTTGCAAGATGGAAACTCTCAATAAAT\n+CAGGAGTATAATAGATTTAAACCCTCACACTGAATCACGAGTATAAACAGATTCAAATATGATTAACAAT\n+CAAACAAACAAAAAGGGACCACAACTAGAGAGAGTACATTTTGGTAGTGCGCAGGTTGTGGGAAAAAGTA\n+CCAAACGACGACAACGCGGAACCAAATTTGACATTGAATATACTGTTAAAAGGAACGATGCACCAAAAGA\n+GCAGAAATTCTTAGTTTCAGAAATTTTTGATGAAAAGTTGGATAAACAAATAAAATATGAGAAGAAGCAA\n+AATCATACTTTTATTAAACCGAAATTAAATTTAGTTACTAGAGAAGAACAACACGTGACTAAGAAGGTTT\n+TAAGAGGTAAAGAACGAGCTGCAACTCATGCTTTTATGAAGGAAATGGTTGAATCTAACAAGATACAACC\n+TAGTTGGAATGTCGAATACGAAAAAGAAATAGATGAGGTTGATCTATTTTTTATGAAGAAGAAAACCAAA\n+CCTTTCTCAGGTTTTTCTATTAAGGAATTAAGAGATAGTCTAATTGTGCAGTCAGACGATAAAAACATGG\n+CACAGCCAACCGTGATGAGTTCAACCAATGAAATTGTTACACCCCGTGAGGAGATAAGCGTTTCTGCTAT\n+CTCTGAACAACTGGCATCCTTGATGGAGAGAGTTGATAAACTCGAGAAGATGAATGCTGCTTTGGAGGAA\n+GAAAACAAGCAGCTAAAGAAAGAGAGAGAGGCGACTATTAAGTCAGTTAAGAAAGAGGCAAAGAGGACTA\n+AACAAGAGAAGCCTCAGATTGCGAAGAAAACGCAACACAAGAGTTTAGGAGTAAATCTTAAAATCACCAA\n+GACCAAAGTAGTTGGTCAGGAACAATGTTTGGAAATTGAAAATACTCAGCATAAGAAATTTGTTGAGAAG\n+CCAAGCATGCCATCCAAAGTGAGCAAGAAGATGAAGGGACAACAGTTGAAAAAGACTATTCGTACTTGGT\n+ATGAATTTGATCCCTCTAAACTCGTTCAGCATCAAAAAGAAGTGTTGAACAGTGTTGTTACTAACACAAC\n+CTTCGCAGATAAAGTCCGTGAAACTGGTATACCTAAACAAAAGATTAGGTATACTGCAAAACCACCAGCA\n+GAGGAGAAGAGGAGTATCCATTTCTATGGTTATAAGCCAAAAGGAATCCCTAACAAAGTTTGGTGGAATT\n+GGGTCACCACTGGCACAGCTATGGACGCTTATGAAAAAGCTGACCATTATCTGTATCACCAATTTAAACG\n+AGAAATGATGGTATACAGAAATAAATGGGTCAAGTTTAGTAAGGAGTTCAATCCGTACCTATCGGAACCG\n+AAAATGGTATGGGAAGAGAATACATGGGAATATGAATATAAAACAGACGTTCCCTACAATTTTATTCTCA\n+AATGGCGCCAGTTAGTGCAGACCTACAAGCCTAACACACCAATCCAGGCTGATTGGTACAAAATCTCGCA\n+GAAACAACAATGTTAATTGAAGTTTTCATTAATTCTTTGTTGCAAAATCTAGGTATCATGATGTCTTTCC\n+GTGACCTAGTGGCGAGCCCATGGATACTGCTAGTAATAGCTATACCCTTGTGTGCATTTGCCAGTTCAGC\n+GTCTATGGTTAGGGAGATGCTTTTCCGTCATAAAATTACAGAAAATATTTTAAAAGGAACAGGAGTAGAA\n+GAATTGTTTAATCCATTCGGGATAATTATTAAATATTTCCTTTATTTTGCAATTTTGTATGCTTTTATTA\n+AATATATTAGAAATAACATTAACGTAATAACAGAGAAAGTTAATTTTATACGGAGAATAGTATCGAACCC\n+AACTGGAACAACAGGACGTAGAGGTGTGTTAGGGCGATGTGTAGAACAAATCATAGAATATCCAACATTC\n+TTTATCACGATGGTCTACGAACTACAGCAAATTAAGAACAAAAAAGATCTTATCTCGAAAATTACGATGA\n+TAAGTAGTATTCTCAAGTTACCACTTGGTATTTGGGAAAGTACTGTAGGACGGATGCTAGATCGACCGGC\n+GATAGAAGGAACAGAAGAAATGTTGGAAGATGTTCTACCTATGGTAGCAATGGGATTGACGATTACAAAG\n+ACTCAAATTGGAGATGTTCCAGTTGAAAGTTTTCTTGTGAATTTGGACCGTAATCAAAAGGCTTGCGAAA\n+ATATAATAAAACGTATGCAGCCGTTGATGATTAAAATGGGAATGATGAAAGATAGTTCATATGATACTAT\n+TTTGCAAGTTGCAAAAGAAGTTAATGAATTATCGGAAGCGGAAACATGGATGAAAACAACGCTCAAATTA\n+AACCCAAATGAGTTCTTACAAACACAAGGGGCTGTAAGAGTTGGCGAAATCAGGGAAAAAGTTGCAACTT\n+TGAGAAATAAGTTAAACACTTTGCAAACGAAAGAACTTCGATCAGATAAAGTAGTAACAGAGTGCCAAAA\n+ACATCTGGCATCACTCGAAGTGCTACTTATTGAAGTTAAGGTGTTAGAGAACAGTAACCAAACCCGAGTA\n+AAACCCGTAGGAGTTACCATACAAGGCGAAAAACAAATCGGAAAGACAAACCTCGTAGCAATCCTCTCAA\n+GAAAAGTGTGCGAGTATGTTCAGGAACATGGCGATATTTCTTTTAGAAACGCTACTAAATGGACAACTTG\n+GTCTAGGCAGTGCAGAGATGAATTTGATACAGGATACACCGGACAAGAAATAACTTACGTAGATGATGCC\n+TTTCAACAAAAAGACAACAAGGATCATTTGATGTGGTTTACTTTTATTTCTAATACAGCAGTGGGAACAA\n+ACCAAGCTGATTTGAAACAAAAAGGTTTACCATACAGAAGTAAGTTGGTGTTTACGACCTGTAACAAGTT\n+GCCGGACAAAAGCGTAACGATTGAGGATATCGAAGCATTACATGCTCGATTCCCTCATACAATTTGCTTG\n+AGGAGGAACAAGAACAAAATGCCAAAACGAGGAGCGATTGACGAGAGCTATGACTGGGTCGATTTTTATT\n+ACGGACCAATGTCGAAAGCCGTCAGCGCTATTGGAAGCAACACGACCAGCACGCTAAAAACCATGTCTTT\n+GAGTGAAATAGTGAAGATAATTGGAGATGATTTGATTATTCAAAATAATTTCTATAACTCCACTATTAAA\n+GATGTGGGAATCACCGGACAAGAACAAATGGATGGAGCGCAATTAGAAAGAAGACAACGAATGCGCGAAT\n+TGAGGGATCACTTGTTGAGAATCCGCCCAGGAGACGAAAACATGCCTTTCCTTGATGAAACATTTGAGTT\n+GAATAGCCGACCTATCCAGACAGATGAGAAATTTATACCGCTCAAAGATAACTTAGATGAAGAAGTTATG\n+TATGGCGGTATTTCAGATCAGT'..b'GTCAACAGGCAAAACAGATTAAC\n+ACCCTTGCCACAACATTAAACGAGCTTGATCAAACTACGAAAGACTCCTTAGACACGTTGAACACAACAA\n+CAGAATCTCTTAGTAAACAAGTATTATTTAATACTGATGAGATTACCGTGTTAAAGGTAGACGTAGCAAC\n+CGTCACACAAAAACAACAGGACGTAGAACATTCACTTGTGACAATGAAAGATGAGATAGGAGAATTGCAC\n+ATATCAGTGAATGCCAATGCTAACTCCATTGAGGCATTACGCACCAGAATTGCCGCGCTAGAGGTTAGAG\n+ATGTAGGACCGTGGGTTTTGAAAAACAGAATTTACAAATTCGTGATCAATATGCCAAATGGAACTACTCG\n+CTATACTACAATATACTTTTTCGCCGATGTATATTATAGCACTGGAGTAAGAGCAGCACCTACAAATGCG\n+GGAACAACTACAAGCATATTGACGATTACTTCGTTGACAACATCATATAGTTTGGCTAACGTCCCCGTTT\n+TAAAAGGTGTACCTTATAGAGTCAATGGTTACTTTGCTAACGGAAATAGTATCGAAGATATAACCGGAAG\n+CACGTCAGTGATTTACGACTCTATGTAAAAACCGGACATGACATGTCTATGACACGACATTAAACTGTCA\n+GAACCTGTTTGGTTAACACAGAGAGATTAACCGCAAGACGAGTATGCAGAATCCAACACAAACCATGCAT\n+ATATACGACATGCCCCTACGCGTCATCGCTGGCCTGTCAACCCTTGCCAAAACAACTGAAGAAGACGACA\n+ACACCTCAACTGGAATAGTAGTTAGTGAAGTAGGAGAGCCACAAGTGGTCGACCATCCAGCATGGATTGA\n+TCCCTTTGTTGCTTATCAATTGCGAGCTCCACGTAAAAACATCACACCAGATTTTATATTTGGTCGAGCC\n+GATATTGGTAATGCGTTTAGTGCTTTCTTACCGCGCCGCTTTTCTGCTCCAGCAGTAGGAACCCGACTTG\n+TGATAGACCCTGTTTTCACTTACCAACAGAAAACGGTGCTAGGACTATATAATTATTTCCATGCGGATTT\n+TTATTATATAGTGCATGTTCCAGCACCCTTGGGAACAGGTATCTATCTGAAGATCTATGCTCCTGAATTT\n+GACACTACAACCGTAACACGAGGAATTCGGTTTAAGCCAAGTGCATCTCCAACAATTGCACTTTCAGTCC\n+CTTGGAGCAACGATCTATCGACCGTAGAAACATCCGTAGGTCGAGTCGGACAGAGTGGAGGGAGTATTGT\n+TATCGAAACTATCGAAGATAACAGTAACGAGACGGTCAACACCCCACTCAGCATCACCGTTTGGTGTTGC\n+ATGGCGAACATTAAAGCCACAGGCTACAAAAATGCGGATACGTCAGCTTACAACGAAAAAGGCATGAACT\n+TTGTCCCAGTTCCAGTGCCAAAGCCGCCCGTTCCCCCAACAAAACCAATTATGGGCGAGGAACAAGCTGA\n+CAATGAAGTTACAGCCGAAGGTGGTAAACTTGTACAGGAATTGGTTTACGACCATTCTGCGATTCCTGTA\n+GCGCCAGTCGTCGAAACACAAGCAGAACAGCCGGAAGTCCCAGTTTCATCAGTGGCAACGCGAAAGAACG\n+ATACGGGACATTTGGCAACAAAGTGGTATGATTTCGCCAAAATCAGTCTGTCAAACCCAGCTAACATGAA\n+CTGGACCACGCTAACCATAGACCCGTACAACAATGTTACATTGTCTAGAGATGGTGAGTCGATGGTCCTA\n+CCATGGAGGCGAAATGTTTGGACAACCGGATCGAAAAGTATTGGATATATCCGAACGATGGTTGCACAAA\n+TTAACATACCACGCCCGCCGCAGATCAGTGGAGTGCTCGAAGTTAAAGATTCAATCAATAACTCAAGTAT\n+TTCACTGGTAGAATTTGGAGGAAAAGTAGAGATTCCAATTATTCCGAAGGTTATGAACGGACTAGTAACA\n+AGTGCTAGTTTGCCAAGGCATAGACTAAACCCATGGATGAGAACCGCCGAAAGTAAGGTTGAATTGCAAT\n+ATCGAATTATTGCTTTTAATCGAACTAGCGACATTGCTGACCTTAACGTTAGCGTTTTGTTGCGACCTGG\n+CGATTCGCAATTCCAATTGCCGATGAAACCTGACAATAGTGTGGATACACGTCATTTTGAGCTTGTTGAA\n+GCTTTAATGTACCACTACGATAGCCTCCGAATTCGAGGAGAAGAACAGAGTCTGCCAGAAAATGCACCTA\n+ATGCAGTTTCAAACCCTCAGCAGTTCATTACACCCGCAACCGCTCTAAGTGCCGAAGAATATAATGTGCA\n+CGAGGCGTTGGGTGAAACTGAGGAGTTGGAGCTGGATGAATTTCCGGTTCTGGTGTTCAAGGGAAATGTT\n+CCCGTTGACTCAGTGACGTCCATTCCTTTGGACCTCGCAACTATATACGACTTTGCTTGGGACGGAGAGC\n+AGAATGCAATTTCTCAGAAATTTCAGCGTTTTGCTCATCTGATACCGAAAAGCGCAGGTGGTTTTGGCCC\n+AGTGATTGGTAATTATACTATCACGGCTAACCTCCCCACCGGTGTAGCAGGTCGTATTCTGCACAATTGT\n+CTCCCAGGAGATTGTGTAGATCTAGCAGTATCGAGAATTTTTGGCTTGAAGAGCCTTCTCGGTGTTGCAG\n+GAACAGCAGTTTCAGCCATTGGTGGCCCACTCCTTAACGGTTTGGTTAACACCGCAGCGCCTATCCTTAG\n+TGGAGCAGCGCACGCCATTGGTGGAAATGTTGTAGGAGGACTGGCTGATGCAGTGATCGACATTGGATCT\n+AATTTGCTGACGCCAAAAGAAAAAGAACAACCAAGCGCAAATTCAAGCGCGATTTCTGGAGATATTCCGA\n+TTTCGCGTTTTGTAGAGATGCTCAAGTATGTCAAGGAGAATTACCAGGATAATCCTGTGTTCCCGACTTT\n+ACTTGTTGAACCACAAAACTTCATCTCAAACGCAATGACCGCACTCAAAACAATTCCAATTGAGGTCTTT\n+GCCAACATGCGCAATGTGAAAGTTGAACGAAATTTGTTCGACCGAACGGTTGTTCCAACTGTGAAGGAAG\n+CTACTCTAGCTGATATTGTCATACCTAATCATATGTATGGCTATATTCTCCGAGACTTCCTCCAAAACAA\n+ACGAGCGTTTCAATCTGGGACCAAACAAAATGTGTACTTTCAGCAGTTTCTAACTGTTCTATCTCAACGT\n+AATACCCGTACACATATTACGCTCAACGACATCACAAGTTGCTCTATTGATAGTGAGTCGATTGCAAACA\n+AAATAGAGAGAGTAAAACGCTACTTGAGTGCAAACTCGAGTGGGGAGACCACGGAAGAATTTTCGCGAAC\n+AGACACCGGTCTGCTACCTACTACGACCCGCAAAATCGTATTAGGTGAAAGTAAACGCAGGACGGAACGA\n+AACGTAGCAGAAACTGTTTTCCCTTCCGTGAGGCAGTAGATTAAATCCAAAACTCGCCATGTGCGCGTCT\n+CAGAAACTAATTTTTAAAATTGGTTTGCGCGTATGGTTAAAAAGAGTCACATTAAATATGAGGATGGTCG\n+CTATAATTTTCTAGCAGAAGATTATAAAGGACGGTGTGATGATGTTTTGGAGCCCGCACTGGGTGTGGGT\n+TCGTAGTGCTAGCAATTGCAACTTTTCCTGAAAGTTAATACCTATAGTTTATAGGAGAAAAATTAACATT\n+TATTGAGAATATCTGTGCAAACGACTCCCCACGCGGGGAGTAGTGGAATCTTGATAAACAGGTTTTTTAA\n+GCTTTTGCGTTTCCGAAAGGGTTACTCTGGCTGAACCAGCAGTTTTTATAACTGTGGGTAGCCCCTCGGA\n+AAATCAGGTTTGC\n' |