Mercurial > repos > devteam > megablast_xml_parser
changeset 0:03ca082aeb2e draft
Imported from capsule None
author | devteam |
---|---|
date | Mon, 19 May 2014 12:33:19 -0400 |
parents | |
children | fbff957a3655 |
files | megablast_xml_parser.py megablast_xml_parser.xml repository_dependencies.xml test-data/megablast_xml_parser_test1.gz test-data/megablast_xml_parser_test1_out.tabular |
diffstat | 5 files changed, 245 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/megablast_xml_parser.py Mon May 19 12:33:19 2014 -0400 @@ -0,0 +1,78 @@ +#!/usr/bin/env python + +import sys, os, re + +if sys.version_info[:2] >= ( 2, 5 ): + import xml.etree.cElementTree as ElementTree +else: + from galaxy import eggs + import pkg_resources; pkg_resources.require( "elementtree" ) + from elementtree import ElementTree + +def stop_err( msg ): + sys.stderr.write( "%s\n" % msg ) + sys.exit() + +def __main__(): + source = sys.argv[1] + hspTags = [ + "Hsp_bit-score", + "Hsp_evalue", + "Hsp_query-from", + "Hsp_query-to", + "Hsp_hit-from", + "Hsp_hit-to", + "Hsp_query-frame", + "Hsp_hit-frame", + "Hsp_identity", + "Hsp_align-len", + "Hsp_qseq", + "Hsp_hseq", + "Hsp_midline" + ] + hspData = [] + + # get an iterable + try: + context = ElementTree.iterparse( source, events=( "start", "end" ) ) + except: + stop_err( "Invalid data format." ) + # turn it into an iterator + context = iter( context ) + # get the root element + try: + event, root = context.next() + except: + stop_err( "Invalid data format." ) + + outfile = open( sys.argv[2], 'w' ) + try: + for event, elem in context: + # for every <Iteration> tag + if event == "end" and elem.tag == "Iteration": + query = elem.findtext( "Iteration_query-def" ) + qLen = elem.findtext( "Iteration_query-len" ) + # for every <Hit> within <Iteration> + for hit in elem.findall( "Iteration_hits/Hit" ): + subject = hit.findtext( "Hit_id" ) + if re.search( '^gi', subject ): + subject = subject.split('|')[1] + sLen = hit.findtext( "Hit_len" ) + # for every <Hsp> within <Hit> + for hsp in hit.findall( "Hit_hsps/Hsp" ): + outfile.write( "%s\t%s\t%s\t%s" % ( query, qLen, subject, sLen ) ) + for tag in hspTags: + outfile.write("\t%s" %(hsp.findtext( tag ))) + #hspData.append( hsp.findtext( tag ) ) + #hspData = [] + outfile.write('\n') + # prevents ElementTree from growing large datastructure + root.clear() + elem.clear() + except: + outfile.close() + stop_err( "The input data is malformed, or there is more than one dataset in the input file. Error: %s" % sys.exc_info()[1] ) + + outfile.close() + +if __name__ == "__main__": __main__()
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/megablast_xml_parser.xml Mon May 19 12:33:19 2014 -0400 @@ -0,0 +1,60 @@ +<tool id="megablast_xml_parser" name="Parse blast XML output" version="1.0.0"> +<description></description> +<command interpreter="python">megablast_xml_parser.py $input1 $output1</command> +<inputs> + <param name="input1" type="data" format="blastxml" label="Megablast XML output" /> +</inputs> +<outputs> + <data name="output1" format="tabular"/> +</outputs> +<tests> + <test> + <param name="input1" value="megablast_xml_parser_test1.gz" ftype="blastxml" /> + <output name="output1" file="megablast_xml_parser_test1_out.tabular" ftype="tabular" /> + </test> +</tests> +<help> + +**What it does** + +This tool processes the XML output of any NCBI blast tool (if you run your own blast jobs, the XML output can be generated with **-m 7** option). + +----- + +**Output fields** + +This tools returns tab-delimited output with the following fields:: + + Description Example + ----------------------------------------- ----------------- + + 1. Name of the query sequence Seq1 + 2. Length of the query sequence 30 + 3. Name of target sequence gnl|BL_ORD_ID|0 + 4. Length of target sequence 5528445 + 5. Alignment bit score 59.96 + 6. E-value 8.38112e-11 + 7. Start of alignment within query 1 + 8. End of alignment within query 30 + 9. Start of alignment within target 5436010 + 10. End of alignment within target 5436039 + 11. Query frame 1 + 12. Target frame 1 + 13. Number of identical bases within 29 + the alignment + 14. Alignment length 30 + 15. Aligned portion (sequence) of query CGGACAGCGCCGCCACCAACAAAGCCACCA + 16. Aligned portion (sequence) of target CGGACAGCGCCGCCACCAACAAAGCCATCA + 17. Midline indicating positions of ||||||||||||||||||||||||||| || + matches within the alignment + +------ + +.. class:: infomark + +Note that this form of output does not contain alignment identify value. However, it can be computed by dividing the number of identical bases within the alignment (Field 13) by the alignment length (Field 14) using *Text Manipulation->Compute* tool + + + +</help> +</tool>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/repository_dependencies.xml Mon May 19 12:33:19 2014 -0400 @@ -0,0 +1,4 @@ +<?xml version="1.0"?> +<repositories> + <repository changeset_revision="de11e1a921c4" name="blast_datatypes" owner="devteam" toolshed="http://toolshed.g2.bx.psu.edu" /> +</repositories>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/megablast_xml_parser_test1_out.tabular Mon May 19 12:33:19 2014 -0400 @@ -0,0 +1,103 @@ +0_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 5436010 5436039 1 1 30 30 CGGACAGCGCCGCCACCAACAAAGCCACCA CGGACAGCGCCGCCACCAACAAAGCCACCA |||||||||||||||||||||||||||||| +1_0.600000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 696993 697022 1 1 30 30 AAAACACCGGATGCTCCGGCGCTGGCAGAT AAAACACCGGATGCTCCGGCGCTGGCAGAT |||||||||||||||||||||||||||||| +2_0.400000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4100018 4100047 1 1 30 30 TTTGCTTTTAGTACACCGGATTCAGAACCA TTTGCTTTTAGTACACCGGATTCAGAACCA |||||||||||||||||||||||||||||| +3_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 2305844 2305873 1 -1 30 30 CCGTCCAGAAAGGTGTATTCATGGGGACGG CCGTCCAGAAAGGTGTATTCATGGGGACGG |||||||||||||||||||||||||||||| +4_0.766667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3457901 3457930 1 1 30 30 CACGCTACGTGCGCCCCCGCCCAGAAGGCG CACGCTACGTGCGCCCCCGCCCAGAAGGCG |||||||||||||||||||||||||||||| +5_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 1264131 1264160 1 -1 30 30 GCACTTAACCCGCTTCGGCGGGTTTTGTTT GCACTTAACCCGCTTCGGCGGGTTTTGTTT |||||||||||||||||||||||||||||| +5_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 1636485 1636514 1 -1 30 30 GCACTTAACCCGCTTCGGCGGGTTTTGTTT GCACTTAACCCGCTTCGGCGGGTTTTGTTT |||||||||||||||||||||||||||||| +5_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2318694 2318723 1 1 30 30 AAACAAAACCCGCCGAAGCGGGTTAAGTGC AAACAAAACCCGCCGAAGCGGGTTAAGTGC |||||||||||||||||||||||||||||| +5_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2777043 2777072 1 1 30 30 AAACAAAACCCGCCGAAGCGGGTTAAGTGC AAACAAAACCCGCCGAAGCGGGTTAAGTGC |||||||||||||||||||||||||||||| +6_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1185124 1185153 1 1 30 30 TAAGCCGTTACTGGCAGCAAGTGCAGGCAA TAAGCCGTTACTGGCAGCAAGTGCAGGCAA |||||||||||||||||||||||||||||| +7_0.400000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2458203 2458232 1 1 30 30 TGAATTTACCGTTATCTATCTTGCCTGCCT TGAATTTACCGTTATCTATCTTGCCTGCCT |||||||||||||||||||||||||||||| +9_0.400000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 5286666 5286695 1 1 30 30 GCGTTTTGCTAAACTTCTGCCGGAATATAA GCGTTTTGCTAAACTTCTGCCGGAATATAA |||||||||||||||||||||||||||||| +10_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2787672 2787701 1 1 30 30 AAAGAGGCGAGCAGAGTAAAACGCAGGCAA AAAGAGGCGAGCAGAGTAAAACGCAGGCAA |||||||||||||||||||||||||||||| +12_0.700000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4116145 4116174 1 1 30 30 GCGGACGATCTTCACGGTCGCCACGCGGAC GCGGACGATCTTCACGGTCGCCACGCGGAC |||||||||||||||||||||||||||||| +13_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 5442351 5442380 1 1 30 30 TTCTTGTTGGATGGCATACTCCGGCAGCCA TTCTTGTTGGATGGCATACTCCGGCAGCCA |||||||||||||||||||||||||||||| +14_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4626492 4626521 1 1 30 30 ACCCCGATATCGTCGCAGGCGTTGCCGCAC ACCCCGATATCGTCGCAGGCGTTGCCGCAC |||||||||||||||||||||||||||||| +15_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 346897 346926 1 1 30 30 GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC |||||||||||||||||||||||||||||| +15_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 1466536 1466565 1 -1 30 30 GAAGCGCCTCTTCCAGCGGAGACAGCAGCC GAAGCGCCTCTTCCAGCGGAGACAGCAGCC |||||||||||||||||||||||||||||| +15_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1750132 1750161 1 1 30 30 GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC |||||||||||||||||||||||||||||| +15_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1908046 1908075 1 1 30 30 GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC |||||||||||||||||||||||||||||| +15_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2279107 2279136 1 1 30 30 GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC |||||||||||||||||||||||||||||| +15_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2813407 2813436 1 1 30 30 GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC |||||||||||||||||||||||||||||| +15_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3939162 3939191 1 1 30 30 GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC |||||||||||||||||||||||||||||| +15_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4656510 4656539 1 1 30 30 GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC GGCTGCTGTCTCCGCTGGAAGAGGCGCTTC |||||||||||||||||||||||||||||| +16_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2595157 2595186 1 1 30 30 ATGTCCTGATCGAGCGGCGTTTTACCGACC ATGTCCTGATCGAGCGGCGTTTTACCGACC |||||||||||||||||||||||||||||| +17_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 717743 717772 1 1 30 30 GGTGTTGAGTGTCCAGGTAATACGCTCTCG GGTGTTGAGTGTCCAGGTAATACGCTCTCG |||||||||||||||||||||||||||||| +19_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1237938 1237967 1 1 30 30 GTTGTAAGCGTCAGAACCGATGCGGTCGGT GTTGTAAGCGTCAGAACCGATGCGGTCGGT |||||||||||||||||||||||||||||| +20_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4792054 4792083 1 1 30 30 CGACATCCTGTAGGCTGGCTTCAATGCGAC CGACATCCTGTAGGCTGGCTTCAATGCGAC |||||||||||||||||||||||||||||| +21_0.733333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 269757 269786 1 1 30 30 GGGAAGGCTGACGGGCGTCCACACCACGGC GGGAAGGCTGACGGGCGTCCACACCACGGC |||||||||||||||||||||||||||||| +21_0.733333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 274007 274036 1 1 30 30 GGGAAGGCTGACGGGCGTCCACACCACGGC GGGAAGGCTGACGGGCGTCCACACCACGGC |||||||||||||||||||||||||||||| +22_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2706426 2706455 1 1 30 30 CGGTATTCCTCAGTTCTCGCTGCATGCCTG CGGTATTCCTCAGTTCTCGCTGCATGCCTG |||||||||||||||||||||||||||||| +23_0.600000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1512107 1512136 1 1 30 30 TTGCCGTTACGCACCACGCCTTCAGTAGCG TTGCCGTTACGCACCACGCCTTCAGTAGCG |||||||||||||||||||||||||||||| +24_0.733333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2032108 2032137 1 1 30 30 CGCGGGCGCACCACGTCGCTGCTGCTGTTC CGCGGGCGCACCACGTCGCTGCTGCTGTTC |||||||||||||||||||||||||||||| +25_0.266667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1343811 1343840 1 1 30 30 TTTTGGGAAAACTAAATACGCATCAAAAAT TTTTGGGAAAACTAAATACGCATCAAAAAT |||||||||||||||||||||||||||||| +26_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3112551 3112580 1 1 30 30 CAACGAGGCGCTACCGAGTTGTTCAATGCG CAACGAGGCGCTACCGAGTTGTTCAATGCG |||||||||||||||||||||||||||||| +28_0.666667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4405442 4405471 1 1 30 30 CGCTCAATCTGCTCGCGCCTGGCTGGCGTT CGCTCAATCTGCTCGCGCCTGGCTGGCGTT |||||||||||||||||||||||||||||| +29_0.700000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3600547 3600576 1 1 30 30 CTCGTCCGGCGGGCGGTTTTGCCGACAAGG CTCGTCCGGCGGGCGGTTTTGCCGACAAGG |||||||||||||||||||||||||||||| +32_0.600000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1435670 1435699 1 1 30 30 TGAGGATGGTCCTCTGACTCTGCAGGCGCA TGAGGATGGTCCTCTGACTCTGCAGGCGCA |||||||||||||||||||||||||||||| +33_0.300000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3788178 3788207 1 1 30 30 TAGTAACCCTTTAATAAGATTGTCGATTAG TAGTAACCCTTTAATAAGATTGTCGATTAG |||||||||||||||||||||||||||||| +34_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 484499 484528 1 1 30 30 TGATGTTAAATGCATGGCACCTGCCGGTGC TGATGTTAAATGCATGGCACCTGCCGGTGC |||||||||||||||||||||||||||||| +35_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2250064 2250093 1 1 30 30 ACTGCTTTGCCGAGATATTCGAGGTTAACC ACTGCTTTGCCGAGATATTCGAGGTTAACC |||||||||||||||||||||||||||||| +36_0.433333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3698178 3698207 1 1 30 30 TGTTGGCAACATGGCGAGCGTAATCAATTA TGTTGGCAACATGGCGAGCGTAATCAATTA |||||||||||||||||||||||||||||| +38_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4242501 4242530 1 1 30 30 GCAGCAGGATCGGATCGAACTCTGGTTTCT GCAGCAGGATCGGATCGAACTCTGGTTTCT |||||||||||||||||||||||||||||| +39_0.400000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3683151 3683180 1 1 30 30 TAATGCGGCATTCTCCTGATTTATTGTCAC TAATGCGGCATTCTCCTGATTTATTGTCAC |||||||||||||||||||||||||||||| +41_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 789086 789115 1 1 30 30 AGCTGACGGTCAGCAGGGATACTTCCTGCA AGCTGACGGTCAGCAGGGATACTTCCTGCA |||||||||||||||||||||||||||||| +42_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1714771 1714800 1 1 30 30 GCAGTGACTACATCCGCGAGGTGAATGTGG GCAGTGACTACATCCGCGAGGTGAATGTGG |||||||||||||||||||||||||||||| +43_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4272582 4272611 1 1 30 30 GCTTTTTCCAGCATCAACGCCACTGAACAA GCTTTTTCCAGCATCAACGCCACTGAACAA |||||||||||||||||||||||||||||| +44_0.433333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 5481023 5481052 1 1 30 30 AAAGTGGTAGATAACGTGGTGCAGACTATG AAAGTGGTAGATAACGTGGTGCAGACTATG |||||||||||||||||||||||||||||| +45_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 1271829 1271858 1 -1 30 30 ATCCGCGATAAGGTCATCCGGTATCAGGAA ATCCGCGATAAGGTCATCCGGTATCAGGAA |||||||||||||||||||||||||||||| +45_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 1357952 1357981 1 -1 30 30 ATCCGCGATAAGGTCATCCGGTATCAGGAA ATCCGCGATAAGGTCATCCGGTATCAGGAA |||||||||||||||||||||||||||||| +45_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2310674 2310703 1 1 30 30 TTCCTGATACCGGATGACCTTATCGCGGAT TTCCTGATACCGGATGACCTTATCGCGGAT |||||||||||||||||||||||||||||| +45_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2769319 2769348 1 1 30 30 TTCCTGATACCGGATGACCTTATCGCGGAT TTCCTGATACCGGATGACCTTATCGCGGAT |||||||||||||||||||||||||||||| +45_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2991293 2991322 1 1 30 30 TTCCTGATACCGGATGACCTTATCGCGGAT TTCCTGATACCGGATGACCTTATCGCGGAT |||||||||||||||||||||||||||||| +46_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1080570 1080599 1 1 30 30 ACCTGTACCCCAGGACCATGGTACATTTAT ACCTGTACCCCAGGACCATGGTACATTTAT |||||||||||||||||||||||||||||| +46_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1476177 1476206 1 1 30 30 ACCTGTACCCCAGGACCATGGTACATTTAT ACCTGTACCCCAGGACCATGGTACATTTAT |||||||||||||||||||||||||||||| +47_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2887871 2887900 1 1 30 30 ACAATGCAACCAGACCAGCCCGGATCGATA ACAATGCAACCAGACCAGCCCGGATCGATA |||||||||||||||||||||||||||||| +49_0.433333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4152853 4152882 1 1 30 30 CGTTATACGGAACAACATTTAACTCCAGCG CGTTATACGGAACAACATTTAACTCCAGCG |||||||||||||||||||||||||||||| +50_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3568677 3568706 1 1 30 30 TTGCTGTTGCCATCGCTTTTCAGGACATAC TTGCTGTTGCCATCGCTTTTCAGGACATAC |||||||||||||||||||||||||||||| +51_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3739788 3739817 1 1 30 30 CGACGGTATCGGTACGCAGATTGTGATGGA CGACGGTATCGGTACGCAGATTGTGATGGA |||||||||||||||||||||||||||||| +52_0.366667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3789407 3789436 1 1 30 30 ATGAGCATCAACATCGAAATCTCAAACCAA ATGAGCATCAACATCGAAATCTCAAACCAA |||||||||||||||||||||||||||||| +54_0.400000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3161991 3162020 1 1 30 30 GTATTCTTCATTGATTTGTAAGCGGGTACC GTATTCTTCATTGATTTGTAAGCGGGTACC |||||||||||||||||||||||||||||| +55_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4384753 4384782 1 1 30 30 AAGCGCTGTTCAACATAAATTGGCTGACGG AAGCGCTGTTCAACATAAATTGGCTGACGG |||||||||||||||||||||||||||||| +56_0.433333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2915787 2915816 1 1 30 30 AACCGTCAGCTCTTTACGCAATATTTTGCC AACCGTCAGCTCTTTACGCAATATTTTGCC |||||||||||||||||||||||||||||| +57_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 294604 294633 1 1 30 30 CGCGAAATCCTCGACGTCCAGGCACGTATT CGCGAAATCCTCGACGTCCAGGCACGTATT |||||||||||||||||||||||||||||| +58_0.300000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1553483 1553512 1 1 30 30 GTTATCCATTAAAATAGATCGGATCGATAT GTTATCCATTAAAATAGATCGGATCGATAT |||||||||||||||||||||||||||||| +59_0.300000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1351506 1351535 1 1 30 30 AAAATCTGCATATCATGATAAGAGTGGTTA AAAATCTGCATATCATGATAAGAGTGGTTA |||||||||||||||||||||||||||||| +59_0.300000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 2997458 2997487 1 -1 30 30 TAACCACTCTTATCATGATATGCAGATTTT TAACCACTCTTATCATGATATGCAGATTTT |||||||||||||||||||||||||||||| +61_0.366667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1987157 1987186 1 1 30 30 TCAGTTTGAAAGCTTTGTCAGCCGTTTTTT TCAGTTTGAAAGCTTTGTCAGCCGTTTTTT |||||||||||||||||||||||||||||| +62_0.366667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1667830 1667859 1 1 30 30 AATCCTAAACCTAGGAATGCCAGAATATCT AATCCTAAACCTAGGAATGCCAGAATATCT |||||||||||||||||||||||||||||| +63_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 231418 231447 1 -1 30 30 TGGCATAAGCCAGCTTGACTGCGAGCGTGA TGGCATAAGCCAGCTTGACTGCGAGCGTGA |||||||||||||||||||||||||||||| +63_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3516862 3516891 1 1 30 30 TCACGCTCGCAGTCAAGCTGGCTTATGCCA TCACGCTCGCAGTCAAGCTGGCTTATGCCA |||||||||||||||||||||||||||||| +63_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4226650 4226679 1 1 30 30 TCACGCTCGCAGTCAAGCTGGCTTATGCCA TCACGCTCGCAGTCAAGCTGGCTTATGCCA |||||||||||||||||||||||||||||| +63_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 4808457 4808486 1 -1 30 30 TGGCATAAGCCAGCTTGACTGCGAGCGTGA TGGCATAAGCCAGCTTGACTGCGAGCGTGA |||||||||||||||||||||||||||||| +63_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 4904735 4904764 1 -1 30 30 TGGCATAAGCCAGCTTGACTGCGAGCGTGA TGGCATAAGCCAGCTTGACTGCGAGCGTGA |||||||||||||||||||||||||||||| +63_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 5048915 5048944 1 -1 30 30 TGGCATAAGCCAGCTTGACTGCGAGCGTGA TGGCATAAGCCAGCTTGACTGCGAGCGTGA |||||||||||||||||||||||||||||| +63_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 30 1 5089922 5089951 1 -1 30 30 TGGCATAAGCCAGCTTGACTGCGAGCGTGA TGGCATAAGCCAGCTTGACTGCGAGCGTGA |||||||||||||||||||||||||||||| +64_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 5440369 5440398 1 1 30 30 GAGATGACGGTTGCAGAGTCATGCGTTTGA GAGATGACGGTTGCAGAGTCATGCGTTTGA |||||||||||||||||||||||||||||| +65_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3963858 3963887 1 1 30 30 TCTGGATCACGCGCAAACACTGGCTATCGT TCTGGATCACGCGCAAACACTGGCTATCGT |||||||||||||||||||||||||||||| +66_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4142497 4142526 1 1 30 30 TCTGCTTTAGCAAACAGAGTGTGGTCACGA TCTGCTTTAGCAAACAGAGTGTGGTCACGA |||||||||||||||||||||||||||||| +67_0.400000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3532236 3532265 1 1 30 30 GCCTTTTGTCTGATCATCCACAATAATGAC GCCTTTTGTCTGATCATCCACAATAATGAC |||||||||||||||||||||||||||||| +68_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 779994 780023 1 1 30 30 GAAGGATAGTTGGTCAGCAACACCAGCGGC GAAGGATAGTTGGTCAGCAACACCAGCGGC |||||||||||||||||||||||||||||| +70_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1317239 1317268 1 1 30 30 TGGTGTTCAGCATCTCAACGGTAATTCGCT TGGTGTTCAGCATCTCAACGGTAATTCGCT |||||||||||||||||||||||||||||| +71_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 5080463 5080492 1 1 30 30 CAGGATGCAAACTGCCGGGAGATCCAGTTA CAGGATGCAAACTGCCGGGAGATCCAGTTA |||||||||||||||||||||||||||||| +72_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3605409 3605438 1 1 30 30 AACTGGAAGGGCTTGGGATGACACAACAGC AACTGGAAGGGCTTGGGATGACACAACAGC |||||||||||||||||||||||||||||| +73_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3280815 3280844 1 1 30 30 TTTAAGCGCCAACCAGGCTTCTTTGGTTGC TTTAAGCGCCAACCAGGCTTCTTTGGTTGC |||||||||||||||||||||||||||||| +75_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2230266 2230295 1 1 30 30 ATAACCCTCTGCAACCGCCGCTTCAGCAAA ATAACCCTCTGCAACCGCCGCTTCAGCAAA |||||||||||||||||||||||||||||| +76_0.600000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 462631 462660 1 1 30 30 TGAAGCCGTACAACGGGCGCTGGAATTCGC TGAAGCCGTACAACGGGCGCTGGAATTCGC |||||||||||||||||||||||||||||| +77_0.700000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 2939076 2939105 1 1 30 30 GAGCTGCAACGCGGTCAGCCAGCTGGCGGT GAGCTGCAACGCGGTCAGCCAGCTGGCGGT |||||||||||||||||||||||||||||| +78_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 5422053 5422082 1 1 30 30 CGGAGTATCCGTTCCCCAACGACAAGCATC CGGAGTATCCGTTCCCCAACGACAAGCATC |||||||||||||||||||||||||||||| +79_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4387420 4387449 1 1 30 30 AATACCGGGAAGAGACAACGGGGTCTCTTT AATACCGGGAAGAGACAACGGGGTCTCTTT |||||||||||||||||||||||||||||| +81_0.433333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1037150 1037179 1 1 30 30 ATTAATGTTGCCGGCACAACATAATAGGGC ATTAATGTTGCCGGCACAACATAATAGGGC |||||||||||||||||||||||||||||| +82_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1182188 1182217 1 1 30 30 ACTGGGTTGCTCTGAACAAGAAAGGCGCTA ACTGGGTTGCTCTGAACAAGAAAGGCGCTA |||||||||||||||||||||||||||||| +83_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 5430210 5430239 1 1 30 30 CGCCAGGGACGTATCGCGTCGATATCTATT CGCCAGGGACGTATCGCGTCGATATCTATT |||||||||||||||||||||||||||||| +84_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 310995 311024 1 1 30 30 TGCTCGTTCCCGTCGTGATGAAGCTCGAAA TGCTCGTTCCCGTCGTGATGAAGCTCGAAA |||||||||||||||||||||||||||||| +85_0.500000 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4174173 4174202 1 1 30 30 AGGAAAGCAAACAACACGACCACCATCAGC AGGAAAGCAAACAACACGACCACCATCAGC |||||||||||||||||||||||||||||| +86_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 163690 163719 1 1 30 30 GGCAACGCAGGCGCATGATTCTGCTTGGAA GGCAACGCAGGCGCATGATTCTGCTTGGAA |||||||||||||||||||||||||||||| +88_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3071785 3071814 1 1 30 30 CGTACCGGGCTGAAAGTAGAAGAGCGTTTC CGTACCGGGCTGAAAGTAGAAGAGCGTTTC |||||||||||||||||||||||||||||| +90_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 692131 692160 1 1 30 30 ATCACCGTTTCGCTAACCGGTACGTTTAAC ATCACCGTTTCGCTAACCGGTACGTTTAAC |||||||||||||||||||||||||||||| +91_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3307050 3307079 1 1 30 30 TTCGCCCGGCAAGCTTACCCAACGCTTATC TTCGCCCGGCAAGCTTACCCAACGCTTATC |||||||||||||||||||||||||||||| +94_0.466667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 1813009 1813038 1 1 30 30 CCACGGTGATATCTGGTGCCATACTGATAA CCACGGTGATATCTGGTGCCATACTGATAA |||||||||||||||||||||||||||||| +96_0.533333 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 573782 573811 1 1 30 30 TTGCCGGGAAGAGAGATATCAATGGCAGGC TTGCCGGGAAGAGAGATATCAATGGCAGGC |||||||||||||||||||||||||||||| +97_0.566667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 3570563 3570592 1 1 30 30 TGCGCCGCCGGATTGTTGCTCAACATGCTT TGCGCCGCCGGATTGTTGCTCAACATGCTT |||||||||||||||||||||||||||||| +98_0.366667 30 gnl|BL_ORD_ID|0 5528445 59.96 8.38112e-11 1 30 4545136 4545165 1 1 30 30 AACGCGCTAACCGCCAATAATAACAAAATT AACGCGCTAACCGCCAATAATAACAAAATT ||||||||||||||||||||||||||||||