# HG changeset patch # User greg # Date 1670856178 0 # Node ID b6794f4cb1c615bea2d2fd3cf17b178e8a4577a0 Uploaded diff -r 000000000000 -r b6794f4cb1c6 .shed.yml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/.shed.yml Mon Dec 12 14:42:58 2022 +0000 @@ -0,0 +1,9 @@ +name: bam_to_psl +owner: greg +description: Converts a BAM or SAM dataset to PSL format +long_description: Converts a BAM or SAM dataset to PSL format +categories: +- Convert Formats +remote_repository_url: https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/convert_formats/bam_to_psl +homepage_url: https://github.com/gregvonkuster/galaxy_tools +type: unrestricted diff -r 000000000000 -r b6794f4cb1c6 bam_to_psl.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/bam_to_psl.py Mon Dec 12 14:42:58 2022 +0000 @@ -0,0 +1,170 @@ +#!/usr/bin/env python + +# This code is very loosely based on +# the FusionCatcher sam2psl script here: +# https://github.com/ndaniel/fusioncatcher/blob/master/bin/sam2psl.py + +import argparse +import sys + + +def parse_cigar(c): + r = [] + d = '' + mismatches_x = 0 + c = c.upper() + for a in c: + if a.isdigit(): + d = d + a + elif a in ['M', 'I', 'D', 'N', 'S', 'H', 'P', '=', 'X']: + dd = int(d) + r.append((a, dd)) + if a == 'X': + mismatches_x = mismatches_x + dd + d = '' + else: + msg = "Error: unknown CIGAR: %s\n" % str(c) + sys.exit(msg) + return (r, mismatches_x) + + +def blocks(cigar, ig=0): + # Returns block of matches. Hard clipping is + # converted to soft clipping index on read. + ir = 0 + rr = [] + rg = [] + match = 0 + mismatch = 0 + mismatch_x = 0 + mismatch_clip = 0 + insert_query = 0 + insert_query_count = 0 + insert_ref = 0 + insert_ref_count = 0 + # Sum of lengths of the M/I/S/=/X operations + # will equal the length of SEQ. + seq_len = 0 + (cig, mismatch_x) = parse_cigar(cigar) + mismatch = mismatch_x + for e in cig: + if e[0] in ('S', 'H'): + ir = ir + e[1] + mismatch_clip = mismatch_clip + e[1] + seq_len = seq_len + e[1] + elif e[0] in ('I',): + ir = ir + e[1] + mismatch = mismatch + e[1] + insert_query = insert_query + e[1] + insert_query_count = insert_query_count + 1 + seq_len = seq_len + e[1] + elif e[0] in ('X'): + ir = ir + e[1] + ig = ig + e[1] + mismatch = mismatch + e[1] + mismatch_x = mismatch_x + e[1] + seq_len = seq_len + e[1] + elif e[0] in ('M', '='): + rr.append((ir, ir + e[1])) + rg.append((ig, ig + e[1])) + ir = ir + e[1] + ig = ig + e[1] + match = match + e[1] + seq_len = seq_len + e[1] + elif e[0] in ('D', 'N', 'P'): + ig = ig + e[1] + insert_ref = insert_ref + e[1] + insert_ref_count = insert_ref_count + 1 + return (rr, rg, match, mismatch, mismatch_clip, mismatch_x, insert_ref, insert_ref_count, insert_query, insert_query_count, seq_len) + + +def get_psl(sam, lens): + # Returns PSL coordinates. + if sam and sam[1].isdigit(): + unmapped = True if int(sam[1]) & 0x4 else False + if (not unmapped) and sam[2] != '*' and sam[5] != '*' and sam[0] != '*': + # Initialize psl_items to those + # that constitute a PSL empty line. + psl_items = ['0', '0', '0', '0', '0', '0', '0', '0', '+', 's', '0', '0', '0', 'r', '0', '0', '0', '0', ',', ',', ','] + # Read sequence length. + psl_items[14] = lens.get(sam[2], 0) + # Reference name. + psl_items[13] = sam[2] + # Read name. + psl_items[9] = sam[0] + # Strand. + psl_items[8] = "-" if int(sam[1]) & 0x10 else '+' + # Start position. + psl_items[15] = int(sam[3]) - 1 + (interval_query, interval_ref, match, mismatch, mismatch_clip, mismatch_x, insert_ref, insert_ref_count, insert_query, insert_query_count, seq_len) = blocks(sam[5], ig=psl_items[15]) + # Read sequence length. + if sam[9] != '*' and sam[5].find('H') == -1: + psl_items[10] = len(sam[9]) + else: + # The length of SEQ is the sum of the + # lengths of the M/I/S/=/X operations. + psl_items[10] = seq_len + psl_items[4] = insert_query_count + psl_items[5] = insert_query + psl_items[6] = insert_ref_count + psl_items[7] = insert_ref + # Extract the mismatches using tag + # NM:i (NM is mismatches per reads). + tag_nm_i = [e.partition("NM:i:")[2] for e in sam[11:] if e.startswith('NM:i:')] + if not tag_nm_i: + # NM is not ideal because it is mismatches + # per # fragment and not per read, but is + # etter than nothing. + tag_nm_i = [e.partition("nM:i:")[2] for e in sam[11:] if e.startswith('nM:i:')] + tag_nm_i = int(tag_nm_i[0]) if tag_nm_i else 0 + if tag_nm_i > float(0.90) * seq_len: + tag_nm_i = 0 + # Compute the matches and mismatches (include the + # clipping as mismatches). + psl_items[0] = match + psl_items[1] = mismatch + if interval_query: + psl_items[11] = interval_query[0][0] + psl_items[12] = interval_query[-1][1] + psl_items[16] = interval_ref[-1][1] + psl_items[17] = len(interval_query) + # BLAT always gives the coordinates as + # everything is mapped on the forwward + # strand. + psl_items[18] = ','.join([str(e[1] - e[0]) for e in interval_query]) + ',' + psl_items[19] = ','.join([str(e[0]) for e in interval_query]) + ',' + psl_items[20] = ','.join([str(e[0]) for e in interval_ref]) + ',' + return map(str, psl_items) + else: + return None + + +def to_psl(input_file, psl_file): + # Convert a SAM file to PSL format. + header = dict() + with open(input_file, 'r') as fin, open(psl_file, 'w') as fou: + for i, sam_line in enumerate(fin): + sam_line = sam_line.rstrip('\r\n') + if sam_line: + sam_items = sam_line.split('\t') + if sam_items[0].startswith('@'): + if sam_items[0].startswith('@SQ') and sam_items[1].startswith('SN:') and sam_items[2].startswith('LN:'): + k = sam_items[1][3:] + v = int(sam_items[2][3:]) + header[k] = v + else: + psl_items = get_psl(sam_items, header) + if psl_items is not None: + fou.write('%s\n' % '\t'.join(psl_items)) + + +if __name__ == '__main__': + + parser = argparse.ArgumentParser() + + parser.add_argument("--input_file", action="store", dest="input_file", help="Input file in SAM format.") + parser.add_argument("--output_file", action="store", dest="output_file", help="Output file in PSL format.") + + args = parser.parse_args() + + to_psl(args.input_file, args.output_file) diff -r 000000000000 -r b6794f4cb1c6 bam_to_psl.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/bam_to_psl.xml Mon Dec 12 14:42:58 2022 +0000 @@ -0,0 +1,40 @@ + + + + macros.xml + + + + + + + + + + + + + + + + + + + + +**What it does** + +Converts a BAM or SAM dataset to PSL format - https://genome.ucsc.edu/FAQ/FAQformat.html#format2. + + + + diff -r 000000000000 -r b6794f4cb1c6 macros.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml Mon Dec 12 14:42:58 2022 +0000 @@ -0,0 +1,17 @@ + + 1.16.1 + 0 + 21.01 + + + samtools + python + + + + + 10.1101/011650 + + + + diff -r 000000000000 -r b6794f4cb1c6 test-data/input_1.sam --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/input_1.sam Mon Dec 12 14:42:58 2022 +0000 @@ -0,0 +1,162 @@ +@HD VN:1.4 SQ:sorted SO:coordinate +@SQ SN:chr1 LN:1626 +chr1-106 0 chr1 4 99 125=1X8=1X52=1X12= * 0 0 TCATGATTTCTTACCTATTAGTGGTTGAACATCGTGATATGTATGTTGACGGCCATAAGGCTGCTTCTTGTTGTCGATAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTCTTCTCACTGCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTACTGCGTGTAGCG ??A??BBBDDBDDBDDGFGGGFHHHHI6IFFHH?FIHCHHIHIEHIHGFHGIIIFGHIHGCHIHHIFAIHHIIGIHEHIHIBBHIGIGFFHFHFHFEIFEHHIHHHI=FHG>HGHHHGE?EG*EE?EEEGGFGEFGGGGGGE@GGEEAEGDGED(GEEAG??E(FGG +chr1-99 0 chr1 14 99 101=1X98= * 0 0 TTACCTATTAGTGGTTGAACATCGTGATATGTATGTTGACGGCCATAAGGCTGCTTCTTGTTGTCGATAGAACTTCATGTGCCTGTAAAACGAAGCGGTAACAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGG ?????BBBDDDDDDDBDGGFGFIHCIHFHIHIIIEH9IHHHFFFI.HIIHHHIBAIIH@FFH5FAEICIAHHGIHDI5BHHHIBH?IGHIHHGHIHHHHHH7IIHH?HHDDHHD,:DHFHHHFDEFGHH*FG4FGG +chr1-160 0 chr1 48 99 183=1X16= * 0 0 GTTGACGGCCATAAGGCTGCTTCTTGTTGTCGATAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTATCTTTATCGCTTTTACC ?A?9?BB?@D@DDDEBFGGGGGIHHIIIFEFIIHIHHGHHIHIHHIIIHHHFIDIFIHFFIHCIIIDFFHHFFHIHHHFIIHCIHIEHHHIGIIBHIEIDHHGIDDGHHHHHEHGHGGG3HFFHEFFCGFEE;GEDGGGFFE9G?FGGBCG?FGGGEEGGGDEGGGGGGGGGBEEFEG;EFEGGGGGGGCGGGGE'8EGG:GECGGGEFGG*:EGGCEF +chr1-121 16 chr1 79 99 200= * 0 0 GATAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCT EEE/DFE?CA:GEE?EDGF;GGG0EGGGGEFE:GG?E?:GGGFG@FGCGGEGEH?G+FDEEGGIGG;GEEBHG7HHG.HEHFGHHGGHEHHGH?H?FHHGHCIHHIDFHHHCH.FGGI-IIHHIIFHIIHHEHAHGHHHFDIICIHGHDHHIIHHIGFHIIHIGHIIHHIH>IHIFHI@FGCG>?BDDDBBDBBB??AA? +chr1-89 16 chr1 109 99 200= * 0 0 CGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCT GGFE8FFGGGFGEEEGGEE:CEGEFFGGEEGEG*GEGG.DEECFF:FGCAAGGFGG4EG)FGGEEEFEAG,HGC9HHFGFFG;BGGH5HHGDHGI=DHGF@IIIFHGH@IGFFHFHHIHIHIFHGGIIHHHFHFHIHHEIIIIIIHIIHIHIIIIHIFHHIFIIHFIIHHIIII/IICFGGGCFBDDDDDDABB?A??A? +chr1-14 16 chr1 111 99 200= * 0 0 GTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTT CEGG?F/CEG?AGGCGEGGGGGG,GGGGGEGEDCGGEE??GEGAEFGFGCDGHAIHFCIEAFFF>DDDDD5DBBB?5?AGGGEFGAEGG?GCGGGGGGEGFAGG'GE;GEE>G?B=FEEFEGGGGGG;EB;GCGEH*@GHFEHGGHH=HFHGBHEHGGIHIGFFHFEDHHIHHCIHIHEFFCHHGIIIHHFII4@HHIF5IIHFDHGIECIIIIHHGEIIIFIEHGHH=HHHIEIHHFIGHCHHHHIHFFCGGFDDD5DDDBBBB???A? +chr1-85 16 chr1 125 99 6=1X193= * 0 0 TTTTTTACTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCC EG:GEE.EGHHHHEHFFCHEHHHHEHHGHHIDHIHEIHHHIIIHIHIDHDHIHHIIIHHHIAHH=AIHIHHFIGIIIHIIIIIHHHHEHHEH;HHIHGIHIFFCHH;CGGGFDD?DG:;GE?GGG:FGDEFGG1?< +chr1-102 16 chr1 136 99 200= * 0 0 CTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCT 8GEE*EAGAEEGF9GE8D6?GA;FGEG?GAEGG??CBGFFGCGC*GEGEG:EEGGGFEGBEEGGIEGGAEHGDHH@EFHCGFFHEG=FEFHHGGCGEFHHDIHDHHFEIHIIEIHIGIIIIEH=FIIHEII>GFIHHIH7H8FGHI=HIIGIIHHHIIIDHIFIIFFHHHICHHFI6HFGGGFFDDDDD.DDB4B??A?? +chr1-29 0 chr1 137 99 200= * 0 0 TTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTT ?????B?BDDDBDDB-GFFEFFHHHHHHIHIHIHEHFGHCIIGHEHHIIII@FGHIIIFHFEEDHFIIHCIFICIIHHHHHHHHHIGHHHEIHG*FHH,AHHFHIDHGH=HHGCG?HHGGEHFHIFBGCBGHHHGI?;EG@?GFD@GAGCGBG18GECEGE2FEG?E:CGGEGEGGFE/EGGFEGFE?GGG8GCEGEGGF +chr1-92 16 chr1 143 99 65=1X134= * 0 0 TACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTAAGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTAC EG;FG0IFGEIHHD>HHHIH@HIIIDIGFIHIFFHHIIFIIGFGGGGBDDDDDDEBBBA???? +chr1-139 0 chr1 149 99 117=1X82= * 0 0 AGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTGCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTA ??,?ABBBDEDBDHHHHDHHGFGFC,GHHHHFGHEDGFEFEFGEIEHGEGGG@EEDEGG?FGF@GGEEEFGG6FG5GGGCGF>GGE0;:*CGGGGEG*GGFFFF(EGG +chr1-84 0 chr1 164 99 57=1X100=1X41= * 0 0 AGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGTTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTCCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTG BEHIA?IFHIICHHHHIHGIIEEFGADFGGDGFG?'GFE?EGEFGEEEGGEGGGAGGEEGEGGGGGGCECEGAG;G* +chr1-125 0 chr1 170 99 200= * 0 0 AACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCG ????ABB@BDD@@DDDGGGFDGHIHIIHIHIHHHIE=IHHHFHHIGIIIIADHHIIEHHGGHEHEIHIFHIHFIHIHIIEGHEFIFIIFHFIHF+FGGGDDBDDDDDBBB,=?A? +chr1-53 0 chr1 211 99 134=1X1=1X63= * 0 0 TGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGACTGAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTA A??A?BBBDBBD?DBDCFGFGGFIIHHHHIIHHFHEBHIHHIIIH8HHH9IEIIAIHHGIHIH-BIEEFIIIIHHFHIIIIHDIHEHHIIHHIIHIHHC.HHHEHFGCD=C*GEHHFGGEGDGF@HFHFFHGEG,G,EGCEHBGD*GGFEG*FEEGEGEGCEGF:GD;G?EE=EEEE?GGEGGGAEFE:GCDEGGEEGEE +chr1-105 0 chr1 226 99 200= * 0 0 GTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGA ???A?B@@DEDD@DDDCGFGFGIFH?HIHEIFIG.HIFHHFCHGHIIHHCHEIHHHHIEIII:IF=EIGIHHIIIFHHIGHGHHHI+DHEIH@IHF7HDFFHHBAHFHIDIHGGADD@EHEEEEEGGEEGFG>EGCGIGGAGDGEEGFE'EGDFGEDFGFBC8DEGEAGEGGA8EEEAGGA?EEGEGGGEE6GEE??GEG +chr1-127 16 chr1 245 99 97=1X102= * 0 0 ACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTAAGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGG FECGGGGFGEEEFEC?GGGFGGFGGG(E4;GGEGAEGECFGGAEGEECEG.=@GGEGGFEGEF7GGDDEDFFEH'F.GDDHEGHDHHFFFHHGHHHH*HHIHHIIHGIIIHICIBIHHHIIFIIBIIIDHH-HBH+HHEIIIIFHHHIHGIDEIIHIHHDIGHIHFIIHHCHHFII@CGFEGFGBDEDDADEB@BA???A +chr1-147 0 chr1 270 99 64=1X135= * 0 0 GTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGTTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCAC ?=A?ABBBDDBDBADBFFFGGGIHHIFEHHHIIGHIIGDICFHHHAHIFIIIIHFFHHHIIIHH+IFIAHHEH5HICIHGIGFHIHIDIEIHIHGIEHHFIHGHHHHHHDHGGI6EFHF@HEHHGBGHGF@GHFEEEGGGHGEEGFGGEG9DCG8GGGGGEGECEGFFFEFF4GGGEFGGEGGGFGFFGCC8)GEEEGGG +chr1-83 0 chr1 271 99 200= * 0 0 TATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACT ??AAA=B@DDDDDDBDFGFG>GIHCIHHH9IIHIIHIGHIFHDIGHIIF?HGIGIIFFGHF?HIIFEHHIFIFGHHHGEIGICECIDGIHIFHF3FHEHIIIHCECHHGHHHGHHGGHHGFGGHHG-FHGEGGHGG9FGECC?GGGEEGAGEGF>GE?CBGFGFFGEFDGHE???/8EEGFCCEGE:6EECEG?GEG=GA +chr1-36 0 chr1 272 99 123=1X76= * 0 0 ATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCACAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTT ???IHIIHHHHHF-HC/HIFFIFHAIHCIHHIIHGEFFIIHHCEIFGICIIIIHGI?GGGGCDDA@BDDDBABAA??? +chr1-136 0 chr1 280 99 200= * 0 0 GTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACT ????ABBADD*HEHHFHHECHIHGDGHIIIFHII8HIHIIIH5I?=DHIFHHIFIFHHHH?HGGIHH,IHIIHIIIHIIFHFHIIHH-HGFIHIIII8CG?GEGDDDBDDDDBA??A??? +chr1-78 0 chr1 303 99 200= * 0 0 CCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTG ?AA????BDBGF.IIEIIIIEIHIIIIIEIIHIFGIHFIEFIHFHFHH-FEDFHDCHICHHI5HFGGHHFHIE4IIFGFFHHHI.HIHGIFIIFFCHHHIHFHHFHHGHHHFF@EEGBHH;>GHEA=GGGGEGEEEHGGGGFECGGFCGE;GFGGG1GFGFEAFGFGGFFFE*GFGF8GCEGGGGGGGFCF +chr1-111 16 chr1 315 99 130=1X69= * 0 0 AAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGAAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATC GG?GEE?GFGEECGGGGGEGFGGCEG;CGAC8FGFEGEG8FFGFGGEAEGAEAGBEGG*GGFFFHEEIHIHIGCIHHIEHHIIFCHHHHHH.HIBHIHHHHHIIIIHIHHIGICIHFA8HGGGECGEDDADDDIHIHFHEHHIGHHHHHHH+IFHIIHHGHEHCDHHIIIGFECIICDHIHEHIHIHHHHIF>IHHIHHHIFHH-IGHHGHIIHHIHIIEHIII;CGFGF@DBDBDBE>BB??=,? +chr1-146 16 chr1 351 99 200= * 0 0 TCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGA GG*2GC?EGGCEEIIFIGGFFFFDD@DBIHFHIFHIFGBICHEHEFHIHHH5HFHIHHIFIDHHGBHHHHCHDFIFHH+IAHIHIHHFIHHIHDHHFIFHHFIHHIHHFHHFGHHFDFG2HBHFEEEFEF.GGHFEGEEEEAGGGGEGCGG=GGFC?GGEEGB?GGFG8GGEGGCGEEGFEGGDFAEGGA(CGAE +chr1-81 0 chr1 366 99 200= * 0 0 GGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTAT ?5A?A??B@DDDDDDDCFGFFGIHFCHFHIHIIHHIHHHHCHFHH8IHHHIHHHIHHHIFFFAFHHI5-HHCIIHFIFHFIHIFIHIH?HHGHHHFFHFFIIFHHHBHIHHH?HIHEHGEEDG8H@ECFGEFFGEEEEGE?GACEBAFGGGCGEDGFFG*?CEGGGGE=GGCFGEGGFEGIFF?IF-I?HIIEHIIHIHEHHHIFIIIB,IIH@?FEHIFHHIHIEFFFGFGDD@DDDEBBBB?A??? +chr1-48 0 chr1 385 99 200= * 0 0 CGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAA IFIHIIHIIIIEFFE?GIGFHHH8HHIHIAHHFFIEIGIIFIIHIIHGIIHFFIFIHFGGFIHH=HH6IHHDFHHFFCHEH=G?HHHFHCHDHFGH=E,HGGB@CGEFGGGGHCGGGGEGGGGGEFGFGGEGEGGFEA:A=GGGGG??G;EGC;IHCCIIIIIIFIIIAHAGHFHEFIIGI@G,BDGEFFIIIHHEFHIFIIHEDCFHICHHEIHF,IHFFECEHHGIIEFHBHHEHDHHEBFFIHHIHHEB?EEHHGGHGHGGGF4FGF?GGECGEGGCGGEG:FFG?EGGEEGGGGFFEGEGGFFCE?EGGGGG?EGCGG?GAGG:GEF( +chr1-8 0 chr1 396 99 99=1X100= * 0 0 AAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCAAGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGA 9????BB8DBBED?DDAGFFFGIIIAHHIFIIHHHHFHHIHIIIIIHIH-GIIAHHCII+CHIH-HEFIIEFHA5HIHHHHIEHIHBIHIIHHI0HFEHBIIFH.F.HHGBHBEHHH7HD1GGGEGEGG=GG6HE;EEGCGGGGBGGGGE;GGGECEGGAGEGGECGGFGGEFGCGEGG+CGG=E?EGG6GEEGCGG4GE +chr1-140 16 chr1 399 99 96=1X103= * 0 0 TTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCAGGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACT EGGCGC<*GEGGCA6-GGGEEGGEGF:GG??EAG?GEGEEDFGCEEEEEGE(GFECGGGEHFBFEFEHFHG<=EHHHF@F7HHHHFGGI?FHFHFF+GFGHHEAHHIHGFHGFGFEHHFHIHGIIIBHHIFIDHEIFHI=*HCAIIIIIHFIIHIAHHHIIHHHHHIFIHIIHHCIAHGGGGGG@DDDDDBD9>B?A??? +chr1-109 0 chr1 404 99 200= * 0 0 CCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATG ?????B?9EFHHHGGHGGFHG=HHHHHFF?H6EHGBHIFGHFF+FCEGGHGFDEGHHHGFHHFIHGFHIHC=FIHHHHIFHHIHHHGHFHIIHIIIHHHIHDFHHHIGIHHFI=AIHHHHGDIHHHHHIHIIIIIDHFIHHHFFHHF-HHFGGGEGDDDDDDBDBBBA???? +chr1-126 0 chr1 440 99 200= * 0 0 AGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTT ??????BBDDDDDEBDFG?B>FIHHFC;HHGEIHHHIFHH:GFHGHIHEIHFHHHIIHIFI+HIHIHFIIHIEIHHCHIFHHHIEIHIHGFHGHFIFHIFHHFHEH+FCHHGGHEHHHGF7HHFFBCGGBHEGAGGGG9GGFEEFGHEEGGEEGGGGGFGGEGFFGEEGEEEGGGFCGGFEGGGFGGEECGEGG/AFEF? +chr1-122 0 chr1 444 99 176=1X23= * 0 0 GTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGAGGTAAAAATTTTTATTTTTTTTC ????FIIICEHCH7IGIIDHHHFGIIH>EDIIIHIDHI=HIHHFHHHFGHHI=IEIHH-HIIGHH5HIHHGHDIHHFDHHHFHHIHHFCHHHHEF?EHHHHDFH3BFEECHHEEGEGEGGHFGGG0GH*GGGGEFGEG?G0GGEECG=FE/EGG:GGGGGEGE9GGGEGG9GGGECG8EE +chr1-128 0 chr1 465 99 200= * 0 0 CTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTT ?9???BAABDEDDDDDGGFGFEIHIBIHIIHHIIH@GIHHCGHIIFHIIIHGIFIIGHEFHHHFHIFHHHDHIHHIHIHHI+IIFHHH7HHHGFHHCHGHFHF=HHHHHFHGFHCGDHHDFGGGHBFHHGGCEGDBFGGACFFFEGGEEGGGGBEFEGFAG;EGGF0EEGFGD86FGGG1GFGFGA8GGF8GGEEFGFGC +chr1-158 16 chr1 472 99 48=1X151= * 0 0 CTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGGTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGC EF?EE:.60FGE6EGAEE*GE:G*+GGAEECGC;EE4EEGFEGGGEBF0GCE;GEGFEGEABEG2H1FHHHGGEGEFEFGHEDEFHH@FH+FCHHH5DHGFHIFIHIHHDHHIGGGHEB-IHHHHIDIIIH=IGGFFIFIFFHHIFFHHHHECIHIIHGIIEIHEHIHIAHIHFHFIIGFFGGFGIICAIHIIIIHDIEFAIHHHHHHIIHEHIFHIIHIIIIHHHCHHFIH>HIHIH5IFHIHH4IFIHIIFHHHGHHIHFHHHHGGIGBDIHHGHHHHEHHFFCBHGFGFGBEEGGGF5GG*GFFGEEFFGCGEEGB'FGEBGGEFE/=EGGEEEGGG?F::GGEGGFGEEEFEE*EGGEEAC?EEEG?ADGGGE8BBG8;DGEGFEHII=IHIIHHIHCAIH@HGFIHI>IFHHDHHHGEHFHFE?IIHIIHDIIHFII=IHFHEHIHIAIGGHHHHFF*IEHBDGGFDFFH7HED,HHHFBHI9HDIHIHHHBDIHHHI@HHFIDIFIIFFIHIIEIHIIIHFIHFHIHHIII*IIIIIHECFIIIIIHHHG6IFHCHFHICHHCFHHEHFFHGCGF;GHGEEGEGEEDFHCGG*GGGGCFGFEEGGGGGGFG;EAGFFG*F6G?:E:G0CEGGFEEFDC>:G*?GAGEGGE +chr1-5 16 chr1 496 99 200= * 0 0 GGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAA G0*F:C*GGG*GG>D6EGEGEGE:FFGGGGGEGGGAEAG?GGFGGGGGDFEEEGEGGG:E.GGGFFEDEHGHDHE@FDEH@G:GHHHGHEHEGFHFEFHFHHHCHDIHAHIHIHIHIHIHIHIFBGHIHIHIAHF;AGIHIHIHHGHHIHIHHHHFIHFIIEH>HIGHHHIHIHICHEGF7F>FDEE@D@BDBBBA???? +chr1-49 16 chr1 501 99 200= * 0 0 TGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCG CAGGEGEGGGEGE?GGECE4GGCGG?BGEFGEGGEG:GEEFGE'FEEDGEGGE:CEGGG8GGGGEGAE0EGFC0FGEGG +chr1-33 0 chr1 528 99 174=1X25= * 0 0 TTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTTCTGCGTGTAGCGTTTATGTTGGTTT ?5A??BBBDDDDDBDDGGFGFGHIIIIHIIHHIHIHGFIIHHGHIHHIDIGHIIDIHCEHIH=IIIFFIIEHHHIHG7EHHGEFFDEFGEEGGHHHCIEHIIFFHH?HH5EFDGHIIHI)DHIHHEHHBHIIHC=?HCH+DHFF?HBHFIHFHGHIHFGHHFGFFGG+GB,GHEHH82GEIEGFGEFEG)GGFEE/ECG/AGCFEF+E;:CGEGF=EGECG?:EFE +chr1-95 16 chr1 606 99 64=1X5=1X129= * 0 0 CCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGACACAATTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAAT (?GGE;GGG:GEGEFECC?AG?GGGGEAEGGEGGGE?G'GEFGEDEE?FGC*EEEGEGF>GGEFGHEFFF*HEECBHEHGGHHHHGBFHHHGDGDFHHHHFHHDHIEHHAHIIGHHHHHHHFFIIGIIHIIEFII;FCIIDHDGIGAIIHHIFIIDIE@HHIFFIIHHIHIIIIFIHIGEEFGDBD?DDBBD@BB?A,?? +chr1-123 0 chr1 609 99 189=1X10= * 0 0 GTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGGATTAAATCGA ??AAAB?BII5HHFEHHHFIFGIIHIHHHHFHIGIHIHHHDHEHIFEHHGFIHFHFF>HHF@FCFEHEGGHGEHFDEGG3IGIGCFGEGGE/GGBDGGEFFEEGEGGFEFGEEFGG?G;GGEGEGGGGG>EEEF*GCGAEEGGGE +chr1-23 0 chr1 622 99 122=1X77= * 0 0 GTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACGTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTT ,?AAABBBDDDDDBB@FGGGGFIHFFIIIHIIIIHIGHIHIHIHH=H+IDIIHIFIICHHHHFHFIHHFDAEHIHIIIII=IIHHIGH/I7HFFEH;HIFHIG?HH3HHIHHHGGFFHHFGH,H@DDBG:EEHGEGGEGFEEEEGGGEGEGECG:EGEEFEGGEFEIHHI?IHIIIHHEHFG@8.IIFIIIIIIIHHIHHHFFIGAICHIHEHHHIIIFEFFCFBDDBDDBDB??????? +chr1-59 16 chr1 657 99 194=1X5= * 0 0 TCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTAACGAA EG*GG'?GGGCEGG*GE;E+A:GEEEFECGCG,*FGEFGEGEE?EGFFGE;GGFG.DG?FGCB2GHFHHD?F@FGHHEFCGGHHFDHHHHGHHDHHBFHHBHIFHFHIHIEIFIIHGIFDHGEIBHIIEDHIHHIHHHIIHHAHHIHFHIIIFIIHFIGHIIDIFDIIDHIIIGEHFHFGGFDGDDBD@DBEB-B?,??= +chr1-2 16 chr1 658 99 15=1X184= * 0 0 CCAGCTTCTTCGGCAAAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAAT EGF(EDGGGEFGEFF1AF?G<:A6G?DFEGEFEE*EEGE*G*EEE(GEE9G9F/G*GEDGE;F:GE=FGEGGGEFHGHHFGGEGEGHHHEGGFDIGHHHFHHDHHHEEGFECGIIHHHHHIFHIHFIH>FDCIHHHFI8FIHHIFDI0IGEDHFDGFHFIHHIFHHHAIIIIEHEFHHGGGGGFED?BHGHEG>/H?FEEG*EGFEEE?G?EFGEG*GGGEGC=GD-GGEEEEGEGGFA9CEEG?GF?GE<:CEA?FC>EFE +chr1-118 0 chr1 678 99 200= * 0 0 ACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTG ?????BB?DDBDBDDDFAGF;FEHIHFIHHFIDIAHEHHIIIHIHHHIH?EHFF9AIFIFHECHIEBIHHIHHHHIIIIFIIHICH?IIIHHEDCH?HEH;HHHHHFHHE,HGEHGEEGECF?EGDGG8*F=GBGGGDGFFGEC?EGEFGGG?G(GGGE*GG?GIII/IIHGGGFGADDDBDDBDB>HIHI=HIAFAHHFHHHFHIHHHIHIIHHHIHIHIHHHHHHHEEHIHEIIIGHFFI-FGHI8IHHHHFDHIHDIIHHGHHGHHHH8HHEHFHHBGGH/GHGGGHFFGDIFGECF*@GG;GFEGEFEGEFF?C:G;GEGGCCFFE9FFG?FEFGCGEGGG=EGEEFEGG:G2ED +chr1-107 16 chr1 695 99 74=1X125= * 0 0 AAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGTAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCTGGTT GE;GEFGEGFGEF:GG;FGG?GGGEG.?FEGECFGGGEFGGGGGGCGEE3GEFGGCEGEC@CFEGGE@EGHCGF.GHHFCGHFFHDHDHFHHFH?HFHDDIHDDHFGHGHIDHFHHHHHIIIIHHHHFHH-IIIIIIIIF@HHIIG.IHHEHGFIHI>FIIEIIII+IIHIEIEIIIHG>FGFGBDBBD?DD?.B???A? +chr1-72 16 chr1 698 99 86=1X113= * 0 0 GCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTACCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCTGGTTTTG *E?FEGGGGG?GGEE:EGEGFGGGGB????? +chr1-114 0 chr1 699 99 157=1X42= * 0 0 CGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAGTTAAATCGAAGTGGACTGCTGGCGTTATAACGCTGGTTTTGT ??=??BBBDEDDDD@DFG>>FFIHIHIIHIICHIIHHFF7FIHHHHEAHFCIHIHGF@IHIIHBHHHFIIGIHIHDFHEIIFHFEIHH*HIHEHHI?EGGECDEGGGEGFGGC*GGGEACFGHHHFFF+GFCEFHHHDH+FHEHFHHHIGFHIHHHHI>IH-HHHHIIIEIIHIIHHFHHHH@HFHHHH=HIHIHHIID@IAIIFIFGIIG@HH@ICH,IHIF/EIFG;AFCD?DEHEEF6GEA3CFEGEF(FGBEBFHEGG;GGCGGFG:GGEGGFA*EFFE*AFEEGDGF6G?GGGCFGE:EGGC +chr1-31 0 chr1 736 99 78=1X16=1X104= * 0 0 TGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTAACGTCTTTCCAGAAATTCTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCTGGTTTTGTCTAACTTTATCGCTGGTTTTGTCTAACTTTATCGCCC ??=??B9?D?DEDDDBGGE+GFIHIHHHI>HHFHAHICHHEGHHIIIIHIIECIH+FIHIIIFDHFHFHIHHD)ICHI'@HIFHIIHIH=IHIIHEFDHHI@IA@IEHHDHF@HHHHGHFGGHFFGGGG@EGCDGDC*GGCG=EG*:EGGGEEGGGEEECFGGGGGGHGGG.FGEDGEGFGGGGGGGGGFGA(GFCF/ +chr1-76 0 chr1 791 99 200= * 0 0 GTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCTGGTTTTGTCTAACTTTATCGCTGGTTTTGTCTAACTTTATCGCCCTGTGGCCTGTTGATTCTAAATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTT ????,B?BDDDBDEDEFGFFFEIFIHHIIFH7I@IIH7IHIGIHGIHIHIDI;A7IHHHFI?FHCCGHDEFIHIHHHIHAIHIIHIHCGEHIEHHFHIIHIEHGDCIH)FHHHHHEG@FHEGHFEEG3@GG9GFEIGEGGGFEEEHGG;GGEGEGGGE*GGGGGECG*FEGA*8FE6A4>?GEG(:GGEGEEGCA0EG8G +chr1-19 0 chr1 796 99 125=1X74= * 0 0 CGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCTGGTTTTGTCTAACTTTATCGCTGGTTTTGTGTAACTTTATCGCCCTGTGGCCTGTTGATTCTAAATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGA EIHHHHHHHHIIHI7HHHCHIIHG=GIHIIHIHDFIHHHI-FIHDIIHGIIFHHHHIHDHGHHIIIIGHFFHHCHHIHFEFEHHHIHGGHIHFGGEEGGEFGC)EEGB6GEF?GG?EEEG:FCGGEG +chr1-56 16 chr1 881 99 44=1X155= * 0 0 TTATAACGCTGGTTTTGTCTAACTTTATCGCTGGTTTTGTCTAAATTTATCGCCCTGTGGCCTGTTGATTCTAAATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACG CAGFEEGEGGGDGE:*EGAG>EGGEBGFGE;GGEGGG6FFGGCG(EGEGG@E7GGGEGEEFGGGGGE:?HEEGHHGHCEDHGHDFCGI=HHHIHHHHHHHGHHI8HHHHIHHCHIHAIHHIIFFA,55BEFHHIHHFHCIIIIIH+II+IDHIGF@IIIIHHICIIHGIFF9HIII+HGG2GFGDDBDDDDDBBB???CG6FGEGEG:GEC)GGF)EGECGGGGGGE(:G0GGFFGEFGGGFFGEGGBCGEGGBGGGGHE6F@G77;GGFFC?HHEGHHFHE?IG?HEHGFGH?HHFHFHGHEIGAHD,HHII+EGHHIFIGIBIIFIHIHHFCHF@IICIHIHHIHGHHHIHIIDHHFIHHE-AHHIEHHHIC>FFGGGEDEDBDDDDBBB???=? +chr1-50 0 chr1 904 99 200= * 0 0 TTTATCGCTGGTTTTGTCTAACTTTATCGCCCTGTGGCCTGTTGATTCTAAATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTG 5???A?BBDBDDDBDDGFGDFF7HIIFFIEHIHIIH@HIIIGHHHBIEHIGIEGG@IHGIIIHFIGHIIHIHICACE>FIIHHIII=IHHHDFFG*HIHGFHIIHI=H+FHHHBHHIHFFEHGFDHFGGE?AG'FFGEEBEGFIIGI;I-IHIIHFFHIHIEHEGFI.HIHHIHFHD?H9@HHHGH@HF)FEDBFFFEFGEAEEHFI?GGAGEGFGFGGGG0BGAFEFGGECGGEGDEGGA3FFG?ECG8?E:ECCGEGGC>G:GEG6GGG +chr1-6 0 chr1 971 99 120=1X79= * 0 0 TTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGCAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATC ????ABB<:DDDDDDDFGGGFGHIFBHIICGHHIIHHGHHIHIHIAFEIFCFIHCIHHIHIFHFFFHHHEIGHIIHICHHFHIADI=HH+IDFHGHIIIHCIHHHH>FHHHHFHHGG,@H->:EGFGGFGHFFG>IEBDGG8G?GGFCGG?GGA?EFGGGEGEGGEGGGGGEGGEGFGGEGGEE(EGF;GEEFG2CCG?G +chr1-93 0 chr1 973 99 95=1X66=1X37= * 0 0 ATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATGGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAGTTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGA ???A?BBADDDDDBD@>FGFCFHHHIHIIHFIGIHIIGCEIIIHIIIIEHFFHHHFHIIHHBCHIHHHIHIIHHGGGIGHGHHIIFDHA7IHC+I,HHHHIGGEIHHFHHHHEFHEGHHGHGI@GH@EFGHE;EF,GIEFGGEHEEDGEGEDGEEEEEGG?F;CGGCGFEEEEGEGGFFAEGE;EGEGBBDD?BBDDDGGFGGFHIHCHFFAIHIHHCHIHIIIIIHHIGFEIAHHIAHHHHHA5HHHHIFFIIIIIECHHGIHHFHGG?IHHHHH.EDHDGHIFHH=HHHEBFGGHDHHEGGH=DG>EGGFHFEEB?EGGG?'EGEGGBG/GEGGFFGG?FD?0GEBGG;GGCGGG1GGAFGGGFGC*E-?.DC8GFCFCE +chr1-154 16 chr1 984 99 200= * 0 0 CGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTA GFGAGGECCGGEE8GGE4CGGGCCGFGE)6GFGGGGGEEGFGGGGFGE=FGGCGEEFGEFE*GABFEGGFDH?D*GFCGFEDGHAFH4HGHEH;HFHIHHGFHIFAGGCFBDBDDDDDB?B????A +chr1-32 16 chr1 984 99 2=1X65=1X131= * 0 0 CGACTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGGAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTA E(*F=EG*GGGEC?FGA>EEE>GE:>:EF>EGGGG=GGAEGGGFGEEGGEGG0GEGGGCGDG3GG?HE'FGEGFDEGHCHFHHFDFGHHHHGHIHHCHHHHE8HHFDIHGEIHG-FHIHHIIHGIGIHIHIFHIHIHIIIHIIHHEIGCIIHIHHHHCHIFIIIDHDIFIIFFIHHCFGGGFGFEDDDDDDDBBB????A +chr1-150 16 chr1 987 99 34=1X165= * 0 0 CTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTTCGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAA GBEEEGEAFGHFGBGHGFDHHHBGHFIHH?HHHH?F?HFD3HHHHGIHHHIGIIHGIIIIHIHHIH?IHHHFFHIIIHIGHIIH8HH?HIEIFFHIIHHHGCHGIHCHIIHAIFCG;FGGDEDDDDDDBBBA?A?? +chr1-90 0 chr1 1006 99 126=1X73= * 0 0 AGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCATAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCA ?????BBBDDDDDEDDFFGFGFHII;HICHEI=IFHHEFIHII,IHIH+III+CHIDIHFHH5HHFIIHIHIIFIIIIGIHBHHEIGGHIHIHHGHH:HAIAIIFHH>H@HFDFHF?DGGH?GEGH+EHFEHGEGGDGHGGGCG,6@?CGG?GEEECEG?G,/FEGEGEEF;AGGCGGEGG*:EEEGFGEGGFGEGFGEG +chr1-135 16 chr1 1007 99 200= * 0 0 GTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCAC GGGE:G:FGGGEG6*,E:EGGEGGECGEGEC9DGE-3EFAF@HGGGH,HG@BHHHHCFFDHGHEH3HIIHFIHEIH+EIHIHFIHHHIHIHIHIHIEEI-IAC-FHHHHHH>IHDHFIHIHHDIHHFEHHIIIHHIG>CHIIIFHFGFF;GD-DDDBDBBBB????? +chr1-144 16 chr1 1008 99 200= * 0 0 TATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACT AEGGEGEGFGEG'?EEABE?*E;EF?EGGEE/+GFEGEGEC1EFGEGGGC2GG +chr1-54 0 chr1 1044 99 152=1X47= * 0 0 CTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTCTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTA ???=ABBBDDD9DDD@GGCFFFHDHFIFIIHHIFHIHIGHHCHDIIFHIGDIHH9IIIEHIIIIIHIHH5IICHIIFCHIHHIICIIIIIHHHGGHI=DF@@CDHIIHCGHGHFF:EEH*DEGHGHGEHGGHGG@EGHIIIE/EHDCIICIIIHICHHHGFGFFFEGBDDDDDDHIGHIIIHIFB?IHFFFDGCG@GDDDDDBDD-+BA?A?? +chr1-21 0 chr1 1066 99 200= * 0 0 ATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTATAACGCCTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCT ?????95BDDBDDDBEGCGGGCICBIIHFHIIHHHFHHIHDFIHIIHH@H?IHIIHHHIIIIIGHEHIHHHIHHGHHIIHEIEHII,HHIFGIIHFCDFHHHHF4HHFHFHHDHFHHFFFEGG@FEEFEFEHDGDDEGFG@EGEAGEGDFEF6GFFAGHFECEGGGGCEE=FGGGGG;GGG*EGGG?6G?F?E*GCGFE? +chr1-133 16 chr1 1120 99 200= * 0 0 ACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATT GF1ECG4:GGABG:GE??FGGHEFHHHDFHHHCHEHH?HIIIHIEIHIDHIEIHHIHHFHHHIHIDIHFIFIHIHHIBIIHHIGIDH>IIIBHHHHIIHHGHHG8FHIHHHHGGGGFGBDDBDBDDBBBIHIHIIIHIHIIIHHHHIIFIIH,IIIFHHFHIIIIIGGIIIIHHFDI?-F>II?IHIIIDEHI.CHIHIHFIGHFHIFHHGHHFHFHGEHGFEGFEEDGEHHDDGFGGGEFCHAEGEEAGAGGEDEGFFEGEEGFGECG7F=CFCGCGGEE0GCECF6GGEEEGCGGF6EGGE +chr1-43 16 chr1 1135 99 200= * 0 0 ATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAAC GGEGEGEGGGEFGEEGGGEGEDGGFACEEG/GEGEGGFEEFFFGGFGFGGDFEGGGGEEGEGEEFGFE<GGGG)GEGFEE +chr1-45 16 chr1 1210 99 4=1X195= * 0 0 TGTTCCTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCA ?EG8(EGGCGECGGGCEGGEFEECEG?*GGE;EECCBGF*?GFFEGEGEF?EGGBFGEFGE1GBEEGCGGGGFGDFGHHIGFDFBHHH=HIEHHHDGHHGH+GIIGHHFHIFGHHHHHIIIHIHFHHCHHIH@+GHDFI-EHIIICHIIHEDEDEFGIDIHIGIIDHDBHHFHIHIHFGGF?GGDB?DDBDD>???EE;BGE.GGHGEAEFG:G>GEEGGEGGGGG,=GGCGE2GFGFGEEGGEEGDFHGEGEHGGHEHHFCHHEGHHEIHIHIDIHHEGHFIH6HHIII@HIHDIGIIFHIIIEIIHIIHIFHE@IIIFIHHFEHI=HFHIHEIIIICFIIHFIHEHIGIIHCHCGGGGGDDDDBDDB>BB??=?? +chr1-101 0 chr1 1214 99 159=1X40= * 0 0 ACTCCAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATCTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAG ?????B>?DED@DDADFCFGGGIHFIEFCHIHFEHHIHIHHCHIIHIEHAIHIHIDHIHHF>,HEG=IIIE5IHIIEIIIIHDHEIIHHDIIEIHGFHCIFFIDHHHIHHHFFHHGHHIFHHEHHGE=;EHEGGEFGEEE2@GEGGGGEG*BGE?GGEG*GGEEFGGEGAGGEEED8CGE?GFGCGFA*DAGGE8E?GG: +chr1-47 16 chr1 1218 99 67=1X132= * 0 0 CAGCTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCTGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAAAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACC G1GACFEGGGE;GFDEGEE0GEEEFEEGGGEFGAGEGGEGGGGEGGGGG;GFGGGGGFEE?EGFEDG2GFHGDHFHEHBDEHG6EGGFF.HHHGHGHGDFGIDFHHIDHHHFHDHI?HHIDGIHIGFFIFCEGHHHIHHHIHHHBFHGGHIHGIGIGAEIIHIIII+HIAIHHHFIIAFG8CFFDBDDBD<@BBB??A?? +chr1-22 16 chr1 1221 99 141=1X58= * 0 0 CTTCTTCGGCATGGTTTTGTCTAACTTTATCGCTGGTTAGTTTCTTCACGCTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTAGAACTTCATGTGCCTGTAAAACGAAGCGGTAGAAATTTTTATTTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAAC GGCCGGE;EGG>GGGGGGEEECGGEGAGGBGF*GGGEEECCGEG;GFGF:FGG?FEGH8ECDGDEFF?EEHEGEFFFF?HDFEGEGFHHHHHHEHFEDDIHH,GIIHHGHHHFHCHIHIIIHFI,HCGHHIFIDIGHIIHH#HHIHIIHHIFHIHIIHHHIIHHHFH7HIII>BIEIHEFG/GGDHEEGIHH3HIHIHFHIH23HHFHGHG@HAEHHFH@EFGEEG@CEFHEG'EGFGCGFG,EGE,FGGGGECCGGEG=GGEFGG?EEEEGGEG8GGGFGCG1CFG@G;E?86E'EAGGGEFECGCE:GGG*E:?GGGG3EG:GCEFFEEE?G:GGGGFGEGHHDFHHG=HHGHBH@FCEHGFHHDHIHIHHHH-GIHIIHGHIHIHIHIIIIDHHIHGIHCH=IGH9FHGHIIFIGIIHIIIHHIGI.FHHHFHIEIIHIHHIHFGGGCGDDDBDDEIFHFIHIHICGGHHCAGHHHIEIF,5HHDHICIHGHIF;HGGIIIIICHHHFHFHHFIEFG=GFGHHF)HHEBGEHGDGEGG4GGEGHFGGAGEGD4EEGFF>EEHHGFHFHDHCHHHFG,FHHGFIHIIHFDHGHHIEHIHIHIFGHIDIHIGIIHDIHIFIHIHHIEHIHIHFHHFHHFHI+IHDIHHIHGHIIFEHIHFFHCGGG;8DBD?DBBDBBB????? +chr1-82 0 chr1 1373 99 200= * 0 0 TTTTTTTCTCACTTCTGTTACTCCAGCTTCTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCC A????B?@DDD5DFHIFHEIHIIIIH?FHHGIFIDFHIHIDHFEIHI@ICIHIIFIEGIHIEG?DHFIFHHHGIHDHHEHHEIGIA.,GIHF=HFDFGHHDHHFGFGHHGEFHBGGDGGFGEGGE7GGFGEGEBAGFGGEE(GE@E6E:GGGCGEFG>ACGEG?F+G:GGE=GAEGFE:GCGEEFF +chr1-116 0 chr1 1402 99 200= * 0 0 CTTCGGCACAAGTACCAACCAGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCG GGDDHHBGHHDIEHHAIHCHIAH/HHFI)AIHIH>HIHHIHHEEHHIFH=AIH?IHIEIHHHHHIH8>FIIFIIFHIIEHH0EIHIIEIIF8IIHIFFFGGG?DDBDBDABBB????5 +chr1-44 0 chr1 1422 99 105=1X94= * 0 0 AGAACGTGAAAAAGCGTCCTGCGTGTAGCGTTTATGTTGGTTTCATGGTTTTGTCTAACTTTATCGCTTTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTCGTTTACGAATTAAATCGAAGTTACCGTCTTTCCAGAAATTGTTCCAAGTATCGGCTTGTTTACGAATTAAATCGAAGTGGACTGCTGGCGTTAT ??A9?BB?DDADD?DBGAEGGGIHIIIHIHIIIIIHDDHIIHGHIIIG=IIIHIFFIDIIHHHHHEIHGHH5DHHIHG=HFIHIIH@IIIHHH7IHEIEHHHHHB'FHFGEGFHFEEF.HBGFFGFDGFFEGHGEIGGGH>GEEFGGG@GGDE@GGFGGGEGGCG?BEGGEGGGE?F8GGGFG9GGGCFG?GGGGEGAGG diff -r 000000000000 -r b6794f4cb1c6 test-data/input_2.bam Binary file test-data/input_2.bam has changed diff -r 000000000000 -r b6794f4cb1c6 test-data/output_1.psl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output_1.psl Mon Dec 12 14:42:58 2022 +0000 @@ -0,0 +1,50 @@ +197 6 0 0 0 0 0 0 + chr1-106 200 0 200 chr1 1626 3 203 4 125,8,52,12, 0,126,135,188, 3,129,138,191, +199 2 0 0 0 0 0 0 + chr1-99 200 0 200 chr1 1626 13 213 2 101,98, 0,102, 13,115, +200 0 0 0 0 0 0 0 - chr1-68 200 0 200 chr1 1626 13 213 1 200, 0, 13, +200 0 0 0 0 0 0 0 - chr1-3 200 0 200 chr1 1626 16 216 1 200, 0, 16, +200 0 0 0 0 0 0 0 + chr1-152 200 0 200 chr1 1626 23 223 1 200, 0, 23, +199 2 0 0 0 0 0 0 + chr1-74 200 0 200 chr1 1626 42 242 2 156,43, 0,157, 42,199, +199 2 0 0 0 0 0 0 + chr1-160 200 0 200 chr1 1626 47 247 2 183,16, 0,184, 47,231, +199 2 0 0 0 0 0 0 - chr1-117 200 0 200 chr1 1626 63 263 2 24,175, 0,25, 63,88, +199 2 0 0 0 0 0 0 + chr1-37 200 0 200 chr1 1626 69 269 2 176,23, 0,177, 69,246, +200 0 0 0 0 0 0 0 - chr1-121 200 0 200 chr1 1626 78 278 1 200, 0, 78, +200 0 0 0 0 0 0 0 - chr1-89 200 0 200 chr1 1626 108 308 1 200, 0, 108, +200 0 0 0 0 0 0 0 - chr1-14 200 0 200 chr1 1626 110 310 1 200, 0, 110, +200 0 0 0 0 0 0 0 - chr1-61 200 0 200 chr1 1626 117 317 1 200, 0, 117, +199 2 0 0 0 0 0 0 - chr1-85 200 0 200 chr1 1626 124 324 2 6,193, 0,7, 124,131, +199 2 0 0 0 0 0 0 + chr1-148 200 0 200 chr1 1626 134 334 2 41,158, 0,42, 134,176, +200 0 0 0 0 0 0 0 - chr1-102 200 0 200 chr1 1626 135 335 1 200, 0, 135, +200 0 0 0 0 0 0 0 + chr1-29 200 0 200 chr1 1626 136 336 1 200, 0, 136, +199 2 0 0 0 0 0 0 - chr1-92 200 0 200 chr1 1626 142 342 2 65,134, 0,66, 142,208, +199 2 0 0 0 0 0 0 + chr1-139 200 0 200 chr1 1626 148 348 2 117,82, 0,118, 148,266, +198 4 0 0 0 0 0 0 + chr1-84 200 0 200 chr1 1626 163 363 3 57,100,41, 0,58,159, 163,221,322, +200 0 0 0 0 0 0 0 + chr1-125 200 0 200 chr1 1626 169 369 1 200, 0, 169, +199 2 0 0 0 0 0 0 - chr1-11 200 0 200 chr1 1626 198 398 2 112,87, 0,113, 198,311, +198 4 0 0 0 0 0 0 + chr1-53 200 0 200 chr1 1626 210 410 3 134,1,63, 0,135,137, 210,345,347, +200 0 0 0 0 0 0 0 + chr1-105 200 0 200 chr1 1626 225 425 1 200, 0, 225, +199 2 0 0 0 0 0 0 - chr1-127 200 0 200 chr1 1626 244 444 2 97,102, 0,98, 244,342, +199 2 0 0 0 0 0 0 + chr1-147 200 0 200 chr1 1626 269 469 2 64,135, 0,65, 269,334, +200 0 0 0 0 0 0 0 + chr1-83 200 0 200 chr1 1626 270 470 1 200, 0, 270, +199 2 0 0 0 0 0 0 + chr1-36 200 0 200 chr1 1626 271 471 2 123,76, 0,124, 271,395, +200 0 0 0 0 0 0 0 - chr1-55 200 0 200 chr1 1626 273 473 1 200, 0, 273, +200 0 0 0 0 0 0 0 + chr1-136 200 0 200 chr1 1626 279 479 1 200, 0, 279, +200 0 0 0 0 0 0 0 + chr1-64 200 0 200 chr1 1626 280 480 1 200, 0, 280, +200 0 0 0 0 0 0 0 - chr1-130 200 0 200 chr1 1626 288 488 1 200, 0, 288, +200 0 0 0 0 0 0 0 + chr1-78 200 0 200 chr1 1626 302 502 1 200, 0, 302, +199 2 0 0 0 0 0 0 - chr1-111 200 0 200 chr1 1626 314 514 2 130,69, 0,131, 314,445, +199 2 0 0 0 0 0 0 - chr1-75 200 0 200 chr1 1626 317 517 2 36,163, 0,37, 317,354, +198 4 0 0 0 0 0 0 + chr1-103 200 0 200 chr1 1626 323 523 3 101,48,49, 0,102,151, 323,425,474, +200 0 0 0 0 0 0 0 - chr1-69 200 0 200 chr1 1626 334 534 1 200, 0, 334, +200 0 0 0 0 0 0 0 - chr1-146 200 0 200 chr1 1626 350 550 1 200, 0, 350, +200 0 0 0 0 0 0 0 - chr1-42 200 0 200 chr1 1626 352 552 1 200, 0, 352, +200 0 0 0 0 0 0 0 + chr1-66 200 0 200 chr1 1626 364 564 1 200, 0, 364, +200 0 0 0 0 0 0 0 + chr1-81 200 0 200 chr1 1626 365 565 1 200, 0, 365, +199 2 0 0 0 0 0 0 - chr1-120 200 0 200 chr1 1626 373 573 2 89,110, 0,90, 373,463, +200 0 0 0 0 0 0 0 + chr1-143 200 0 200 chr1 1626 378 578 1 200, 0, 378, +200 0 0 0 0 0 0 0 - chr1-58 200 0 200 chr1 1626 382 582 1 200, 0, 382, +200 0 0 0 0 0 0 0 + chr1-48 200 0 200 chr1 1626 384 584 1 200, 0, 384, +199 2 0 0 0 0 0 0 + chr1-86 200 0 200 chr1 1626 385 585 2 162,37, 0,163, 385,548, +199 2 0 0 0 0 0 0 - chr1-34 200 0 200 chr1 1626 391 591 2 49,150, 0,50, 391,441, +199 2 0 0 0 0 0 0 + chr1-15 200 0 199 chr1 1626 394 593 1 199, 0, 394, +199 2 0 0 0 0 0 0 + chr1-8 200 0 200 chr1 1626 395 595 2 99,100, 0,100, 395,495, +199 2 0 0 0 0 0 0 - chr1-140 200 0 200 chr1 1626 398 598 2 96,103, 0,97, 398,495, diff -r 000000000000 -r b6794f4cb1c6 test-data/output_2.psl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output_2.psl Mon Dec 12 14:42:58 2022 +0000 @@ -0,0 +1,50 @@ +180 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1101:6911:8255 251 71 251 gi|251831106|ref|NC_012920.1| 16569 0 180 1 180, 71, 0, +241 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1101:14518:9998 251 10 251 gi|251831106|ref|NC_012920.1| 16569 0 241 1 241, 10, 0, +171 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1101:18422:19051 251 80 251 gi|251831106|ref|NC_012920.1| 16569 0 171 1 171, 80, 0, +138 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1101:25545:21098 251 113 251 gi|251831106|ref|NC_012920.1| 16569 0 138 1 138, 113, 0, +173 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1101:5446:12248 251 78 251 gi|251831106|ref|NC_012920.1| 16569 0 173 1 173, 78, 0, +171 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1101:5861:6452 251 80 251 gi|251831106|ref|NC_012920.1| 16569 0 171 1 171, 80, 0, +130 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1102:10403:6021 251 121 251 gi|251831106|ref|NC_012920.1| 16569 0 130 1 130, 121, 0, +213 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1102:10677:23253 251 22 235 gi|251831106|ref|NC_012920.1| 16569 0 213 1 213, 22, 0, +179 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1102:13809:1733 251 50 229 gi|251831106|ref|NC_012920.1| 16569 0 179 1 179, 50, 0, +138 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1102:17584:10050 251 52 190 gi|251831106|ref|NC_012920.1| 16569 0 138 1 138, 52, 0, +146 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1102:18842:24844 251 105 251 gi|251831106|ref|NC_012920.1| 16569 0 146 1 146, 105, 0, +213 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1102:21788:11027 251 35 248 gi|251831106|ref|NC_012920.1| 16569 0 213 1 213, 35, 0, +146 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1102:5728:8777 251 105 251 gi|251831106|ref|NC_012920.1| 16569 0 146 1 146, 105, 0, +171 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1102:5983:21093 251 80 251 gi|251831106|ref|NC_012920.1| 16569 0 171 1 171, 80, 0, +132 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1102:7765:18353 251 119 251 gi|251831106|ref|NC_012920.1| 16569 0 132 1 132, 119, 0, +171 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1103:10405:17879 251 80 251 gi|251831106|ref|NC_012920.1| 16569 0 171 1 171, 80, 0, +155 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1103:13493:8205 251 96 251 gi|251831106|ref|NC_012920.1| 16569 0 155 1 155, 96, 0, +156 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1103:14060:21273 251 80 236 gi|251831106|ref|NC_012920.1| 16569 0 156 1 156, 80, 0, +138 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1103:14528:12993 251 113 251 gi|251831106|ref|NC_012920.1| 16569 0 138 1 138, 113, 0, +161 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1103:17657:20856 251 90 251 gi|251831106|ref|NC_012920.1| 16569 0 161 1 161, 90, 0, +134 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1103:23099:3794 251 59 193 gi|251831106|ref|NC_012920.1| 16569 0 134 1 134, 59, 0, +120 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1103:25465:20010 251 45 165 gi|251831106|ref|NC_012920.1| 16569 0 120 1 120, 45, 0, +184 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1103:25519:6301 251 18 202 gi|251831106|ref|NC_012920.1| 16569 0 184 1 184, 18, 0, +143 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1103:6074:6549 251 108 251 gi|251831106|ref|NC_012920.1| 16569 0 143 1 143, 108, 0, +171 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1104:11572:8264 251 80 251 gi|251831106|ref|NC_012920.1| 16569 0 171 1 171, 80, 0, +127 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1104:11928:24197 251 124 251 gi|251831106|ref|NC_012920.1| 16569 0 127 1 127, 124, 0, +146 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1104:12288:20635 251 105 251 gi|251831106|ref|NC_012920.1| 16569 0 146 1 146, 105, 0, +132 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1104:13832:4398 251 7 139 gi|251831106|ref|NC_012920.1| 16569 0 132 1 132, 7, 0, +176 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1104:23670:4161 251 75 251 gi|251831106|ref|NC_012920.1| 16569 0 176 1 176, 75, 0, +157 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1104:24927:22253 251 94 251 gi|251831106|ref|NC_012920.1| 16569 0 157 1 157, 94, 0, +187 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1104:4705:7727 251 64 251 gi|251831106|ref|NC_012920.1| 16569 0 187 1 187, 64, 0, +137 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1104:7756:4776 251 114 251 gi|251831106|ref|NC_012920.1| 16569 0 137 1 137, 114, 0, +144 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:11310:21761 251 104 248 gi|251831106|ref|NC_012920.1| 16569 0 144 1 144, 104, 0, +131 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:11578:14676 251 120 251 gi|251831106|ref|NC_012920.1| 16569 0 131 1 131, 120, 0, +184 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:13575:19255 251 67 251 gi|251831106|ref|NC_012920.1| 16569 0 184 1 184, 67, 0, +231 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:15502:11453 251 0 231 gi|251831106|ref|NC_012920.1| 16569 0 231 1 231, 0, 0, +187 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:16787:9771 251 64 251 gi|251831106|ref|NC_012920.1| 16569 0 187 1 187, 64, 0, +173 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:17564:15723 251 78 251 gi|251831106|ref|NC_012920.1| 16569 0 173 1 173, 78, 0, +156 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:18108:12091 251 80 236 gi|251831106|ref|NC_012920.1| 16569 0 156 1 156, 80, 0, +181 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:18331:16683 251 70 251 gi|251831106|ref|NC_012920.1| 16569 0 181 1 181, 70, 0, +151 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:20577:18421 251 100 251 gi|251831106|ref|NC_012920.1| 16569 0 151 1 151, 100, 0, +156 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:21099:2895 251 95 251 gi|251831106|ref|NC_012920.1| 16569 0 156 1 156, 95, 0, +152 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:26469:19245 251 99 251 gi|251831106|ref|NC_012920.1| 16569 0 152 1 152, 99, 0, +206 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1105:7169:17145 251 45 251 gi|251831106|ref|NC_012920.1| 16569 0 206 1 206, 45, 0, +161 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1106:15481:16176 251 90 251 gi|251831106|ref|NC_012920.1| 16569 0 161 1 161, 90, 0, +140 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1106:17389:18671 251 111 251 gi|251831106|ref|NC_012920.1| 16569 0 140 1 140, 111, 0, +130 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1106:22927:3863 251 80 210 gi|251831106|ref|NC_012920.1| 16569 0 130 1 130, 80, 0, +156 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1106:23625:4236 251 95 251 gi|251831106|ref|NC_012920.1| 16569 0 156 1 156, 95, 0, +184 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1106:26031:14826 251 0 184 gi|251831106|ref|NC_012920.1| 16569 0 184 1 184, 0, 0, +132 0 0 0 0 0 0 0 + M01368:8:000000000-A3GHV:1:1106:27607:15990 251 24 156 gi|251831106|ref|NC_012920.1| 16569 0 132 1 132, 24, 0,