# HG changeset patch # User iuc # Date 1765443217 0 # Node ID faec698e3f98c1abca445dde1df5c85831e4f364 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/main/tools/detect_circular_sequences commit 7ea9f729b44c6351c52b6295c780f496d239488e diff -r 000000000000 -r faec698e3f98 detect_circular_sequences.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/detect_circular_sequences.py Thu Dec 11 08:53:37 2025 +0000 @@ -0,0 +1,248 @@ +#!/usr/bin/env python3 + +######################################################################################### +# This script detect circular contigs by looking for exact identical k-mer at the two +# ends of the sequences provided in fasta file. In order to be able to predict genes +# spanning the origin of circular contigs, the first 1,000 nucleotides of each circular +# contigs are duplicated and added at the contig's end. +# +# Inspired by Simon Roux work for Metavir2 (2014) and Corentin Hochart work in PlasSuite +# +######################################################################################### + +import argparse +import logging +from pathlib import Path + +from Bio import SeqIO + +log_levels = { + 0: logging.CRITICAL, + 1: logging.ERROR, + 2: logging.WARN, + 3: logging.INFO, + 4: logging.DEBUG, +} +logging.basicConfig(level=log_levels[3]) +logger = logging.getLogger() + + +def setup_logger(verbosity: int) -> None: + """ + Configure the logger based on verbosity level. + + :param verbosity: verbosity level + """ + logging.basicConfig( + format="%(asctime)s - %(levelname)s - %(message)s", + level=log_levels.get(verbosity, logging.INFO), + ) + + +def find_occurrences(s, substring) -> list: + """ + Find all starting positions of a substring in a string + + :param s: String to be searched + :param substring: Substring to search in s + """ + return [i for i in range(len(s)) if s.startswith(substring, i)] + + +def is_circular(sequence, length, pos) -> bool: + """ + Determines if a sequence is circular by comparing segments starting at `start_pos`. + + A sequence is considered circular if the `length` elements at the beginning of the sequence match the `length` + elements starting at `start_pos` in the sequence. This is useful for detecting repeating patterns or cycles + in sequences. + + :param sequence: The input sequence + :param length: The number of elements to compare for circularity. + :param pos: The starting index in the sequence to begin the comparison. + + :return bool: True if circular, False otherwise + """ + for i in range(length): + if sequence[i] != sequence[pos + i]: + return False + return True + + +def check_circularity(seq_record, subseq_length=10) -> int: + """ + Process a single sequence to detect circularity and return the overlap length if circular. + + :param seq_record: SeqRecord object + :param subseq_length: Length of 3' fragment to check on the 5' end + + :return: overlap length if circular, 0 otherwise + """ + seq_len = len(seq_record) + + if seq_len < subseq_length: + logging.error(f"Sequence too short ({seq_len}bp): {seq_record.id}") + return 0 + + begin = "".join(seq_record[:subseq_length]) + end = "".join(seq_record[subseq_length:]) + positions = [x + subseq_length for x in find_occurrences(end, begin)] + + for pos in positions: + overlap_length = seq_len - pos + if is_circular(seq_record, overlap_length, pos): + return overlap_length + return 0 + + +def extend_sequence( + seq_record, + overlap_length, + duplication_length=1000, +): + """ + Extends the 5' end of a sequence by duplicating a fragment from the 3' end. + + This function is useful for simulating circular sequences by extending the 5' end + with a fragment from the 3' end, based on the specified `overlap_length` and `duplication_length`. + + :param seq_record: The input sequence record to be extended. + :param overlap_length: The length of the overlapping segment that was previously identified as circular. + :param duplication_length: The length of the 3' end fragment to duplicate and add to the 5' end. + + :return: The modified sequence record with the extended 5' end. + """ + # Remove the overlapping segment from the 3' end + modified_seq = seq_record.seq[: len(seq_record.seq) - overlap_length] + # Duplicate the first `duplication_length` nucleotides from the original sequence + # and append them to the 5' end of the modified sequence + if len(modified_seq) < duplication_length: + # If the modified sequence is shorter than `duplication_length`, + # duplicate the entire modified sequence + extension = modified_seq + else: + # Otherwise, duplicate the first `duplication_length` nucleotides + extension = seq_record.seq[:duplication_length] + # Combine the modified sequence with the duplicated fragment + extended_seq = modified_seq + extension + # Update the sequence in the SeqRecord object + seq_record.seq = extended_seq + return seq_record + + +def detect_circular( + fasta_in, + fasta_out, + id_out, + subseq_length=10, + duplication_length=1000, +): + """ + Detect and process circular sequences in a FASTA file. + + This function reads sequences from `fasta_in`, checks for circularity, + extends circular sequences, and writes the results to `fasta_out` and `id_out`. + + :param fasta_in: Path to the input FASTA file. + :param fasta_out: Path to the output FASTA file for extended circular sequences. + :param id_out: Path to the output file for recording IDs of circular sequences. + :param subseq_length: Length of the 3' fragment to check for circularity. + :param duplication_length: Length of the 3' fragment to duplicate and add to the 5' end. + """ + records = [] + ids = [] + try: + with fasta_in.open("r") as fasta_in_f: + for seq_record in SeqIO.parse(fasta_in_f, "fasta"): + overlap_length = check_circularity( + seq_record, + subseq_length=subseq_length, + ) + if overlap_length > 0: + records.append( + extend_sequence( + seq_record, + overlap_length, + duplication_length, + ) + ) + ids.append(seq_record.id) + except Exception as e: + logging.error(f"Error processing {fasta_in}: {e}") + raise + + if not records: + logging.warning("Warning: No circular sequences found.") + + try: + with fasta_out.open("w") as fasta_out_f: + SeqIO.write(records, fasta_out_f, "fasta") + with id_out.open("w") as id_out_f: + id_out_f.write("\n".join(ids) + "\n") + except IOError as e: + logging.error(f"Error writing output files: {e}") + raise + + +def main(): + """ + Main function to detect circular contigs in a FASTA file. + + This function parses command-line arguments, launches function to read the input + FASTA file, process each sequence to detect circular contigs, and generate the + output files. + """ + parser = argparse.ArgumentParser( + description=""" + Detect circular contigs by looking for exact identical subsequences at the two + ends of the sequences provided in a FASTA file and output the circular contigs + extended on 5' end by duplication of the first nucleotides on 3' end to be able + to predict genes spanning the origin of circular contigs. + """ + ) + parser.add_argument("--fasta-in", required=True, help="Input FASTA file") + parser.add_argument( + "--subseq-length", + type=int, + default=10, + help="Length of 3' fragment to check on the 5' end (default: 10)", + ) + parser.add_argument( + "--duplication-length", + type=int, + default=1000, + help="Length of the 3' end fragment to duplicate and add on the 5' end (default: 1000)", + ) + parser.add_argument( + "-v", + "--verbose", + type=int, + default=3, + choices=log_levels.keys(), + help="Verbosity level (0=CRITICAL, 1=ERROR, 2=WARN, 3=INFO, 4=DEBUG)", + ) + parser.add_argument( + "--fasta-out", + required=True, + help="Output FASTA file with extended circular contigs", + ) + parser.add_argument( + "--id-out", required=True, help="Output TXT file with circular sequence IDs" + ) + + args = parser.parse_args() + setup_logger(args.verbose) + + logging.info("Starting script execution.") + detect_circular( + Path(args.fasta_in), + Path(args.fasta_out), + Path(args.id_out), + subseq_length=args.subseq_length, + duplication_length=args.duplication_length, + ) + logging.info("Script execution completed.") + + +if __name__ == "__main__": + main() diff -r 000000000000 -r faec698e3f98 detect_circular_sequences.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/detect_circular_sequences.xml Thu Dec 11 08:53:37 2025 +0000 @@ -0,0 +1,65 @@ + + (e.g. circular contigs) in a FASTA file + + 1.0 + 0 + 24.0 + + + python + biopython + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + \ No newline at end of file diff -r 000000000000 -r faec698e3f98 test-data/input.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/input.fasta Thu Dec 11 08:53:37 2025 +0000 @@ -0,0 +1,359 @@ +>SRR17300492_25544 +ACACCATATATCTCATTTTGTCTGTTGAGAGCGTCGCTCGATACTACGAAGTAGATATCT +CACTCCGCTGGGTTTTGTGTTTTCTTTTGTTTTCGATTTCGCGACTTGCCTGACAGCAAG +CCTCTCATCTGGAGCCCACCGCGAGGGGTGGTACAGACTTTATATCTCTTAAATTCCTTA +AATTCCATTTAACAAACTCGAGCCTTATTACCACCTAGTTACGCGTCGCGAGGCTTTGTT +CGAAGCTGCACAAGTAACTTAATAAGCTTGACATAAATCACAACGGCGCCTCGAAAGAAA +GCGTCGAAAGTAGTTAAAGACAAGCCCGAAGAATTAGAAGTTGAGGAGGAAACTACTCAA +CCAAAACCCACCAAAGGCCCAGTACGAAAAGCAGCTCCAGCTAAAGGCGCTAAAACAGTC +GCGATCCCAGTTCCTGTCTTAGCACCTAAAACTCGAGCATCGCAAAGGGCAACAACTAGT +AAAACAGTAGTTGAGGCAGACGCAACACCCGAAGCAGTCGGGAAGCCTGGCAAAAGATTC +GTTGTACCTGCTCGATTACCAGGACCATATTCTAAATTCTTAACTGAGCCATCAGTTGTA +AACCCAGTTGGTGAACCCAGGACAGTACCGACCGGATTATTTGAGGGATATCAGAGACCA +GACCGATCATACGAGCAGTCGCGACAGACACTTCCAAAAGCCCCGGAAGACTTTGCTGAA +ACATCTTTTACGGAAGATCTTCACGATAGTCCGGAGAGTGACAAGGTTGAGTTTGAAGTT +GCTGTGAATATATTACAAGGCTTGGGAGACGAGAATCCTTACCAGAGACCGATCGCGATC +CATCCTACACCACTTGCAGCCAAGCTCAAAGCCCCATTTGAAACAGATAGCCCTTTAACA +CCTTTGCCGAGTGATTACCAGTCTCCAGAAGCGAATTACGCTAAAAGCCAGACAGCTCGC +GATCCAACTGAACCGGATCTAGAGCCGTGGGGTCAACCGCGCGCTAGTTATACTTTCGGA +GAAAGTTCCGCAGCAGGTTTACAAGAGCCACCTGCATATTCTTGGGGAGAAGCATCAGAA +CAACAAAGGGAGAGAGAAGAGAGAATCCAGCGTTATCTTCAGTCACAAATTATTGAACCA +CAAGAGCCTTCGGTTAAAGAAGAAGTTAGATCGGATATCTCGTATCTTACCCAACAAGAA +TATCCACCGCTACCAAGTTCACCTAGACCAGACTTAAGAGGCTCTAGAAGATCTAGATCA +CGATCCAGCACACACCAAAGCAGTAACCACGAAACTAGACACTCGCGATCCGAAATGAGT +GACCATGGAGGAGATGCCGGAGGAGTACGGCGCCAGTACAAACCTATGCCGGCCAGGAGA +TCGAAGGATGCACCTGAATTCGATGAGACTGAGCCAGAGAGTTTGATGCGATATTTCGAG +GATCTAGAGGCGTGTTTCGAGAACGCAGGATTGACAAATGACACAGAGAAAAAGAAATAT +GTAGGAAGATATGTAAAAGCTCGACTAGAGTCGGAGTGGAGCACGCTGAGTGGAGCTGAG +GATGGAAATTCCTACCAGGATTATAAAGCGCAAATTATGGGGGATTATTACGCTGTAGGA +AGCCTGAAACGAGGCTCGATCAAGCGTCTTACTCAGATTTGCAAAGAGCATCAGCGTATT +AGTGCGAACGATATAGACGATCTGTTAACCCTGAAACGACAATTCAGCGCGGAGGCTAAG +AAATTAATGGAGCCGCCGGCTCTATTGGCTAACCATACGCTGGTAGAAAATTTCATGGGA +TGTCTGACTCGCGACTTCCGCGAGAAAGTCTATCAGCAGTTAGAGTCGAACGCGCGCACC +GATATCAGAATAAAGAAAGCTATCACAGCTAATGCGCCAGCTGGTTTGGTACCACCGGCA +CCAGTACCTGCGAGACCCACTCGTCACAGGCCGGAAGATCGTTTCGAGTTAGACGAAGTG +ATCGCGATGGCTGAGGAAATTGCTCGCGAGCAAAATCCAGGTGTCGCGGCGGTATCTTTA +AATTCGCGAACAGGAGGAGCGGCTGCAGCCCCACCAATGGTTGTCAAGACGGAGAGCTTT +AAGCTGGAACCCTTGACCCAGCAATTAGAAGAGCTCAGGGCTGAACTCGCCATGAGTCGC +GATCGTGAGGTGGAGCGTCAGAAGCGCTTTGTCGAAGAAGTAAGGGCTGCCATGCAGCAA +GGGATGCATAATGCGCCGGCGCCACTGCCTGCGCAGCCTAAATTGTATGAGCCTCGCGCT +CCAAATCCCAGCTATGCACGCCCTGAGTACCCTACCACGATGAAGTGTTTCTATTGCGGT +TTACAAGGACACACGTTCAATAGATGTCCCGCGAAAGAAGCGCATATTCAGCTGGGGAAA +ATCATCGACAAAGGATCGCGAGTGCATCTCCCGGATCATACCTACTTAGGTGTCGATCCG +AATAGAACTATTCTATCGCGAGTGGAGGAATACCACGCGCAGAAAAAGCTGGACAGTAAT +TATTTAAATTATGGAGGCCAAAGCGTGCTTCAGCTAGCGCAGATACAGCAGCAGGTCGGG +CCTAACTCAGTCTTTACCAATAAGGCTAAAGATACCAGGGACGATCTGATCTCTGCGCTG +CAAAAGGAAAACGCTTCGCTTAAGGTGTTGATGAATGGACACTCTGAGGTCTTGCCGACG +ATGGCAGCGTCAAGCTCGTCGTCGGATCTAGATCTAGTACCTAGACGCCTACCGGACCCT +GAGGAATACGGGGACCGGTACCACGACGCACTGCGCAAAGAGCGCGAGGAGTTGATGAGT +CTTATTAGTCAACTGGACTATTCGCAGCCGGAAGCGGCGGGTTTCACCAGTACCTGAGGA +AGGCAGTGCTGGCAAACGCGCGCAAGACGCTGGCGCGATCTGCCAAAACTCCGGAGGGTG +CATCAGCAAAATCGAAAGCAGTGCCTAATAAAAATATTAAATCTATTCTGAAAGAGAAAC +AGCCAGTAGAGGAAGAGCCAGAAGAAAGTGATGATGAAGAAAATGAGGTAGCGGAGAAGG +AAATACCCATACAAAAGGATCGCGATCCGGCTGTAAAGCAGGTACCTACTACAGCAGTAC +CCCGTTCTATGCAGAAACATGTAGAGTTCGAAGTCTTACCAGAGGGAGGGTTACCAATGA +GAGCTAAGCCCACAAAGTCGGGGATGATACCGTTCGTGGACATCCCGCCAATGAATCCAG +CCTTGCGGCAAAAGAAACCTGTCGCGATCGAAGCAGAACCCTTACCCACTATTGATAAGA +AAGGACCAGCGTACAAACATCGTGCTCCAATTGAGGACGACGCTAACTGGTCTGGTTTCA +TAAAAACGTTGCGCGATCTGCCTGTAACGATCTCTCAAGGGCAATTAATGGGATTAATTA +ATGCTCAGAGCCGTAAACGGGTAATTGAAGAATTAACTGCTAAGCGAATGCCTGTAAATG +AGGATAAGCCAGTTAAACGCGGCGTGACTATGGTGGAAGAAGTGGAGGGCATGCTAGACG +ACGACGGAAATGCGTATGAGCAGTTAGTATTTACTGAGCTGCCAGAACCGACCTATACAA +TCCTTGGGCAGGATGAGGGTGAGTTAAAAGCGGGGTCAATCATCGCGAGCGATCCAGTAA +CTCAATATCTCAACGGACTCGCTCCTGAGGAGGCGGCTAGGAAAATTATGGTTGCTCGTG +AATCTTATTTACTAAAAACGCTATATCCATTAGTAAACGCACAAGCAGAGGTGGAGTCGA +TTATAGACGGGGGATCACAAATCATATCGATGTCATCAGATGTCGCGATCCAAGTAGGAG +CGACCTGGGACCCAGATGTCACGATCCAAATGCAGAGCGCCAATAAACAGCTTGAAAAGA +CACAAGGGCTAGTAAGAAACATGCCGTTCAAATTCGGTGATGAAATTACTGTCTACTTTC +AAGTACATGTAATGCAGAATGCGGCGTACGACGTGCTACTCGGGCGACCGTTCGAGGTAC +TCACGGCGTCGGTATTCGAAAACGCTCTAGATGGATCACAAATGGTGACGTTGACGGAAC +CGAATTCAGGGAAGCGTTGTAAAATGCCAACTTACGACAGAGGGAAACCACGTAAAGTAA +TCAGCCGTAAGCACCCTGAGACGGTAGAGTCTTTTTAAACCTCGATGAGCTGGTTATAGA +TCAGGGAGAAGTTGCATTTATTATTGGGTCGGACGGCAATGAAGGCTATGTGATCGAAGG +CTATCAATTTCCTCAGGAAGGCCAGAAGTTCACTCAGCACGCACTTAGAAATGCGTACTT +AGAGAGAGCTATCCTGGAAGACGGACATGAGGATGCAGAACGAGAGAAAATAATTAAATA +TTTAGTAGATACACGAAAAACAAAGCCAGTAGAAGGATCGCGATCCAATCGTGGCACGTT +TGGAAGCATCGCGAGCCAATTCCATATGGCAGAATGTGTCGAGAAAGCCCCAAAACAAGT +ATTTGCTGCGACAAAGAAGTACAAGAAGGTGGCAGATAAAATACGGCCCGTATATCAAGA +ATTACCCGACAAATATCGGATCGTGCGCGACATTAAAGGGGATCCATTGAAAAACATGCC +TATGCTATCTAAGCAGCCGCCAGAATTCGTACCCACTGGCCGATACTCTCGCGAGCGCAA +GGAGCAAATGGACATAGTCCATGGCGGAGATTTTCTATGGGAAGAAGAGCGAAAGCTCGT +GCATCAGTTAATCATGCAGCAAAATGAGGCGTTTGCGTGGGACGACACAGAGAAGGGAAG +CTTCAAGTCTGAATTCTTCCCGCCTGTCGAGATCCCCGCGATCGAACATGTGCCCTGGGT +ATTAAAGAATATTCCTATCCCACCGGGTATGCACACCGAGATTTGCGATTTTATTCGGCG +CAAAGTAGAAGCAGGGACCTATGAGCCGTCTAGCTCGTCCTATAGGACGAGGTGGTTTAT +AGTGATGAAAAAGGACGGCAAGACATTTAGGATCGTGCACAGTCTAGAGCCTTTAAATGC +TGTCACGATCGCTCATTCTGGCTTACCGCCGGCTATGGAATCGTTAGCAGAACATTTCGC +AGGACGCGCGTGCGGCGGAATACTGGATTTATACGTTGGGTATGACGAGCGACTACTTGC +AGAAGTGTCGCGAGACATGACGACGTTCCAGACTCCGTTCGGCGCGCTCAGACTCGTCAC +GCTCCCTATGGGATGGACCAATTCGGTGCCAATCTTTCACGAGGATGTTACATATATTCT +TAGGGAAGAAATACCCGAATTTACGGAGCCATACATAGACGATGTACCTATCAGAGGGCC +TAAAACACGCTATGAACTGCCTGATGGTGGCTACGAAGTTATTCCAGAAAATCCAGGAAT +ACGAAGGTTCGTGTGGGAGCATATGGTTAACGTAAACCGGATCGTGCAGCGAATGAAATA +TAGCGGAGGCACGTTTTCAGGTTACAAATCACTATTATGCGCTGCCGAAATCGTTGTCGT +AGGGCATTTATGTACCTTTGAAGGAAGGAAGCCTATGCCGGATAAAGTGCATGTTATTCA +GAATTGGGGATCGTGCAAGAATATTAGTGATGTACGAGCGTTTATGGGAACTATGGGATT +ATTGCGGATATACATATCTGATTATGCGTCGCGAGCCCATCATATCCAGAAACTGCTGCG +TAACAACACGCCGTTCGAGTGGGGACCTGATCAAGAGGAAAGCATGCGCCTGCTGAAAGA +AGGCGTAACGGATGCACATTGTATAACGCCACTAGATTACACGATGTCAGGTAAAATAAT +ACTGTCCGTGGATACATCGTGGCGAGCCGTGGGATTCTATATCCGACAAGAGGATGAGAA +TGATAAGAAGAAAAAGAGATATGCGCGCTTTGGTTCGATATTATTGGGGGATCGCGAGCA +AAGGTTCTCGCAGCCAAAACGCGAGCTGTACGGCTTACTTCGCGCCTTGACAGCGTGCTA +TTATTGGCTCATTGGAGCACGGAACCTAGTGATCGAGACGGATGCTAAATATATTAAAGG +CATGCTCGAAAATCCAGGCATGGGTCCGAACGCCACTATAAATAGATGGATCGATCAGAT +ATTGATGTTCCATTTTGAGCTCAGGCACGTTGCGGGGAAGACATTTGGTCCAGATGGACT +GTCGCGACGCGAATGGCAGCCCGGGGATGAGGAATACGAGAACCCGGAACAGCAAGTGGA +GGATGGATTAGGATCGCTCACCTATGTAAAGAAATTTAAGAGTGATCCAGATCCTTTAGA +GTTTGAAGAGTTTAAAGAGACTATAGATACGCGTGGAGGTTATCAACAGGAGGTGGCGCC +CCAGTTCATACTGGAGGAAACTACAGACCTAGCTGTGTCAGTGGAATGTTTTCAGAAGGA +GTTAGACGCCGCGAGGCATCAAAACAAGTTGGAGCGAGAGATCGCGATCCAATACATCAG +CGCGGGAAGCGGCTCACCAGAGCAGCGCGACTTCTTGCAGCAGTTTATGCTCTCGCCAGA +ACTGCCCAGCGATAAGATAACGGAGAGCTCGGACGAAGCCGAGTACGATGAAAGGAACCG +GACGCCGGCGGGGACGGAACTAGATAATAAAATTCCGTTGATCAAGCAATGGTTAAAAGA +CCCGACCTCGAGGCCTGCTGGGATGTCCACCAAGGAGTATTTTAATTTCGCAAGGAGCGC +GAGAAATTTCTTTGTAGATAAGAAGGGAAGATTATACCGACGCTCTATAGATGAGGCGCA +CAAATTATTTGTAGAAAAGAAAGACCGTACGCGATTAATGCAGAGCGCTCACGATAGTCT +GGGACACAGAGGATCATACGCTACACGCACTATGCTGCAGGAGCGTTTCTGGTGGCCAGA +ATTGGATCGCGACGTGCATTGGTATGTTAAAACGTGCCATTTATGCCAAGAGCGTCAGAA +GACTATGATAAGGATACCTAGGACGGAGACTCACACGCCGTCAATCTTCCAGCAATTGCA +CGTAGACACTATGCACATGACGCCGCAGTCGCATGGGTGTGGGTACATTGTGCATGGAAG +GTGCGGGTTAACTTCGTATCCGGAAGGACGGCCGCTCCGCAAAGAAAATGCAGAATCGAT +CGCGAACTGGCTGTTCGAGGACATAATCTGTCGGTGGGGAAGTCTTAGGGAAATTATCAC +AGATAATGGCGGGCCATTTGTAAAGGCGTTAGCGCATTTGAAGCAGAGGTGGGGCATAGA +TTGGATCACGATCTCTGCGTACAACTCTAGAGCGAACGGAAAGATCGAGAGACCGCACTG +GGATATTAGACAAATGTTATTCAAGGCTTGCGGAGGCGAAGAATTCGCAAGTAAATGGTA +TAAATATTTTTACCATGTGCTTTGGGCGGATCGCGTGTCAATTAGGAAAGGTTTCGGGGC +CTCGCCCTTCTTTCTCGTGACAGGAGCGCACCCTGTATTGCCTATGGACATCATAGAAGC +CACTTGGCTTGTCGAATTACCGGACCGTGTGCTCACGACCGAAGAACTCATTGGATTCAG +AGCGCGAGCGCTCGCAAAGCATAAAGAACACATCGACGAAATGCGCGAGCGCGTATCTAA +ACAAAAGCGCGATGCACTGTTAAAATTCGAGGAGAAACATGTACATAAAATTAAAGATTA +CAAATTTAAAAGCGGAGACTTAGTGCTGGTACGAAATTCGCCGGTAGAAATGTCCTTGAA +CAGAAAAATGAGACGTCGTTGGGAAGGTCCATTTATTGTTATTACAAGGAAAGCTGGCGG +TGCGTATATACTAGCAGACATGAGCGGAAAAGTGTATAAAGATAAAATTGCGGCGTTCAG +AGTAATCCCTTACTTTGCGCGGCGTCATATTCAAGTGCCCGAAAATATTACAGAGATTTT +AGACCAAAATAAAGAGGATCTAGATGCGTTAGCCAACGCTCCAGACAATGAGGAAGCGGA +CAAATTAGAACGTTTAGTTTATAACGAAAACGATCGCGATCCGCAGATTATTGACTGGGA +CGATGATGAGGAACGCTGGTGGGACGATGATATATGGCCTTAGGCCCAACAGGTTTATTC +AATATACGGATCGTGACAAAAGTATAACTACAACAGGCCCCTTTAAGGCTGTAAAGACGG +GCGCACGCGCCGGAACGACTACCCTACTCGGCCTCAATCCCCGCCGGGTTGAAAGTGGCA +CGAAGGCGAGTCAACTCCTCCGAAAGCAAAGAACGGTGCTTCAAGAGGAAGTCGAGCTTG +TAGAGGTTGGTAATGAGCTCCGAGCGGAGCTCGCCTTCAACGCGCCTAAATGCGAGAACA +GGCCCATCGGTAGGGAGACCGATCGCGACAACTTCTGCTGCTTCCACAGCGACCGCAGGG +GACGGCGCGCCGGCTTCCTGCGCCTCTAAAAACATGAAATAAAAATTATTTTAATCAAAA +ATTAAAAAGAGAGGAAGGGGGAGCTGAAGCTCACCGGTGACAGTAGCGGCAGGAGGAGTA +GCAGGAGGAGTCGCAGCGCCATCCAAGCGAGCCCGCTTGGACGGACCAGACTCGGTAGAG +CCATCCTCGGCCGCAGAGAGAATTTGGACGGCCTTCAGATAAGCGTAACTGGTCAAATCC +ATACGTGGAACAAGGTGATAAGGGAGACGTACAACTTCGGCACGTTTGGAGGTGGTCGCC +TAAAATTTGAGGTTTAATGTTGGATCGCGATCCTCATTTAGAGAAAATATAACTCACGCG +GGAAGAAAAGCCACTCGCAGGCGGCTCGCGACGCTTCTTGGACGGGCCAGGGACCTCGGA +AGATAAAGAAGGTACACCGGGATCGGTAGCGCACTCGAGAGTGGTCGACTCTTGACCCAA +AAGCATCTGAGAAAATGCCCAAGCGAGCGTTCGTTCGCAGTCAGCAAACGAGAGACCTTA +AAAAATTCATAAGTACACACTTCGATGTCAGTGTCCTCTGAAGTACCTGCTGGGGCAGAA +GCAGTCTCAAGAGGGTCGATGCGCTTGCCCTTACCCGCGATATGGCCACGCGGAACGCGC +TGTAAAAATATTAAGTTAGGAAATAAAGAAAAGAGGAGAAAAATAAAGCATACAGGGCCA +GTCGGGTGGGTATCTTTGTACGTGACCACAGGAGAGCTGGTCGCAGACAGGTGGAAGCTA +GGGTTAATCCTCGCAAGAGCCAAATGAAGGCCGAAGAAGTCGCGGACTGCGCTAGACATA +GTATATCCCTTCTGTGTAACCACTGCCTGGAAAGCCCGGCGAACCGAGACCACCAAAGCG +GCAGCTTCAGGATTGGCTGCAATAGCAGGCGCGAGGCCAGACCACTTCCGGAGTACCACT +GCAATATCCTCCAGAATGTTGGCATAATGCGCAGGAACGGCGGAGGGCGAAGAACGTATG +CTCTCTAAGAGTGCGACGCGTTCGGCGATCTCAGTAAAGGCAGGAAGGTTGCGACGAGGG +GAAGCCATGACTGACTAAAGAAACACGGTCAGAGGAAGACCGTTTTATACCATCTACAAG +GATCGCGATCCACAACACGCGTAAATTGGGAGACCAGGGAACTAGTGCAACTCAGTAGCG +AGGCGTGCAAGTAGAAAAATACCCGGTTACCGAACAAAAAGCAGAGCTAGCGAGAAAATC +TGCTGCGCATGGGTCGTAAATACTTGGAAAGATATGGAGTAAAATGAATCGCGATCCTTT +GAAACATGAGGCAGAGACGATATCTCAAGCCAAAACAGTGGCAGTCAAGGTCTGGAATAA +TAAAATAATGTTTTATTGAAGATAAAATACGCGCGACGCGCTCAATATAGAGTAGTAGCC +AAATTCGGACGCTTAAGCGGTGTAAGCCTAAGTAGGCACACTGTGTACGGCAGTACGGTA +ATGGGATGTCCACTTGACGACATATTCATTAAACCACCGAACGGAATCCAAAAATAATAC +ATTTCAAATAAGAAGCTTGGCGAGTCTACAGATGGATCGCGAGCACAAGAAAAGGTACAC +TAGTCGGGCAACTCGAGCGCAGATAGGGTAACAGTGCCTGCAGGCTGCGGAAACGCGCGG +CCTTGCTGCAATACCAAAAGTCAGCTACGCTCAGTAAGCACGGAAGAAATAAGGCGTACA +GAGACCATGAACTGGTAGCAGGAGATATCGCGAGCTGCGTGTACGAGGTTACGGAGACGG +CAGTGCTCGTCGCCCAGATAGGGCATGCGCTGATGATTGAGGATAGCGAAATGCGCCACG +ACAGAAGAGTGAACGCCGAGTAATTCTGACAATAAGTGCAGAAGCTCGGGGTCACCAAAC +AAATGCTCTGGTGTGAGATCAAGGCGACACTGGATCGCGAGACTTCAGATGGGCAAAAAT +ACATGATAGTAAAAGACTTACCGCCGCGCGAATCATGGACTGGACGGTGTACAAATTGGC +ACGCGTACCCGCCATGGTATTAGTCTGGTCATAAGTCGAAATGCGCCGCTTGAGAGCGAT +AATGCCAATCACCAGTTCGTTAACAGATGGACTGGGCGGAGGAGATTCTAGATCCCCGTC +GAGAATAAAGAGGTCGATAGAGGGATGTGCCGGGTTCAAGCCATTAGCGGTGCGGGGTGT +AATAGGTTGATCGCGAGCGTCGGGAGTGTCGAACAAAGGAGTCTCGAGCACTTCACCATT +AAGGTGGGACGCGCTAGAGTTCTCAGATTGACGCGGGAGACCAGGCATAAGGCGAAAATG +AATACAATTCCATTCGCAAAAACTACATGTCTATATATGCTCGTAATCAAAAGCTCCGCA +GAGCTGAAACGCCTTAGGAAGTGTGAACGCGTGCGAGATGACGATACTAGAATCGTGTTA +GATATCTGGAGTGATAAAATCAAAAATATCCACGTACAGATGGATCGTGAACCATCAGAT +GCGTAAACGCAAGCAACCCTTCTAATCCCAGGCGCTCGTCACAGAAATGGAACGGACGCT +TGTGCTGCAAAAAGGGAGCGCGATCGCAGATCTTGATGACGGCAAGTTCGAGCCGAAATA +AGTACAGAATGTGCAAAACTAAAGTAGGGTTGGTGGCGAGATTATGAGCAGAAAGACGCC +AGGACGTCTGGATCTCGAGACAAATTAATCAATAATAAATGAATAAATAATTGTGATACG +CACCAGACGACGGTACAAAGCGTGGATACGCTCTAGAGTGCCTTCTGGATCGTCCTTGCC +CACAGTAGACAAGTAACGAGCATCGAATGAATCCAAATCAACAAGCAATTGCTTGAAAAG +TTTGGATCGCGACTCATCGTCGAGGCGATGAAGGAAGATACCGGCGTCGGATGCCTCGCG +AATATTCGTAGAGCAAAGAGGCACGTCGGGGACATAGGGAAAAGCCATCGTGCGCCTGAT +ATGTCTGACGTGTACGCAGAGAATTTTATACAAAACAAACAGAGATCGCGATCTCGATAT +TCCATTCAGAGACCAACTGGGGTCAGTTGCTTTTTGTTGGGGGGGAGAGATAAGATCTAT +CTAGAGAAAATTTAACCCGAATAATTTTCGAGTTTTTTCACTTAGAAATCACACTTCAAA +TCAGGCAAATTTGGAAAGACAAAGCGAAGTTTTTATTGAGAAGAAAACACAAGTACTACA +GGGAACTTCAAAAACCCTATAGTAAAAGAAGAGATGAGATATGAAAAATATAAAAAAAAA +AAGAGAAAAATGCTGTCAACGGCGAGCCCTCTTGACCCTAGGACGAGGAACAGGAGACGA +GCCAGAGCGCTTGAGGCGGAGGAGCTTCTGACGCAGGGGAGAAGGCGAACGGTCACCAGC +ACCGCTCCCAGCCTTATCCTCCTCGTCCTGATTGCCACCAACGCTCTCACCCTGGTCGTC +CTCTTCGTCCTCTTCCTCATCACCATCACCTTCGCCAGAGCTTTCTATAGCTTCGTCGTC +GATAAGAACAGATCGACGAGGAAGAGCGCGTTGTGGACGAATGGAAGCACTAGCACGGCA +AGTGCGCGTTGGCGCGCGCGTCGAAGATGCGCCGGTCGCGACAGTTGCTACAGGCACCGA +AGGGGCGGGAGCTGTAGATAGCGCGGGATGAACCGTGAGTGGAGACCGATCCGGGGTAGG +GGTAGCCCAGATGGAGAGCTGCGCGAATAAGTTAGCGAGCTCGTCCGGAGACGAAAGCAC +GCTGGGTGTCGGCTCCAGTCGCACGCGCTGTGCGTCGATATCAGGGAGCTCCAGGAACCA +GCGAAAGATGTCGAAGGCCTCGGGGTCCGAGTGAAATAGAGTCGCGATAGGTGTGGAAGC +GCTAAGGCGCTCGGATAGTTGGAGCGCGCGGTTAAGCGCGCGGGCACTGGCTTCGGCCGA +CCGGATCGCGAGCTCTTGTTGACGGAACGCCTGTTGCGCGTGAAGCACAGCTTCGGCCAA +CAAGGACTTCAACACTGCAAAAATAGTTTAGACTGAAGAAATAAAGAAGAATAGAATAAA +GAAAGCACCGTTGGGATCAAGATCATTCCATGGCGCAAGAATAGCCGCGAGCTCCCCGAG +AATCTTGGGGGAAGCTGCGAAAGTACAGCCAGTCTTGCGGCCGGTCAGGCAGGCCTTGCA +TTGGAGGCCCCAGCCGCGGAATTCGCAAAATAAAAGAGTCCCGTCGGCATGAGGGATGGT +ACAGGGAATGCACCGGGCTGGGGCCTAAAAATAAAATAAATAAATCAAGATAATAGAGCA +GAAAAGAAATAAACTCACCAATAGAGTCTTGATCACCGCTAACGCCTTCTGAGCGTCGCG +GAGGAGCGCAGAGTCGCGCATGGGGCCCAGGGCGACGGCCAGATACGCGCCAGCAGCGTC +GCGAGGCGTGAGGGACTTGAATAATTCGAGAGTCTCCTCGTCTGGCTCCGGCAGGGAATC +AAAAGCGGCGTTGGGATGGCCGACCGAGGGCGGGACGACTTGTTGGATCTCGACCGAGCT +CACGGCCTTCTTGAATAAGTTGATGGCCCGTTGGCTTTTGGACCTCATAGTGACAACCTT +CGACCCGTCCTTGCCGTGGTTGGATGTCGACGGGCGCAGCGCAATAGTGGGCTAAAAATA +AGGCATCAAAAGATAGGCAGTAAATTAAAAATAGACAAATACCTCGAGAGGGAGCGTATT +GAAGAAAGTTTGCGCATTAGAGGTGAGCCGAGCGCGAGAAAGGAGAAGAGCGGCAAGCTC +CTCCTCGGCATCGGCGTCCTCATCACCTTGATCAGAGGGATCGCGCTCTTCCTCCGACGG +AACTATAAAAACCGTGAATAATAAGAAAACAGAAAAGAATGATAACTTACCGGGTGTAGT +AGCATGGCCTTTCCCCTTGTGCGCCCTGGATAAGCGCGGGGTGGACTCGTGATCCGACTC +CTCGAGCTGATCGACCTCAATAGGTTGAGGCTCTTCGGGAGGCGACGACGCGGGTTCTGT +AAAAATATAAACCAGAATTAAAAAAGGGTACGCGAGTAATGAAAAACAAAAGAAAATAAG +TACCTTGTAACGCCGCTACAGGAGGAGCAGCAGCAGAAGAAATAGTAATCTCCATGTCCT +CGCGACCGGAGAAGTCATCGTCCTCGGGAGGGGGCAGAGCTGGGACACCAATGGGGAACT +GCGCCTCGGCAAGCTTGAGAAGATCCTCGTCGACGGGAGGATCGCGAGCGACGTGAATAG +GGTCTTCCAGGTTGTCGACAGGAGAAGCTGGTTGAAAACGCCTCGCGATAGCAGATAAAG +ACAAGAGGCGCTCACCAAGAGAAGAAGGAGCGGACACAGCGGGCCGGGGAGTAGCGAAGA +CGGAGCTGTTGGAAGTAGAGGCTGCCACCACGGAAACAGAAGCGGAGGCGGCAGCTGCAG +GCACAGAGAGAGAACCCGCCACGCTTGCGGCGTCTGGCTCCGGAAGAGCGTCGACCGGAA +GTAGGAGCGGGCGAATAAAGGACAGAAGAATATTGGCGGCCTCTTGATCAGCCGAGCGCG +GCGTCGACGACAGAGGCTCTTGATCCTGATGGACCGAAGAATCGCCCGCGGTGAGATTGG +GAGAAGGTTCGCGAGTCGGCGAGGCAGTCATGAGCAAAGGAGATGGCGGTGGAGAAGGGT +CGCGAGCTGATAAAGGTGGCGACGGCGCGTCGCGCGCGGGAGATGGAGGCCGGTCGTCGC +GTAAAAGCGCCCCGCTGTCGAGAGGGGTGTCCATGAACGACGAGGGCTCTCGCCAGGTCG +AAGGAGGGCTGCCGCTAGCAGCCAGCGCGGCAGAAAGACCAGGTGGGGGTGAAAAAGCAT +CGTTAGGGTCGTACCGGAGGTCGGCGCTGCAGGGGAAGCTCATGTCGATAGGTGGTGGAA +TAGGGAGTTGCTGCACGTAGCAGCCGATCTGTCCGGCATCGAGCCATCGGTGTCCAAAAA +GATGCGCTTGGTCTGGAAACCATAGCGCGGGATCGGTGCTAAAGAACAAAAGTTCAGCGT +CGTACTAAACCAAAATATGTAAACGTTAGTAAGACATGGCAAACGAGGAAAAAGGATCGC +GACACGTACTATGACAACGTCCCGGTACCAGCCATGCGATAGATGTTCCAGCGTCGCGCT +GGAAGGCACAGCATCGCAAACACGGGAGATGGAATACAGGAAACGCTCGACGGGAGCGCG +CAGGAAGTGGTCAGCGGGAAATCTCGCCAGTCGGTCATTCAGAACTCCCTGAATACGACA +CAGTTTAGCTAGAAAAATTTAAAAGAGACGGAATATGACGCTCACGAGGTGAGACGACCA +CTCAGTGATCAGCGCTCTTAGCCAGGCGTGGCTGGGCGTCTCTTGAGCAAGGAAGGCGGC +TATGATCTTGCTGAAGCGGAAAAAGGAAAGAGCGAAGGAAGAGGAATAATTAGTATCCGG +GGAGAAAAGTGTCCCCTGGAAAGTAGGAAAGAGGATAGGGTGTGTATGCATAGTGAAAGG +ATGAGGAAAGTGGGAAACATACGCGACAAGGGATCGCGACTTAAATACGTCGTGAACCAG +CGGCGTACGCGGACAGTCAAAGTCTCGCGAGAGCCCACCGGCAATCTAGGAAGCGTTGAT +TTGCGTCTATAATGGGCAGTTAACTTCCTAGTGATAGCTTCATGGATCGCGAGAGACGTC +ATAGCGTAAAACTTATGTTGCGCGGCGTGTATGTCGCGAGAGTAATGCTGGGCTAGGGCC +AAATTCTAAAAAGTTTAATTGATTGATGGGGAAATTCTTCTGCGACGCCGCTACAAAGGT +CGCGATGCATCCTCACGCCTAGTTGGAGGATCGCGACGAAAGAACTATCAAAATAATGGC +CTTGCGCGCCTTAAGCGCTCAGGATAGACTATGCGGAAGGGACGTACCAGGATGAGGAGA +TGCCGAGGAAGGAAGCGCGTCGCAATCTAAAAATAGATAGGTGCAGCGCCGTAGCAACGG +CTTCGATGTCTAGCCCAGGAAGCTGGAACCAGGCCAGAAGGCTGTCCGTGGGCGCCGATA +TGAAAGAGCGGTGGCGCCCACTGATAGAATACCAAGGAATAATGACCAAAGCAGCAGGGG +AAGTGCCCGTCTAGGGATCGGTCGTACGGAGTGTCCAGAAAACGGATCGCGACAGAACCG +AATAGCGTTTTAAAAATAGAATCAGGTCGGGGAAACTCTGAATGGGTGTCGACTGGGGAC +AGTCGATATTTGTTAGGGGGGAGATGATAGGGTAGTTACATGGCTACGCCTGAAAATTCG +AAATTTTCACATTTCCCTTACAAAATAAATAATGATTAAGAGGAGCTAAGGCCGTCCCGG +GCTGAGAGCTCAGAGCAAATGCGCGTGCGGGCGATAATGATCGCGAGCCTGTGACGAAGG +TAGCCGCGCGCTGTGCTAAATATAGGTGCACGTTCGGCAAGCTGGGAGACAGTGTACAAA +GCTCGCGATCCATTATTATTGTAGTAAAACTGCACGGCGGCTCCATTACACTAAGGGACA +GGAGGACTAGACGCTATGAGGGAGTCGCGAGACTAATACAGGTCGTCCAGGACGCTCGCG +ATCGCTAGTACGGAAGACACACGCCTACCGGCGGACCGGCAATAATAGCACACCGGCCGG +ATAGCGCTAAACCGTTGGCGCGCGCTTAAGCTATGAAGGCACGGCAAATGCCGAGCGCGC +CCGAGCGCGCTTCCGAGGATGCCTGCAGAAGGCGTATCTGCGCCAATACGGGCTCACGAT +CTGACTTATCAGGTCGCGGAGTACCTAAACAATAAACGGGTAGGATCCGAGGGGCTTATC +TCGAGCCCCGTGTCCTAAAAACGCTCAGAAACAGTAGATAGAAGGTGACTCATACGAGGT +AGCACATGGATCGCGAGCCTCGAGGAGGGCAACCCTTCGCCCATTTGTTTGTATAACGGT +TTGATCATATTAGACTTAGAGATATTTTCCATACAACCTGTGTACTATTTAACTAGCTGT +AGAGTACAGAATAAAATCAAGCAATCGTACCCCACATTTTACAAGAGCTAAACCTGCAAA +GGCGCGAGCTCGACTAAAACTAAGGAATTTACACATTTGACTTCCGAGCTTCGAACTTAA +GCACTTCGTAAGATCGTGATCCCGTTAGCGCCGTCAGTGATAGTAGATTTAAGACCGAGC +CTACTGAGAGTGGTAGAGAAGCTAGTTTTAAAGAAAATATTGCAGACGGATAGCGCGAGA +CTACGAGAATTTTGAGGTGCCGTAGAGTGCAAACGCTCCAGATCCAAGGCTACTAGACGT +TTTCGAGTGCCCTAGTGATTGATTGATATTTTACTCTCGCGATACATTGGAAGTTTTGGC +CGGAGTGTTATACAACGGAAAAGCTGAAGATAAATAAATCTAAAATCTGTTTAAATCCCC +CTCAACCTTGAAGAACATCGCAGCACTCGCTGTCGAGGATCGCGACTACTTCTACACGTA +TATAAAACAATAAAACCCCTAAAACTACACTTTTGCTTCGTTTTCACCCTAGGAGCTAGA +CCACACCATATATCTCATTTTGTCTGTTGAGAGCGTCGCTCGATACTACGAAGTAGATAT +CTCACTCCGCTGGGTTTTGTGTTTTCTTTTGTTTTCGATTTCGCGACTTGCCTGACAGCA +AGCCTCTCA +>SRR17300492_42243 +TAATTAGGAAATTAGACACTTTTAGATGCTATTAATACTTTTAGATACTTTTAGACACTA +TTAGATATAATCCGGAGCTAATACAAGGGGGTGGTTTTCCAGATGTGTCCAGCTTCTTGT +AAACAGAGATTCTAGGATATTGAGTGCCATAAGGAATTGTATCGGTGCTTGCGATATCAT +TGTCCCAGCTCTGGCCACCCTGATGAAGATTGCCATGGCAAGCACATGGATCATCTACAT +TGGCGCAAGTACGGACGAGGCCAAGACTAGAGCAAATTCCAGTACTTTCGATGATTCTGA +TCTAGAGATACAATAAATGTTCAAGGCTCACCTAAATTTGAGGCAACACACTCACCAACT +TAGCCTGGATGTTGTCACCCTGCTTGAATTTTGTGAACTGTTACTCACAAAAATAGGGCA +AATGTCATGGCAATGCGTGTAAAAAAAGTCTTGAAAAAATCGTTTATTGGCATAGGGCCA +ATGAAGCTGTAGTCCATGTCTATAACCGATGGTACTGTGCTGAGGAGGGATGATCTCATA +TCAGTCCGAGGATGTGTAAGCAGTGAGCAACTAGAGTGAGAGTTCAGGAGGTCAGAAAGA +AGAAGGATGGTGTCGCCGACATACCCAGGCTAGTAGTGATTACAAGTCCAACGAAGAGCA +AGATGTTGAGCCATTGAGGACTCGAGCCACCACACGTTCAATTGGCTGGGTTTGAATTAC +ACATTTAAAACTCCAAAGTACACGTGACCTGGCATCCAGTGACAATGTGGCATAGTACAC +ACTGCTCTCTAGAGTCTAGTCCATAGAATAGGGTAGCTTTTCATTTGGGCGGGGAATCAT +ATACGCCGGCATGGGCATCAATCACTCGACTCAACACAGCATACAAGTAATCTTAGTGAA +TATCACGAAACTAGACACTGAGATCTGGTAGTGGGCACTGAACTCCTTGGGTCATCGCAC +GAGCCTTGAGTCACAAGCAGAGACACCAGAATAAGCTACAAGACGGTGCAGTAACAGTCG +CATCACAACTACGCCGTCTTTCGTTTACCACTGGCCCTCTGCAACGCAACTTCGTCCAAG +CTGCGCCTAGCTCCGGCCAGCTTGTAGTATAACGATTCTCCATGTAAGCTGTCGCTCTGG +TCATTCCTATTACTTCCCCATCCCACCGAGGACAGGTGGTTGTGGAAAATCTTGGTGAGG +GAGTCTGACGCAGTCAATGCAGTGCGAGCTTCGTCAGTGGTGGGGAGCAAAGAAAGGTCA +ATTCTCGATGGTCGGTCAGAGTAAAGGGGAACAAACAGCCACCGAAGTTCATGAATAAGT +TCGACGAGTACTAGACTGAAGAACTGCAGAAGAGTGCTCTCGTTGAAGTGTGTGGTTGCG +ATCTGAAAGAAAGCCCGTTTGCCTTCCCCGCCAGTAGCAACACCATCATCGTCGACTTCA +CATTGATCGAATACTACTTTCATCGACTTGGTTAGTTGTGAACGAAGCGGTTTCGGTATT +TTGTGAGTTTGAAACTAAACACAGTGATATACCAGAACATGGAGAAATGATTCCAAGTCA +TCACAGAGTTGATGGGGCTGCGATCCAGGTTGACTCAGTCGAGTTAACAACATGAATTGC +CATGTTCCCTGATAAAATATATTACGATGCAGAAGTTAAATAATCAAATAGTACCAGCTC +ACCGTTCTCCGATTGAGCCTTGCTCCTGAAACGGGGCAATCTGATCTTCTTGCAAAGTCC +CAGTCTATGAGCAGAGCGTGGCCCTCGTTCGTGATTAGAATATTCCCACTGCTTATATCT +TGATGCAGCATGCCAGAGACAAAAGCCTCCTGATGGGCTGGCTCAGAAATAAATTAGTTG +GTATGGGGCTGTGGATGCGTAATAGGCAACATACAGATAATGGCTTTATAGAGCACCTTG +CAGAGTTGCTCTGTAGAATTGTACTGGCTCAACACATCTGGAAAACCACCCCCTTGTATT +AGCTCTGGATTATATCTAATAGTGTCTAAAAGTATCTAAAAGTATTAATAGCATCTAAAA +GTGTCTAATTTCCTAATTAGGAGCAACACA +>SRR17300492_101362 +CCATGGTGCGCCGCGGCTTTCTTCCACCCTATTGCATATGGACCGTGAAGTGAAGGTGCC +TGACCCTATGGCTGGTCTAGCAGAGCTTCACTCAGGCGCTCTACCACCTCGCCGCGAATC +CAGAGTACGCATGCGTGCTGCGCAAGGAGGTCGAGTCCGCGGTCGCGGAAGACGGGTGGA +CGAAGCACGCGGTGGGTAAGATGCTCAAACTCGACAGCTTCATTCGGGAATCGCAGCGCC +TCAATGGACTTGGTCTATGTTAGTTTCTTCCTTGCCTTCGACCCGTGTCTGTTTACTAAC +CTCACCCGTCAATCTCTCCTATTACGGCACTGCCATGGGTATGATTGCCAGTGACACTTC +AGCGCTATGCCCTCAAACCTTTCACGCTCTCGACCGGTCAGACGATCCCAGCGGGAACGT +TTCTCTCGTGCACATCGCTGCCGACACATCATGATCCTGAACTGTATGCCGATCCCGACG +TCTTCGATCCCTGGCGCTTCGCTAGCATGCGCGAATCACACACCAATTCGGATGACGACC +TGAGCGCCCTGGCCAGGGCCAAACTCCAGATGGTGTCCACCAGCACAGACTTCCTAGCCT +TCGGGCACGGCAAGCACGCCTGGTAAGTCGACCTCCCCTCCGGCACGCCCCTCGATCTTC +AGGAAAGCACGCCCTACTGCACGCGACGTCTTTCACGACACATGTTGACCTCGTTTCCGC +AGCCCCGGGCGCTTCTTCGCCGCCTACGAGATGAAAGCAATGCTTGCGCACGTCGTCGTC +GCCTACGACGTCAAGTTCGAGAACGGCGCTGCGGACTTCCCGCCAAATTTGTTCATCGGA +TCTGCCTGTTTGCCGGGAAAGGGACAGGTCATGTTCAGGAAGCGGCAGGTGAGCGACGAG +TTGACTCTCGCTTCCCTAGAAAAGTAGTCATGTTGAGTACTCGTGTGTAACGTACCTTGA +GTCAAGGAGATTGACTGAAGGTACAATTATGGTTTCTTGCATAGTGCTGATAAAATAGTG +AGAGTAACAGAGGAAGGTGTGAAACAAACGACTCCGGGAGATATACAGTCATCACGAGCA +ATATAGTACATGCATTACCACTGGCACTACGAGATCGGACTCTCCTTCAATAATACCCAC +AGAAAGCAGCTAGGAAAAACCCCTACTCTAAGAAGACTTCGGTAGGCCACATGTGGGGCA +TACGATAGGCCTAGTCTTGCACGCCTTGTATACTGCGTATCCCAGTCCTGCTACCGCCAT +CCCGCCTGCAGCGCTGATGATGAAGCCTACGACAGGAAGTGCACCTCCGGCTCCTACGCT +GGTAGCGACGGCGAACGGGGATCCCGCGACAACGTTACCGATGCTAGCTTGCACTGCGGC +TGCCCATGATGCTACGCATAATATAAAGTCATTGTCTGTTGGTGGGCAGCAAATGGTGCG +AATGAGCGCACTTGCAATGATACCCTCAGATCCGAAACCAAGTAGAGCTAGGACACCTGG +GGCTGCAGCTGGAGCAGCAGCCAGTCCTATCACTGCACCCGTACCCGTGACAGCGACCTT +AGTATGGTCGCCACAGGTACAGAATTGAGGGCCAGCAGCTTCAGCACCCTCTCCAGCAGG +ATTTATTGCGTCTAGATTGCAAGAGGTGATCAGCAGTCGATGTGTAGTGCACACTCGATC +TCGATGAAGAACTTACTATTCATGTTGCTCCTATTATTCACGACGGTCGAGCGATAGAGA +CTTAGAGTCTGAGGATGTTTCAAGATTCGATTGGTTGTACTGAGTGGGTCGAAGGGTGTT +GGCCAGTCTGCCCCCCACGAGCGTCCTTATATACTTCGACACGTTCCCATCGAAGATTCT +GGGTTATTAGGGTACCTAGCGCTCATCCTATTTTGATATACAAGGTAGAGCTTATGATAA +TATCATATTTGACTCGAAGTATGCCTGGTAGACAAAAGTCAGCCGCTCGTCGAAAGATAG +AAGGACCGCCCACTGCCAAATGTATCGTATCATGTTCCCTTCGGGACCTTGTTTCCAAAC +ACACGCCTGTGCTCTTTGTTCTCATCGGAAAGCATAGCATGGTGACTCCACCTACCCTG \ No newline at end of file