Mercurial > repos > iuc > detect_circular_sequences
changeset 0:faec698e3f98 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/main/tools/detect_circular_sequences commit 7ea9f729b44c6351c52b6295c780f496d239488e
| author | iuc |
|---|---|
| date | Thu, 11 Dec 2025 08:53:37 +0000 |
| parents | |
| children | |
| files | detect_circular_sequences.py detect_circular_sequences.xml test-data/input.fasta |
| diffstat | 3 files changed, 672 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/detect_circular_sequences.py Thu Dec 11 08:53:37 2025 +0000 @@ -0,0 +1,248 @@ +#!/usr/bin/env python3 + +######################################################################################### +# This script detect circular contigs by looking for exact identical k-mer at the two +# ends of the sequences provided in fasta file. In order to be able to predict genes +# spanning the origin of circular contigs, the first 1,000 nucleotides of each circular +# contigs are duplicated and added at the contig's end. +# +# Inspired by Simon Roux work for Metavir2 (2014) and Corentin Hochart work in PlasSuite +# +######################################################################################### + +import argparse +import logging +from pathlib import Path + +from Bio import SeqIO + +log_levels = { + 0: logging.CRITICAL, + 1: logging.ERROR, + 2: logging.WARN, + 3: logging.INFO, + 4: logging.DEBUG, +} +logging.basicConfig(level=log_levels[3]) +logger = logging.getLogger() + + +def setup_logger(verbosity: int) -> None: + """ + Configure the logger based on verbosity level. + + :param verbosity: verbosity level + """ + logging.basicConfig( + format="%(asctime)s - %(levelname)s - %(message)s", + level=log_levels.get(verbosity, logging.INFO), + ) + + +def find_occurrences(s, substring) -> list: + """ + Find all starting positions of a substring in a string + + :param s: String to be searched + :param substring: Substring to search in s + """ + return [i for i in range(len(s)) if s.startswith(substring, i)] + + +def is_circular(sequence, length, pos) -> bool: + """ + Determines if a sequence is circular by comparing segments starting at `start_pos`. + + A sequence is considered circular if the `length` elements at the beginning of the sequence match the `length` + elements starting at `start_pos` in the sequence. This is useful for detecting repeating patterns or cycles + in sequences. + + :param sequence: The input sequence + :param length: The number of elements to compare for circularity. + :param pos: The starting index in the sequence to begin the comparison. + + :return bool: True if circular, False otherwise + """ + for i in range(length): + if sequence[i] != sequence[pos + i]: + return False + return True + + +def check_circularity(seq_record, subseq_length=10) -> int: + """ + Process a single sequence to detect circularity and return the overlap length if circular. + + :param seq_record: SeqRecord object + :param subseq_length: Length of 3' fragment to check on the 5' end + + :return: overlap length if circular, 0 otherwise + """ + seq_len = len(seq_record) + + if seq_len < subseq_length: + logging.error(f"Sequence too short ({seq_len}bp): {seq_record.id}") + return 0 + + begin = "".join(seq_record[:subseq_length]) + end = "".join(seq_record[subseq_length:]) + positions = [x + subseq_length for x in find_occurrences(end, begin)] + + for pos in positions: + overlap_length = seq_len - pos + if is_circular(seq_record, overlap_length, pos): + return overlap_length + return 0 + + +def extend_sequence( + seq_record, + overlap_length, + duplication_length=1000, +): + """ + Extends the 5' end of a sequence by duplicating a fragment from the 3' end. + + This function is useful for simulating circular sequences by extending the 5' end + with a fragment from the 3' end, based on the specified `overlap_length` and `duplication_length`. + + :param seq_record: The input sequence record to be extended. + :param overlap_length: The length of the overlapping segment that was previously identified as circular. + :param duplication_length: The length of the 3' end fragment to duplicate and add to the 5' end. + + :return: The modified sequence record with the extended 5' end. + """ + # Remove the overlapping segment from the 3' end + modified_seq = seq_record.seq[: len(seq_record.seq) - overlap_length] + # Duplicate the first `duplication_length` nucleotides from the original sequence + # and append them to the 5' end of the modified sequence + if len(modified_seq) < duplication_length: + # If the modified sequence is shorter than `duplication_length`, + # duplicate the entire modified sequence + extension = modified_seq + else: + # Otherwise, duplicate the first `duplication_length` nucleotides + extension = seq_record.seq[:duplication_length] + # Combine the modified sequence with the duplicated fragment + extended_seq = modified_seq + extension + # Update the sequence in the SeqRecord object + seq_record.seq = extended_seq + return seq_record + + +def detect_circular( + fasta_in, + fasta_out, + id_out, + subseq_length=10, + duplication_length=1000, +): + """ + Detect and process circular sequences in a FASTA file. + + This function reads sequences from `fasta_in`, checks for circularity, + extends circular sequences, and writes the results to `fasta_out` and `id_out`. + + :param fasta_in: Path to the input FASTA file. + :param fasta_out: Path to the output FASTA file for extended circular sequences. + :param id_out: Path to the output file for recording IDs of circular sequences. + :param subseq_length: Length of the 3' fragment to check for circularity. + :param duplication_length: Length of the 3' fragment to duplicate and add to the 5' end. + """ + records = [] + ids = [] + try: + with fasta_in.open("r") as fasta_in_f: + for seq_record in SeqIO.parse(fasta_in_f, "fasta"): + overlap_length = check_circularity( + seq_record, + subseq_length=subseq_length, + ) + if overlap_length > 0: + records.append( + extend_sequence( + seq_record, + overlap_length, + duplication_length, + ) + ) + ids.append(seq_record.id) + except Exception as e: + logging.error(f"Error processing {fasta_in}: {e}") + raise + + if not records: + logging.warning("Warning: No circular sequences found.") + + try: + with fasta_out.open("w") as fasta_out_f: + SeqIO.write(records, fasta_out_f, "fasta") + with id_out.open("w") as id_out_f: + id_out_f.write("\n".join(ids) + "\n") + except IOError as e: + logging.error(f"Error writing output files: {e}") + raise + + +def main(): + """ + Main function to detect circular contigs in a FASTA file. + + This function parses command-line arguments, launches function to read the input + FASTA file, process each sequence to detect circular contigs, and generate the + output files. + """ + parser = argparse.ArgumentParser( + description=""" + Detect circular contigs by looking for exact identical subsequences at the two + ends of the sequences provided in a FASTA file and output the circular contigs + extended on 5' end by duplication of the first nucleotides on 3' end to be able + to predict genes spanning the origin of circular contigs. + """ + ) + parser.add_argument("--fasta-in", required=True, help="Input FASTA file") + parser.add_argument( + "--subseq-length", + type=int, + default=10, + help="Length of 3' fragment to check on the 5' end (default: 10)", + ) + parser.add_argument( + "--duplication-length", + type=int, + default=1000, + help="Length of the 3' end fragment to duplicate and add on the 5' end (default: 1000)", + ) + parser.add_argument( + "-v", + "--verbose", + type=int, + default=3, + choices=log_levels.keys(), + help="Verbosity level (0=CRITICAL, 1=ERROR, 2=WARN, 3=INFO, 4=DEBUG)", + ) + parser.add_argument( + "--fasta-out", + required=True, + help="Output FASTA file with extended circular contigs", + ) + parser.add_argument( + "--id-out", required=True, help="Output TXT file with circular sequence IDs" + ) + + args = parser.parse_args() + setup_logger(args.verbose) + + logging.info("Starting script execution.") + detect_circular( + Path(args.fasta_in), + Path(args.fasta_out), + Path(args.id_out), + subseq_length=args.subseq_length, + duplication_length=args.duplication_length, + ) + logging.info("Script execution completed.") + + +if __name__ == "__main__": + main()
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/detect_circular_sequences.xml Thu Dec 11 08:53:37 2025 +0000 @@ -0,0 +1,65 @@ +<tool id="detect_circular_sequences" name="Detect circular sequences" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@"> + <description>(e.g. circular contigs) in a FASTA file</description> + <macros> + <token name="@TOOL_VERSION@">1.0</token> + <token name="@VERSION_SUFFIX@">0</token> + <token name="@PROFILE@">24.0</token> + </macros> + <requirements> + <requirement type="package" version="3.13">python</requirement> + <requirement type="package" version="1.86">biopython</requirement> + </requirements> + <command><![CDATA[ +python '${__tool_directory__}/detect_circular_sequences.py' + --fasta-in '$fasta_in' + --subseq-length $subseq_length + --duplication-length $duplication_length + --verbose $verbose + --fasta-out '$fasta_out' + --id-out '$id_out' + ]]></command> + <inputs> + <param argument="--fasta-in" type="data" format="fasta" label="Input FASTA file"/> + <param argument="--subseq-length" type="integer" min="0" value="10" label="Length of 3' fragment to check on the 5' end"/> + <param argument="--duplication-length" type="integer" min="0" value="1000" label="Length of the 3' end fragment to duplicate and add on the 5' end"/> + <param argument="--verbose" type="select" label="Verbosity level"> + <option value="0">CRITICAL</option> + <option value="1">ERROR</option> + <option value="2">WARN</option> + <option value="3" selected="true">INFO</option> + <option value="4">DEBUG</option> + </param> + </inputs> + <outputs> + <data name="fasta_out" format="fasta" label="${tool.name} on ${on_string}: Extended circular sequences"/> + <data name="id_out" format="txt" label="${tool.name} on ${on_string}: Circular sequence IDs"/> + </outputs> + <tests> + <test expect_num_outputs="2"> + <param name="fasta_in" value="input.fasta"/> + <param name="subseq_length" value="10"/> + <param name="duplication_length" value="1000"/> + <param name="verbose" value="3"/> + <output name="fasta_out"> + <assert_contents> + <has_text text=">SRR17300492_25544"/> + <has_text text="GCGATCCAACTGAACCGGATCTAGAGCCGTGGGGTCAACCGC"/> + </assert_contents> + </output> + <output name="id_out"> + <assert_contents> + <has_text text="SRR17300492_25544"/> + <has_n_lines n="1"/> + </assert_contents> + </output> + </test> + </tests> + <help><![CDATA[ +This tool detects circular contigs by looking for exact identical subsequences at the two +ends of the sequences provided in a FASTA file and output the circular contigs +extended on 5' end by duplication of the first nucleotides on 3' end to be able +to predict genes spanning the origin of circular contigs. + +Inspired by Simon Roux work for Metavir2 (2014) and Corentin Hochart work in PlasSuite + ]]></help> +</tool> \ No newline at end of file
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/input.fasta Thu Dec 11 08:53:37 2025 +0000 @@ -0,0 +1,359 @@ +>SRR17300492_25544 +ACACCATATATCTCATTTTGTCTGTTGAGAGCGTCGCTCGATACTACGAAGTAGATATCT +CACTCCGCTGGGTTTTGTGTTTTCTTTTGTTTTCGATTTCGCGACTTGCCTGACAGCAAG +CCTCTCATCTGGAGCCCACCGCGAGGGGTGGTACAGACTTTATATCTCTTAAATTCCTTA +AATTCCATTTAACAAACTCGAGCCTTATTACCACCTAGTTACGCGTCGCGAGGCTTTGTT +CGAAGCTGCACAAGTAACTTAATAAGCTTGACATAAATCACAACGGCGCCTCGAAAGAAA +GCGTCGAAAGTAGTTAAAGACAAGCCCGAAGAATTAGAAGTTGAGGAGGAAACTACTCAA +CCAAAACCCACCAAAGGCCCAGTACGAAAAGCAGCTCCAGCTAAAGGCGCTAAAACAGTC +GCGATCCCAGTTCCTGTCTTAGCACCTAAAACTCGAGCATCGCAAAGGGCAACAACTAGT +AAAACAGTAGTTGAGGCAGACGCAACACCCGAAGCAGTCGGGAAGCCTGGCAAAAGATTC +GTTGTACCTGCTCGATTACCAGGACCATATTCTAAATTCTTAACTGAGCCATCAGTTGTA +AACCCAGTTGGTGAACCCAGGACAGTACCGACCGGATTATTTGAGGGATATCAGAGACCA +GACCGATCATACGAGCAGTCGCGACAGACACTTCCAAAAGCCCCGGAAGACTTTGCTGAA +ACATCTTTTACGGAAGATCTTCACGATAGTCCGGAGAGTGACAAGGTTGAGTTTGAAGTT +GCTGTGAATATATTACAAGGCTTGGGAGACGAGAATCCTTACCAGAGACCGATCGCGATC +CATCCTACACCACTTGCAGCCAAGCTCAAAGCCCCATTTGAAACAGATAGCCCTTTAACA +CCTTTGCCGAGTGATTACCAGTCTCCAGAAGCGAATTACGCTAAAAGCCAGACAGCTCGC +GATCCAACTGAACCGGATCTAGAGCCGTGGGGTCAACCGCGCGCTAGTTATACTTTCGGA +GAAAGTTCCGCAGCAGGTTTACAAGAGCCACCTGCATATTCTTGGGGAGAAGCATCAGAA +CAACAAAGGGAGAGAGAAGAGAGAATCCAGCGTTATCTTCAGTCACAAATTATTGAACCA +CAAGAGCCTTCGGTTAAAGAAGAAGTTAGATCGGATATCTCGTATCTTACCCAACAAGAA +TATCCACCGCTACCAAGTTCACCTAGACCAGACTTAAGAGGCTCTAGAAGATCTAGATCA +CGATCCAGCACACACCAAAGCAGTAACCACGAAACTAGACACTCGCGATCCGAAATGAGT +GACCATGGAGGAGATGCCGGAGGAGTACGGCGCCAGTACAAACCTATGCCGGCCAGGAGA +TCGAAGGATGCACCTGAATTCGATGAGACTGAGCCAGAGAGTTTGATGCGATATTTCGAG +GATCTAGAGGCGTGTTTCGAGAACGCAGGATTGACAAATGACACAGAGAAAAAGAAATAT +GTAGGAAGATATGTAAAAGCTCGACTAGAGTCGGAGTGGAGCACGCTGAGTGGAGCTGAG +GATGGAAATTCCTACCAGGATTATAAAGCGCAAATTATGGGGGATTATTACGCTGTAGGA +AGCCTGAAACGAGGCTCGATCAAGCGTCTTACTCAGATTTGCAAAGAGCATCAGCGTATT +AGTGCGAACGATATAGACGATCTGTTAACCCTGAAACGACAATTCAGCGCGGAGGCTAAG +AAATTAATGGAGCCGCCGGCTCTATTGGCTAACCATACGCTGGTAGAAAATTTCATGGGA +TGTCTGACTCGCGACTTCCGCGAGAAAGTCTATCAGCAGTTAGAGTCGAACGCGCGCACC +GATATCAGAATAAAGAAAGCTATCACAGCTAATGCGCCAGCTGGTTTGGTACCACCGGCA +CCAGTACCTGCGAGACCCACTCGTCACAGGCCGGAAGATCGTTTCGAGTTAGACGAAGTG +ATCGCGATGGCTGAGGAAATTGCTCGCGAGCAAAATCCAGGTGTCGCGGCGGTATCTTTA +AATTCGCGAACAGGAGGAGCGGCTGCAGCCCCACCAATGGTTGTCAAGACGGAGAGCTTT +AAGCTGGAACCCTTGACCCAGCAATTAGAAGAGCTCAGGGCTGAACTCGCCATGAGTCGC +GATCGTGAGGTGGAGCGTCAGAAGCGCTTTGTCGAAGAAGTAAGGGCTGCCATGCAGCAA +GGGATGCATAATGCGCCGGCGCCACTGCCTGCGCAGCCTAAATTGTATGAGCCTCGCGCT +CCAAATCCCAGCTATGCACGCCCTGAGTACCCTACCACGATGAAGTGTTTCTATTGCGGT +TTACAAGGACACACGTTCAATAGATGTCCCGCGAAAGAAGCGCATATTCAGCTGGGGAAA +ATCATCGACAAAGGATCGCGAGTGCATCTCCCGGATCATACCTACTTAGGTGTCGATCCG +AATAGAACTATTCTATCGCGAGTGGAGGAATACCACGCGCAGAAAAAGCTGGACAGTAAT +TATTTAAATTATGGAGGCCAAAGCGTGCTTCAGCTAGCGCAGATACAGCAGCAGGTCGGG +CCTAACTCAGTCTTTACCAATAAGGCTAAAGATACCAGGGACGATCTGATCTCTGCGCTG +CAAAAGGAAAACGCTTCGCTTAAGGTGTTGATGAATGGACACTCTGAGGTCTTGCCGACG +ATGGCAGCGTCAAGCTCGTCGTCGGATCTAGATCTAGTACCTAGACGCCTACCGGACCCT +GAGGAATACGGGGACCGGTACCACGACGCACTGCGCAAAGAGCGCGAGGAGTTGATGAGT +CTTATTAGTCAACTGGACTATTCGCAGCCGGAAGCGGCGGGTTTCACCAGTACCTGAGGA +AGGCAGTGCTGGCAAACGCGCGCAAGACGCTGGCGCGATCTGCCAAAACTCCGGAGGGTG +CATCAGCAAAATCGAAAGCAGTGCCTAATAAAAATATTAAATCTATTCTGAAAGAGAAAC +AGCCAGTAGAGGAAGAGCCAGAAGAAAGTGATGATGAAGAAAATGAGGTAGCGGAGAAGG +AAATACCCATACAAAAGGATCGCGATCCGGCTGTAAAGCAGGTACCTACTACAGCAGTAC +CCCGTTCTATGCAGAAACATGTAGAGTTCGAAGTCTTACCAGAGGGAGGGTTACCAATGA +GAGCTAAGCCCACAAAGTCGGGGATGATACCGTTCGTGGACATCCCGCCAATGAATCCAG +CCTTGCGGCAAAAGAAACCTGTCGCGATCGAAGCAGAACCCTTACCCACTATTGATAAGA +AAGGACCAGCGTACAAACATCGTGCTCCAATTGAGGACGACGCTAACTGGTCTGGTTTCA +TAAAAACGTTGCGCGATCTGCCTGTAACGATCTCTCAAGGGCAATTAATGGGATTAATTA +ATGCTCAGAGCCGTAAACGGGTAATTGAAGAATTAACTGCTAAGCGAATGCCTGTAAATG +AGGATAAGCCAGTTAAACGCGGCGTGACTATGGTGGAAGAAGTGGAGGGCATGCTAGACG +ACGACGGAAATGCGTATGAGCAGTTAGTATTTACTGAGCTGCCAGAACCGACCTATACAA +TCCTTGGGCAGGATGAGGGTGAGTTAAAAGCGGGGTCAATCATCGCGAGCGATCCAGTAA +CTCAATATCTCAACGGACTCGCTCCTGAGGAGGCGGCTAGGAAAATTATGGTTGCTCGTG +AATCTTATTTACTAAAAACGCTATATCCATTAGTAAACGCACAAGCAGAGGTGGAGTCGA +TTATAGACGGGGGATCACAAATCATATCGATGTCATCAGATGTCGCGATCCAAGTAGGAG +CGACCTGGGACCCAGATGTCACGATCCAAATGCAGAGCGCCAATAAACAGCTTGAAAAGA +CACAAGGGCTAGTAAGAAACATGCCGTTCAAATTCGGTGATGAAATTACTGTCTACTTTC +AAGTACATGTAATGCAGAATGCGGCGTACGACGTGCTACTCGGGCGACCGTTCGAGGTAC +TCACGGCGTCGGTATTCGAAAACGCTCTAGATGGATCACAAATGGTGACGTTGACGGAAC +CGAATTCAGGGAAGCGTTGTAAAATGCCAACTTACGACAGAGGGAAACCACGTAAAGTAA +TCAGCCGTAAGCACCCTGAGACGGTAGAGTCTTTTTAAACCTCGATGAGCTGGTTATAGA +TCAGGGAGAAGTTGCATTTATTATTGGGTCGGACGGCAATGAAGGCTATGTGATCGAAGG +CTATCAATTTCCTCAGGAAGGCCAGAAGTTCACTCAGCACGCACTTAGAAATGCGTACTT +AGAGAGAGCTATCCTGGAAGACGGACATGAGGATGCAGAACGAGAGAAAATAATTAAATA +TTTAGTAGATACACGAAAAACAAAGCCAGTAGAAGGATCGCGATCCAATCGTGGCACGTT +TGGAAGCATCGCGAGCCAATTCCATATGGCAGAATGTGTCGAGAAAGCCCCAAAACAAGT +ATTTGCTGCGACAAAGAAGTACAAGAAGGTGGCAGATAAAATACGGCCCGTATATCAAGA +ATTACCCGACAAATATCGGATCGTGCGCGACATTAAAGGGGATCCATTGAAAAACATGCC +TATGCTATCTAAGCAGCCGCCAGAATTCGTACCCACTGGCCGATACTCTCGCGAGCGCAA +GGAGCAAATGGACATAGTCCATGGCGGAGATTTTCTATGGGAAGAAGAGCGAAAGCTCGT +GCATCAGTTAATCATGCAGCAAAATGAGGCGTTTGCGTGGGACGACACAGAGAAGGGAAG +CTTCAAGTCTGAATTCTTCCCGCCTGTCGAGATCCCCGCGATCGAACATGTGCCCTGGGT +ATTAAAGAATATTCCTATCCCACCGGGTATGCACACCGAGATTTGCGATTTTATTCGGCG +CAAAGTAGAAGCAGGGACCTATGAGCCGTCTAGCTCGTCCTATAGGACGAGGTGGTTTAT +AGTGATGAAAAAGGACGGCAAGACATTTAGGATCGTGCACAGTCTAGAGCCTTTAAATGC +TGTCACGATCGCTCATTCTGGCTTACCGCCGGCTATGGAATCGTTAGCAGAACATTTCGC +AGGACGCGCGTGCGGCGGAATACTGGATTTATACGTTGGGTATGACGAGCGACTACTTGC +AGAAGTGTCGCGAGACATGACGACGTTCCAGACTCCGTTCGGCGCGCTCAGACTCGTCAC +GCTCCCTATGGGATGGACCAATTCGGTGCCAATCTTTCACGAGGATGTTACATATATTCT +TAGGGAAGAAATACCCGAATTTACGGAGCCATACATAGACGATGTACCTATCAGAGGGCC +TAAAACACGCTATGAACTGCCTGATGGTGGCTACGAAGTTATTCCAGAAAATCCAGGAAT +ACGAAGGTTCGTGTGGGAGCATATGGTTAACGTAAACCGGATCGTGCAGCGAATGAAATA +TAGCGGAGGCACGTTTTCAGGTTACAAATCACTATTATGCGCTGCCGAAATCGTTGTCGT +AGGGCATTTATGTACCTTTGAAGGAAGGAAGCCTATGCCGGATAAAGTGCATGTTATTCA +GAATTGGGGATCGTGCAAGAATATTAGTGATGTACGAGCGTTTATGGGAACTATGGGATT +ATTGCGGATATACATATCTGATTATGCGTCGCGAGCCCATCATATCCAGAAACTGCTGCG +TAACAACACGCCGTTCGAGTGGGGACCTGATCAAGAGGAAAGCATGCGCCTGCTGAAAGA +AGGCGTAACGGATGCACATTGTATAACGCCACTAGATTACACGATGTCAGGTAAAATAAT +ACTGTCCGTGGATACATCGTGGCGAGCCGTGGGATTCTATATCCGACAAGAGGATGAGAA +TGATAAGAAGAAAAAGAGATATGCGCGCTTTGGTTCGATATTATTGGGGGATCGCGAGCA +AAGGTTCTCGCAGCCAAAACGCGAGCTGTACGGCTTACTTCGCGCCTTGACAGCGTGCTA +TTATTGGCTCATTGGAGCACGGAACCTAGTGATCGAGACGGATGCTAAATATATTAAAGG +CATGCTCGAAAATCCAGGCATGGGTCCGAACGCCACTATAAATAGATGGATCGATCAGAT +ATTGATGTTCCATTTTGAGCTCAGGCACGTTGCGGGGAAGACATTTGGTCCAGATGGACT +GTCGCGACGCGAATGGCAGCCCGGGGATGAGGAATACGAGAACCCGGAACAGCAAGTGGA +GGATGGATTAGGATCGCTCACCTATGTAAAGAAATTTAAGAGTGATCCAGATCCTTTAGA +GTTTGAAGAGTTTAAAGAGACTATAGATACGCGTGGAGGTTATCAACAGGAGGTGGCGCC +CCAGTTCATACTGGAGGAAACTACAGACCTAGCTGTGTCAGTGGAATGTTTTCAGAAGGA +GTTAGACGCCGCGAGGCATCAAAACAAGTTGGAGCGAGAGATCGCGATCCAATACATCAG +CGCGGGAAGCGGCTCACCAGAGCAGCGCGACTTCTTGCAGCAGTTTATGCTCTCGCCAGA +ACTGCCCAGCGATAAGATAACGGAGAGCTCGGACGAAGCCGAGTACGATGAAAGGAACCG +GACGCCGGCGGGGACGGAACTAGATAATAAAATTCCGTTGATCAAGCAATGGTTAAAAGA +CCCGACCTCGAGGCCTGCTGGGATGTCCACCAAGGAGTATTTTAATTTCGCAAGGAGCGC +GAGAAATTTCTTTGTAGATAAGAAGGGAAGATTATACCGACGCTCTATAGATGAGGCGCA +CAAATTATTTGTAGAAAAGAAAGACCGTACGCGATTAATGCAGAGCGCTCACGATAGTCT +GGGACACAGAGGATCATACGCTACACGCACTATGCTGCAGGAGCGTTTCTGGTGGCCAGA +ATTGGATCGCGACGTGCATTGGTATGTTAAAACGTGCCATTTATGCCAAGAGCGTCAGAA +GACTATGATAAGGATACCTAGGACGGAGACTCACACGCCGTCAATCTTCCAGCAATTGCA +CGTAGACACTATGCACATGACGCCGCAGTCGCATGGGTGTGGGTACATTGTGCATGGAAG +GTGCGGGTTAACTTCGTATCCGGAAGGACGGCCGCTCCGCAAAGAAAATGCAGAATCGAT +CGCGAACTGGCTGTTCGAGGACATAATCTGTCGGTGGGGAAGTCTTAGGGAAATTATCAC +AGATAATGGCGGGCCATTTGTAAAGGCGTTAGCGCATTTGAAGCAGAGGTGGGGCATAGA +TTGGATCACGATCTCTGCGTACAACTCTAGAGCGAACGGAAAGATCGAGAGACCGCACTG +GGATATTAGACAAATGTTATTCAAGGCTTGCGGAGGCGAAGAATTCGCAAGTAAATGGTA +TAAATATTTTTACCATGTGCTTTGGGCGGATCGCGTGTCAATTAGGAAAGGTTTCGGGGC +CTCGCCCTTCTTTCTCGTGACAGGAGCGCACCCTGTATTGCCTATGGACATCATAGAAGC +CACTTGGCTTGTCGAATTACCGGACCGTGTGCTCACGACCGAAGAACTCATTGGATTCAG +AGCGCGAGCGCTCGCAAAGCATAAAGAACACATCGACGAAATGCGCGAGCGCGTATCTAA +ACAAAAGCGCGATGCACTGTTAAAATTCGAGGAGAAACATGTACATAAAATTAAAGATTA +CAAATTTAAAAGCGGAGACTTAGTGCTGGTACGAAATTCGCCGGTAGAAATGTCCTTGAA +CAGAAAAATGAGACGTCGTTGGGAAGGTCCATTTATTGTTATTACAAGGAAAGCTGGCGG +TGCGTATATACTAGCAGACATGAGCGGAAAAGTGTATAAAGATAAAATTGCGGCGTTCAG +AGTAATCCCTTACTTTGCGCGGCGTCATATTCAAGTGCCCGAAAATATTACAGAGATTTT +AGACCAAAATAAAGAGGATCTAGATGCGTTAGCCAACGCTCCAGACAATGAGGAAGCGGA +CAAATTAGAACGTTTAGTTTATAACGAAAACGATCGCGATCCGCAGATTATTGACTGGGA +CGATGATGAGGAACGCTGGTGGGACGATGATATATGGCCTTAGGCCCAACAGGTTTATTC +AATATACGGATCGTGACAAAAGTATAACTACAACAGGCCCCTTTAAGGCTGTAAAGACGG +GCGCACGCGCCGGAACGACTACCCTACTCGGCCTCAATCCCCGCCGGGTTGAAAGTGGCA +CGAAGGCGAGTCAACTCCTCCGAAAGCAAAGAACGGTGCTTCAAGAGGAAGTCGAGCTTG +TAGAGGTTGGTAATGAGCTCCGAGCGGAGCTCGCCTTCAACGCGCCTAAATGCGAGAACA +GGCCCATCGGTAGGGAGACCGATCGCGACAACTTCTGCTGCTTCCACAGCGACCGCAGGG +GACGGCGCGCCGGCTTCCTGCGCCTCTAAAAACATGAAATAAAAATTATTTTAATCAAAA +ATTAAAAAGAGAGGAAGGGGGAGCTGAAGCTCACCGGTGACAGTAGCGGCAGGAGGAGTA +GCAGGAGGAGTCGCAGCGCCATCCAAGCGAGCCCGCTTGGACGGACCAGACTCGGTAGAG +CCATCCTCGGCCGCAGAGAGAATTTGGACGGCCTTCAGATAAGCGTAACTGGTCAAATCC +ATACGTGGAACAAGGTGATAAGGGAGACGTACAACTTCGGCACGTTTGGAGGTGGTCGCC +TAAAATTTGAGGTTTAATGTTGGATCGCGATCCTCATTTAGAGAAAATATAACTCACGCG +GGAAGAAAAGCCACTCGCAGGCGGCTCGCGACGCTTCTTGGACGGGCCAGGGACCTCGGA +AGATAAAGAAGGTACACCGGGATCGGTAGCGCACTCGAGAGTGGTCGACTCTTGACCCAA +AAGCATCTGAGAAAATGCCCAAGCGAGCGTTCGTTCGCAGTCAGCAAACGAGAGACCTTA +AAAAATTCATAAGTACACACTTCGATGTCAGTGTCCTCTGAAGTACCTGCTGGGGCAGAA +GCAGTCTCAAGAGGGTCGATGCGCTTGCCCTTACCCGCGATATGGCCACGCGGAACGCGC +TGTAAAAATATTAAGTTAGGAAATAAAGAAAAGAGGAGAAAAATAAAGCATACAGGGCCA +GTCGGGTGGGTATCTTTGTACGTGACCACAGGAGAGCTGGTCGCAGACAGGTGGAAGCTA +GGGTTAATCCTCGCAAGAGCCAAATGAAGGCCGAAGAAGTCGCGGACTGCGCTAGACATA +GTATATCCCTTCTGTGTAACCACTGCCTGGAAAGCCCGGCGAACCGAGACCACCAAAGCG +GCAGCTTCAGGATTGGCTGCAATAGCAGGCGCGAGGCCAGACCACTTCCGGAGTACCACT +GCAATATCCTCCAGAATGTTGGCATAATGCGCAGGAACGGCGGAGGGCGAAGAACGTATG +CTCTCTAAGAGTGCGACGCGTTCGGCGATCTCAGTAAAGGCAGGAAGGTTGCGACGAGGG +GAAGCCATGACTGACTAAAGAAACACGGTCAGAGGAAGACCGTTTTATACCATCTACAAG +GATCGCGATCCACAACACGCGTAAATTGGGAGACCAGGGAACTAGTGCAACTCAGTAGCG +AGGCGTGCAAGTAGAAAAATACCCGGTTACCGAACAAAAAGCAGAGCTAGCGAGAAAATC +TGCTGCGCATGGGTCGTAAATACTTGGAAAGATATGGAGTAAAATGAATCGCGATCCTTT +GAAACATGAGGCAGAGACGATATCTCAAGCCAAAACAGTGGCAGTCAAGGTCTGGAATAA +TAAAATAATGTTTTATTGAAGATAAAATACGCGCGACGCGCTCAATATAGAGTAGTAGCC +AAATTCGGACGCTTAAGCGGTGTAAGCCTAAGTAGGCACACTGTGTACGGCAGTACGGTA +ATGGGATGTCCACTTGACGACATATTCATTAAACCACCGAACGGAATCCAAAAATAATAC +ATTTCAAATAAGAAGCTTGGCGAGTCTACAGATGGATCGCGAGCACAAGAAAAGGTACAC +TAGTCGGGCAACTCGAGCGCAGATAGGGTAACAGTGCCTGCAGGCTGCGGAAACGCGCGG +CCTTGCTGCAATACCAAAAGTCAGCTACGCTCAGTAAGCACGGAAGAAATAAGGCGTACA +GAGACCATGAACTGGTAGCAGGAGATATCGCGAGCTGCGTGTACGAGGTTACGGAGACGG +CAGTGCTCGTCGCCCAGATAGGGCATGCGCTGATGATTGAGGATAGCGAAATGCGCCACG +ACAGAAGAGTGAACGCCGAGTAATTCTGACAATAAGTGCAGAAGCTCGGGGTCACCAAAC +AAATGCTCTGGTGTGAGATCAAGGCGACACTGGATCGCGAGACTTCAGATGGGCAAAAAT +ACATGATAGTAAAAGACTTACCGCCGCGCGAATCATGGACTGGACGGTGTACAAATTGGC +ACGCGTACCCGCCATGGTATTAGTCTGGTCATAAGTCGAAATGCGCCGCTTGAGAGCGAT +AATGCCAATCACCAGTTCGTTAACAGATGGACTGGGCGGAGGAGATTCTAGATCCCCGTC +GAGAATAAAGAGGTCGATAGAGGGATGTGCCGGGTTCAAGCCATTAGCGGTGCGGGGTGT +AATAGGTTGATCGCGAGCGTCGGGAGTGTCGAACAAAGGAGTCTCGAGCACTTCACCATT +AAGGTGGGACGCGCTAGAGTTCTCAGATTGACGCGGGAGACCAGGCATAAGGCGAAAATG +AATACAATTCCATTCGCAAAAACTACATGTCTATATATGCTCGTAATCAAAAGCTCCGCA +GAGCTGAAACGCCTTAGGAAGTGTGAACGCGTGCGAGATGACGATACTAGAATCGTGTTA +GATATCTGGAGTGATAAAATCAAAAATATCCACGTACAGATGGATCGTGAACCATCAGAT +GCGTAAACGCAAGCAACCCTTCTAATCCCAGGCGCTCGTCACAGAAATGGAACGGACGCT +TGTGCTGCAAAAAGGGAGCGCGATCGCAGATCTTGATGACGGCAAGTTCGAGCCGAAATA +AGTACAGAATGTGCAAAACTAAAGTAGGGTTGGTGGCGAGATTATGAGCAGAAAGACGCC +AGGACGTCTGGATCTCGAGACAAATTAATCAATAATAAATGAATAAATAATTGTGATACG +CACCAGACGACGGTACAAAGCGTGGATACGCTCTAGAGTGCCTTCTGGATCGTCCTTGCC +CACAGTAGACAAGTAACGAGCATCGAATGAATCCAAATCAACAAGCAATTGCTTGAAAAG +TTTGGATCGCGACTCATCGTCGAGGCGATGAAGGAAGATACCGGCGTCGGATGCCTCGCG +AATATTCGTAGAGCAAAGAGGCACGTCGGGGACATAGGGAAAAGCCATCGTGCGCCTGAT +ATGTCTGACGTGTACGCAGAGAATTTTATACAAAACAAACAGAGATCGCGATCTCGATAT +TCCATTCAGAGACCAACTGGGGTCAGTTGCTTTTTGTTGGGGGGGAGAGATAAGATCTAT +CTAGAGAAAATTTAACCCGAATAATTTTCGAGTTTTTTCACTTAGAAATCACACTTCAAA +TCAGGCAAATTTGGAAAGACAAAGCGAAGTTTTTATTGAGAAGAAAACACAAGTACTACA +GGGAACTTCAAAAACCCTATAGTAAAAGAAGAGATGAGATATGAAAAATATAAAAAAAAA +AAGAGAAAAATGCTGTCAACGGCGAGCCCTCTTGACCCTAGGACGAGGAACAGGAGACGA +GCCAGAGCGCTTGAGGCGGAGGAGCTTCTGACGCAGGGGAGAAGGCGAACGGTCACCAGC +ACCGCTCCCAGCCTTATCCTCCTCGTCCTGATTGCCACCAACGCTCTCACCCTGGTCGTC +CTCTTCGTCCTCTTCCTCATCACCATCACCTTCGCCAGAGCTTTCTATAGCTTCGTCGTC +GATAAGAACAGATCGACGAGGAAGAGCGCGTTGTGGACGAATGGAAGCACTAGCACGGCA +AGTGCGCGTTGGCGCGCGCGTCGAAGATGCGCCGGTCGCGACAGTTGCTACAGGCACCGA +AGGGGCGGGAGCTGTAGATAGCGCGGGATGAACCGTGAGTGGAGACCGATCCGGGGTAGG +GGTAGCCCAGATGGAGAGCTGCGCGAATAAGTTAGCGAGCTCGTCCGGAGACGAAAGCAC +GCTGGGTGTCGGCTCCAGTCGCACGCGCTGTGCGTCGATATCAGGGAGCTCCAGGAACCA +GCGAAAGATGTCGAAGGCCTCGGGGTCCGAGTGAAATAGAGTCGCGATAGGTGTGGAAGC +GCTAAGGCGCTCGGATAGTTGGAGCGCGCGGTTAAGCGCGCGGGCACTGGCTTCGGCCGA +CCGGATCGCGAGCTCTTGTTGACGGAACGCCTGTTGCGCGTGAAGCACAGCTTCGGCCAA +CAAGGACTTCAACACTGCAAAAATAGTTTAGACTGAAGAAATAAAGAAGAATAGAATAAA +GAAAGCACCGTTGGGATCAAGATCATTCCATGGCGCAAGAATAGCCGCGAGCTCCCCGAG +AATCTTGGGGGAAGCTGCGAAAGTACAGCCAGTCTTGCGGCCGGTCAGGCAGGCCTTGCA +TTGGAGGCCCCAGCCGCGGAATTCGCAAAATAAAAGAGTCCCGTCGGCATGAGGGATGGT +ACAGGGAATGCACCGGGCTGGGGCCTAAAAATAAAATAAATAAATCAAGATAATAGAGCA +GAAAAGAAATAAACTCACCAATAGAGTCTTGATCACCGCTAACGCCTTCTGAGCGTCGCG +GAGGAGCGCAGAGTCGCGCATGGGGCCCAGGGCGACGGCCAGATACGCGCCAGCAGCGTC +GCGAGGCGTGAGGGACTTGAATAATTCGAGAGTCTCCTCGTCTGGCTCCGGCAGGGAATC +AAAAGCGGCGTTGGGATGGCCGACCGAGGGCGGGACGACTTGTTGGATCTCGACCGAGCT +CACGGCCTTCTTGAATAAGTTGATGGCCCGTTGGCTTTTGGACCTCATAGTGACAACCTT +CGACCCGTCCTTGCCGTGGTTGGATGTCGACGGGCGCAGCGCAATAGTGGGCTAAAAATA +AGGCATCAAAAGATAGGCAGTAAATTAAAAATAGACAAATACCTCGAGAGGGAGCGTATT +GAAGAAAGTTTGCGCATTAGAGGTGAGCCGAGCGCGAGAAAGGAGAAGAGCGGCAAGCTC +CTCCTCGGCATCGGCGTCCTCATCACCTTGATCAGAGGGATCGCGCTCTTCCTCCGACGG +AACTATAAAAACCGTGAATAATAAGAAAACAGAAAAGAATGATAACTTACCGGGTGTAGT +AGCATGGCCTTTCCCCTTGTGCGCCCTGGATAAGCGCGGGGTGGACTCGTGATCCGACTC +CTCGAGCTGATCGACCTCAATAGGTTGAGGCTCTTCGGGAGGCGACGACGCGGGTTCTGT +AAAAATATAAACCAGAATTAAAAAAGGGTACGCGAGTAATGAAAAACAAAAGAAAATAAG +TACCTTGTAACGCCGCTACAGGAGGAGCAGCAGCAGAAGAAATAGTAATCTCCATGTCCT +CGCGACCGGAGAAGTCATCGTCCTCGGGAGGGGGCAGAGCTGGGACACCAATGGGGAACT +GCGCCTCGGCAAGCTTGAGAAGATCCTCGTCGACGGGAGGATCGCGAGCGACGTGAATAG +GGTCTTCCAGGTTGTCGACAGGAGAAGCTGGTTGAAAACGCCTCGCGATAGCAGATAAAG +ACAAGAGGCGCTCACCAAGAGAAGAAGGAGCGGACACAGCGGGCCGGGGAGTAGCGAAGA +CGGAGCTGTTGGAAGTAGAGGCTGCCACCACGGAAACAGAAGCGGAGGCGGCAGCTGCAG +GCACAGAGAGAGAACCCGCCACGCTTGCGGCGTCTGGCTCCGGAAGAGCGTCGACCGGAA +GTAGGAGCGGGCGAATAAAGGACAGAAGAATATTGGCGGCCTCTTGATCAGCCGAGCGCG +GCGTCGACGACAGAGGCTCTTGATCCTGATGGACCGAAGAATCGCCCGCGGTGAGATTGG +GAGAAGGTTCGCGAGTCGGCGAGGCAGTCATGAGCAAAGGAGATGGCGGTGGAGAAGGGT +CGCGAGCTGATAAAGGTGGCGACGGCGCGTCGCGCGCGGGAGATGGAGGCCGGTCGTCGC +GTAAAAGCGCCCCGCTGTCGAGAGGGGTGTCCATGAACGACGAGGGCTCTCGCCAGGTCG +AAGGAGGGCTGCCGCTAGCAGCCAGCGCGGCAGAAAGACCAGGTGGGGGTGAAAAAGCAT +CGTTAGGGTCGTACCGGAGGTCGGCGCTGCAGGGGAAGCTCATGTCGATAGGTGGTGGAA +TAGGGAGTTGCTGCACGTAGCAGCCGATCTGTCCGGCATCGAGCCATCGGTGTCCAAAAA +GATGCGCTTGGTCTGGAAACCATAGCGCGGGATCGGTGCTAAAGAACAAAAGTTCAGCGT +CGTACTAAACCAAAATATGTAAACGTTAGTAAGACATGGCAAACGAGGAAAAAGGATCGC +GACACGTACTATGACAACGTCCCGGTACCAGCCATGCGATAGATGTTCCAGCGTCGCGCT +GGAAGGCACAGCATCGCAAACACGGGAGATGGAATACAGGAAACGCTCGACGGGAGCGCG +CAGGAAGTGGTCAGCGGGAAATCTCGCCAGTCGGTCATTCAGAACTCCCTGAATACGACA +CAGTTTAGCTAGAAAAATTTAAAAGAGACGGAATATGACGCTCACGAGGTGAGACGACCA +CTCAGTGATCAGCGCTCTTAGCCAGGCGTGGCTGGGCGTCTCTTGAGCAAGGAAGGCGGC +TATGATCTTGCTGAAGCGGAAAAAGGAAAGAGCGAAGGAAGAGGAATAATTAGTATCCGG +GGAGAAAAGTGTCCCCTGGAAAGTAGGAAAGAGGATAGGGTGTGTATGCATAGTGAAAGG +ATGAGGAAAGTGGGAAACATACGCGACAAGGGATCGCGACTTAAATACGTCGTGAACCAG +CGGCGTACGCGGACAGTCAAAGTCTCGCGAGAGCCCACCGGCAATCTAGGAAGCGTTGAT +TTGCGTCTATAATGGGCAGTTAACTTCCTAGTGATAGCTTCATGGATCGCGAGAGACGTC +ATAGCGTAAAACTTATGTTGCGCGGCGTGTATGTCGCGAGAGTAATGCTGGGCTAGGGCC +AAATTCTAAAAAGTTTAATTGATTGATGGGGAAATTCTTCTGCGACGCCGCTACAAAGGT +CGCGATGCATCCTCACGCCTAGTTGGAGGATCGCGACGAAAGAACTATCAAAATAATGGC +CTTGCGCGCCTTAAGCGCTCAGGATAGACTATGCGGAAGGGACGTACCAGGATGAGGAGA +TGCCGAGGAAGGAAGCGCGTCGCAATCTAAAAATAGATAGGTGCAGCGCCGTAGCAACGG +CTTCGATGTCTAGCCCAGGAAGCTGGAACCAGGCCAGAAGGCTGTCCGTGGGCGCCGATA +TGAAAGAGCGGTGGCGCCCACTGATAGAATACCAAGGAATAATGACCAAAGCAGCAGGGG +AAGTGCCCGTCTAGGGATCGGTCGTACGGAGTGTCCAGAAAACGGATCGCGACAGAACCG +AATAGCGTTTTAAAAATAGAATCAGGTCGGGGAAACTCTGAATGGGTGTCGACTGGGGAC +AGTCGATATTTGTTAGGGGGGAGATGATAGGGTAGTTACATGGCTACGCCTGAAAATTCG +AAATTTTCACATTTCCCTTACAAAATAAATAATGATTAAGAGGAGCTAAGGCCGTCCCGG +GCTGAGAGCTCAGAGCAAATGCGCGTGCGGGCGATAATGATCGCGAGCCTGTGACGAAGG +TAGCCGCGCGCTGTGCTAAATATAGGTGCACGTTCGGCAAGCTGGGAGACAGTGTACAAA +GCTCGCGATCCATTATTATTGTAGTAAAACTGCACGGCGGCTCCATTACACTAAGGGACA +GGAGGACTAGACGCTATGAGGGAGTCGCGAGACTAATACAGGTCGTCCAGGACGCTCGCG +ATCGCTAGTACGGAAGACACACGCCTACCGGCGGACCGGCAATAATAGCACACCGGCCGG +ATAGCGCTAAACCGTTGGCGCGCGCTTAAGCTATGAAGGCACGGCAAATGCCGAGCGCGC +CCGAGCGCGCTTCCGAGGATGCCTGCAGAAGGCGTATCTGCGCCAATACGGGCTCACGAT +CTGACTTATCAGGTCGCGGAGTACCTAAACAATAAACGGGTAGGATCCGAGGGGCTTATC +TCGAGCCCCGTGTCCTAAAAACGCTCAGAAACAGTAGATAGAAGGTGACTCATACGAGGT +AGCACATGGATCGCGAGCCTCGAGGAGGGCAACCCTTCGCCCATTTGTTTGTATAACGGT +TTGATCATATTAGACTTAGAGATATTTTCCATACAACCTGTGTACTATTTAACTAGCTGT +AGAGTACAGAATAAAATCAAGCAATCGTACCCCACATTTTACAAGAGCTAAACCTGCAAA +GGCGCGAGCTCGACTAAAACTAAGGAATTTACACATTTGACTTCCGAGCTTCGAACTTAA +GCACTTCGTAAGATCGTGATCCCGTTAGCGCCGTCAGTGATAGTAGATTTAAGACCGAGC +CTACTGAGAGTGGTAGAGAAGCTAGTTTTAAAGAAAATATTGCAGACGGATAGCGCGAGA +CTACGAGAATTTTGAGGTGCCGTAGAGTGCAAACGCTCCAGATCCAAGGCTACTAGACGT +TTTCGAGTGCCCTAGTGATTGATTGATATTTTACTCTCGCGATACATTGGAAGTTTTGGC +CGGAGTGTTATACAACGGAAAAGCTGAAGATAAATAAATCTAAAATCTGTTTAAATCCCC +CTCAACCTTGAAGAACATCGCAGCACTCGCTGTCGAGGATCGCGACTACTTCTACACGTA +TATAAAACAATAAAACCCCTAAAACTACACTTTTGCTTCGTTTTCACCCTAGGAGCTAGA +CCACACCATATATCTCATTTTGTCTGTTGAGAGCGTCGCTCGATACTACGAAGTAGATAT +CTCACTCCGCTGGGTTTTGTGTTTTCTTTTGTTTTCGATTTCGCGACTTGCCTGACAGCA +AGCCTCTCA +>SRR17300492_42243 +TAATTAGGAAATTAGACACTTTTAGATGCTATTAATACTTTTAGATACTTTTAGACACTA +TTAGATATAATCCGGAGCTAATACAAGGGGGTGGTTTTCCAGATGTGTCCAGCTTCTTGT +AAACAGAGATTCTAGGATATTGAGTGCCATAAGGAATTGTATCGGTGCTTGCGATATCAT +TGTCCCAGCTCTGGCCACCCTGATGAAGATTGCCATGGCAAGCACATGGATCATCTACAT +TGGCGCAAGTACGGACGAGGCCAAGACTAGAGCAAATTCCAGTACTTTCGATGATTCTGA +TCTAGAGATACAATAAATGTTCAAGGCTCACCTAAATTTGAGGCAACACACTCACCAACT +TAGCCTGGATGTTGTCACCCTGCTTGAATTTTGTGAACTGTTACTCACAAAAATAGGGCA +AATGTCATGGCAATGCGTGTAAAAAAAGTCTTGAAAAAATCGTTTATTGGCATAGGGCCA +ATGAAGCTGTAGTCCATGTCTATAACCGATGGTACTGTGCTGAGGAGGGATGATCTCATA +TCAGTCCGAGGATGTGTAAGCAGTGAGCAACTAGAGTGAGAGTTCAGGAGGTCAGAAAGA +AGAAGGATGGTGTCGCCGACATACCCAGGCTAGTAGTGATTACAAGTCCAACGAAGAGCA +AGATGTTGAGCCATTGAGGACTCGAGCCACCACACGTTCAATTGGCTGGGTTTGAATTAC +ACATTTAAAACTCCAAAGTACACGTGACCTGGCATCCAGTGACAATGTGGCATAGTACAC +ACTGCTCTCTAGAGTCTAGTCCATAGAATAGGGTAGCTTTTCATTTGGGCGGGGAATCAT +ATACGCCGGCATGGGCATCAATCACTCGACTCAACACAGCATACAAGTAATCTTAGTGAA +TATCACGAAACTAGACACTGAGATCTGGTAGTGGGCACTGAACTCCTTGGGTCATCGCAC +GAGCCTTGAGTCACAAGCAGAGACACCAGAATAAGCTACAAGACGGTGCAGTAACAGTCG +CATCACAACTACGCCGTCTTTCGTTTACCACTGGCCCTCTGCAACGCAACTTCGTCCAAG +CTGCGCCTAGCTCCGGCCAGCTTGTAGTATAACGATTCTCCATGTAAGCTGTCGCTCTGG +TCATTCCTATTACTTCCCCATCCCACCGAGGACAGGTGGTTGTGGAAAATCTTGGTGAGG +GAGTCTGACGCAGTCAATGCAGTGCGAGCTTCGTCAGTGGTGGGGAGCAAAGAAAGGTCA +ATTCTCGATGGTCGGTCAGAGTAAAGGGGAACAAACAGCCACCGAAGTTCATGAATAAGT +TCGACGAGTACTAGACTGAAGAACTGCAGAAGAGTGCTCTCGTTGAAGTGTGTGGTTGCG +ATCTGAAAGAAAGCCCGTTTGCCTTCCCCGCCAGTAGCAACACCATCATCGTCGACTTCA +CATTGATCGAATACTACTTTCATCGACTTGGTTAGTTGTGAACGAAGCGGTTTCGGTATT +TTGTGAGTTTGAAACTAAACACAGTGATATACCAGAACATGGAGAAATGATTCCAAGTCA +TCACAGAGTTGATGGGGCTGCGATCCAGGTTGACTCAGTCGAGTTAACAACATGAATTGC +CATGTTCCCTGATAAAATATATTACGATGCAGAAGTTAAATAATCAAATAGTACCAGCTC +ACCGTTCTCCGATTGAGCCTTGCTCCTGAAACGGGGCAATCTGATCTTCTTGCAAAGTCC +CAGTCTATGAGCAGAGCGTGGCCCTCGTTCGTGATTAGAATATTCCCACTGCTTATATCT +TGATGCAGCATGCCAGAGACAAAAGCCTCCTGATGGGCTGGCTCAGAAATAAATTAGTTG +GTATGGGGCTGTGGATGCGTAATAGGCAACATACAGATAATGGCTTTATAGAGCACCTTG +CAGAGTTGCTCTGTAGAATTGTACTGGCTCAACACATCTGGAAAACCACCCCCTTGTATT +AGCTCTGGATTATATCTAATAGTGTCTAAAAGTATCTAAAAGTATTAATAGCATCTAAAA +GTGTCTAATTTCCTAATTAGGAGCAACACA +>SRR17300492_101362 +CCATGGTGCGCCGCGGCTTTCTTCCACCCTATTGCATATGGACCGTGAAGTGAAGGTGCC +TGACCCTATGGCTGGTCTAGCAGAGCTTCACTCAGGCGCTCTACCACCTCGCCGCGAATC +CAGAGTACGCATGCGTGCTGCGCAAGGAGGTCGAGTCCGCGGTCGCGGAAGACGGGTGGA +CGAAGCACGCGGTGGGTAAGATGCTCAAACTCGACAGCTTCATTCGGGAATCGCAGCGCC +TCAATGGACTTGGTCTATGTTAGTTTCTTCCTTGCCTTCGACCCGTGTCTGTTTACTAAC +CTCACCCGTCAATCTCTCCTATTACGGCACTGCCATGGGTATGATTGCCAGTGACACTTC +AGCGCTATGCCCTCAAACCTTTCACGCTCTCGACCGGTCAGACGATCCCAGCGGGAACGT +TTCTCTCGTGCACATCGCTGCCGACACATCATGATCCTGAACTGTATGCCGATCCCGACG +TCTTCGATCCCTGGCGCTTCGCTAGCATGCGCGAATCACACACCAATTCGGATGACGACC +TGAGCGCCCTGGCCAGGGCCAAACTCCAGATGGTGTCCACCAGCACAGACTTCCTAGCCT +TCGGGCACGGCAAGCACGCCTGGTAAGTCGACCTCCCCTCCGGCACGCCCCTCGATCTTC +AGGAAAGCACGCCCTACTGCACGCGACGTCTTTCACGACACATGTTGACCTCGTTTCCGC +AGCCCCGGGCGCTTCTTCGCCGCCTACGAGATGAAAGCAATGCTTGCGCACGTCGTCGTC +GCCTACGACGTCAAGTTCGAGAACGGCGCTGCGGACTTCCCGCCAAATTTGTTCATCGGA +TCTGCCTGTTTGCCGGGAAAGGGACAGGTCATGTTCAGGAAGCGGCAGGTGAGCGACGAG +TTGACTCTCGCTTCCCTAGAAAAGTAGTCATGTTGAGTACTCGTGTGTAACGTACCTTGA +GTCAAGGAGATTGACTGAAGGTACAATTATGGTTTCTTGCATAGTGCTGATAAAATAGTG +AGAGTAACAGAGGAAGGTGTGAAACAAACGACTCCGGGAGATATACAGTCATCACGAGCA +ATATAGTACATGCATTACCACTGGCACTACGAGATCGGACTCTCCTTCAATAATACCCAC +AGAAAGCAGCTAGGAAAAACCCCTACTCTAAGAAGACTTCGGTAGGCCACATGTGGGGCA +TACGATAGGCCTAGTCTTGCACGCCTTGTATACTGCGTATCCCAGTCCTGCTACCGCCAT +CCCGCCTGCAGCGCTGATGATGAAGCCTACGACAGGAAGTGCACCTCCGGCTCCTACGCT +GGTAGCGACGGCGAACGGGGATCCCGCGACAACGTTACCGATGCTAGCTTGCACTGCGGC +TGCCCATGATGCTACGCATAATATAAAGTCATTGTCTGTTGGTGGGCAGCAAATGGTGCG +AATGAGCGCACTTGCAATGATACCCTCAGATCCGAAACCAAGTAGAGCTAGGACACCTGG +GGCTGCAGCTGGAGCAGCAGCCAGTCCTATCACTGCACCCGTACCCGTGACAGCGACCTT +AGTATGGTCGCCACAGGTACAGAATTGAGGGCCAGCAGCTTCAGCACCCTCTCCAGCAGG +ATTTATTGCGTCTAGATTGCAAGAGGTGATCAGCAGTCGATGTGTAGTGCACACTCGATC +TCGATGAAGAACTTACTATTCATGTTGCTCCTATTATTCACGACGGTCGAGCGATAGAGA +CTTAGAGTCTGAGGATGTTTCAAGATTCGATTGGTTGTACTGAGTGGGTCGAAGGGTGTT +GGCCAGTCTGCCCCCCACGAGCGTCCTTATATACTTCGACACGTTCCCATCGAAGATTCT +GGGTTATTAGGGTACCTAGCGCTCATCCTATTTTGATATACAAGGTAGAGCTTATGATAA +TATCATATTTGACTCGAAGTATGCCTGGTAGACAAAAGTCAGCCGCTCGTCGAAAGATAG +AAGGACCGCCCACTGCCAAATGTATCGTATCATGTTCCCTTCGGGACCTTGTTTCCAAAC +ACACGCCTGTGCTCTTTGTTCTCATCGGAAAGCATAGCATGGTGACTCCACCTACCCTG \ No newline at end of file
